We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5dd80d3 commit 81ce2a4Copy full SHA for 81ce2a4
vllm/model_executor/models/mixtral.py
@@ -251,7 +251,7 @@ def sparse_transpose(
251
return column_indices_t, offsets_t, block_offsets_t
252
253
def topology(self, x: torch.Tensor,
254
- padded_bins: torch.Tensor) -> stk.Matrix:
+ padded_bins: torch.Tensor) -> "stk.Matrix":
255
padded_tokens, _ = x.size()
256
assert padded_tokens % self.blocking == 0
257
assert self.ffn_dim_per_partition % self.blocking == 0
0 commit comments