We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 25e4e87 commit 93ee1c5Copy full SHA for 93ee1c5
vllm/model_executor/layers/utils.py
@@ -110,7 +110,10 @@ def rocm_unquantized_gemm_impl(
110
from vllm.platforms.rocm import on_gfx9
111
k = weight.shape[1]
112
m = weight.shape[0]
113
- x_view = x.view(-1, x.size(-1))
+ if x.is_contiguous():
114
+ x_view = x.view(-1, x.size(-1))
115
+ else:
116
+ x_view = x.reshape(-1, x.size(-1))
117
n = x_view.shape[0]
118
use_skinny = (envs.VLLM_ROCM_USE_SKINNY_GEMM and on_gfx9() and \
119
x.dtype in [torch.float16, torch.bfloat16] \
0 commit comments