We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 41f17bf commit 4d7c1d5Copy full SHA for 4d7c1d5
vllm/model_executor/layers/rotary_embedding/mrope.py
@@ -300,6 +300,15 @@ def forward_cuda(
300
key = torch.cat((key_rot, key_pass), dim=-1).reshape(key_shape)
301
return query, key
302
303
+ def forward_xpu(
304
+ self,
305
+ positions: torch.Tensor,
306
+ query: torch.Tensor,
307
+ key: Optional[torch.Tensor] = None,
308
+ offsets: Optional[torch.Tensor] = None,
309
+ ) -> tuple[torch.Tensor, Optional[torch.Tensor]]:
310
+ return self.forward_native(positions, query, key, offsets)
311
+
312
def forward_cpu(
313
self,
314
positions: torch.Tensor,
0 commit comments