Skip to content

Commit f5d1740

Browse files
[Bugfix] Add OOT backend option (vllm-project#32471)
Signed-off-by: Iryna Boiko <[email protected]>
1 parent eebc58d commit f5d1740

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

vllm/model_executor/layers/fused_moe/oracle/unquantized.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -33,6 +33,7 @@ class UnquantizedMoeBackend(Enum):
3333
CPU = "CPU"
3434
XPU = "XPU"
3535
TPU = "TPU"
36+
OOT = "OOT"
3637

3738

3839
# NOTE(zyongye): Unsupported backend means backend
@@ -42,6 +43,7 @@ class UnquantizedMoeBackend(Enum):
4243
UnquantizedMoeBackend.CPU,
4344
UnquantizedMoeBackend.XPU,
4445
UnquantizedMoeBackend.TPU,
46+
UnquantizedMoeBackend.OOT,
4547
]
4648

4749

@@ -95,6 +97,8 @@ def _make_log_backend(backend: UnquantizedMoeBackend):
9597
backend = UnquantizedMoeBackend.CPU
9698
if current_platform.is_tpu():
9799
backend = UnquantizedMoeBackend.TPU
100+
if current_platform.is_out_of_tree():
101+
backend = UnquantizedMoeBackend.OOT
98102

99103
logger.info_once(_make_log_backend(backend), scope="local")
100104
return backend

0 commit comments

Comments
 (0)