File tree Expand file tree Collapse file tree 2 files changed +6
-1
lines changed
Expand file tree Collapse file tree 2 files changed +6
-1
lines changed Original file line number Diff line number Diff line change 3030 from aiter import flash_attn_func , flash_attn_varlen_func # noqa: F401
3131 except (ImportError , ModuleNotFoundError ):
3232 pass
33+ elif current_omni_platform .is_xpu ():
34+ try :
35+ from vllm .v1 .attention .backends .fa_utils import flash_attn_varlen_func # noqa: F401
36+ except (ImportError , ModuleNotFoundError ):
37+ pass
3338else :
3439 # CUDA: try FA3 -> FA2 fallback chain
3540 # Try FA3 from fa3-fwd PyPI package
Original file line number Diff line number Diff line change 3030from vllm .model_executor .layers .vocab_parallel_embedding import VocabParallelEmbedding
3131from vllm .model_executor .model_loader .weight_utils import default_weight_loader
3232from vllm .transformers_utils .configs .bagel import BagelConfig
33- from vllm .vllm_flash_attn import flash_attn_varlen_func
3433
34+ from vllm_omni .diffusion .attention .backends .utils .fa import flash_attn_varlen_func
3535from vllm_omni .diffusion .layers .rope import RotaryEmbedding
3636
3737
You can’t perform that action at this time.
0 commit comments