Skip to content

Commit ad6eca4

Browse files
leiwen83wenlei03
andauthored
Fix early CUDA init via get_architecture_class_name import (#3770)
Signed-off-by: Lei Wen <[email protected]> Co-authored-by: Lei Wen <[email protected]>
1 parent 205b949 commit ad6eca4

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

vllm/engine/llm_engine.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,6 @@
1313
from vllm.executor.executor_base import ExecutorBase
1414
from vllm.logger import init_logger
1515
from vllm.lora.request import LoRARequest
16-
from vllm.model_executor.model_loader import get_architecture_class_name
1716
from vllm.outputs import RequestOutput
1817
from vllm.sampling_params import SamplingParams
1918
from vllm.sequence import (MultiModalData, SamplerOutput, Sequence,
@@ -115,6 +114,8 @@ def __init__(
115114

116115
# If usage stat is enabled, collect relevant info.
117116
if is_usage_stats_enabled():
117+
from vllm.model_executor.model_loader import (
118+
get_architecture_class_name)
118119
usage_message.report_usage(
119120
get_architecture_class_name(model_config),
120121
usage_context,

0 commit comments

Comments
 (0)