Skip to content

Commit 57f560a

Browse files
authored
[BugFix] Use args.trust_remote_code (#7121)
1 parent 003f8ee commit 57f560a

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

vllm/entrypoints/openai/api_server.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -60,11 +60,11 @@
6060
_running_tasks: Set[asyncio.Task] = set()
6161

6262

63-
def model_is_embedding(model_name: str) -> bool:
63+
def model_is_embedding(model_name: str, trust_remote_code: bool) -> bool:
6464
return ModelConfig(model=model_name,
6565
tokenizer=model_name,
6666
tokenizer_mode="auto",
67-
trust_remote_code=False,
67+
trust_remote_code=trust_remote_code,
6868
seed=0,
6969
dtype="float16").embedding_mode
7070

@@ -97,7 +97,7 @@ async def build_async_engine_client(args) -> AsyncIterator[AsyncEngineClient]:
9797

9898
# If manually triggered or embedding model, use AsyncLLMEngine in process.
9999
# TODO: support embedding model via RPC.
100-
if (model_is_embedding(args.model)
100+
if (model_is_embedding(args.model, args.trust_remote_code)
101101
or args.disable_frontend_multiprocessing):
102102
async_engine_client = AsyncLLMEngine.from_engine_args(
103103
engine_args, usage_context=UsageContext.OPENAI_API_SERVER)

0 commit comments

Comments
 (0)