Skip to content
This repository was archived by the owner on Sep 4, 2025. It is now read-only.

Commit 1e44f5e

Browse files
committed
grpc_server: fix tokenizer group usage
1 parent 926c25c commit 1e44f5e

File tree

1 file changed

+5
-2
lines changed

1 file changed

+5
-2
lines changed

vllm/entrypoints/grpc/grpc_server.py

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -92,7 +92,6 @@ def __init__(self, engine: AsyncLLMEngine, args: argparse.Namespace):
9292
self.engine: AsyncLLMEngine = engine
9393

9494
# These set in _post_init()
95-
self.tokenizer_group: BaseTokenizerGroup = None
9695
self.tokenizer: Union[PreTrainedTokenizer,
9796
PreTrainedTokenizerFast] = None
9897
self.config: ModelConfig = None
@@ -101,9 +100,13 @@ def __init__(self, engine: AsyncLLMEngine, args: argparse.Namespace):
101100
self.skip_special_tokens = not args.output_special_tokens
102101
self.default_include_stop_seqs = args.default_include_stop_seqs
103102

103+
@property
104+
def tokenizer_group(self) -> BaseTokenizerGroup:
105+
return self.engine.engine
106+
107+
104108
async def _post_init(self):
105109
self.config = await self.engine.get_model_config()
106-
self.tokenizer_group = await self.engine.get_tokenizer_group()
107110
self.tokenizer = await self.engine.get_tokenizer()
108111

109112
# Swap in the special TGIS stats logger

0 commit comments

Comments
 (0)