Skip to content

Commit 1c4ab1a

Browse files
[python] offload setting block size to neuron (#2705)
1 parent 950dc7b commit 1c4ab1a

File tree

1 file changed

+0
-3
lines changed

1 file changed

+0
-3
lines changed

engines/python/setup/djl_python/properties_manager/vllm_rb_properties.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -187,9 +187,6 @@ def generate_vllm_engine_arg_dict(self,
187187
if self.max_rolling_batch_prefill_tokens is not None:
188188
vllm_engine_args[
189189
'max_num_batched_tokens'] = self.max_rolling_batch_prefill_tokens
190-
if self.device == 'neuron':
191-
vllm_engine_args['block_size'] = passthrough_vllm_engine_args.get(
192-
"max_model_len")
193190
vllm_engine_args.update(passthrough_vllm_engine_args)
194191
return vllm_engine_args
195192

0 commit comments

Comments
 (0)