File tree Expand file tree Collapse file tree 3 files changed +2
-7
lines changed Expand file tree Collapse file tree 3 files changed +2
-7
lines changed Original file line number Diff line number Diff line change @@ -28,7 +28,7 @@ COPY ./requirements-neuron.txt /app/vllm/requirements-neuron.txt
28
28
RUN cd /app/vllm \
29
29
&& python3 -m pip install -U -r requirements-neuron.txt
30
30
31
- ENV VLLM_BUILD_WITH_NEURON 1
31
+ ENV VLLM_TARGET_DEVICE neuron
32
32
RUN cd /app/vllm \
33
33
&& pip install -e . \
34
34
&& cd ..
Original file line number Diff line number Diff line change @@ -222,7 +222,7 @@ def _is_neuron() -> bool:
222
222
subprocess .run (["neuron-ls" ], capture_output = True , check = True )
223
223
except (FileNotFoundError , PermissionError , subprocess .CalledProcessError ):
224
224
torch_neuronx_installed = False
225
- return torch_neuronx_installed or envs . VLLM_BUILD_WITH_NEURON
225
+ return torch_neuronx_installed or VLLM_TARGET_DEVICE == "neuron"
226
226
227
227
228
228
def _is_cpu () -> bool :
Original file line number Diff line number Diff line change 33
33
VLLM_TARGET_DEVICE : str = "cuda"
34
34
MAX_JOBS : Optional [str ] = None
35
35
NVCC_THREADS : Optional [str ] = None
36
- VLLM_BUILD_WITH_NEURON : bool = False
37
36
VLLM_USE_PRECOMPILED : bool = False
38
37
VLLM_INSTALL_PUNICA_KERNELS : bool = False
39
38
CMAKE_BUILD_TYPE : Optional [str ] = None
63
62
"NVCC_THREADS" :
64
63
lambda : os .getenv ("NVCC_THREADS" , None ),
65
64
66
- # If set, vllm will build with Neuron support
67
- "VLLM_BUILD_WITH_NEURON" :
68
- lambda : bool (os .environ .get ("VLLM_BUILD_WITH_NEURON" , False )),
69
-
70
65
# If set, vllm will use precompiled binaries (*.so)
71
66
"VLLM_USE_PRECOMPILED" :
72
67
lambda : bool (os .environ .get ("VLLM_USE_PRECOMPILED" )),
You can’t perform that action at this time.
0 commit comments