File tree Expand file tree Collapse file tree 2 files changed +4
-10
lines changed
deploy/genai_vllm_server_docker Expand file tree Collapse file tree 2 files changed +4
-10
lines changed Original file line number Diff line number Diff line change @@ -13,9 +13,10 @@ RUN python -m pip install "paddlex${PADDLEX_VERSION}"
1313
1414ARG BUILD_FOR_SM120=false
1515RUN if [ "${BUILD_FOR_SM120}" = 'true' ]; then \
16- python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl \
16+ python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl; \
1717 else \
18- python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.2+cu128torch2.8-cp310-cp310-linux_x86_64.whl \
18+ python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.2+cu128torch2.8-cp310-cp310-linux_x86_64.whl; \
19+ fi \
1920 && paddlex --install genai-vllm-server
2021
2122EXPOSE 8080
Original file line number Diff line number Diff line change 3636 is_dep_available ,
3737 is_paddle2onnx_plugin_available ,
3838)
39- from .utils .env import (
40- get_gpu_compute_capability ,
41- get_paddle_cuda_version ,
42- is_cuda_available ,
43- )
39+ from .utils .env import get_gpu_compute_capability , get_paddle_cuda_version
4440from .utils .install import install_packages , uninstall_packages
4541from .utils .interactive_get_pipeline import interactive_get_pipeline
4642from .utils .pipeline_arguments import PIPELINE_ARGUMENTS
@@ -324,9 +320,6 @@ def _install_hpi_deps(device_type):
324320 )
325321
326322 def _install_genai_deps (plugin_types ):
327- if not is_cuda_available ():
328- sys .exit ("Currently, only GPU devices are supported." )
329-
330323 fd_plugin_types = []
331324 not_fd_plugin_types = []
332325 for plugin_type in plugin_types :
You can’t perform that action at this time.
0 commit comments