Skip to content

Commit b833bd1

Browse files
authored
Fix bugs (#4707)
1 parent d5fd5ae commit b833bd1

File tree

2 files changed

+4
-10
lines changed

2 files changed

+4
-10
lines changed

deploy/genai_vllm_server_docker/Dockerfile

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,10 @@ RUN python -m pip install "paddlex${PADDLEX_VERSION}"
1313

1414
ARG BUILD_FOR_SM120=false
1515
RUN if [ "${BUILD_FOR_SM120}" = 'true' ]; then \
16-
python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl \
16+
python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl; \
1717
else \
18-
python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.2+cu128torch2.8-cp310-cp310-linux_x86_64.whl \
18+
python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.2+cu128torch2.8-cp310-cp310-linux_x86_64.whl; \
19+
fi \
1920
&& paddlex --install genai-vllm-server
2021

2122
EXPOSE 8080

paddlex/paddlex_cli.py

Lines changed: 1 addition & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -36,11 +36,7 @@
3636
is_dep_available,
3737
is_paddle2onnx_plugin_available,
3838
)
39-
from .utils.env import (
40-
get_gpu_compute_capability,
41-
get_paddle_cuda_version,
42-
is_cuda_available,
43-
)
39+
from .utils.env import get_gpu_compute_capability, get_paddle_cuda_version
4440
from .utils.install import install_packages, uninstall_packages
4541
from .utils.interactive_get_pipeline import interactive_get_pipeline
4642
from .utils.pipeline_arguments import PIPELINE_ARGUMENTS
@@ -324,9 +320,6 @@ def _install_hpi_deps(device_type):
324320
)
325321

326322
def _install_genai_deps(plugin_types):
327-
if not is_cuda_available():
328-
sys.exit("Currently, only GPU devices are supported.")
329-
330323
fd_plugin_types = []
331324
not_fd_plugin_types = []
332325
for plugin_type in plugin_types:

0 commit comments

Comments
 (0)