File tree Expand file tree Collapse file tree 2 files changed +12
-6
lines changed Expand file tree Collapse file tree 2 files changed +12
-6
lines changed Original file line number Diff line number Diff line change @@ -13,16 +13,16 @@ All scripts accept a positional argument as workspace path for staging the build
13
13
14
14
## Usage
15
15
16
- ### Single-node
17
-
18
16
``` bash
19
- bash install_python_libraries.sh
17
+ # for hopper
18
+ TORCH_CUDA_ARCH_LIST=" 9.0" bash install_python_libraries.sh
19
+ # for blackwell
20
+ TORCH_CUDA_ARCH_LIST=" 10.0" bash install_python_libraries.sh
20
21
```
21
22
22
- ### Multi -node
23
+ Additional step for multi -node deployment:
23
24
24
25
``` bash
25
- bash install_python_libraries.sh
26
26
sudo bash configure_system_drivers.sh
27
27
sudo reboot # Reboot is required to load the new driver
28
28
```
Original file line number Diff line number Diff line change @@ -29,6 +29,12 @@ if [ -z "$CUDA_HOME" ]; then
29
29
exit 1
30
30
fi
31
31
32
+ # assume TORCH_CUDA_ARCH_LIST is set correctly
33
+ if [ -z " $TORCH_CUDA_ARCH_LIST " ]; then
34
+ echo " TORCH_CUDA_ARCH_LIST is not set, please set it to your desired architecture."
35
+ exit 1
36
+ fi
37
+
32
38
# disable all features except IBGDA
33
39
export NVSHMEM_IBGDA_SUPPORT=1
34
40
@@ -95,7 +101,7 @@ clone_repo "https://github.com/ppl-ai/pplx-kernels" "pplx-kernels" "setup.py"
95
101
cd pplx-kernels
96
102
# see https://github.com/pypa/pip/issues/9955#issuecomment-838065925
97
103
# PIP_NO_BUILD_ISOLATION=0 disables build isolation
98
- PIP_NO_BUILD_ISOLATION=0 TORCH_CUDA_ARCH_LIST=9.0a+PTX pip install -vvv -e .
104
+ PIP_NO_BUILD_ISOLATION=0 pip install -vvv -e .
99
105
popd
100
106
101
107
# build and install deepep, require pytorch installed
You can’t perform that action at this time.
0 commit comments