Skip to content

Commit f310db9

Browse files
committed
Attempt to add cuda support to distributed ci pipeline
1 parent 522f08c commit f310db9

File tree

4 files changed

+14
-10
lines changed

4 files changed

+14
-10
lines changed

ci/distributed.yml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -80,7 +80,8 @@ build_distributed_cpu:
8080
parallel:
8181
matrix:
8282
- COMPONENT: [atmosphere/diffusion, atmosphere/dycore, common]
83-
BACKEND: [embedded, gtfn_cpu, dace_cpu]
83+
# BACKEND: [embedded, gtfn_cpu, dace_cpu, dace_gpu]
84+
BACKEND: [dace_cpu, dace_gpu]
8485
rules:
8586
- if: $COMPONENT == 'atmosphere/diffusion'
8687
variables:

ci/docker/base_mpi.Dockerfile

Lines changed: 9 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -5,22 +5,23 @@ ENV LC_ALL C.UTF-8
55

66
ARG DEBIAN_FRONTEND=noninteractive
77
RUN apt-get update -qq && apt-get install -qq -y --no-install-recommends \
8-
strace \
8+
autoconf \
9+
automake \
910
build-essential \
10-
tar \
11-
wget \
11+
ca-certificates \
1212
curl \
13+
git && \
1314
libboost-dev \
1415
libnuma-dev \
1516
libopenmpi-dev \
16-
ca-certificates \
17+
libreadline-dev \
1718
libssl-dev \
18-
autoconf \
19-
automake \
2019
libtool \
20+
nvidia-cuda-toolkit \
2121
pkg-config \
22-
libreadline-dev \
23-
git && \
22+
strace \
23+
tar \
24+
wget \
2425
rm -rf /var/lib/apt/lists/*
2526

2627
# Install uv: https://docs.astral.sh/uv/guides/integration/docker

ci/docker/checkout_mpi.Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,4 +8,4 @@ ARG PYVERSION
88
ARG VENV
99
ENV UV_PROJECT_ENVIRONMENT=$VENV
1010
ENV MPI4PY_BUILD_BACKEND="scikit-build-core"
11-
RUN uv sync --extra distributed --python=$PYVERSION
11+
RUN uv sync --extra all --python=$PYVERSION

scripts/ci-mpi-wrapper.sh

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,8 @@ else
1717
exit 1
1818
fi
1919

20+
export CUDA_VISIBLE_DEVICES="${rank}"
21+
2022
log_file="${CI_PROJECT_DIR:+${CI_PROJECT_DIR}/}pytest-log-rank-${rank}.txt"
2123

2224
if [[ "${rank}" -eq 0 ]]; then

0 commit comments

Comments
 (0)