Skip to content

Commit 2146a4e

Browse files
committed
Update tests container
Signed-off-by: ajrasane <[email protected]>
1 parent 918d081 commit 2146a4e

File tree

2 files changed

+42
-1
lines changed

2 files changed

+42
-1
lines changed

.github/workflows/gpu_tests.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,7 @@ jobs:
6262
runs-on: linux-amd64-gpu-l4-latest-1
6363
timeout-minutes: 120
6464
container: &gpu_container
65-
image: nvcr.io/nvidia/pytorch:25.06-py3
65+
image: nvcr.io/nvidia/pytorch:25.08-py3
6666
env:
6767
GIT_DEPTH: 1000 # For correct version for tests/gpu/torch/quantization/plugins/test_megatron.py
6868
PIP_CONSTRAINT: "" # Disable pip constraint for upgrading packages

.gitlab/tests.yml

Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,47 @@
1313
example-onnx-bash:
1414
extends: .tests-default
1515
timeout: 90m
16+
image: nvcr.io/nvidia/pytorch:25.08-py3
17+
variables:
18+
GIT_DEPTH: 1000 # For correct version for tests/gpu/torch/quantization/plugins/test_megatron.py
19+
tags: [docker, linux, 2-gpu]
20+
before_script:
21+
# Add libcudnn*.so and libnv*.so to path
22+
- export LD_LIBRARY_PATH="${LD_LIBRARY_PATH}:/usr/include:/usr/lib/x86_64-linux-gnu"
23+
# Install git-lfs for Daring-Anteater dataset
24+
- apt-get update && apt-get install -y git-lfs
25+
- git lfs install --system
26+
27+
multi-gpu:
28+
extends: .multi-gpu-tests-default
29+
script:
30+
# Use pre-installed packages without a new venv with tox-current-env
31+
- pip install tox-current-env
32+
- tox -e py312-cuda12-gpu --current-env
33+
34+
##### Example Tests #####
35+
example-torch:
36+
extends: .multi-gpu-tests-default
37+
timeout: 30m
38+
parallel:
39+
matrix:
40+
- EXAMPLE: [llm_distill, llm_qat, llm_sparsity, speculative_decoding]
41+
script:
42+
- pip install ".[hf,dev-test]"
43+
- find examples/$EXAMPLE -name "requirements.txt" | while read req_file; do pip install -r "$req_file" || exit 1; done
44+
- pytest -s tests/examples/$EXAMPLE
45+
46+
example-trtllm:
47+
extends: example-torch
48+
timeout: 60m
49+
image: nvcr.io/nvidia/tensorrt-llm/release:1.1.0rc2.post2
50+
tags: [docker, linux, 2-gpu, sm>=89]
51+
parallel:
52+
matrix:
53+
- EXAMPLE: [llm_autodeploy, llm_eval, llm_ptq, vlm_ptq]
54+
55+
example-onnx:
56+
extends: example-torch
1657
image: nvcr.io/nvidia/tensorrt:25.08-py3
1758
tags: [docker, linux, 2-gpu, sm>=89]
1859
parallel:

0 commit comments

Comments
 (0)