diff --git a/.github/workflows/slow_tests.yaml b/.github/workflows/slow_tests.yaml index a1f68f9d4..3d5e63e9a 100644 --- a/.github/workflows/slow_tests.yaml +++ b/.github/workflows/slow_tests.yaml @@ -42,4 +42,10 @@ jobs: run: nvidia-smi - name: Run tests - run: uv run pytest --disable-pytest-warnings --runslow tests/slow_tests/ + run: | + uv run pytest --disable-pytest-warnings --runslow tests/slow_tests/test_accelerate_model.py + nvidia-smi + uv run pytest --disable-pytest-warnings --runslow tests/slow_tests/test_vllm_model.py + nvidia-smi + export VLLM_WORKER_MULTIPROC_METHOD=spawn && uv run pytest --disable-pytest-warnings --runslow tests/slow_tests/test_accelerate_vlm_model.py + nvidia-smi diff --git a/pyproject.toml b/pyproject.toml index 45b88d1f2..85da4147d 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -98,7 +98,7 @@ nanotron = [ "tensorboardX" ] tensorboardX = ["tensorboardX"] -vllm = ["vllm>=0.10.0,<0.10.2", "ray", "more_itertools"] +vllm = ["vllm>=0.10.0", "ray", "more_itertools"] sglang = ["sglang"] quality = ["ruff>=v0.11.0","pre-commit"] tests = ["pytest>=7.4.0","deepdiff","pip>=25.2"]