We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6431be8 commit 20db99cCopy full SHA for 20db99c
tests/quantization/test_blackwell_moe.py
@@ -15,7 +15,15 @@
15
"This test only runs on Blackwell GPUs (SM100).", allow_module_level=True
16
)
17
18
-os.environ["FLASHINFER_NVCC_THREADS"] = "16"
+
19
+@pytest.fixture(scope="module", autouse=True)
20
+def set_test_environment():
21
+ """Sets environment variables required for this test module."""
22
+ # Make sure TRTLLM attention is available
23
+ os.environ["VLLM_HAS_FLASHINFER_CUBIN"] = "1"
24
+ # Set compilation threads to 16 to speed up startup
25
+ os.environ["FLASHINFER_NVCC_THREADS"] = "16"
26
27
28
# dummy_hf_overrides = {"num_layers": 4, "num_hidden_layers": 4,
29
# "text_config": {"num_layers": 4, "num_hidden_layers": 4}}
0 commit comments