Skip to content

Commit 9fdecf5

Browse files
authored
Enable bitsandbytes unit tests on Radeon
1 parent 42c26bd commit 9fdecf5

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

tests/models/quantization/test_bitsandbytes.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,13 +10,14 @@
1010

1111
from tests.quantization.utils import is_quant_method_supported
1212
from vllm.platforms import current_platform
13+
from vllm.platforms.rocm import on_gfx9
1314

1415
from ...utils import compare_two_settings, multi_gpu_test
1516
from ..utils import check_embeddings_close, check_logprobs_close
1617

1718
pytestmark = pytest.mark.skipif(
18-
current_platform.is_rocm(),
19-
reason="bitsandbytes quantization not supported on ROCm (CUDA-only kernels)",
19+
current_platform.is_rocm() and on_gfx9(),
20+
reason="bitsandbytes quantization not supported on Instinct (warp size 64 limitation)",
2021
)
2122

2223
models_4bit_to_test = [

0 commit comments

Comments
 (0)