Skip to content

Commit 3835163

Browse files
authored
Disable LDL/STL checks, for failures seen with NVRTC 13.1 (#7054)
* Add comment * Alias to avoid shadowing `cuda` --------- Co-authored-by: Ashwin Srinath <[email protected]>
1 parent b380110 commit 3835163

File tree

2 files changed

+15
-4
lines changed

2 files changed

+15
-4
lines changed

python/cuda_cccl/tests/compute/test_radix_sort.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -256,7 +256,8 @@ def test_radix_sort_keys_double_buffer(dtype, num_items, monkeypatch):
256256
)
257257
def test_radix_sort_pairs_double_buffer(dtype, num_items, monkeypatch):
258258
cc_major, _ = numba.cuda.get_current_device().compute_capability
259-
if cc_major >= 9 or np.isdtype(dtype, np.uint32):
259+
# NOTE: int16 failures seen only with NVRTC 13.1:
260+
if cc_major >= 9 or np.isdtype(dtype, (np.int16, np.uint32)):
260261
import cuda.compute._cccl_interop
261262

262263
monkeypatch.setattr(
@@ -306,7 +307,8 @@ def test_radix_sort_pairs_double_buffer(dtype, num_items, monkeypatch):
306307
)
307308
def test_radix_sort_pairs_bit_window(dtype, num_items, monkeypatch):
308309
cc_major, _ = numba.cuda.get_current_device().compute_capability
309-
if cc_major >= 9 or np.isdtype(dtype, np.uint32):
310+
# NOTE: int16 failures seen only with NVRTC 13.1:
311+
if cc_major >= 9 or np.isdtype(dtype, (np.int16, np.uint32)):
310312
import cuda.compute._cccl_interop
311313

312314
monkeypatch.setattr(

python/cuda_cccl/tests/compute/test_three_way_partition.py

Lines changed: 11 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,17 @@ def _host_three_way_partition(h_in: np.ndarray, less_than_op, greater_equal_op):
6666

6767

6868
@pytest.mark.parametrize("dtype,num_items", three_way_partition_params)
69-
def test_three_way_partition_basic(dtype, num_items):
69+
def test_three_way_partition_basic(dtype, num_items, monkeypatch):
70+
# NOTE: the SASS check failure is seen only with NVRTC 13.1:
71+
if np.isdtype(dtype, np.float16):
72+
import cuda.compute._cccl_interop as cccl_interop
73+
74+
monkeypatch.setattr(
75+
cccl_interop,
76+
"_check_sass",
77+
False,
78+
)
79+
7080
h_in = random_array(num_items, dtype, max_value=100)
7181

7282
def less_than_op(x):
@@ -80,7 +90,6 @@ def greater_equal_op(x):
8090
d_second = cp.empty_like(d_in)
8191
d_unselected = cp.empty_like(d_in)
8292
d_num_selected = cp.empty(2, dtype=np.int32)
83-
8493
cuda.compute.three_way_partition(
8594
d_in,
8695
d_first,

0 commit comments

Comments
 (0)