add abi version to rocdl target (#139)

makslevental · web-flow · commit ebb00615a2a3 · 2025-04-09T21:26:23.000Z
diff --git a/tests/test_gpu.py b/tests/test_gpu.py
@@ -760,15 +760,15 @@ def mat_product_kernel(
     hip_check(hip.hipGetDeviceProperties(props, 0))
     arch = props.gcnArchName.decode()
 
-    @module("naive", [f'#rocdl.target<chip = "{arch}">'])
+    @module("naive", [f'#rocdl.target<chip = "{arch}", abi = "500">'])
     def gpu_module():
         mat_product_kernel.emit()
 
     lowered_module = run_pipeline(
         gpu_module,
         Pipeline()
         .Gpu(Pipeline().convert_gpu_to_rocdl(use_bare_ptr_memref_call_conv=True))
-        .rocdl_attach_target(chip=arch)
+        .rocdl_attach_target(chip=arch, abi="500")
         .gpu_to_llvm()
         .lower_to_llvm()
         .gpu_module_to_binary(),
@@ -871,15 +871,15 @@ def mat_product_kernel(
     hip_check(hip.hipGetDeviceProperties(props, 0))
     arch = props.gcnArchName.decode()
 
-    @module("naive", [f'#rocdl.target<chip = "{arch}">'])
+    @module("naive", [f'#rocdl.target<chip = "{arch}", abi = "500">'])
     def gpu_module():
         mat_product_kernel.emit()
 
     lowered_module = run_pipeline(
         gpu_module,
         Pipeline()
         .Gpu(Pipeline().convert_gpu_to_rocdl(use_bare_ptr_memref_call_conv=True))
-        .rocdl_attach_target(chip=arch)
+        .rocdl_attach_target(chip=arch, abi="500")
         .gpu_to_llvm()
         .lower_to_llvm()
         .gpu_module_to_binary(),
@@ -998,15 +998,15 @@ def smol_matmul(
     hip_check(hip.hipGetDeviceProperties(props, 0))
     arch = props.gcnArchName.decode()
 
-    @module("naive", [f'#rocdl.target<chip = "{arch}">'])
+    @module("naive", [f'#rocdl.target<chip = "{arch}", abi = "500">'])
     def gpu_module():
         smol_matmul.emit()
 
     lowered_module = run_pipeline(
         gpu_module,
         Pipeline()
         .Gpu(Pipeline().convert_gpu_to_rocdl(use_bare_ptr_memref_call_conv=True))
-        .rocdl_attach_target(chip=arch)
+        .rocdl_attach_target(chip=arch, abi="500")
         .gpu_to_llvm()
         .lower_to_llvm()
         .gpu_module_to_binary(),
@@ -1106,7 +1106,7 @@ def all_bank_conflicts(A: T.memref(M, M, T.f32()), B: T.memref(M, M, T.f32())):
     hip_check(hip.hipGetDeviceProperties(props, 0))
     arch = props.gcnArchName.decode()
 
-    @module("naive", [f'#rocdl.target<chip = "{arch}">'])
+    @module("naive", [f'#rocdl.target<chip = "{arch}", abi = "500">'])
     def gpu_module():
         no_bank_conflicts.emit()
         all_bank_conflicts.emit()
@@ -1115,7 +1115,7 @@ def gpu_module():
         gpu_module,
         Pipeline()
         .Gpu(Pipeline().convert_gpu_to_rocdl(use_bare_ptr_memref_call_conv=True))
-        .rocdl_attach_target(chip=arch)
+        .rocdl_attach_target(chip=arch, abi="500")
         .gpu_to_llvm()
         .lower_to_llvm()
         .gpu_module_to_binary(),