@@ -760,15 +760,15 @@ def mat_product_kernel(
760
760
hip_check (hip .hipGetDeviceProperties (props , 0 ))
761
761
arch = props .gcnArchName .decode ()
762
762
763
- @module ("naive" , [f'#rocdl.target<chip = "{ arch } ">' ])
763
+ @module ("naive" , [f'#rocdl.target<chip = "{ arch } ", abi = "500" >' ])
764
764
def gpu_module ():
765
765
mat_product_kernel .emit ()
766
766
767
767
lowered_module = run_pipeline (
768
768
gpu_module ,
769
769
Pipeline ()
770
770
.Gpu (Pipeline ().convert_gpu_to_rocdl (use_bare_ptr_memref_call_conv = True ))
771
- .rocdl_attach_target (chip = arch )
771
+ .rocdl_attach_target (chip = arch , abi = "500" )
772
772
.gpu_to_llvm ()
773
773
.lower_to_llvm ()
774
774
.gpu_module_to_binary (),
@@ -871,15 +871,15 @@ def mat_product_kernel(
871
871
hip_check (hip .hipGetDeviceProperties (props , 0 ))
872
872
arch = props .gcnArchName .decode ()
873
873
874
- @module ("naive" , [f'#rocdl.target<chip = "{ arch } ">' ])
874
+ @module ("naive" , [f'#rocdl.target<chip = "{ arch } ", abi = "500" >' ])
875
875
def gpu_module ():
876
876
mat_product_kernel .emit ()
877
877
878
878
lowered_module = run_pipeline (
879
879
gpu_module ,
880
880
Pipeline ()
881
881
.Gpu (Pipeline ().convert_gpu_to_rocdl (use_bare_ptr_memref_call_conv = True ))
882
- .rocdl_attach_target (chip = arch )
882
+ .rocdl_attach_target (chip = arch , abi = "500" )
883
883
.gpu_to_llvm ()
884
884
.lower_to_llvm ()
885
885
.gpu_module_to_binary (),
@@ -998,15 +998,15 @@ def smol_matmul(
998
998
hip_check (hip .hipGetDeviceProperties (props , 0 ))
999
999
arch = props .gcnArchName .decode ()
1000
1000
1001
- @module ("naive" , [f'#rocdl.target<chip = "{ arch } ">' ])
1001
+ @module ("naive" , [f'#rocdl.target<chip = "{ arch } ", abi = "500" >' ])
1002
1002
def gpu_module ():
1003
1003
smol_matmul .emit ()
1004
1004
1005
1005
lowered_module = run_pipeline (
1006
1006
gpu_module ,
1007
1007
Pipeline ()
1008
1008
.Gpu (Pipeline ().convert_gpu_to_rocdl (use_bare_ptr_memref_call_conv = True ))
1009
- .rocdl_attach_target (chip = arch )
1009
+ .rocdl_attach_target (chip = arch , abi = "500" )
1010
1010
.gpu_to_llvm ()
1011
1011
.lower_to_llvm ()
1012
1012
.gpu_module_to_binary (),
@@ -1106,7 +1106,7 @@ def all_bank_conflicts(A: T.memref(M, M, T.f32()), B: T.memref(M, M, T.f32())):
1106
1106
hip_check (hip .hipGetDeviceProperties (props , 0 ))
1107
1107
arch = props .gcnArchName .decode ()
1108
1108
1109
- @module ("naive" , [f'#rocdl.target<chip = "{ arch } ">' ])
1109
+ @module ("naive" , [f'#rocdl.target<chip = "{ arch } ", abi = "500" >' ])
1110
1110
def gpu_module ():
1111
1111
no_bank_conflicts .emit ()
1112
1112
all_bank_conflicts .emit ()
@@ -1115,7 +1115,7 @@ def gpu_module():
1115
1115
gpu_module ,
1116
1116
Pipeline ()
1117
1117
.Gpu (Pipeline ().convert_gpu_to_rocdl (use_bare_ptr_memref_call_conv = True ))
1118
- .rocdl_attach_target (chip = arch )
1118
+ .rocdl_attach_target (chip = arch , abi = "500" )
1119
1119
.gpu_to_llvm ()
1120
1120
.lower_to_llvm ()
1121
1121
.gpu_module_to_binary (),
0 commit comments