99typedef half __attribute__ ((ext_vector_type (2 ))) half2 ;
1010
1111// CHECK-LABEL: test_global_add_f64
12- // CHECK: = atomicrmw fadd ptr addrspace(1) %{{.+}}, double %{{.+}} syncscope("agent") seq_cst , align 8, !amdgpu.no.fine.grained.memory !{{[0-9]+$}}
12+ // CHECK: = atomicrmw fadd ptr addrspace(1) %{{.+}}, double %{{.+}} syncscope("agent") monotonic , align 8, !amdgpu.no.fine.grained.memory !{{[0-9]+$}}
1313// GFX90A-LABEL: test_global_add_f64$local:
1414// GFX90A: global_atomic_add_f64
1515void test_global_add_f64 (__global double * addr , double x ) {
@@ -99,7 +99,7 @@ void test_flat_global_max_f64(__global double *addr, double x){
9999}
100100
101101// CHECK-LABEL: test_ds_add_local_f64
102- // CHECK: = atomicrmw fadd ptr addrspace(3) %{{.+}}, double %{{.+}} seq_cst , align 8
102+ // CHECK: = atomicrmw fadd ptr addrspace(3) %{{.+}}, double %{{.+}} monotonic , align 8
103103// GFX90A: test_ds_add_local_f64$local
104104// GFX90A: ds_add_rtn_f64
105105void test_ds_add_local_f64 (__local double * addr , double x ){
@@ -108,7 +108,7 @@ void test_ds_add_local_f64(__local double *addr, double x){
108108}
109109
110110// CHECK-LABEL: test_ds_addf_local_f32
111- // CHECK: = atomicrmw fadd ptr addrspace(3) %{{.+}}, float %{{.+}} seq_cst , align 4
111+ // CHECK: = atomicrmw fadd ptr addrspace(3) %{{.+}}, float %{{.+}} monotonic , align 4
112112// GFX90A-LABEL: test_ds_addf_local_f32$local
113113// GFX90A: ds_add_rtn_f32
114114void test_ds_addf_local_f32 (__local float * addr , float x ){
@@ -117,7 +117,7 @@ void test_ds_addf_local_f32(__local float *addr, float x){
117117}
118118
119119// CHECK-LABEL: @test_global_add_f32
120- // CHECK: = atomicrmw fadd ptr addrspace(1) %{{.+}}, float %{{.+}} syncscope("agent") seq_cst , align 4, !amdgpu.no.fine.grained.memory !{{[0-9]+}}, !amdgpu.ignore.denormal.mode !{{[0-9]+$}}
120+ // CHECK: = atomicrmw fadd ptr addrspace(1) %{{.+}}, float %{{.+}} syncscope("agent") monotonic , align 4, !amdgpu.no.fine.grained.memory !{{[0-9]+}}, !amdgpu.ignore.denormal.mode !{{[0-9]+$}}
121121void test_global_add_f32 (float * rtn , global float * addr , float x ) {
122122 * rtn = __builtin_amdgcn_global_atomic_fadd_f32 (addr , x );
123123}
0 commit comments