@@ -115,7 +115,7 @@ define amdgpu_kernel void @v_fneg_add_fneg_x_f32(float addrspace(1)* %out, float
115115; GCN-SAFE: v_xor_b32_e32 v{{[0-9]+}}, 0x80000000, [[ADD]]
116116
117117; GCN-NSZ: v_sub_f32_e32 [[ADD:v[0-9]+]], [[B]], [[A]]
118- ; GCN-NSZ-NEXT : flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
118+ ; GCN-NSZ: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
119119define amdgpu_kernel void @v_fneg_add_x_fneg_f32 (float addrspace (1 )* %out , float addrspace (1 )* %a.ptr , float addrspace (1 )* %b.ptr ) #0 {
120120 %tid = call i32 @llvm.amdgcn.workitem.id.x ()
121121 %tid.ext = sext i32 %tid to i64
@@ -139,7 +139,7 @@ define amdgpu_kernel void @v_fneg_add_x_fneg_f32(float addrspace(1)* %out, float
139139; GCN-SAFE: v_xor_b32_e32 v{{[0-9]+}}, 0x80000000, [[ADD]]
140140
141141; GCN-NSZ: v_add_f32_e32 [[ADD:v[0-9]+]], [[A]], [[B]]
142- ; GCN-NSZ-NEXT : flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
142+ ; GCN-NSZ: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
143143define amdgpu_kernel void @v_fneg_add_fneg_fneg_f32 (float addrspace (1 )* %out , float addrspace (1 )* %a.ptr , float addrspace (1 )* %b.ptr ) #0 {
144144 %tid = call i32 @llvm.amdgcn.workitem.id.x ()
145145 %tid.ext = sext i32 %tid to i64
@@ -157,9 +157,9 @@ define amdgpu_kernel void @v_fneg_add_fneg_fneg_f32(float addrspace(1)* %out, fl
157157}
158158
159159; GCN-LABEL: {{^}}v_fneg_add_store_use_fneg_x_f32:
160- ; GCN-SAFE: s_brev_b32 [[SIGNBIT:s[0-9]+]], 1{{$}}
161- ; GCN: {{buffer|flat}}_load_dword [[A:v[0-9]+]]
162- ; GCN: {{buffer|flat}}_load_dword [[B:v[0-9]+]]
160+ ; GCN-SAFE-DAG : s_brev_b32 [[SIGNBIT:s[0-9]+]], 1{{$}}
161+ ; GCN-DAG : {{buffer|flat}}_load_dword [[A:v[0-9]+]]
162+ ; GCN-DAG : {{buffer|flat}}_load_dword [[B:v[0-9]+]]
163163
164164; GCN-SAFE: v_xor_b32_e32 [[NEG_A:v[0-9]+]], [[SIGNBIT]], [[A]]
165165; GCN-SAFE: v_sub_f32_e32 [[ADD:v[0-9]+]], [[B]], [[A]]
@@ -329,7 +329,7 @@ define amdgpu_kernel void @v_fneg_mul_multi_use_mul_f32(float addrspace(1)* %out
329329; GCN: {{buffer|flat}}_load_dword [[A:v[0-9]+]]
330330; GCN: {{buffer|flat}}_load_dword [[B:v[0-9]+]]
331331; GCN: v_mul_f32_e32 [[ADD:v[0-9]+]], [[A]], [[B]]
332- ; GCN-NEXT : flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
332+ ; GCN: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
333333define amdgpu_kernel void @v_fneg_mul_fneg_x_f32 (float addrspace (1 )* %out , float addrspace (1 )* %a.ptr , float addrspace (1 )* %b.ptr ) #0 {
334334 %tid = call i32 @llvm.amdgcn.workitem.id.x ()
335335 %tid.ext = sext i32 %tid to i64
@@ -349,7 +349,7 @@ define amdgpu_kernel void @v_fneg_mul_fneg_x_f32(float addrspace(1)* %out, float
349349; GCN: {{buffer|flat}}_load_dword [[A:v[0-9]+]]
350350; GCN: {{buffer|flat}}_load_dword [[B:v[0-9]+]]
351351; GCN: v_mul_f32_e32 [[ADD:v[0-9]+]], [[A]], [[B]]
352- ; GCN-NEXT : flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
352+ ; GCN: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
353353define amdgpu_kernel void @v_fneg_mul_x_fneg_f32 (float addrspace (1 )* %out , float addrspace (1 )* %a.ptr , float addrspace (1 )* %b.ptr ) #0 {
354354 %tid = call i32 @llvm.amdgcn.workitem.id.x ()
355355 %tid.ext = sext i32 %tid to i64
@@ -369,7 +369,7 @@ define amdgpu_kernel void @v_fneg_mul_x_fneg_f32(float addrspace(1)* %out, float
369369; GCN: {{buffer|flat}}_load_dword [[A:v[0-9]+]]
370370; GCN: {{buffer|flat}}_load_dword [[B:v[0-9]+]]
371371; GCN: v_mul_f32_e64 [[ADD:v[0-9]+]], [[A]], -[[B]]
372- ; GCN-NEXT : flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
372+ ; GCN: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
373373define amdgpu_kernel void @v_fneg_mul_fneg_fneg_f32 (float addrspace (1 )* %out , float addrspace (1 )* %a.ptr , float addrspace (1 )* %b.ptr ) #0 {
374374 %tid = call i32 @llvm.amdgcn.workitem.id.x ()
375375 %tid.ext = sext i32 %tid to i64
@@ -1902,7 +1902,7 @@ define amdgpu_kernel void @v_fneg_mul_legacy_multi_use_mul_legacy_f32(float addr
19021902; GCN: {{buffer|flat}}_load_dword [[A:v[0-9]+]]
19031903; GCN: {{buffer|flat}}_load_dword [[B:v[0-9]+]]
19041904; GCN: v_mul_legacy_f32_e32 [[ADD:v[0-9]+]], [[A]], [[B]]
1905- ; GCN-NEXT : flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
1905+ ; GCN: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
19061906define amdgpu_kernel void @v_fneg_mul_legacy_fneg_x_f32 (float addrspace (1 )* %out , float addrspace (1 )* %a.ptr , float addrspace (1 )* %b.ptr ) #0 {
19071907 %tid = call i32 @llvm.amdgcn.workitem.id.x ()
19081908 %tid.ext = sext i32 %tid to i64
@@ -1922,7 +1922,7 @@ define amdgpu_kernel void @v_fneg_mul_legacy_fneg_x_f32(float addrspace(1)* %out
19221922; GCN: {{buffer|flat}}_load_dword [[A:v[0-9]+]]
19231923; GCN: {{buffer|flat}}_load_dword [[B:v[0-9]+]]
19241924; GCN: v_mul_legacy_f32_e32 [[ADD:v[0-9]+]], [[A]], [[B]]
1925- ; GCN-NEXT : flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
1925+ ; GCN: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
19261926define amdgpu_kernel void @v_fneg_mul_legacy_x_fneg_f32 (float addrspace (1 )* %out , float addrspace (1 )* %a.ptr , float addrspace (1 )* %b.ptr ) #0 {
19271927 %tid = call i32 @llvm.amdgcn.workitem.id.x ()
19281928 %tid.ext = sext i32 %tid to i64
@@ -1942,7 +1942,7 @@ define amdgpu_kernel void @v_fneg_mul_legacy_x_fneg_f32(float addrspace(1)* %out
19421942; GCN: {{buffer|flat}}_load_dword [[A:v[0-9]+]]
19431943; GCN: {{buffer|flat}}_load_dword [[B:v[0-9]+]]
19441944; GCN: v_mul_legacy_f32_e64 [[ADD:v[0-9]+]], [[A]], -[[B]]
1945- ; GCN-NEXT : flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
1945+ ; GCN: flat_store_dword v{{\[[0-9]+:[0-9]+\]}}, [[ADD]]
19461946define amdgpu_kernel void @v_fneg_mul_legacy_fneg_fneg_f32 (float addrspace (1 )* %out , float addrspace (1 )* %a.ptr , float addrspace (1 )* %b.ptr ) #0 {
19471947 %tid = call i32 @llvm.amdgcn.workitem.id.x ()
19481948 %tid.ext = sext i32 %tid to i64
0 commit comments