Skip to content

Commit 2d8bd10

Browse files
[AMDGPU] revert xor.ll si-annotate-cf.ll changes
1 parent b953c51 commit 2d8bd10

File tree

2 files changed

+11
-23
lines changed

2 files changed

+11
-23
lines changed

llvm/test/CodeGen/AMDGPU/si-annotate-cf.ll

Lines changed: 8 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -7,17 +7,15 @@ define amdgpu_kernel void @break_inserted_outside_of_loop(ptr addrspace(1) %out,
77
; SI: ; %bb.0: ; %main_body
88
; SI-NEXT: s_load_dword s0, s[2:3], 0xb
99
; SI-NEXT: v_mbcnt_lo_u32_b32_e64 v0, -1, 0
10+
; SI-NEXT: s_waitcnt lgkmcnt(0)
11+
; SI-NEXT: v_and_b32_e32 v0, s0, v0
1012
; SI-NEXT: v_and_b32_e32 v0, 1, v0
1113
; SI-NEXT: v_cmp_eq_u32_e32 vcc, 1, v0
12-
; SI-NEXT: s_waitcnt lgkmcnt(0)
13-
; SI-NEXT: s_bitcmp1_b32 s0, 0
14-
; SI-NEXT: s_cselect_b64 s[0:1], -1, 0
15-
; SI-NEXT: s_and_b64 s[4:5], s[0:1], vcc
1614
; SI-NEXT: s_mov_b64 s[0:1], 0
1715
; SI-NEXT: .LBB0_1: ; %ENDIF
1816
; SI-NEXT: ; =>This Inner Loop Header: Depth=1
19-
; SI-NEXT: s_and_b64 s[6:7], exec, s[4:5]
20-
; SI-NEXT: s_or_b64 s[0:1], s[6:7], s[0:1]
17+
; SI-NEXT: s_and_b64 s[4:5], exec, vcc
18+
; SI-NEXT: s_or_b64 s[0:1], s[4:5], s[0:1]
2119
; SI-NEXT: s_andn2_b64 exec, exec, s[0:1]
2220
; SI-NEXT: s_cbranch_execnz .LBB0_1
2321
; SI-NEXT: ; %bb.2: ; %ENDLOOP
@@ -34,17 +32,15 @@ define amdgpu_kernel void @break_inserted_outside_of_loop(ptr addrspace(1) %out,
3432
; FLAT: ; %bb.0: ; %main_body
3533
; FLAT-NEXT: s_load_dword s0, s[2:3], 0x2c
3634
; FLAT-NEXT: v_mbcnt_lo_u32_b32 v0, -1, 0
35+
; FLAT-NEXT: s_waitcnt lgkmcnt(0)
36+
; FLAT-NEXT: v_and_b32_e32 v0, s0, v0
3737
; FLAT-NEXT: v_and_b32_e32 v0, 1, v0
3838
; FLAT-NEXT: v_cmp_eq_u32_e32 vcc, 1, v0
39-
; FLAT-NEXT: s_waitcnt lgkmcnt(0)
40-
; FLAT-NEXT: s_bitcmp1_b32 s0, 0
41-
; FLAT-NEXT: s_cselect_b64 s[0:1], -1, 0
42-
; FLAT-NEXT: s_and_b64 s[4:5], s[0:1], vcc
4339
; FLAT-NEXT: s_mov_b64 s[0:1], 0
4440
; FLAT-NEXT: .LBB0_1: ; %ENDIF
4541
; FLAT-NEXT: ; =>This Inner Loop Header: Depth=1
46-
; FLAT-NEXT: s_and_b64 s[6:7], exec, s[4:5]
47-
; FLAT-NEXT: s_or_b64 s[0:1], s[6:7], s[0:1]
42+
; FLAT-NEXT: s_and_b64 s[4:5], exec, vcc
43+
; FLAT-NEXT: s_or_b64 s[0:1], s[4:5], s[0:1]
4844
; FLAT-NEXT: s_andn2_b64 exec, exec, s[0:1]
4945
; FLAT-NEXT: s_cbranch_execnz .LBB0_1
5046
; FLAT-NEXT: ; %bb.2: ; %ENDLOOP

llvm/test/CodeGen/AMDGPU/xor.ll

Lines changed: 3 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -182,12 +182,8 @@ define amdgpu_kernel void @v_xor_i1(ptr addrspace(1) %out, ptr addrspace(1) %in0
182182
; SI-NEXT: s_waitcnt vmcnt(0)
183183
; SI-NEXT: s_mov_b32 s8, s4
184184
; SI-NEXT: s_mov_b32 s9, s5
185+
; SI-NEXT: v_xor_b32_e32 v0, v0, v1
185186
; SI-NEXT: v_and_b32_e32 v0, 1, v0
186-
; SI-NEXT: v_and_b32_e32 v1, 1, v1
187-
; SI-NEXT: v_cmp_eq_u32_e32 vcc, 1, v0
188-
; SI-NEXT: v_cmp_eq_u32_e64 s[0:1], 1, v1
189-
; SI-NEXT: s_xor_b64 s[0:1], vcc, s[0:1]
190-
; SI-NEXT: v_cndmask_b32_e64 v0, 0, 1, s[0:1]
191187
; SI-NEXT: buffer_store_byte v0, off, s[8:11], 0
192188
; SI-NEXT: s_endpgm
193189
;
@@ -206,12 +202,8 @@ define amdgpu_kernel void @v_xor_i1(ptr addrspace(1) %out, ptr addrspace(1) %in0
206202
; VI-NEXT: s_waitcnt vmcnt(0)
207203
; VI-NEXT: v_mov_b32_e32 v0, s4
208204
; VI-NEXT: v_mov_b32_e32 v1, s5
209-
; VI-NEXT: v_and_b32_e32 v3, 1, v4
205+
; VI-NEXT: v_xor_b32_e32 v2, v4, v2
210206
; VI-NEXT: v_and_b32_e32 v2, 1, v2
211-
; VI-NEXT: v_cmp_eq_u32_e32 vcc, 1, v3
212-
; VI-NEXT: v_cmp_eq_u32_e64 s[0:1], 1, v2
213-
; VI-NEXT: s_xor_b64 s[0:1], vcc, s[0:1]
214-
; VI-NEXT: v_cndmask_b32_e64 v2, 0, 1, s[0:1]
215207
; VI-NEXT: flat_store_byte v[0:1], v2
216208
; VI-NEXT: s_endpgm
217209
%a = load volatile i1, ptr addrspace(1) %in0
@@ -820,4 +812,4 @@ define amdgpu_kernel void @vector_xor_literal_i64(ptr addrspace(1) %out, ptr add
820812
%or = xor i64 %loada, 22470723082367
821813
store i64 %or, ptr addrspace(1) %out
822814
ret void
823-
}
815+
}

0 commit comments

Comments
 (0)