Skip to content

Commit 63f4320

Browse files
committed
fixup! Automatically updated tests
1 parent b1af424 commit 63f4320

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

47 files changed

+1321
-1510
lines changed

llvm/test/CodeGen/AArch64/aarch64-matrix-umull-smull.ll

Lines changed: 23 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -632,20 +632,18 @@ define i16 @red_mla_dup_ext_u8_s8_s16(ptr noalias nocapture noundef readonly %A,
632632
;
633633
; CHECK-GI-LABEL: red_mla_dup_ext_u8_s8_s16:
634634
; CHECK-GI: // %bb.0: // %entry
635-
; CHECK-GI-NEXT: cbz w2, .LBB5_3
635+
; CHECK-GI-NEXT: mov w8, wzr
636+
; CHECK-GI-NEXT: cbz w2, .LBB5_9
636637
; CHECK-GI-NEXT: // %bb.1: // %for.body.preheader
637638
; CHECK-GI-NEXT: cmp w2, #16
638639
; CHECK-GI-NEXT: mov w8, w2
639-
; CHECK-GI-NEXT: b.hs .LBB5_4
640+
; CHECK-GI-NEXT: b.hs .LBB5_3
640641
; CHECK-GI-NEXT: // %bb.2:
641642
; CHECK-GI-NEXT: mov w10, #0 // =0x0
642643
; CHECK-GI-NEXT: mov x9, xzr
643644
; CHECK-GI-NEXT: fmov s0, w10
644-
; CHECK-GI-NEXT: b .LBB5_8
645-
; CHECK-GI-NEXT: .LBB5_3:
646-
; CHECK-GI-NEXT: mov w0, wzr
647-
; CHECK-GI-NEXT: ret
648-
; CHECK-GI-NEXT: .LBB5_4: // %vector.ph
645+
; CHECK-GI-NEXT: b .LBB5_7
646+
; CHECK-GI-NEXT: .LBB5_3: // %vector.ph
649647
; CHECK-GI-NEXT: lsl w9, w1, #8
650648
; CHECK-GI-NEXT: movi v0.2d, #0000000000000000
651649
; CHECK-GI-NEXT: movi v1.2d, #0000000000000000
@@ -654,7 +652,7 @@ define i16 @red_mla_dup_ext_u8_s8_s16(ptr noalias nocapture noundef readonly %A,
654652
; CHECK-GI-NEXT: dup v2.8h, w9
655653
; CHECK-GI-NEXT: and x9, x8, #0xfffffff0
656654
; CHECK-GI-NEXT: mov x11, x9
657-
; CHECK-GI-NEXT: .LBB5_5: // %vector.body
655+
; CHECK-GI-NEXT: .LBB5_4: // %vector.body
658656
; CHECK-GI-NEXT: // =>This Inner Loop Header: Depth=1
659657
; CHECK-GI-NEXT: ldp d3, d4, [x10, #-8]
660658
; CHECK-GI-NEXT: subs x11, x11, #16
@@ -663,29 +661,31 @@ define i16 @red_mla_dup_ext_u8_s8_s16(ptr noalias nocapture noundef readonly %A,
663661
; CHECK-GI-NEXT: ushll v4.8h, v4.8b, #0
664662
; CHECK-GI-NEXT: mla v0.8h, v2.8h, v3.8h
665663
; CHECK-GI-NEXT: mla v1.8h, v2.8h, v4.8h
666-
; CHECK-GI-NEXT: b.ne .LBB5_5
667-
; CHECK-GI-NEXT: // %bb.6: // %middle.block
664+
; CHECK-GI-NEXT: b.ne .LBB5_4
665+
; CHECK-GI-NEXT: // %bb.5: // %middle.block
668666
; CHECK-GI-NEXT: add v0.8h, v1.8h, v0.8h
669667
; CHECK-GI-NEXT: cmp x9, x8
670668
; CHECK-GI-NEXT: addv h0, v0.8h
671-
; CHECK-GI-NEXT: b.ne .LBB5_8
672-
; CHECK-GI-NEXT: // %bb.7:
673-
; CHECK-GI-NEXT: fmov w0, s0
669+
; CHECK-GI-NEXT: b.ne .LBB5_7
670+
; CHECK-GI-NEXT: // %bb.6:
671+
; CHECK-GI-NEXT: fmov w8, s0
672+
; CHECK-GI-NEXT: mov w0, w8
674673
; CHECK-GI-NEXT: ret
675-
; CHECK-GI-NEXT: .LBB5_8: // %for.body.preheader1
674+
; CHECK-GI-NEXT: .LBB5_7: // %for.body.preheader1
676675
; CHECK-GI-NEXT: sxtb w10, w1
677-
; CHECK-GI-NEXT: sub x8, x8, x9
676+
; CHECK-GI-NEXT: sub x11, x8, x9
678677
; CHECK-GI-NEXT: add x9, x0, x9
679-
; CHECK-GI-NEXT: .LBB5_9: // %for.body
678+
; CHECK-GI-NEXT: .LBB5_8: // %for.body
680679
; CHECK-GI-NEXT: // =>This Inner Loop Header: Depth=1
681-
; CHECK-GI-NEXT: ldrb w11, [x9], #1
680+
; CHECK-GI-NEXT: ldrb w8, [x9], #1
682681
; CHECK-GI-NEXT: fmov w12, s0
683-
; CHECK-GI-NEXT: subs x8, x8, #1
684-
; CHECK-GI-NEXT: mul w11, w11, w10
685-
; CHECK-GI-NEXT: add w0, w11, w12, uxth
686-
; CHECK-GI-NEXT: fmov s0, w0
687-
; CHECK-GI-NEXT: b.ne .LBB5_9
688-
; CHECK-GI-NEXT: // %bb.10: // %for.cond.cleanup
682+
; CHECK-GI-NEXT: subs x11, x11, #1
683+
; CHECK-GI-NEXT: mul w8, w8, w10
684+
; CHECK-GI-NEXT: add w8, w8, w12, uxth
685+
; CHECK-GI-NEXT: fmov s0, w8
686+
; CHECK-GI-NEXT: b.ne .LBB5_8
687+
; CHECK-GI-NEXT: .LBB5_9: // %for.cond.cleanup
688+
; CHECK-GI-NEXT: mov w0, w8
689689
; CHECK-GI-NEXT: ret
690690
entry:
691691
%conv2 = sext i8 %B to i16

llvm/test/CodeGen/AArch64/swifterror.ll

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -412,6 +412,7 @@ define float @foo_if(ptr swifterror %error_ptr_ref, i32 %cc) {
412412
; CHECK-APPLE-NEXT: .cfi_def_cfa w29, 16
413413
; CHECK-APPLE-NEXT: .cfi_offset w30, -8
414414
; CHECK-APPLE-NEXT: .cfi_offset w29, -16
415+
; CHECK-APPLE-NEXT: movi d0, #0000000000000000
415416
; CHECK-APPLE-NEXT: cbz w0, LBB3_2
416417
; CHECK-APPLE-NEXT: ; %bb.1: ; %gen_error
417418
; CHECK-APPLE-NEXT: mov w0, #16 ; =0x10
@@ -420,10 +421,7 @@ define float @foo_if(ptr swifterror %error_ptr_ref, i32 %cc) {
420421
; CHECK-APPLE-NEXT: fmov s0, #1.00000000
421422
; CHECK-APPLE-NEXT: mov w8, #1 ; =0x1
422423
; CHECK-APPLE-NEXT: strb w8, [x0, #8]
423-
; CHECK-APPLE-NEXT: ldp x29, x30, [sp], #16 ; 16-byte Folded Reload
424-
; CHECK-APPLE-NEXT: ret
425-
; CHECK-APPLE-NEXT: LBB3_2:
426-
; CHECK-APPLE-NEXT: movi d0, #0000000000000000
424+
; CHECK-APPLE-NEXT: LBB3_2: ; %common.ret
427425
; CHECK-APPLE-NEXT: ldp x29, x30, [sp], #16 ; 16-byte Folded Reload
428426
; CHECK-APPLE-NEXT: ret
429427
;

llvm/test/CodeGen/AMDGPU/GlobalISel/sdiv.i64.ll

Lines changed: 5 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -200,6 +200,7 @@ define amdgpu_ps i64 @s_sdiv_i64(i64 inreg %num, i64 inreg %den) {
200200
; CHECK-NEXT: s_and_b64 s[0:1], s[0:1], s[6:7]
201201
; CHECK-NEXT: v_cmp_ne_u64_e64 vcc, s[0:1], 0
202202
; CHECK-NEXT: s_mov_b32 s0, 1
203+
; CHECK-NEXT: ; implicit-def: $vgpr0_vgpr1
203204
; CHECK-NEXT: s_cbranch_vccz .LBB1_2
204205
; CHECK-NEXT: ; %bb.1:
205206
; CHECK-NEXT: s_ashr_i32 s6, s3, 31
@@ -330,15 +331,12 @@ define amdgpu_ps i64 @s_sdiv_i64(i64 inreg %num, i64 inreg %den) {
330331
; CHECK-NEXT: v_xor_b32_e32 v0, s6, v0
331332
; CHECK-NEXT: s_mov_b32 s0, 0
332333
; CHECK-NEXT: v_subrev_i32_e32 v0, vcc, s6, v0
333-
; CHECK-NEXT: s_branch .LBB1_3
334-
; CHECK-NEXT: .LBB1_2:
335-
; CHECK-NEXT: ; implicit-def: $vgpr0_vgpr1
336-
; CHECK-NEXT: .LBB1_3: ; %Flow
334+
; CHECK-NEXT: .LBB1_2: ; %Flow
337335
; CHECK-NEXT: s_xor_b32 s0, s0, 1
338336
; CHECK-NEXT: s_and_b32 s0, s0, 1
339337
; CHECK-NEXT: s_cmp_lg_u32 s0, 0
340-
; CHECK-NEXT: s_cbranch_scc1 .LBB1_5
341-
; CHECK-NEXT: ; %bb.4:
338+
; CHECK-NEXT: s_cbranch_scc1 .LBB1_4
339+
; CHECK-NEXT: ; %bb.3:
342340
; CHECK-NEXT: v_cvt_f32_u32_e32 v0, s4
343341
; CHECK-NEXT: s_sub_i32 s0, 0, s4
344342
; CHECK-NEXT: v_rcp_iflag_f32_e32 v0, v0
@@ -358,7 +356,7 @@ define amdgpu_ps i64 @s_sdiv_i64(i64 inreg %num, i64 inreg %den) {
358356
; CHECK-NEXT: v_add_i32_e32 v2, vcc, 1, v0
359357
; CHECK-NEXT: v_cmp_le_u32_e32 vcc, s4, v1
360358
; CHECK-NEXT: v_cndmask_b32_e32 v0, v0, v2, vcc
361-
; CHECK-NEXT: .LBB1_5:
359+
; CHECK-NEXT: .LBB1_4:
362360
; CHECK-NEXT: v_readfirstlane_b32 s0, v0
363361
; CHECK-NEXT: s_mov_b32 s1, s0
364362
; CHECK-NEXT: ; return to shader part epilog

llvm/test/CodeGen/AMDGPU/GlobalISel/srem.i64.ll

Lines changed: 5 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -194,6 +194,7 @@ define amdgpu_ps i64 @s_srem_i64(i64 inreg %num, i64 inreg %den) {
194194
; CHECK-NEXT: s_and_b64 s[0:1], s[0:1], s[6:7]
195195
; CHECK-NEXT: v_cmp_ne_u64_e64 vcc, s[0:1], 0
196196
; CHECK-NEXT: s_mov_b32 s7, 1
197+
; CHECK-NEXT: ; implicit-def: $vgpr0_vgpr1
197198
; CHECK-NEXT: s_cbranch_vccz .LBB1_2
198199
; CHECK-NEXT: ; %bb.1:
199200
; CHECK-NEXT: s_ashr_i32 s6, s3, 31
@@ -322,15 +323,12 @@ define amdgpu_ps i64 @s_srem_i64(i64 inreg %num, i64 inreg %den) {
322323
; CHECK-NEXT: v_cndmask_b32_e32 v0, v0, v1, vcc
323324
; CHECK-NEXT: v_xor_b32_e32 v0, s6, v0
324325
; CHECK-NEXT: v_subrev_i32_e32 v0, vcc, s6, v0
325-
; CHECK-NEXT: s_branch .LBB1_3
326-
; CHECK-NEXT: .LBB1_2:
327-
; CHECK-NEXT: ; implicit-def: $vgpr0_vgpr1
328-
; CHECK-NEXT: .LBB1_3: ; %Flow
326+
; CHECK-NEXT: .LBB1_2: ; %Flow
329327
; CHECK-NEXT: s_xor_b32 s0, s7, 1
330328
; CHECK-NEXT: s_and_b32 s0, s0, 1
331329
; CHECK-NEXT: s_cmp_lg_u32 s0, 0
332-
; CHECK-NEXT: s_cbranch_scc1 .LBB1_5
333-
; CHECK-NEXT: ; %bb.4:
330+
; CHECK-NEXT: s_cbranch_scc1 .LBB1_4
331+
; CHECK-NEXT: ; %bb.3:
334332
; CHECK-NEXT: v_cvt_f32_u32_e32 v0, s4
335333
; CHECK-NEXT: s_sub_i32 s0, 0, s4
336334
; CHECK-NEXT: v_rcp_iflag_f32_e32 v0, v0
@@ -348,7 +346,7 @@ define amdgpu_ps i64 @s_srem_i64(i64 inreg %num, i64 inreg %den) {
348346
; CHECK-NEXT: v_subrev_i32_e32 v1, vcc, s4, v0
349347
; CHECK-NEXT: v_cmp_le_u32_e32 vcc, s4, v0
350348
; CHECK-NEXT: v_cndmask_b32_e32 v0, v0, v1, vcc
351-
; CHECK-NEXT: .LBB1_5:
349+
; CHECK-NEXT: .LBB1_4:
352350
; CHECK-NEXT: v_readfirstlane_b32 s0, v0
353351
; CHECK-NEXT: s_mov_b32 s1, s0
354352
; CHECK-NEXT: ; return to shader part epilog

llvm/test/CodeGen/AMDGPU/GlobalISel/udiv.i64.ll

Lines changed: 5 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -193,6 +193,7 @@ define amdgpu_ps i64 @s_udiv_i64(i64 inreg %num, i64 inreg %den) {
193193
; CHECK-NEXT: v_cmp_ne_u64_e64 vcc, s[4:5], 0
194194
; CHECK-NEXT: s_mov_b32 s6, 1
195195
; CHECK-NEXT: v_cvt_f32_u32_e32 v2, s2
196+
; CHECK-NEXT: ; implicit-def: $vgpr0_vgpr1
196197
; CHECK-NEXT: s_cbranch_vccz .LBB1_2
197198
; CHECK-NEXT: ; %bb.1:
198199
; CHECK-NEXT: v_mov_b32_e32 v0, s3
@@ -318,15 +319,12 @@ define amdgpu_ps i64 @s_udiv_i64(i64 inreg %num, i64 inreg %den) {
318319
; CHECK-NEXT: v_cndmask_b32_e32 v0, v9, v5, vcc
319320
; CHECK-NEXT: v_cmp_ne_u32_e32 vcc, 0, v3
320321
; CHECK-NEXT: v_cndmask_b32_e32 v0, v1, v0, vcc
321-
; CHECK-NEXT: s_branch .LBB1_3
322-
; CHECK-NEXT: .LBB1_2:
323-
; CHECK-NEXT: ; implicit-def: $vgpr0_vgpr1
324-
; CHECK-NEXT: .LBB1_3: ; %Flow
322+
; CHECK-NEXT: .LBB1_2: ; %Flow
325323
; CHECK-NEXT: s_xor_b32 s1, s6, 1
326324
; CHECK-NEXT: s_and_b32 s1, s1, 1
327325
; CHECK-NEXT: s_cmp_lg_u32 s1, 0
328-
; CHECK-NEXT: s_cbranch_scc1 .LBB1_5
329-
; CHECK-NEXT: ; %bb.4:
326+
; CHECK-NEXT: s_cbranch_scc1 .LBB1_4
327+
; CHECK-NEXT: ; %bb.3:
330328
; CHECK-NEXT: v_rcp_iflag_f32_e32 v0, v2
331329
; CHECK-NEXT: s_sub_i32 s1, 0, s2
332330
; CHECK-NEXT: v_mul_f32_e32 v0, 0x4f7ffffe, v0
@@ -345,7 +343,7 @@ define amdgpu_ps i64 @s_udiv_i64(i64 inreg %num, i64 inreg %den) {
345343
; CHECK-NEXT: v_add_i32_e32 v2, vcc, 1, v0
346344
; CHECK-NEXT: v_cmp_le_u32_e32 vcc, s2, v1
347345
; CHECK-NEXT: v_cndmask_b32_e32 v0, v0, v2, vcc
348-
; CHECK-NEXT: .LBB1_5:
346+
; CHECK-NEXT: .LBB1_4:
349347
; CHECK-NEXT: v_readfirstlane_b32 s0, v0
350348
; CHECK-NEXT: s_mov_b32 s1, s0
351349
; CHECK-NEXT: ; return to shader part epilog

llvm/test/CodeGen/AMDGPU/GlobalISel/urem.i64.ll

Lines changed: 5 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -190,6 +190,7 @@ define amdgpu_ps i64 @s_urem_i64(i64 inreg %num, i64 inreg %den) {
190190
; CHECK-NEXT: v_cmp_ne_u64_e64 vcc, s[4:5], 0
191191
; CHECK-NEXT: s_mov_b32 s6, 1
192192
; CHECK-NEXT: v_cvt_f32_u32_e32 v2, s2
193+
; CHECK-NEXT: ; implicit-def: $vgpr0_vgpr1
193194
; CHECK-NEXT: s_cbranch_vccz .LBB1_2
194195
; CHECK-NEXT: ; %bb.1:
195196
; CHECK-NEXT: v_mov_b32_e32 v0, s3
@@ -314,15 +315,12 @@ define amdgpu_ps i64 @s_urem_i64(i64 inreg %num, i64 inreg %den) {
314315
; CHECK-NEXT: v_cndmask_b32_e32 v0, v3, v6, vcc
315316
; CHECK-NEXT: v_cmp_ne_u32_e32 vcc, 0, v1
316317
; CHECK-NEXT: v_cndmask_b32_e32 v0, v4, v0, vcc
317-
; CHECK-NEXT: s_branch .LBB1_3
318-
; CHECK-NEXT: .LBB1_2:
319-
; CHECK-NEXT: ; implicit-def: $vgpr0_vgpr1
320-
; CHECK-NEXT: .LBB1_3: ; %Flow
318+
; CHECK-NEXT: .LBB1_2: ; %Flow
321319
; CHECK-NEXT: s_xor_b32 s1, s6, 1
322320
; CHECK-NEXT: s_and_b32 s1, s1, 1
323321
; CHECK-NEXT: s_cmp_lg_u32 s1, 0
324-
; CHECK-NEXT: s_cbranch_scc1 .LBB1_5
325-
; CHECK-NEXT: ; %bb.4:
322+
; CHECK-NEXT: s_cbranch_scc1 .LBB1_4
323+
; CHECK-NEXT: ; %bb.3:
326324
; CHECK-NEXT: v_rcp_iflag_f32_e32 v0, v2
327325
; CHECK-NEXT: s_sub_i32 s1, 0, s2
328326
; CHECK-NEXT: v_mul_f32_e32 v0, 0x4f7ffffe, v0
@@ -339,7 +337,7 @@ define amdgpu_ps i64 @s_urem_i64(i64 inreg %num, i64 inreg %den) {
339337
; CHECK-NEXT: v_subrev_i32_e32 v1, vcc, s2, v0
340338
; CHECK-NEXT: v_cmp_le_u32_e32 vcc, s2, v0
341339
; CHECK-NEXT: v_cndmask_b32_e32 v0, v0, v1, vcc
342-
; CHECK-NEXT: .LBB1_5:
340+
; CHECK-NEXT: .LBB1_4:
343341
; CHECK-NEXT: v_readfirstlane_b32 s0, v0
344342
; CHECK-NEXT: s_mov_b32 s1, s0
345343
; CHECK-NEXT: ; return to shader part epilog

llvm/test/CodeGen/AMDGPU/blender-no-live-segment-at-def-implicit-def.ll

Lines changed: 32 additions & 32 deletions
Original file line numberDiff line numberDiff line change
@@ -9,44 +9,34 @@ define amdgpu_kernel void @blender_no_live_segment_at_def_error(<4 x float> %ext
99
; CHECK-NEXT: s_addc_u32 s13, s13, 0
1010
; CHECK-NEXT: s_setreg_b32 hwreg(HW_REG_FLAT_SCR_LO), s12
1111
; CHECK-NEXT: s_setreg_b32 hwreg(HW_REG_FLAT_SCR_HI), s13
12-
; CHECK-NEXT: s_load_dwordx8 s[36:43], s[8:9], 0x0
12+
; CHECK-NEXT: s_load_dwordx8 s[20:27], s[8:9], 0x0
1313
; CHECK-NEXT: s_add_u32 s0, s0, s17
1414
; CHECK-NEXT: s_addc_u32 s1, s1, 0
15-
; CHECK-NEXT: s_mov_b32 s12, 0
16-
; CHECK-NEXT: s_waitcnt lgkmcnt(0)
17-
; CHECK-NEXT: s_cmp_lg_u32 s40, 0
18-
; CHECK-NEXT: s_cbranch_scc1 .LBB0_8
19-
; CHECK-NEXT: ; %bb.1: ; %if.end13.i.i
20-
; CHECK-NEXT: s_cmp_eq_u32 s42, 0
21-
; CHECK-NEXT: s_cbranch_scc1 .LBB0_4
22-
; CHECK-NEXT: ; %bb.2: ; %if.else251.i.i
23-
; CHECK-NEXT: s_cmp_lg_u32 s43, 0
24-
; CHECK-NEXT: s_mov_b32 s17, 0
25-
; CHECK-NEXT: s_cselect_b32 s12, -1, 0
26-
; CHECK-NEXT: s_and_b32 vcc_lo, exec_lo, s12
27-
; CHECK-NEXT: s_cbranch_vccz .LBB0_5
28-
; CHECK-NEXT: ; %bb.3:
2915
; CHECK-NEXT: s_mov_b32 s36, 0
30-
; CHECK-NEXT: s_andn2_b32 vcc_lo, exec_lo, s12
31-
; CHECK-NEXT: s_cbranch_vccz .LBB0_6
32-
; CHECK-NEXT: s_branch .LBB0_7
33-
; CHECK-NEXT: .LBB0_4:
34-
; CHECK-NEXT: s_mov_b32 s14, s12
35-
; CHECK-NEXT: s_mov_b32 s15, s12
36-
; CHECK-NEXT: s_mov_b32 s13, s12
37-
; CHECK-NEXT: s_mov_b64 s[38:39], s[14:15]
38-
; CHECK-NEXT: s_mov_b64 s[36:37], s[12:13]
16+
; CHECK-NEXT: s_waitcnt lgkmcnt(0)
17+
; CHECK-NEXT: s_cmp_lg_u32 s24, 0
18+
; CHECK-NEXT: s_cbranch_scc0 .LBB0_2
19+
; CHECK-NEXT: ; %bb.1:
20+
; CHECK-NEXT: s_mov_b64 s[38:39], s[22:23]
21+
; CHECK-NEXT: s_mov_b64 s[36:37], s[20:21]
3922
; CHECK-NEXT: s_branch .LBB0_7
40-
; CHECK-NEXT: .LBB0_5: ; %if.then263.i.i
41-
; CHECK-NEXT: v_cmp_lt_f32_e64 s12, s41, 0
42-
; CHECK-NEXT: s_mov_b32 s36, 1.0
43-
; CHECK-NEXT: s_mov_b32 s17, 0x7fc00000
23+
; CHECK-NEXT: .LBB0_2: ; %if.end13.i.i
4424
; CHECK-NEXT: s_mov_b32 s37, s36
4525
; CHECK-NEXT: s_mov_b32 s38, s36
26+
; CHECK-NEXT: s_cmp_eq_u32 s26, 0
4627
; CHECK-NEXT: s_mov_b32 s39, s36
28+
; CHECK-NEXT: s_cbranch_scc1 .LBB0_6
29+
; CHECK-NEXT: ; %bb.3: ; %if.else251.i.i
30+
; CHECK-NEXT: s_cmp_lg_u32 s27, 0
31+
; CHECK-NEXT: s_mov_b32 s17, 0
32+
; CHECK-NEXT: s_cselect_b32 s12, -1, 0
33+
; CHECK-NEXT: s_and_b32 vcc_lo, exec_lo, s12
34+
; CHECK-NEXT: s_cbranch_vccz .LBB0_8
35+
; CHECK-NEXT: ; %bb.4:
36+
; CHECK-NEXT: s_mov_b32 s36, 0
4737
; CHECK-NEXT: s_andn2_b32 vcc_lo, exec_lo, s12
48-
; CHECK-NEXT: s_cbranch_vccnz .LBB0_7
49-
; CHECK-NEXT: .LBB0_6: ; %if.end273.i.i
38+
; CHECK-NEXT: s_cbranch_vccnz .LBB0_6
39+
; CHECK-NEXT: .LBB0_5: ; %if.end273.i.i
5040
; CHECK-NEXT: s_add_u32 s12, s8, 40
5141
; CHECK-NEXT: s_addc_u32 s13, s9, 0
5242
; CHECK-NEXT: s_getpc_b64 s[18:19]
@@ -72,13 +62,13 @@ define amdgpu_kernel void @blender_no_live_segment_at_def_error(<4 x float> %ext
7262
; CHECK-NEXT: s_mov_b32 s37, s36
7363
; CHECK-NEXT: s_mov_b32 s38, s36
7464
; CHECK-NEXT: s_mov_b32 s39, s36
75-
; CHECK-NEXT: .LBB0_7: ; %if.end294.i.i
65+
; CHECK-NEXT: .LBB0_6: ; %if.end294.i.i
7666
; CHECK-NEXT: v_mov_b32_e32 v0, 0
7767
; CHECK-NEXT: buffer_store_dword v0, off, s[0:3], 0 offset:12
7868
; CHECK-NEXT: buffer_store_dword v0, off, s[0:3], 0 offset:8
7969
; CHECK-NEXT: buffer_store_dword v0, off, s[0:3], 0 offset:4
8070
; CHECK-NEXT: buffer_store_dword v0, off, s[0:3], 0
81-
; CHECK-NEXT: .LBB0_8: ; %kernel_direct_lighting.exit
71+
; CHECK-NEXT: .LBB0_7: ; %kernel_direct_lighting.exit
8272
; CHECK-NEXT: s_load_dwordx2 s[4:5], s[8:9], 0x20
8373
; CHECK-NEXT: v_mov_b32_e32 v0, s36
8474
; CHECK-NEXT: v_mov_b32_e32 v4, 0
@@ -88,6 +78,16 @@ define amdgpu_kernel void @blender_no_live_segment_at_def_error(<4 x float> %ext
8878
; CHECK-NEXT: s_waitcnt lgkmcnt(0)
8979
; CHECK-NEXT: global_store_dwordx4 v4, v[0:3], s[4:5]
9080
; CHECK-NEXT: s_endpgm
81+
; CHECK-NEXT: .LBB0_8: ; %if.then263.i.i
82+
; CHECK-NEXT: v_cmp_lt_f32_e64 s12, s25, 0
83+
; CHECK-NEXT: s_mov_b32 s36, 1.0
84+
; CHECK-NEXT: s_mov_b32 s17, 0x7fc00000
85+
; CHECK-NEXT: s_mov_b32 s37, s36
86+
; CHECK-NEXT: s_mov_b32 s38, s36
87+
; CHECK-NEXT: s_mov_b32 s39, s36
88+
; CHECK-NEXT: s_andn2_b32 vcc_lo, exec_lo, s12
89+
; CHECK-NEXT: s_cbranch_vccz .LBB0_5
90+
; CHECK-NEXT: s_branch .LBB0_6
9191
entry:
9292
%cmp5.i.i = icmp eq i32 %cmp5.i.i.arg, 0
9393
br i1 %cmp5.i.i, label %if.end13.i.i, label %kernel_direct_lighting.exit

0 commit comments

Comments
 (0)