Skip to content

Commit 2474bc9

Browse files
committed
Update tests
Signed-off-by: John Lu <[email protected]>
1 parent ff4ae2c commit 2474bc9

File tree

11 files changed

+355
-359
lines changed

11 files changed

+355
-359
lines changed

llvm/lib/Target/AMDGPU/SIISelLowering.cpp

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -5956,10 +5956,6 @@ SITargetLowering::EmitInstrWithCustomInserter(MachineInstr &MI,
59565956
return lowerWaveReduce(MI, *BB, *getSubtarget(), AMDGPU::S_XOR_B64);
59575957
case AMDGPU::S_UADDO_PSEUDO:
59585958
case AMDGPU::S_USUBO_PSEUDO: {
5959-
<<<<<<< HEAD
5960-
=======
5961-
const DebugLoc &DL = MI.getDebugLoc();
5962-
>>>>>>> 27321ddcdbe2 (Clean up code.)
59635959
MachineOperand &Dest0 = MI.getOperand(0);
59645960
MachineOperand &Dest1 = MI.getOperand(1);
59655961
MachineOperand &Src0 = MI.getOperand(2);

llvm/test/CodeGen/AMDGPU/amdgpu-codegenprepare-idiv.ll

Lines changed: 116 additions & 116 deletions
Large diffs are not rendered by default.

llvm/test/CodeGen/AMDGPU/carryout-selection.ll

Lines changed: 41 additions & 41 deletions
Original file line numberDiff line numberDiff line change
@@ -2215,11 +2215,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
22152215
; VI-NEXT: s_add_i32 s14, s8, s9
22162216
; VI-NEXT: s_sub_i32 s10, s3, s14
22172217
; VI-NEXT: v_readfirstlane_b32 s8, v0
2218-
; VI-NEXT: s_sub_i32 s15, s2, s8
2218+
; VI-NEXT: s_sub_u32 s15, s2, s8
22192219
; VI-NEXT: s_cselect_b64 s[8:9], 1, 0
22202220
; VI-NEXT: s_cmp_lg_u64 s[8:9], 0
22212221
; VI-NEXT: s_subb_u32 s16, s10, s5
2222-
; VI-NEXT: s_sub_i32 s17, s15, s4
2222+
; VI-NEXT: s_sub_u32 s17, s15, s4
22232223
; VI-NEXT: s_cselect_b64 s[10:11], 1, 0
22242224
; VI-NEXT: s_cmp_lg_u64 s[10:11], 0
22252225
; VI-NEXT: s_subb_u32 s10, s16, 0
@@ -2329,7 +2329,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
23292329
; GFX9-NEXT: s_mul_i32 s9, s12, s9
23302330
; GFX9-NEXT: s_add_u32 s9, s13, s9
23312331
; GFX9-NEXT: s_addc_u32 s13, 0, s14
2332-
; GFX9-NEXT: s_add_i32 s14, s8, s9
2332+
; GFX9-NEXT: s_add_u32 s14, s8, s9
23332333
; GFX9-NEXT: s_cselect_b64 s[8:9], 1, 0
23342334
; GFX9-NEXT: s_cmp_lg_u64 s[8:9], 0
23352335
; GFX9-NEXT: s_addc_u32 s12, s12, s13
@@ -2353,21 +2353,21 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
23532353
; GFX9-NEXT: s_mul_i32 s8, s12, s8
23542354
; GFX9-NEXT: s_add_u32 s8, s10, s8
23552355
; GFX9-NEXT: s_addc_u32 s10, 0, s9
2356-
; GFX9-NEXT: s_add_i32 s14, s14, s8
2356+
; GFX9-NEXT: s_add_u32 s11, s14, s8
23572357
; GFX9-NEXT: s_cselect_b64 s[8:9], 1, 0
23582358
; GFX9-NEXT: s_cmp_lg_u64 s[8:9], 0
23592359
; GFX9-NEXT: s_addc_u32 s8, s12, s10
23602360
; GFX9-NEXT: s_mul_i32 s10, s2, s8
2361-
; GFX9-NEXT: s_mul_hi_u32 s11, s2, s14
2361+
; GFX9-NEXT: s_mul_hi_u32 s12, s2, s11
23622362
; GFX9-NEXT: s_mul_hi_u32 s9, s2, s8
2363-
; GFX9-NEXT: s_add_u32 s10, s11, s10
2363+
; GFX9-NEXT: s_add_u32 s10, s12, s10
23642364
; GFX9-NEXT: s_addc_u32 s9, 0, s9
2365-
; GFX9-NEXT: s_mul_i32 s13, s3, s14
2366-
; GFX9-NEXT: s_mul_hi_u32 s12, s3, s14
2367-
; GFX9-NEXT: s_add_u32 s10, s10, s13
2368-
; GFX9-NEXT: s_mul_hi_u32 s11, s3, s8
2369-
; GFX9-NEXT: s_addc_u32 s9, s9, s12
2370-
; GFX9-NEXT: s_addc_u32 s10, s11, 0
2365+
; GFX9-NEXT: s_mul_hi_u32 s13, s3, s11
2366+
; GFX9-NEXT: s_mul_i32 s11, s3, s11
2367+
; GFX9-NEXT: s_add_u32 s10, s10, s11
2368+
; GFX9-NEXT: s_mul_hi_u32 s12, s3, s8
2369+
; GFX9-NEXT: s_addc_u32 s9, s9, s13
2370+
; GFX9-NEXT: s_addc_u32 s10, s12, 0
23712371
; GFX9-NEXT: s_mul_i32 s8, s3, s8
23722372
; GFX9-NEXT: s_add_u32 s12, s9, s8
23732373
; GFX9-NEXT: s_addc_u32 s13, 0, s10
@@ -2378,11 +2378,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
23782378
; GFX9-NEXT: s_add_i32 s14, s8, s9
23792379
; GFX9-NEXT: s_sub_i32 s10, s3, s14
23802380
; GFX9-NEXT: s_mul_i32 s8, s6, s12
2381-
; GFX9-NEXT: s_sub_i32 s15, s2, s8
2381+
; GFX9-NEXT: s_sub_u32 s15, s2, s8
23822382
; GFX9-NEXT: s_cselect_b64 s[8:9], 1, 0
23832383
; GFX9-NEXT: s_cmp_lg_u64 s[8:9], 0
23842384
; GFX9-NEXT: s_subb_u32 s16, s10, s7
2385-
; GFX9-NEXT: s_sub_i32 s17, s15, s6
2385+
; GFX9-NEXT: s_sub_u32 s17, s15, s6
23862386
; GFX9-NEXT: s_cselect_b64 s[10:11], 1, 0
23872387
; GFX9-NEXT: s_cmp_lg_u64 s[10:11], 0
23882388
; GFX9-NEXT: s_subb_u32 s10, s16, 0
@@ -2488,7 +2488,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
24882488
; GFX1010-NEXT: s_addc_u32 s13, s17, 0
24892489
; GFX1010-NEXT: s_add_u32 s11, s12, s11
24902490
; GFX1010-NEXT: s_addc_u32 s12, 0, s13
2491-
; GFX1010-NEXT: s_add_i32 s8, s8, s11
2491+
; GFX1010-NEXT: s_add_u32 s8, s8, s11
24922492
; GFX1010-NEXT: s_cselect_b32 s11, 1, 0
24932493
; GFX1010-NEXT: s_mul_hi_u32 s13, s9, s8
24942494
; GFX1010-NEXT: s_cmp_lg_u32 s11, 0
@@ -2512,7 +2512,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
25122512
; GFX1010-NEXT: s_addc_u32 s11, s11, 0
25132513
; GFX1010-NEXT: s_add_u32 s9, s10, s9
25142514
; GFX1010-NEXT: s_addc_u32 s10, 0, s11
2515-
; GFX1010-NEXT: s_add_i32 s8, s8, s9
2515+
; GFX1010-NEXT: s_add_u32 s8, s8, s9
25162516
; GFX1010-NEXT: s_cselect_b32 s9, 1, 0
25172517
; GFX1010-NEXT: s_mul_hi_u32 s11, s2, s8
25182518
; GFX1010-NEXT: s_cmp_lg_u32 s9, 0
@@ -2537,11 +2537,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
25372537
; GFX1010-NEXT: s_mul_i32 s10, s6, s5
25382538
; GFX1010-NEXT: s_add_i32 s9, s9, s11
25392539
; GFX1010-NEXT: s_sub_i32 s11, s3, s9
2540-
; GFX1010-NEXT: s_sub_i32 s10, s2, s10
2540+
; GFX1010-NEXT: s_sub_u32 s10, s2, s10
25412541
; GFX1010-NEXT: s_cselect_b32 s12, 1, 0
25422542
; GFX1010-NEXT: s_cmp_lg_u32 s12, 0
25432543
; GFX1010-NEXT: s_subb_u32 s11, s11, s7
2544-
; GFX1010-NEXT: s_sub_i32 s13, s10, s6
2544+
; GFX1010-NEXT: s_sub_u32 s13, s10, s6
25452545
; GFX1010-NEXT: s_cselect_b32 s14, 1, 0
25462546
; GFX1010-NEXT: s_cmp_lg_u32 s14, 0
25472547
; GFX1010-NEXT: s_subb_u32 s11, s11, 0
@@ -2648,7 +2648,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
26482648
; GFX1030W32-NEXT: s_addc_u32 s13, s17, 0
26492649
; GFX1030W32-NEXT: s_add_u32 s11, s12, s11
26502650
; GFX1030W32-NEXT: s_addc_u32 s12, 0, s13
2651-
; GFX1030W32-NEXT: s_add_i32 s8, s8, s11
2651+
; GFX1030W32-NEXT: s_add_u32 s8, s8, s11
26522652
; GFX1030W32-NEXT: s_cselect_b32 s11, 1, 0
26532653
; GFX1030W32-NEXT: s_mul_hi_u32 s13, s9, s8
26542654
; GFX1030W32-NEXT: s_cmp_lg_u32 s11, 0
@@ -2672,7 +2672,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
26722672
; GFX1030W32-NEXT: s_addc_u32 s11, s11, 0
26732673
; GFX1030W32-NEXT: s_add_u32 s9, s10, s9
26742674
; GFX1030W32-NEXT: s_addc_u32 s10, 0, s11
2675-
; GFX1030W32-NEXT: s_add_i32 s8, s8, s9
2675+
; GFX1030W32-NEXT: s_add_u32 s8, s8, s9
26762676
; GFX1030W32-NEXT: s_cselect_b32 s9, 1, 0
26772677
; GFX1030W32-NEXT: s_mul_hi_u32 s11, s2, s8
26782678
; GFX1030W32-NEXT: s_cmp_lg_u32 s9, 0
@@ -2697,11 +2697,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
26972697
; GFX1030W32-NEXT: s_mul_i32 s10, s4, s7
26982698
; GFX1030W32-NEXT: s_add_i32 s9, s9, s11
26992699
; GFX1030W32-NEXT: s_sub_i32 s11, s3, s9
2700-
; GFX1030W32-NEXT: s_sub_i32 s10, s2, s10
2700+
; GFX1030W32-NEXT: s_sub_u32 s10, s2, s10
27012701
; GFX1030W32-NEXT: s_cselect_b32 s12, 1, 0
27022702
; GFX1030W32-NEXT: s_cmp_lg_u32 s12, 0
27032703
; GFX1030W32-NEXT: s_subb_u32 s11, s11, s5
2704-
; GFX1030W32-NEXT: s_sub_i32 s13, s10, s4
2704+
; GFX1030W32-NEXT: s_sub_u32 s13, s10, s4
27052705
; GFX1030W32-NEXT: s_cselect_b32 s14, 1, 0
27062706
; GFX1030W32-NEXT: s_cmp_lg_u32 s14, 0
27072707
; GFX1030W32-NEXT: s_subb_u32 s11, s11, 0
@@ -2808,7 +2808,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
28082808
; GFX1030W64-NEXT: s_addc_u32 s12, s16, 0
28092809
; GFX1030W64-NEXT: s_add_u32 s7, s11, s7
28102810
; GFX1030W64-NEXT: s_addc_u32 s11, 0, s12
2811-
; GFX1030W64-NEXT: s_add_i32 s12, s6, s7
2811+
; GFX1030W64-NEXT: s_add_u32 s12, s6, s7
28122812
; GFX1030W64-NEXT: s_cselect_b64 s[6:7], 1, 0
28132813
; GFX1030W64-NEXT: s_mul_hi_u32 s13, s9, s12
28142814
; GFX1030W64-NEXT: s_cmp_lg_u64 s[6:7], 0
@@ -2832,16 +2832,16 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
28322832
; GFX1030W64-NEXT: s_addc_u32 s7, s10, 0
28332833
; GFX1030W64-NEXT: s_add_u32 s6, s6, s9
28342834
; GFX1030W64-NEXT: s_addc_u32 s9, 0, s7
2835-
; GFX1030W64-NEXT: s_add_i32 s12, s12, s6
2835+
; GFX1030W64-NEXT: s_add_u32 s10, s12, s6
28362836
; GFX1030W64-NEXT: s_cselect_b64 s[6:7], 1, 0
2837-
; GFX1030W64-NEXT: s_mul_hi_u32 s10, s2, s12
2837+
; GFX1030W64-NEXT: s_mul_hi_u32 s11, s2, s10
28382838
; GFX1030W64-NEXT: s_cmp_lg_u64 s[6:7], 0
2839-
; GFX1030W64-NEXT: s_mul_hi_u32 s6, s3, s12
2839+
; GFX1030W64-NEXT: s_mul_hi_u32 s6, s3, s10
28402840
; GFX1030W64-NEXT: s_addc_u32 s7, s8, s9
2841-
; GFX1030W64-NEXT: s_mul_i32 s8, s3, s12
2842-
; GFX1030W64-NEXT: s_mul_i32 s11, s2, s7
2841+
; GFX1030W64-NEXT: s_mul_i32 s8, s3, s10
2842+
; GFX1030W64-NEXT: s_mul_i32 s10, s2, s7
28432843
; GFX1030W64-NEXT: s_mul_hi_u32 s9, s2, s7
2844-
; GFX1030W64-NEXT: s_add_u32 s10, s10, s11
2844+
; GFX1030W64-NEXT: s_add_u32 s10, s11, s10
28452845
; GFX1030W64-NEXT: s_addc_u32 s9, 0, s9
28462846
; GFX1030W64-NEXT: s_mul_hi_u32 s12, s3, s7
28472847
; GFX1030W64-NEXT: s_add_u32 s8, s10, s8
@@ -2857,11 +2857,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
28572857
; GFX1030W64-NEXT: s_add_i32 s12, s6, s8
28582858
; GFX1030W64-NEXT: s_mul_i32 s6, s4, s10
28592859
; GFX1030W64-NEXT: s_sub_i32 s8, s3, s12
2860-
; GFX1030W64-NEXT: s_sub_i32 s13, s2, s6
2860+
; GFX1030W64-NEXT: s_sub_u32 s13, s2, s6
28612861
; GFX1030W64-NEXT: s_cselect_b64 s[6:7], 1, 0
28622862
; GFX1030W64-NEXT: s_cmp_lg_u64 s[6:7], 0
28632863
; GFX1030W64-NEXT: s_subb_u32 s14, s8, s5
2864-
; GFX1030W64-NEXT: s_sub_i32 s15, s13, s4
2864+
; GFX1030W64-NEXT: s_sub_u32 s15, s13, s4
28652865
; GFX1030W64-NEXT: s_cselect_b64 s[8:9], 1, 0
28662866
; GFX1030W64-NEXT: s_cmp_lg_u64 s[8:9], 0
28672867
; GFX1030W64-NEXT: s_subb_u32 s8, s14, 0
@@ -2973,7 +2973,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
29732973
; GFX11-NEXT: s_addc_u32 s13, s17, 0
29742974
; GFX11-NEXT: s_add_u32 s11, s12, s11
29752975
; GFX11-NEXT: s_addc_u32 s12, 0, s13
2976-
; GFX11-NEXT: s_add_i32 s8, s8, s11
2976+
; GFX11-NEXT: s_add_u32 s8, s8, s11
29772977
; GFX11-NEXT: s_cselect_b32 s11, 1, 0
29782978
; GFX11-NEXT: s_mul_hi_u32 s13, s9, s8
29792979
; GFX11-NEXT: s_cmp_lg_u32 s11, 0
@@ -2997,7 +2997,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
29972997
; GFX11-NEXT: s_addc_u32 s11, s11, 0
29982998
; GFX11-NEXT: s_add_u32 s9, s10, s9
29992999
; GFX11-NEXT: s_addc_u32 s10, 0, s11
3000-
; GFX11-NEXT: s_add_i32 s8, s8, s9
3000+
; GFX11-NEXT: s_add_u32 s8, s8, s9
30013001
; GFX11-NEXT: s_cselect_b32 s9, 1, 0
30023002
; GFX11-NEXT: s_mul_hi_u32 s11, s2, s8
30033003
; GFX11-NEXT: s_cmp_lg_u32 s9, 0
@@ -3023,11 +3023,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
30233023
; GFX11-NEXT: s_add_i32 s9, s9, s11
30243024
; GFX11-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_2) | instid1(SALU_CYCLE_1)
30253025
; GFX11-NEXT: s_sub_i32 s11, s3, s9
3026-
; GFX11-NEXT: s_sub_i32 s10, s2, s10
3026+
; GFX11-NEXT: s_sub_u32 s10, s2, s10
30273027
; GFX11-NEXT: s_cselect_b32 s12, 1, 0
30283028
; GFX11-NEXT: s_cmp_lg_u32 s12, 0
30293029
; GFX11-NEXT: s_subb_u32 s11, s11, s5
3030-
; GFX11-NEXT: s_sub_i32 s13, s10, s4
3030+
; GFX11-NEXT: s_sub_u32 s13, s10, s4
30313031
; GFX11-NEXT: s_cselect_b32 s14, 1, 0
30323032
; GFX11-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_1) | instid1(SALU_CYCLE_1)
30333033
; GFX11-NEXT: s_cmp_lg_u32 s14, 0
@@ -3105,7 +3105,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
31053105
; GFX1250-NEXT: s_wait_kmcnt 0x0
31063106
; GFX1250-NEXT: s_or_b64 s[6:7], s[2:3], s[4:5]
31073107
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
3108-
; GFX1250-NEXT: s_and_b64 s[6:7], s[6:7], lit64(0xffffffff00000000)
3108+
; GFX1250-NEXT: s_and_b64 s[6:7], s[6:7], 0xffffffff00000000
31093109
; GFX1250-NEXT: s_cmp_lg_u64 s[6:7], 0
31103110
; GFX1250-NEXT: s_cbranch_scc0 .LBB16_4
31113111
; GFX1250-NEXT: ; %bb.1:
@@ -3140,7 +3140,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
31403140
; GFX1250-NEXT: s_add_co_ci_u32 s13, s18, 0
31413141
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
31423142
; GFX1250-NEXT: s_add_nc_u64 s[12:13], s[6:7], s[12:13]
3143-
; GFX1250-NEXT: s_add_co_i32 s8, s8, s12
3143+
; GFX1250-NEXT: s_add_co_u32 s8, s8, s12
31443144
; GFX1250-NEXT: s_cselect_b32 s6, 1, 0
31453145
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_1) | instid1(SALU_CYCLE_1)
31463146
; GFX1250-NEXT: s_cmp_lg_u32 s6, 0
@@ -3160,7 +3160,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
31603160
; GFX1250-NEXT: s_add_co_ci_u32 s11, s16, 0
31613161
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
31623162
; GFX1250-NEXT: s_add_nc_u64 s[10:11], s[6:7], s[10:11]
3163-
; GFX1250-NEXT: s_add_co_i32 s8, s8, s10
3163+
; GFX1250-NEXT: s_add_co_u32 s8, s8, s10
31643164
; GFX1250-NEXT: s_cselect_b32 s10, 1, 0
31653165
; GFX1250-NEXT: s_mul_hi_u32 s6, s2, s8
31663166
; GFX1250-NEXT: s_cmp_lg_u32 s10, 0
@@ -3177,17 +3177,17 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
31773177
; GFX1250-NEXT: s_add_co_ci_u32 s11, s13, 0
31783178
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
31793179
; GFX1250-NEXT: s_add_nc_u64 s[8:9], s[6:7], s[10:11]
3180-
; GFX1250-NEXT: s_and_b64 s[10:11], s[8:9], lit64(0xffffffff00000000)
3180+
; GFX1250-NEXT: s_and_b64 s[10:11], s[8:9], 0xffffffff00000000
31813181
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
31823182
; GFX1250-NEXT: s_or_b32 s10, s10, s8
31833183
; GFX1250-NEXT: s_mul_u64 s[8:9], s[4:5], s[10:11]
31843184
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
3185-
; GFX1250-NEXT: s_sub_co_i32 s6, s2, s8
3185+
; GFX1250-NEXT: s_sub_co_u32 s6, s2, s8
31863186
; GFX1250-NEXT: s_cselect_b32 s8, 1, 0
31873187
; GFX1250-NEXT: s_sub_co_i32 s12, s3, s9
31883188
; GFX1250-NEXT: s_cmp_lg_u32 s8, 0
31893189
; GFX1250-NEXT: s_sub_co_ci_u32 s12, s12, s5
3190-
; GFX1250-NEXT: s_sub_co_i32 s13, s6, s4
3190+
; GFX1250-NEXT: s_sub_co_u32 s13, s6, s4
31913191
; GFX1250-NEXT: s_cselect_b32 s14, 1, 0
31923192
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_1) | instid1(SALU_CYCLE_1)
31933193
; GFX1250-NEXT: s_cmp_lg_u32 s14, 0

llvm/test/CodeGen/AMDGPU/expand-scalar-carry-out-select-user.ll

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@ define i32 @s_add_co_select_user() {
1111
; GFX7-NEXT: s_mov_b64 s[4:5], 0
1212
; GFX7-NEXT: s_load_dword s6, s[4:5], 0x0
1313
; GFX7-NEXT: s_waitcnt lgkmcnt(0)
14-
; GFX7-NEXT: s_add_i32 s7, s6, s6
14+
; GFX7-NEXT: s_add_u32 s7, s6, s6
1515
; GFX7-NEXT: s_cselect_b64 s[4:5], 1, 0
1616
; GFX7-NEXT: s_or_b32 s4, s4, s5
1717
; GFX7-NEXT: s_cmp_lg_u32 s4, 0
@@ -30,7 +30,7 @@ define i32 @s_add_co_select_user() {
3030
; GFX9-NEXT: s_mov_b64 s[4:5], 0
3131
; GFX9-NEXT: s_load_dword s6, s[4:5], 0x0
3232
; GFX9-NEXT: s_waitcnt lgkmcnt(0)
33-
; GFX9-NEXT: s_add_i32 s7, s6, s6
33+
; GFX9-NEXT: s_add_u32 s7, s6, s6
3434
; GFX9-NEXT: s_cselect_b64 s[4:5], 1, 0
3535
; GFX9-NEXT: s_cmp_lg_u64 s[4:5], 0
3636
; GFX9-NEXT: s_addc_u32 s8, s6, 0
@@ -48,7 +48,7 @@ define i32 @s_add_co_select_user() {
4848
; GFX10-NEXT: s_mov_b64 s[4:5], 0
4949
; GFX10-NEXT: s_load_dword s4, s[4:5], 0x0
5050
; GFX10-NEXT: s_waitcnt lgkmcnt(0)
51-
; GFX10-NEXT: s_add_i32 s5, s4, s4
51+
; GFX10-NEXT: s_add_u32 s5, s4, s4
5252
; GFX10-NEXT: s_cselect_b32 s6, 1, 0
5353
; GFX10-NEXT: s_cmp_lg_u32 s6, 0
5454
; GFX10-NEXT: s_addc_u32 s6, s4, 0
@@ -66,7 +66,7 @@ define i32 @s_add_co_select_user() {
6666
; GFX11-NEXT: s_mov_b64 s[0:1], 0
6767
; GFX11-NEXT: s_load_b32 s0, s[0:1], 0x0
6868
; GFX11-NEXT: s_waitcnt lgkmcnt(0)
69-
; GFX11-NEXT: s_add_i32 s1, s0, s0
69+
; GFX11-NEXT: s_add_u32 s1, s0, s0
7070
; GFX11-NEXT: s_cselect_b32 s2, 1, 0
7171
; GFX11-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_2) | instid1(SALU_CYCLE_1)
7272
; GFX11-NEXT: s_cmp_lg_u32 s2, 0

llvm/test/CodeGen/AMDGPU/s_uaddo_pseudo.ll

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111
define amdgpu_ps i32 @s_uaddo_pseudo(i32 inreg %val0) {
1212
; CHECK-LABEL: s_uaddo_pseudo:
1313
; CHECK: ; %bb.0:
14-
; CHECK-NEXT: s_add_i32 s0, s0, 1
14+
; CHECK-NEXT: s_add_u32 s0, s0, 1
1515
; CHECK-NEXT: s_cselect_b64 s[0:1], 1, 0
1616
; CHECK-NEXT: s_cmp_lg_u64 s[0:1], 0
1717
; CHECK-NEXT: s_addc_u32 s0, 1, 0

llvm/test/CodeGen/AMDGPU/sdiv64.ll

Lines changed: 11 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -54,7 +54,7 @@ define amdgpu_kernel void @s_test_sdiv(ptr addrspace(1) %out, i64 %x, i64 %y) {
5454
; GCN-NEXT: s_mul_i32 s1, s14, s1
5555
; GCN-NEXT: s_add_u32 s1, s15, s1
5656
; GCN-NEXT: s_addc_u32 s15, 0, s16
57-
; GCN-NEXT: s_add_i32 s16, s0, s1
57+
; GCN-NEXT: s_add_u32 s16, s0, s1
5858
; GCN-NEXT: v_mov_b32_e32 v0, s16
5959
; GCN-NEXT: s_cselect_b64 s[0:1], 1, 0
6060
; GCN-NEXT: v_mul_hi_u32 v0, s12, v0
@@ -87,7 +87,7 @@ define amdgpu_kernel void @s_test_sdiv(ptr addrspace(1) %out, i64 %x, i64 %y) {
8787
; GCN-NEXT: s_mul_i32 s0, s14, s0
8888
; GCN-NEXT: s_add_u32 s0, s1, s0
8989
; GCN-NEXT: s_addc_u32 s12, 0, s12
90-
; GCN-NEXT: s_add_i32 s15, s16, s0
90+
; GCN-NEXT: s_add_u32 s15, s16, s0
9191
; GCN-NEXT: s_cselect_b64 s[0:1], 1, 0
9292
; GCN-NEXT: s_or_b32 s0, s0, s1
9393
; GCN-NEXT: s_cmp_lg_u32 s0, 0
@@ -128,12 +128,12 @@ define amdgpu_kernel void @s_test_sdiv(ptr addrspace(1) %out, i64 %x, i64 %y) {
128128
; GCN-NEXT: s_add_i32 s16, s4, s5
129129
; GCN-NEXT: s_sub_i32 s17, s7, s16
130130
; GCN-NEXT: s_mul_i32 s4, s10, s14
131-
; GCN-NEXT: s_sub_i32 s6, s6, s4
131+
; GCN-NEXT: s_sub_u32 s6, s6, s4
132132
; GCN-NEXT: s_cselect_b64 s[4:5], 1, 0
133133
; GCN-NEXT: s_or_b32 s18, s4, s5
134134
; GCN-NEXT: s_cmp_lg_u32 s18, 0
135135
; GCN-NEXT: s_subb_u32 s17, s17, s11
136-
; GCN-NEXT: s_sub_i32 s19, s6, s10
136+
; GCN-NEXT: s_sub_u32 s19, s6, s10
137137
; GCN-NEXT: s_cselect_b64 s[4:5], 1, 0
138138
; GCN-NEXT: s_or_b32 s4, s4, s5
139139
; GCN-NEXT: s_cmp_lg_u32 s4, 0
@@ -1190,7 +1190,7 @@ define amdgpu_kernel void @s_test_sdiv_k_num_i64(ptr addrspace(1) %out, i64 %x)
11901190
; GCN-NEXT: s_mul_i32 s9, s11, s9
11911191
; GCN-NEXT: s_add_u32 s9, s12, s9
11921192
; GCN-NEXT: s_addc_u32 s12, 0, s13
1193-
; GCN-NEXT: s_add_i32 s13, s8, s9
1193+
; GCN-NEXT: s_add_u32 s13, s8, s9
11941194
; GCN-NEXT: v_mov_b32_e32 v0, s13
11951195
; GCN-NEXT: s_cselect_b64 s[8:9], 1, 0
11961196
; GCN-NEXT: v_mul_hi_u32 v0, s2, v0
@@ -1223,12 +1223,12 @@ define amdgpu_kernel void @s_test_sdiv_k_num_i64(ptr addrspace(1) %out, i64 %x)
12231223
; GCN-NEXT: s_mul_i32 s8, s11, s8
12241224
; GCN-NEXT: s_add_u32 s2, s2, s8
12251225
; GCN-NEXT: s_addc_u32 s10, 0, s9
1226-
; GCN-NEXT: s_add_i32 s13, s13, s2
1226+
; GCN-NEXT: s_add_u32 s2, s13, s2
12271227
; GCN-NEXT: s_cselect_b64 s[8:9], 1, 0
1228-
; GCN-NEXT: s_or_b32 s2, s8, s9
1229-
; GCN-NEXT: s_cmp_lg_u32 s2, 0
1228+
; GCN-NEXT: s_or_b32 s8, s8, s9
1229+
; GCN-NEXT: s_cmp_lg_u32 s8, 0
12301230
; GCN-NEXT: s_addc_u32 s8, s11, s10
1231-
; GCN-NEXT: v_mul_hi_u32 v1, s13, 24
1231+
; GCN-NEXT: v_mul_hi_u32 v1, s2, 24
12321232
; GCN-NEXT: v_mul_hi_u32 v0, s8, 24
12331233
; GCN-NEXT: s_mul_i32 s8, s8, 24
12341234
; GCN-NEXT: s_mov_b32 s2, -1
@@ -1243,12 +1243,12 @@ define amdgpu_kernel void @s_test_sdiv_k_num_i64(ptr addrspace(1) %out, i64 %x)
12431243
; GCN-NEXT: s_add_i32 s11, s9, s8
12441244
; GCN-NEXT: s_sub_i32 s12, 0, s11
12451245
; GCN-NEXT: s_mul_i32 s8, s6, s10
1246-
; GCN-NEXT: s_sub_i32 s13, 24, s8
1246+
; GCN-NEXT: s_sub_u32 s13, 24, s8
12471247
; GCN-NEXT: s_cselect_b64 s[8:9], 1, 0
12481248
; GCN-NEXT: s_or_b32 s14, s8, s9
12491249
; GCN-NEXT: s_cmp_lg_u32 s14, 0
12501250
; GCN-NEXT: s_subb_u32 s12, s12, s7
1251-
; GCN-NEXT: s_sub_i32 s15, s13, s6
1251+
; GCN-NEXT: s_sub_u32 s15, s13, s6
12521252
; GCN-NEXT: s_cselect_b64 s[8:9], 1, 0
12531253
; GCN-NEXT: s_or_b32 s8, s8, s9
12541254
; GCN-NEXT: s_cmp_lg_u32 s8, 0

0 commit comments

Comments
 (0)