@@ -2216,11 +2216,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2216
2216
; VI-NEXT: s_sub_i32 s10, s3, s14
2217
2217
; VI-NEXT: v_readfirstlane_b32 s8, v0
2218
2218
; VI-NEXT: s_sub_u32 s15, s2, s8
2219
- ; VI-NEXT: s_cselect_b64 s[8:9], 1, 0
2219
+ ; VI-NEXT: s_cselect_b64 s[8:9], - 1, 0
2220
2220
; VI-NEXT: s_cmp_lg_u64 s[8:9], 0
2221
2221
; VI-NEXT: s_subb_u32 s16, s10, s5
2222
2222
; VI-NEXT: s_sub_u32 s17, s15, s4
2223
- ; VI-NEXT: s_cselect_b64 s[10:11], 1, 0
2223
+ ; VI-NEXT: s_cselect_b64 s[10:11], - 1, 0
2224
2224
; VI-NEXT: s_cmp_lg_u64 s[10:11], 0
2225
2225
; VI-NEXT: s_subb_u32 s10, s16, 0
2226
2226
; VI-NEXT: s_cmp_ge_u32 s10, s5
@@ -2330,7 +2330,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2330
2330
; GFX9-NEXT: s_add_u32 s9, s13, s9
2331
2331
; GFX9-NEXT: s_addc_u32 s13, 0, s14
2332
2332
; GFX9-NEXT: s_add_u32 s14, s8, s9
2333
- ; GFX9-NEXT: s_cselect_b64 s[8:9], 1, 0
2333
+ ; GFX9-NEXT: s_cselect_b64 s[8:9], - 1, 0
2334
2334
; GFX9-NEXT: s_cmp_lg_u64 s[8:9], 0
2335
2335
; GFX9-NEXT: s_addc_u32 s12, s12, s13
2336
2336
; GFX9-NEXT: s_mul_i32 s8, s10, s12
@@ -2354,7 +2354,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2354
2354
; GFX9-NEXT: s_add_u32 s8, s10, s8
2355
2355
; GFX9-NEXT: s_addc_u32 s10, 0, s9
2356
2356
; GFX9-NEXT: s_add_u32 s11, s14, s8
2357
- ; GFX9-NEXT: s_cselect_b64 s[8:9], 1, 0
2357
+ ; GFX9-NEXT: s_cselect_b64 s[8:9], - 1, 0
2358
2358
; GFX9-NEXT: s_cmp_lg_u64 s[8:9], 0
2359
2359
; GFX9-NEXT: s_addc_u32 s8, s12, s10
2360
2360
; GFX9-NEXT: s_mul_i32 s10, s2, s8
@@ -2379,11 +2379,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2379
2379
; GFX9-NEXT: s_sub_i32 s10, s3, s14
2380
2380
; GFX9-NEXT: s_mul_i32 s8, s6, s12
2381
2381
; GFX9-NEXT: s_sub_u32 s15, s2, s8
2382
- ; GFX9-NEXT: s_cselect_b64 s[8:9], 1, 0
2382
+ ; GFX9-NEXT: s_cselect_b64 s[8:9], - 1, 0
2383
2383
; GFX9-NEXT: s_cmp_lg_u64 s[8:9], 0
2384
2384
; GFX9-NEXT: s_subb_u32 s16, s10, s7
2385
2385
; GFX9-NEXT: s_sub_u32 s17, s15, s6
2386
- ; GFX9-NEXT: s_cselect_b64 s[10:11], 1, 0
2386
+ ; GFX9-NEXT: s_cselect_b64 s[10:11], - 1, 0
2387
2387
; GFX9-NEXT: s_cmp_lg_u64 s[10:11], 0
2388
2388
; GFX9-NEXT: s_subb_u32 s10, s16, 0
2389
2389
; GFX9-NEXT: s_cmp_ge_u32 s10, s7
@@ -2489,7 +2489,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2489
2489
; GFX1010-NEXT: s_add_u32 s11, s12, s11
2490
2490
; GFX1010-NEXT: s_addc_u32 s12, 0, s13
2491
2491
; GFX1010-NEXT: s_add_u32 s8, s8, s11
2492
- ; GFX1010-NEXT: s_cselect_b32 s11, 1, 0
2492
+ ; GFX1010-NEXT: s_cselect_b32 s11, - 1, 0
2493
2493
; GFX1010-NEXT: s_mul_hi_u32 s13, s9, s8
2494
2494
; GFX1010-NEXT: s_cmp_lg_u32 s11, 0
2495
2495
; GFX1010-NEXT: s_mul_i32 s11, s9, s8
@@ -2513,7 +2513,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2513
2513
; GFX1010-NEXT: s_add_u32 s9, s10, s9
2514
2514
; GFX1010-NEXT: s_addc_u32 s10, 0, s11
2515
2515
; GFX1010-NEXT: s_add_u32 s8, s8, s9
2516
- ; GFX1010-NEXT: s_cselect_b32 s9, 1, 0
2516
+ ; GFX1010-NEXT: s_cselect_b32 s9, - 1, 0
2517
2517
; GFX1010-NEXT: s_mul_hi_u32 s11, s2, s8
2518
2518
; GFX1010-NEXT: s_cmp_lg_u32 s9, 0
2519
2519
; GFX1010-NEXT: s_mul_hi_u32 s9, s3, s8
@@ -2538,11 +2538,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2538
2538
; GFX1010-NEXT: s_add_i32 s9, s9, s11
2539
2539
; GFX1010-NEXT: s_sub_i32 s11, s3, s9
2540
2540
; GFX1010-NEXT: s_sub_u32 s10, s2, s10
2541
- ; GFX1010-NEXT: s_cselect_b32 s12, 1, 0
2541
+ ; GFX1010-NEXT: s_cselect_b32 s12, - 1, 0
2542
2542
; GFX1010-NEXT: s_cmp_lg_u32 s12, 0
2543
2543
; GFX1010-NEXT: s_subb_u32 s11, s11, s7
2544
2544
; GFX1010-NEXT: s_sub_u32 s13, s10, s6
2545
- ; GFX1010-NEXT: s_cselect_b32 s14, 1, 0
2545
+ ; GFX1010-NEXT: s_cselect_b32 s14, - 1, 0
2546
2546
; GFX1010-NEXT: s_cmp_lg_u32 s14, 0
2547
2547
; GFX1010-NEXT: s_subb_u32 s11, s11, 0
2548
2548
; GFX1010-NEXT: s_cmp_ge_u32 s11, s7
@@ -2649,7 +2649,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2649
2649
; GFX1030W32-NEXT: s_add_u32 s11, s12, s11
2650
2650
; GFX1030W32-NEXT: s_addc_u32 s12, 0, s13
2651
2651
; GFX1030W32-NEXT: s_add_u32 s8, s8, s11
2652
- ; GFX1030W32-NEXT: s_cselect_b32 s11, 1, 0
2652
+ ; GFX1030W32-NEXT: s_cselect_b32 s11, - 1, 0
2653
2653
; GFX1030W32-NEXT: s_mul_hi_u32 s13, s9, s8
2654
2654
; GFX1030W32-NEXT: s_cmp_lg_u32 s11, 0
2655
2655
; GFX1030W32-NEXT: s_mul_i32 s11, s9, s8
@@ -2673,7 +2673,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2673
2673
; GFX1030W32-NEXT: s_add_u32 s9, s10, s9
2674
2674
; GFX1030W32-NEXT: s_addc_u32 s10, 0, s11
2675
2675
; GFX1030W32-NEXT: s_add_u32 s8, s8, s9
2676
- ; GFX1030W32-NEXT: s_cselect_b32 s9, 1, 0
2676
+ ; GFX1030W32-NEXT: s_cselect_b32 s9, - 1, 0
2677
2677
; GFX1030W32-NEXT: s_mul_hi_u32 s11, s2, s8
2678
2678
; GFX1030W32-NEXT: s_cmp_lg_u32 s9, 0
2679
2679
; GFX1030W32-NEXT: s_mul_hi_u32 s9, s3, s8
@@ -2698,11 +2698,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2698
2698
; GFX1030W32-NEXT: s_add_i32 s9, s9, s11
2699
2699
; GFX1030W32-NEXT: s_sub_i32 s11, s3, s9
2700
2700
; GFX1030W32-NEXT: s_sub_u32 s10, s2, s10
2701
- ; GFX1030W32-NEXT: s_cselect_b32 s12, 1, 0
2701
+ ; GFX1030W32-NEXT: s_cselect_b32 s12, - 1, 0
2702
2702
; GFX1030W32-NEXT: s_cmp_lg_u32 s12, 0
2703
2703
; GFX1030W32-NEXT: s_subb_u32 s11, s11, s5
2704
2704
; GFX1030W32-NEXT: s_sub_u32 s13, s10, s4
2705
- ; GFX1030W32-NEXT: s_cselect_b32 s14, 1, 0
2705
+ ; GFX1030W32-NEXT: s_cselect_b32 s14, - 1, 0
2706
2706
; GFX1030W32-NEXT: s_cmp_lg_u32 s14, 0
2707
2707
; GFX1030W32-NEXT: s_subb_u32 s11, s11, 0
2708
2708
; GFX1030W32-NEXT: s_cmp_ge_u32 s11, s5
@@ -2809,7 +2809,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2809
2809
; GFX1030W64-NEXT: s_add_u32 s7, s11, s7
2810
2810
; GFX1030W64-NEXT: s_addc_u32 s11, 0, s12
2811
2811
; GFX1030W64-NEXT: s_add_u32 s12, s6, s7
2812
- ; GFX1030W64-NEXT: s_cselect_b64 s[6:7], 1, 0
2812
+ ; GFX1030W64-NEXT: s_cselect_b64 s[6:7], - 1, 0
2813
2813
; GFX1030W64-NEXT: s_mul_hi_u32 s13, s9, s12
2814
2814
; GFX1030W64-NEXT: s_cmp_lg_u64 s[6:7], 0
2815
2815
; GFX1030W64-NEXT: s_mul_i32 s6, s9, s12
@@ -2833,7 +2833,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2833
2833
; GFX1030W64-NEXT: s_add_u32 s6, s6, s9
2834
2834
; GFX1030W64-NEXT: s_addc_u32 s9, 0, s7
2835
2835
; GFX1030W64-NEXT: s_add_u32 s10, s12, s6
2836
- ; GFX1030W64-NEXT: s_cselect_b64 s[6:7], 1, 0
2836
+ ; GFX1030W64-NEXT: s_cselect_b64 s[6:7], - 1, 0
2837
2837
; GFX1030W64-NEXT: s_mul_hi_u32 s11, s2, s10
2838
2838
; GFX1030W64-NEXT: s_cmp_lg_u64 s[6:7], 0
2839
2839
; GFX1030W64-NEXT: s_mul_hi_u32 s6, s3, s10
@@ -2858,11 +2858,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2858
2858
; GFX1030W64-NEXT: s_mul_i32 s6, s4, s10
2859
2859
; GFX1030W64-NEXT: s_sub_i32 s8, s3, s12
2860
2860
; GFX1030W64-NEXT: s_sub_u32 s13, s2, s6
2861
- ; GFX1030W64-NEXT: s_cselect_b64 s[6:7], 1, 0
2861
+ ; GFX1030W64-NEXT: s_cselect_b64 s[6:7], - 1, 0
2862
2862
; GFX1030W64-NEXT: s_cmp_lg_u64 s[6:7], 0
2863
2863
; GFX1030W64-NEXT: s_subb_u32 s14, s8, s5
2864
2864
; GFX1030W64-NEXT: s_sub_u32 s15, s13, s4
2865
- ; GFX1030W64-NEXT: s_cselect_b64 s[8:9], 1, 0
2865
+ ; GFX1030W64-NEXT: s_cselect_b64 s[8:9], - 1, 0
2866
2866
; GFX1030W64-NEXT: s_cmp_lg_u64 s[8:9], 0
2867
2867
; GFX1030W64-NEXT: s_subb_u32 s8, s14, 0
2868
2868
; GFX1030W64-NEXT: s_cmp_ge_u32 s8, s5
@@ -2974,7 +2974,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2974
2974
; GFX11-NEXT: s_add_u32 s11, s12, s11
2975
2975
; GFX11-NEXT: s_addc_u32 s12, 0, s13
2976
2976
; GFX11-NEXT: s_add_u32 s8, s8, s11
2977
- ; GFX11-NEXT: s_cselect_b32 s11, 1, 0
2977
+ ; GFX11-NEXT: s_cselect_b32 s11, - 1, 0
2978
2978
; GFX11-NEXT: s_mul_hi_u32 s13, s9, s8
2979
2979
; GFX11-NEXT: s_cmp_lg_u32 s11, 0
2980
2980
; GFX11-NEXT: s_mul_i32 s11, s9, s8
@@ -2998,7 +2998,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
2998
2998
; GFX11-NEXT: s_add_u32 s9, s10, s9
2999
2999
; GFX11-NEXT: s_addc_u32 s10, 0, s11
3000
3000
; GFX11-NEXT: s_add_u32 s8, s8, s9
3001
- ; GFX11-NEXT: s_cselect_b32 s9, 1, 0
3001
+ ; GFX11-NEXT: s_cselect_b32 s9, - 1, 0
3002
3002
; GFX11-NEXT: s_mul_hi_u32 s11, s2, s8
3003
3003
; GFX11-NEXT: s_cmp_lg_u32 s9, 0
3004
3004
; GFX11-NEXT: s_mul_hi_u32 s9, s3, s8
@@ -3024,11 +3024,11 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
3024
3024
; GFX11-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_2) | instid1(SALU_CYCLE_1)
3025
3025
; GFX11-NEXT: s_sub_i32 s11, s3, s9
3026
3026
; GFX11-NEXT: s_sub_u32 s10, s2, s10
3027
- ; GFX11-NEXT: s_cselect_b32 s12, 1, 0
3027
+ ; GFX11-NEXT: s_cselect_b32 s12, - 1, 0
3028
3028
; GFX11-NEXT: s_cmp_lg_u32 s12, 0
3029
3029
; GFX11-NEXT: s_subb_u32 s11, s11, s5
3030
3030
; GFX11-NEXT: s_sub_u32 s13, s10, s4
3031
- ; GFX11-NEXT: s_cselect_b32 s14, 1, 0
3031
+ ; GFX11-NEXT: s_cselect_b32 s14, - 1, 0
3032
3032
; GFX11-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_1) | instid1(SALU_CYCLE_1)
3033
3033
; GFX11-NEXT: s_cmp_lg_u32 s14, 0
3034
3034
; GFX11-NEXT: s_subb_u32 s11, s11, 0
@@ -3141,7 +3141,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
3141
3141
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
3142
3142
; GFX1250-NEXT: s_add_nc_u64 s[12:13], s[6:7], s[12:13]
3143
3143
; GFX1250-NEXT: s_add_co_u32 s8, s8, s12
3144
- ; GFX1250-NEXT: s_cselect_b32 s6, 1, 0
3144
+ ; GFX1250-NEXT: s_cselect_b32 s6, - 1, 0
3145
3145
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_1) | instid1(SALU_CYCLE_1)
3146
3146
; GFX1250-NEXT: s_cmp_lg_u32 s6, 0
3147
3147
; GFX1250-NEXT: s_add_co_ci_u32 s9, s9, s13
@@ -3161,7 +3161,7 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
3161
3161
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
3162
3162
; GFX1250-NEXT: s_add_nc_u64 s[10:11], s[6:7], s[10:11]
3163
3163
; GFX1250-NEXT: s_add_co_u32 s8, s8, s10
3164
- ; GFX1250-NEXT: s_cselect_b32 s10, 1, 0
3164
+ ; GFX1250-NEXT: s_cselect_b32 s10, - 1, 0
3165
3165
; GFX1250-NEXT: s_mul_hi_u32 s6, s2, s8
3166
3166
; GFX1250-NEXT: s_cmp_lg_u32 s10, 0
3167
3167
; GFX1250-NEXT: s_mul_hi_u32 s12, s3, s8
@@ -3183,12 +3183,12 @@ define amdgpu_kernel void @sudiv64(ptr addrspace(1) %out, i64 %x, i64 %y) {
3183
3183
; GFX1250-NEXT: s_mul_u64 s[8:9], s[4:5], s[10:11]
3184
3184
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
3185
3185
; GFX1250-NEXT: s_sub_co_u32 s6, s2, s8
3186
- ; GFX1250-NEXT: s_cselect_b32 s8, 1, 0
3186
+ ; GFX1250-NEXT: s_cselect_b32 s8, - 1, 0
3187
3187
; GFX1250-NEXT: s_sub_co_i32 s12, s3, s9
3188
3188
; GFX1250-NEXT: s_cmp_lg_u32 s8, 0
3189
3189
; GFX1250-NEXT: s_sub_co_ci_u32 s12, s12, s5
3190
3190
; GFX1250-NEXT: s_sub_co_u32 s13, s6, s4
3191
- ; GFX1250-NEXT: s_cselect_b32 s14, 1, 0
3191
+ ; GFX1250-NEXT: s_cselect_b32 s14, - 1, 0
3192
3192
; GFX1250-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(SKIP_1) | instid1(SALU_CYCLE_1)
3193
3193
; GFX1250-NEXT: s_cmp_lg_u32 s14, 0
3194
3194
; GFX1250-NEXT: s_sub_co_ci_u32 s12, s12, 0
0 commit comments