@@ -24693,8 +24693,7 @@ define bfloat @v_log_bf16(bfloat %a) {
24693
24693
; GCN-NEXT: v_mov_b32_e32 v1, 0x41b17218
24694
24694
; GCN-NEXT: v_and_b32_e32 v0, 0xffff0000, v0
24695
24695
; GCN-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
24696
- ; GCN-NEXT: v_cndmask_b32_e64 v2, 0, 1, vcc
24697
- ; GCN-NEXT: v_lshlrev_b32_e32 v2, 5, v2
24696
+ ; GCN-NEXT: v_cndmask_b32_e64 v2, 0, 32, vcc
24698
24697
; GCN-NEXT: v_ldexp_f32_e32 v0, v0, v2
24699
24698
; GCN-NEXT: v_log_f32_e32 v0, v0
24700
24699
; GCN-NEXT: v_and_b32_e32 v2, 0xfffff000, v0
@@ -24720,8 +24719,7 @@ define bfloat @v_log_bf16(bfloat %a) {
24720
24719
; GFX7-NEXT: v_and_b32_e32 v0, 0xffff0000, v0
24721
24720
; GFX7-NEXT: s_mov_b32 s4, 0x800000
24722
24721
; GFX7-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
24723
- ; GFX7-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc
24724
- ; GFX7-NEXT: v_lshlrev_b32_e32 v1, 5, v1
24722
+ ; GFX7-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc
24725
24723
; GFX7-NEXT: v_ldexp_f32_e32 v0, v0, v1
24726
24724
; GFX7-NEXT: v_log_f32_e32 v0, v0
24727
24725
; GFX7-NEXT: s_mov_b32 s4, 0x3f317217
@@ -24745,8 +24743,7 @@ define bfloat @v_log_bf16(bfloat %a) {
24745
24743
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 16, v0
24746
24744
; GFX8-NEXT: s_mov_b32 s4, 0x800000
24747
24745
; GFX8-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
24748
- ; GFX8-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc
24749
- ; GFX8-NEXT: v_lshlrev_b32_e32 v1, 5, v1
24746
+ ; GFX8-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc
24750
24747
; GFX8-NEXT: v_ldexp_f32 v0, v0, v1
24751
24748
; GFX8-NEXT: v_log_f32_e32 v0, v0
24752
24749
; GFX8-NEXT: s_mov_b32 s4, 0x7f800000
@@ -24779,8 +24776,7 @@ define bfloat @v_log_bf16(bfloat %a) {
24779
24776
; GFX9-NEXT: v_lshlrev_b32_e32 v0, 16, v0
24780
24777
; GFX9-NEXT: s_mov_b32 s4, 0x800000
24781
24778
; GFX9-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
24782
- ; GFX9-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc
24783
- ; GFX9-NEXT: v_lshlrev_b32_e32 v1, 5, v1
24779
+ ; GFX9-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc
24784
24780
; GFX9-NEXT: v_ldexp_f32 v0, v0, v1
24785
24781
; GFX9-NEXT: v_log_f32_e32 v0, v0
24786
24782
; GFX9-NEXT: s_mov_b32 s4, 0x3f317217
@@ -24809,8 +24805,7 @@ define bfloat @v_log_bf16(bfloat %a) {
24809
24805
; GFX10-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
24810
24806
; GFX10-NEXT: v_lshlrev_b32_e32 v0, 16, v0
24811
24807
; GFX10-NEXT: v_cmp_gt_f32_e32 vcc_lo, 0x800000, v0
24812
- ; GFX10-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc_lo
24813
- ; GFX10-NEXT: v_lshlrev_b32_e32 v1, 5, v1
24808
+ ; GFX10-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc_lo
24814
24809
; GFX10-NEXT: v_ldexp_f32 v0, v0, v1
24815
24810
; GFX10-NEXT: v_log_f32_e32 v0, v0
24816
24811
; GFX10-NEXT: v_mul_f32_e32 v1, 0x3f317217, v0
@@ -24835,30 +24830,28 @@ define bfloat @v_log_bf16(bfloat %a) {
24835
24830
; GFX11-NEXT: v_lshlrev_b32_e32 v0, 16, v0
24836
24831
; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_1) | instid1(VALU_DEP_1)
24837
24832
; GFX11-NEXT: v_cmp_gt_f32_e32 vcc_lo, 0x800000, v0
24838
- ; GFX11-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc_lo
24839
- ; GFX11-NEXT: v_lshlrev_b32_e32 v1, 5, v1
24840
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
24833
+ ; GFX11-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc_lo
24841
24834
; GFX11-NEXT: v_ldexp_f32 v0, v0, v1
24835
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_1)
24842
24836
; GFX11-NEXT: v_log_f32_e32 v0, v0
24843
24837
; GFX11-NEXT: s_waitcnt_depctr 0xfff
24844
24838
; GFX11-NEXT: v_mul_f32_e32 v1, 0x3f317217, v0
24845
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
24846
24839
; GFX11-NEXT: v_fma_f32 v2, 0x3f317217, v0, -v1
24840
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
24847
24841
; GFX11-NEXT: v_fmamk_f32 v2, v0, 0x3377d1cf, v2
24848
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_3)
24849
24842
; GFX11-NEXT: v_add_f32_e32 v1, v1, v2
24850
24843
; GFX11-NEXT: v_cndmask_b32_e64 v2, 0, 0x41b17218, vcc_lo
24851
24844
; GFX11-NEXT: v_cmp_gt_f32_e64 vcc_lo, 0x7f800000, |v0|
24845
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_3) | instskip(NEXT) | instid1(VALU_DEP_1)
24852
24846
; GFX11-NEXT: v_cndmask_b32_e32 v0, v0, v1, vcc_lo
24853
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
24854
24847
; GFX11-NEXT: v_sub_f32_e32 v0, v0, v2
24848
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_3)
24855
24849
; GFX11-NEXT: v_bfe_u32 v1, v0, 16, 1
24856
24850
; GFX11-NEXT: v_or_b32_e32 v2, 0x400000, v0
24857
24851
; GFX11-NEXT: v_cmp_u_f32_e32 vcc_lo, v0, v0
24858
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_3) | instskip(NEXT) | instid1(VALU_DEP_1)
24859
24852
; GFX11-NEXT: v_add3_u32 v1, v1, v0, 0x7fff
24853
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
24860
24854
; GFX11-NEXT: v_cndmask_b32_e32 v0, v1, v2, vcc_lo
24861
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1)
24862
24855
; GFX11-NEXT: v_lshrrev_b32_e32 v0, 16, v0
24863
24856
; GFX11-NEXT: s_setpc_b64 s[30:31]
24864
24857
%op = call bfloat @llvm.log.bf16(bfloat %a)
@@ -24874,8 +24867,7 @@ define bfloat @v_log2_bf16(bfloat %a) {
24874
24867
; GCN-NEXT: v_mov_b32_e32 v1, 0x42000000
24875
24868
; GCN-NEXT: v_and_b32_e32 v0, 0xffff0000, v0
24876
24869
; GCN-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
24877
- ; GCN-NEXT: v_cndmask_b32_e64 v2, 0, 1, vcc
24878
- ; GCN-NEXT: v_lshlrev_b32_e32 v2, 5, v2
24870
+ ; GCN-NEXT: v_cndmask_b32_e64 v2, 0, 32, vcc
24879
24871
; GCN-NEXT: v_ldexp_f32_e32 v0, v0, v2
24880
24872
; GCN-NEXT: v_log_f32_e32 v0, v0
24881
24873
; GCN-NEXT: v_cndmask_b32_e32 v1, 0, v1, vcc
@@ -24890,8 +24882,7 @@ define bfloat @v_log2_bf16(bfloat %a) {
24890
24882
; GFX7-NEXT: v_and_b32_e32 v0, 0xffff0000, v0
24891
24883
; GFX7-NEXT: s_mov_b32 s4, 0x800000
24892
24884
; GFX7-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
24893
- ; GFX7-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc
24894
- ; GFX7-NEXT: v_lshlrev_b32_e32 v1, 5, v1
24885
+ ; GFX7-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc
24895
24886
; GFX7-NEXT: v_ldexp_f32_e32 v0, v0, v1
24896
24887
; GFX7-NEXT: v_log_f32_e32 v0, v0
24897
24888
; GFX7-NEXT: v_mov_b32_e32 v1, 0x42000000
@@ -24906,8 +24897,7 @@ define bfloat @v_log2_bf16(bfloat %a) {
24906
24897
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 16, v0
24907
24898
; GFX8-NEXT: s_mov_b32 s4, 0x800000
24908
24899
; GFX8-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
24909
- ; GFX8-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc
24910
- ; GFX8-NEXT: v_lshlrev_b32_e32 v1, 5, v1
24900
+ ; GFX8-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc
24911
24901
; GFX8-NEXT: v_ldexp_f32 v0, v0, v1
24912
24902
; GFX8-NEXT: v_log_f32_e32 v0, v0
24913
24903
; GFX8-NEXT: v_mov_b32_e32 v1, 0x42000000
@@ -24928,8 +24918,7 @@ define bfloat @v_log2_bf16(bfloat %a) {
24928
24918
; GFX9-NEXT: v_lshlrev_b32_e32 v0, 16, v0
24929
24919
; GFX9-NEXT: s_mov_b32 s4, 0x800000
24930
24920
; GFX9-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
24931
- ; GFX9-NEXT: v_cndmask_b32_e64 v2, 0, 1, vcc
24932
- ; GFX9-NEXT: v_lshlrev_b32_e32 v2, 5, v2
24921
+ ; GFX9-NEXT: v_cndmask_b32_e64 v2, 0, 32, vcc
24933
24922
; GFX9-NEXT: v_ldexp_f32 v0, v0, v2
24934
24923
; GFX9-NEXT: v_log_f32_e32 v0, v0
24935
24924
; GFX9-NEXT: v_mov_b32_e32 v1, 0x42000000
@@ -24949,9 +24938,8 @@ define bfloat @v_log2_bf16(bfloat %a) {
24949
24938
; GFX10-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
24950
24939
; GFX10-NEXT: v_lshlrev_b32_e32 v0, 16, v0
24951
24940
; GFX10-NEXT: v_cmp_gt_f32_e32 vcc_lo, 0x800000, v0
24952
- ; GFX10-NEXT: v_cndmask_b32_e64 v2, 0, 1 , vcc_lo
24941
+ ; GFX10-NEXT: v_cndmask_b32_e64 v2, 0, 32 , vcc_lo
24953
24942
; GFX10-NEXT: v_cndmask_b32_e64 v1, 0, 0x42000000, vcc_lo
24954
- ; GFX10-NEXT: v_lshlrev_b32_e32 v2, 5, v2
24955
24943
; GFX10-NEXT: v_ldexp_f32 v0, v0, v2
24956
24944
; GFX10-NEXT: v_log_f32_e32 v0, v0
24957
24945
; GFX10-NEXT: v_sub_f32_e32 v0, v0, v1
@@ -24969,21 +24957,20 @@ define bfloat @v_log2_bf16(bfloat %a) {
24969
24957
; GFX11-NEXT: v_lshlrev_b32_e32 v0, 16, v0
24970
24958
; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_2)
24971
24959
; GFX11-NEXT: v_cmp_gt_f32_e32 vcc_lo, 0x800000, v0
24972
- ; GFX11-NEXT: v_cndmask_b32_e64 v2, 0, 1 , vcc_lo
24960
+ ; GFX11-NEXT: v_cndmask_b32_e64 v2, 0, 32 , vcc_lo
24973
24961
; GFX11-NEXT: v_cndmask_b32_e64 v1, 0, 0x42000000, vcc_lo
24974
- ; GFX11-NEXT: v_lshlrev_b32_e32 v2, 5, v2
24975
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
24976
24962
; GFX11-NEXT: v_ldexp_f32 v0, v0, v2
24963
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_1)
24977
24964
; GFX11-NEXT: v_log_f32_e32 v0, v0
24978
24965
; GFX11-NEXT: s_waitcnt_depctr 0xfff
24979
24966
; GFX11-NEXT: v_sub_f32_e32 v0, v0, v1
24980
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_3)
24981
24967
; GFX11-NEXT: v_bfe_u32 v1, v0, 16, 1
24982
24968
; GFX11-NEXT: v_or_b32_e32 v2, 0x400000, v0
24983
24969
; GFX11-NEXT: v_cmp_u_f32_e32 vcc_lo, v0, v0
24970
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_3) | instskip(NEXT) | instid1(VALU_DEP_1)
24984
24971
; GFX11-NEXT: v_add3_u32 v1, v1, v0, 0x7fff
24985
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
24986
24972
; GFX11-NEXT: v_cndmask_b32_e32 v0, v1, v2, vcc_lo
24973
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1)
24987
24974
; GFX11-NEXT: v_lshrrev_b32_e32 v0, 16, v0
24988
24975
; GFX11-NEXT: s_setpc_b64 s[30:31]
24989
24976
%op = call bfloat @llvm.log2.bf16(bfloat %a)
@@ -25000,8 +24987,7 @@ define bfloat @v_log10_bf16(bfloat %a) {
25000
24987
; GCN-NEXT: v_mov_b32_e32 v1, 0x411a209b
25001
24988
; GCN-NEXT: v_and_b32_e32 v0, 0xffff0000, v0
25002
24989
; GCN-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
25003
- ; GCN-NEXT: v_cndmask_b32_e64 v2, 0, 1, vcc
25004
- ; GCN-NEXT: v_lshlrev_b32_e32 v2, 5, v2
24990
+ ; GCN-NEXT: v_cndmask_b32_e64 v2, 0, 32, vcc
25005
24991
; GCN-NEXT: v_ldexp_f32_e32 v0, v0, v2
25006
24992
; GCN-NEXT: v_log_f32_e32 v0, v0
25007
24993
; GCN-NEXT: v_and_b32_e32 v2, 0xfffff000, v0
@@ -25027,8 +25013,7 @@ define bfloat @v_log10_bf16(bfloat %a) {
25027
25013
; GFX7-NEXT: v_and_b32_e32 v0, 0xffff0000, v0
25028
25014
; GFX7-NEXT: s_mov_b32 s4, 0x800000
25029
25015
; GFX7-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
25030
- ; GFX7-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc
25031
- ; GFX7-NEXT: v_lshlrev_b32_e32 v1, 5, v1
25016
+ ; GFX7-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc
25032
25017
; GFX7-NEXT: v_ldexp_f32_e32 v0, v0, v1
25033
25018
; GFX7-NEXT: v_log_f32_e32 v0, v0
25034
25019
; GFX7-NEXT: s_mov_b32 s4, 0x3e9a209a
@@ -25052,8 +25037,7 @@ define bfloat @v_log10_bf16(bfloat %a) {
25052
25037
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 16, v0
25053
25038
; GFX8-NEXT: s_mov_b32 s4, 0x800000
25054
25039
; GFX8-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
25055
- ; GFX8-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc
25056
- ; GFX8-NEXT: v_lshlrev_b32_e32 v1, 5, v1
25040
+ ; GFX8-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc
25057
25041
; GFX8-NEXT: v_ldexp_f32 v0, v0, v1
25058
25042
; GFX8-NEXT: v_log_f32_e32 v0, v0
25059
25043
; GFX8-NEXT: s_mov_b32 s4, 0x7f800000
@@ -25086,8 +25070,7 @@ define bfloat @v_log10_bf16(bfloat %a) {
25086
25070
; GFX9-NEXT: v_lshlrev_b32_e32 v0, 16, v0
25087
25071
; GFX9-NEXT: s_mov_b32 s4, 0x800000
25088
25072
; GFX9-NEXT: v_cmp_gt_f32_e32 vcc, s4, v0
25089
- ; GFX9-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc
25090
- ; GFX9-NEXT: v_lshlrev_b32_e32 v1, 5, v1
25073
+ ; GFX9-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc
25091
25074
; GFX9-NEXT: v_ldexp_f32 v0, v0, v1
25092
25075
; GFX9-NEXT: v_log_f32_e32 v0, v0
25093
25076
; GFX9-NEXT: s_mov_b32 s4, 0x3e9a209a
@@ -25116,8 +25099,7 @@ define bfloat @v_log10_bf16(bfloat %a) {
25116
25099
; GFX10-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
25117
25100
; GFX10-NEXT: v_lshlrev_b32_e32 v0, 16, v0
25118
25101
; GFX10-NEXT: v_cmp_gt_f32_e32 vcc_lo, 0x800000, v0
25119
- ; GFX10-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc_lo
25120
- ; GFX10-NEXT: v_lshlrev_b32_e32 v1, 5, v1
25102
+ ; GFX10-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc_lo
25121
25103
; GFX10-NEXT: v_ldexp_f32 v0, v0, v1
25122
25104
; GFX10-NEXT: v_log_f32_e32 v0, v0
25123
25105
; GFX10-NEXT: v_mul_f32_e32 v1, 0x3e9a209a, v0
@@ -25142,30 +25124,28 @@ define bfloat @v_log10_bf16(bfloat %a) {
25142
25124
; GFX11-NEXT: v_lshlrev_b32_e32 v0, 16, v0
25143
25125
; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_1) | instid1(VALU_DEP_1)
25144
25126
; GFX11-NEXT: v_cmp_gt_f32_e32 vcc_lo, 0x800000, v0
25145
- ; GFX11-NEXT: v_cndmask_b32_e64 v1, 0, 1, vcc_lo
25146
- ; GFX11-NEXT: v_lshlrev_b32_e32 v1, 5, v1
25147
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
25127
+ ; GFX11-NEXT: v_cndmask_b32_e64 v1, 0, 32, vcc_lo
25148
25128
; GFX11-NEXT: v_ldexp_f32 v0, v0, v1
25129
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_1)
25149
25130
; GFX11-NEXT: v_log_f32_e32 v0, v0
25150
25131
; GFX11-NEXT: s_waitcnt_depctr 0xfff
25151
25132
; GFX11-NEXT: v_mul_f32_e32 v1, 0x3e9a209a, v0
25152
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
25153
25133
; GFX11-NEXT: v_fma_f32 v2, 0x3e9a209a, v0, -v1
25134
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
25154
25135
; GFX11-NEXT: v_fmamk_f32 v2, v0, 0x3284fbcf, v2
25155
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_3)
25156
25136
; GFX11-NEXT: v_add_f32_e32 v1, v1, v2
25157
25137
; GFX11-NEXT: v_cndmask_b32_e64 v2, 0, 0x411a209b, vcc_lo
25158
25138
; GFX11-NEXT: v_cmp_gt_f32_e64 vcc_lo, 0x7f800000, |v0|
25139
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_3) | instskip(NEXT) | instid1(VALU_DEP_1)
25159
25140
; GFX11-NEXT: v_cndmask_b32_e32 v0, v0, v1, vcc_lo
25160
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
25161
25141
; GFX11-NEXT: v_sub_f32_e32 v0, v0, v2
25142
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(SKIP_2) | instid1(VALU_DEP_3)
25162
25143
; GFX11-NEXT: v_bfe_u32 v1, v0, 16, 1
25163
25144
; GFX11-NEXT: v_or_b32_e32 v2, 0x400000, v0
25164
25145
; GFX11-NEXT: v_cmp_u_f32_e32 vcc_lo, v0, v0
25165
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_3) | instskip(NEXT) | instid1(VALU_DEP_1)
25166
25146
; GFX11-NEXT: v_add3_u32 v1, v1, v0, 0x7fff
25147
+ ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1) | instskip(NEXT) | instid1(VALU_DEP_1)
25167
25148
; GFX11-NEXT: v_cndmask_b32_e32 v0, v1, v2, vcc_lo
25168
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1)
25169
25149
; GFX11-NEXT: v_lshrrev_b32_e32 v0, 16, v0
25170
25150
; GFX11-NEXT: s_setpc_b64 s[30:31]
25171
25151
%op = call bfloat @llvm.log10.bf16(bfloat %a)
0 commit comments