Skip to content

Commit d49aab1

Browse files
authored
Revert "[AMDGPU][True16][CodeGen] use vgpr16 for zext patterns (#1538… (#154163)
This reverts commit 7c53c61. This patch hit an issue in hip test. revert and will reopen later
1 parent 7e8ff2a commit d49aab1

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

45 files changed

+14018
-12480
lines changed

llvm/lib/Target/AMDGPU/SIInstructions.td

Lines changed: 0 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -3056,8 +3056,6 @@ def : GCNPat<
30563056
}
30573057
} // AddedComplexity = 1
30583058

3059-
foreach p = [NotHasTrue16BitInsts, UseFakeTrue16Insts] in
3060-
let True16Predicate = p in {
30613059
def : GCNPat<
30623060
(i32 (DivergentUnaryFrag<zext> i16:$src)),
30633061
(V_AND_B32_e64 (S_MOV_B32 (i32 0xffff)), $src)
@@ -3073,26 +3071,6 @@ def : GCNPat<
30733071
def : GCNPat<
30743072
(i32 (zext (i16 (bitconvert fp16_zeros_high_16bits:$src)))),
30753073
(COPY VSrc_b16:$src)>;
3076-
}
3077-
3078-
let True16Predicate = UseRealTrue16Insts in {
3079-
def : GCNPat<
3080-
(i32 (DivergentUnaryFrag<zext> i16:$src)),
3081-
(REG_SEQUENCE VGPR_32, $src, lo16, (V_MOV_B16_t16_e64 0, (i16 0), 0), hi16)
3082-
>;
3083-
3084-
def : GCNPat<
3085-
(i64 (DivergentUnaryFrag<zext> i16:$src)),
3086-
(REG_SEQUENCE VReg_64,
3087-
(REG_SEQUENCE VGPR_32, $src, lo16, (V_MOV_B16_t16_e64 0, (i16 0), 0), hi16), sub0,
3088-
(S_MOV_B32 (i32 0)), sub1)
3089-
>;
3090-
3091-
def : GCNPat<
3092-
(i32 (zext (i16 (bitconvert fp16_zeros_high_16bits:$src)))),
3093-
(REG_SEQUENCE VGPR_32, $src, lo16, (V_MOV_B16_t16_e64 0, (i16 0), 0), hi16)
3094-
>;
3095-
}
30963074

30973075
def : GCNPat <
30983076
(i32 (trunc i64:$a)),

llvm/test/CodeGen/AMDGPU/GlobalISel/mul.ll

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -164,7 +164,7 @@ define zeroext i16 @v_mul_i16_zeroext(i16 zeroext %num, i16 zeroext %den) {
164164
; GFX11-TRUE16: ; %bb.0:
165165
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
166166
; GFX11-TRUE16-NEXT: v_mul_lo_u16 v0.l, v0.l, v1.l
167-
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v0.h, 0
167+
; GFX11-TRUE16-NEXT: v_and_b32_e32 v0, 0xffff, v0
168168
; GFX11-TRUE16-NEXT: s_setpc_b64 s[30:31]
169169
;
170170
; GFX11-FAKE16-LABEL: v_mul_i16_zeroext:

llvm/test/CodeGen/AMDGPU/amdgcn.bitcast.1024bit.ll

Lines changed: 6265 additions & 5636 deletions
Large diffs are not rendered by default.

llvm/test/CodeGen/AMDGPU/amdgcn.bitcast.128bit.ll

Lines changed: 602 additions & 546 deletions
Large diffs are not rendered by default.

llvm/test/CodeGen/AMDGPU/amdgcn.bitcast.256bit.ll

Lines changed: 700 additions & 620 deletions
Large diffs are not rendered by default.

llvm/test/CodeGen/AMDGPU/amdgcn.bitcast.320bit.ll

Lines changed: 1534 additions & 1352 deletions
Large diffs are not rendered by default.

llvm/test/CodeGen/AMDGPU/amdgcn.bitcast.32bit.ll

Lines changed: 132 additions & 108 deletions
Large diffs are not rendered by default.

llvm/test/CodeGen/AMDGPU/amdgcn.bitcast.512bit.ll

Lines changed: 2877 additions & 2537 deletions
Large diffs are not rendered by default.

llvm/test/CodeGen/AMDGPU/amdgcn.bitcast.64bit.ll

Lines changed: 350 additions & 287 deletions
Large diffs are not rendered by default.

llvm/test/CodeGen/AMDGPU/amdgcn.bitcast.96bit.ll

Lines changed: 311 additions & 283 deletions
Large diffs are not rendered by default.

0 commit comments

Comments
 (0)