|
1 | 1 | # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 3 |
2 | 2 | # RUN: llc -mtriple=amdgcn -mcpu=gfx1100 -mattr=+real-true16 -run-pass=si-fix-sgpr-copies -verify-machineinstrs -o - %s | FileCheck --check-prefixes=GCN %s |
3 | | -# XFAIL: * |
4 | | -# FIXME-TRUE16 reenable after fix-sgpr-copies is updated for true16 flow |
5 | 3 |
|
6 | 4 | --- |
7 | | -name: cmp_f16 |
| 5 | +name: cvt_hi_f32_f16 |
8 | 6 | body: | |
9 | | - bb.0.entry: |
10 | | - ; GCN-LABEL: name: cmp_f16 |
| 7 | + bb.0: |
| 8 | + ; GCN-LABEL: name: cvt_hi_f32_f16 |
11 | 9 | ; GCN: [[DEF:%[0-9]+]]:vgpr_16 = IMPLICIT_DEF |
12 | | - ; GCN-NEXT: [[DEF1:%[0-9]+]]:sreg_32 = IMPLICIT_DEF |
13 | 10 | ; GCN-NEXT: [[V_CVT_F16_U16_t16_e64_:%[0-9]+]]:vgpr_16 = V_CVT_F16_U16_t16_e64 0, [[DEF]], 0, 0, 0, implicit $mode, implicit $exec |
14 | | - ; GCN-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY [[V_CVT_F16_U16_t16_e64_]] |
15 | | - ; GCN-NEXT: [[COPY1:%[0-9]+]]:vgpr_16 = COPY killed [[COPY]] |
16 | | - ; GCN-NEXT: [[V_CMP_LT_F16_t16_e64_:%[0-9]+]]:sreg_32_xm0_xexec = nofpexcept V_CMP_LT_F16_t16_e64 0, [[COPY1]], 0, [[DEF1]], 0, 0, implicit $mode, implicit $exec |
17 | | - ; GCN-NEXT: [[V_CNDMASK_B32_e64_:%[0-9]+]]:vgpr_32 = V_CNDMASK_B32_e64 0, 0, 0, -1, killed [[V_CMP_LT_F16_t16_e64_]], implicit $exec |
| 11 | + ; GCN-NEXT: [[SUBREG_TO_REG:%[0-9]+]]:vgpr_32 = SUBREG_TO_REG 0, [[V_CVT_F16_U16_t16_e64_]], %subreg.lo16 |
| 12 | + ; GCN-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY [[SUBREG_TO_REG]] |
| 13 | + ; GCN-NEXT: [[V_CVT_F32_F16_t16_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_F16_t16_e64 0, [[COPY]].hi16, 0, 0, 0, implicit $mode, implicit $exec |
18 | 14 | %0:vgpr_16 = IMPLICIT_DEF |
19 | | - %1:sreg_32 = IMPLICIT_DEF |
20 | | - %2:vgpr_16 = V_CVT_F16_U16_t16_e64 0, %0:vgpr_16, 0, 0, 0, implicit $mode, implicit $exec |
21 | | - %3:sreg_32 = COPY %2:vgpr_16 |
22 | | - nofpexcept S_CMP_LT_F16 killed %3:sreg_32, %1:sreg_32, implicit-def $scc, implicit $mode |
23 | | - %4:sreg_32_xm0_xexec = COPY $scc |
24 | | - %5:vgpr_32 = V_CNDMASK_B32_e64 0, 0, 0, -1, killed %4, implicit $exec |
| 15 | + %1:vgpr_16 = V_CVT_F16_U16_t16_e64 0, %0:vgpr_16, 0, 0, 0, implicit $mode, implicit $exec |
| 16 | + %2:sreg_32 = COPY %1:vgpr_16 |
| 17 | + %3:sreg_32 = S_CVT_HI_F32_F16 %2:sreg_32, implicit $mode |
25 | 18 | ... |
26 | 19 |
|
27 | 20 | --- |
28 | | -name: cvt_hi_f32_f16 |
| 21 | +name: s_xor_b32 |
29 | 22 | body: | |
30 | 23 | bb.0: |
31 | | - ; GCN-LABEL: name: cvt_hi_f32_f16 |
| 24 | + ; GCN-LABEL: name: s_xor_b32 |
32 | 25 | ; GCN: [[DEF:%[0-9]+]]:vgpr_16 = IMPLICIT_DEF |
33 | 26 | ; GCN-NEXT: [[V_CVT_F16_U16_t16_e64_:%[0-9]+]]:vgpr_16 = V_CVT_F16_U16_t16_e64 0, [[DEF]], 0, 0, 0, implicit $mode, implicit $exec |
34 | | - ; GCN-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY [[V_CVT_F16_U16_t16_e64_]] |
35 | | - ; GCN-NEXT: [[COPY1:%[0-9]+]]:vgpr_32 = COPY [[COPY]] |
36 | | - ; GCN-NEXT: [[V_CVT_F32_F16_t16_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_F16_t16_e64 0, [[COPY1]].hi16, 0, 0, 0, implicit $mode, implicit $exec |
| 27 | + ; GCN-NEXT: [[SUBREG_TO_REG:%[0-9]+]]:vgpr_32 = SUBREG_TO_REG 0, [[V_CVT_F16_U16_t16_e64_]], %subreg.lo16 |
| 28 | + ; GCN-NEXT: [[V_OR_B32_e64_:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[SUBREG_TO_REG]], [[SUBREG_TO_REG]], implicit $exec |
| 29 | + ; GCN-NEXT: [[V_CVT_F16_U16_t16_e64_1:%[0-9]+]]:vgpr_16 = V_CVT_F16_U16_t16_e64 0, [[V_OR_B32_e64_]].lo16, 0, 0, 0, implicit $mode, implicit $exec |
37 | 30 | %0:vgpr_16 = IMPLICIT_DEF |
38 | 31 | %1:vgpr_16 = V_CVT_F16_U16_t16_e64 0, %0:vgpr_16, 0, 0, 0, implicit $mode, implicit $exec |
39 | 32 | %2:sreg_32 = COPY %1:vgpr_16 |
40 | | - %3:sreg_32 = S_CVT_HI_F32_F16 %2:sreg_32, implicit $mode |
| 33 | + %3:sreg_32 = S_OR_B32 %2:sreg_32, %2:sreg_32, implicit-def $scc |
| 34 | + %4:vgpr_16 = V_CVT_F16_U16_t16_e64 0, %3:sreg_32, 0, 0, 0, implicit $mode, implicit $exec |
41 | 35 | ... |
0 commit comments