1
+ # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 5
1
2
# RUN: llc -mtriple=amdgcn -run-pass si-fold-operands -verify-machineinstrs %s -o - | FileCheck -check-prefix=GCN %s
2
3
3
- # GCN-LABEL: name: fold-imm-copy
4
- # GCN: V_AND_B32_e32 65535
5
-
6
4
---
7
5
name : fold-imm-copy
8
6
tracksRegLiveness : true
9
7
body : |
10
8
bb.0:
11
9
liveins: $vgpr0, $sgpr0_sgpr1
10
+ ; GCN-LABEL: name: fold-imm-copy
11
+ ; GCN: liveins: $vgpr0, $sgpr0_sgpr1
12
+ ; GCN-NEXT: {{ $}}
13
+ ; GCN-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY $vgpr0
14
+ ; GCN-NEXT: [[COPY1:%[0-9]+]]:sgpr_64 = COPY $sgpr0_sgpr1
15
+ ; GCN-NEXT: [[S_LOAD_DWORDX4_IMM:%[0-9]+]]:sgpr_128 = S_LOAD_DWORDX4_IMM [[COPY1]], 9, 0
16
+ ; GCN-NEXT: [[V_LSHLREV_B32_e64_:%[0-9]+]]:vgpr_32 = V_LSHLREV_B32_e64 2, [[COPY]], implicit $exec
17
+ ; GCN-NEXT: [[V_MOV_B32_e32_:%[0-9]+]]:vgpr_32 = V_MOV_B32_e32 0, implicit $exec
18
+ ; GCN-NEXT: [[REG_SEQUENCE:%[0-9]+]]:vreg_64 = REG_SEQUENCE killed [[V_LSHLREV_B32_e64_]], %subreg.sub0, killed [[V_MOV_B32_e32_]], %subreg.sub1
19
+ ; GCN-NEXT: [[BUFFER_LOAD_DWORD_ADDR64_:%[0-9]+]]:vgpr_32 = BUFFER_LOAD_DWORD_ADDR64 [[REG_SEQUENCE]], [[S_LOAD_DWORDX4_IMM]], 0, 4, 0, 0, implicit $exec
20
+ ; GCN-NEXT: [[V_AND_B32_e32_:%[0-9]+]]:vgpr_32 = V_AND_B32_e32 65535, [[BUFFER_LOAD_DWORD_ADDR64_]], implicit $exec
12
21
%0:vgpr_32 = COPY $vgpr0
13
22
%1:sgpr_64 = COPY $sgpr0_sgpr1
14
23
%2:sgpr_128 = S_LOAD_DWORDX4_IMM %1, 9, 0
@@ -23,14 +32,19 @@ body: |
23
32
...
24
33
25
34
---
26
- # GCN-LABEL: name: no_extra_fold_on_same_opnd
27
35
# The first XOR needs commuting to fold that immediate operand.
28
- # GCN: V_XOR_B32_e32 0, %1
29
- # GCN: V_XOR_B32_e32 %2, %4.sub0
30
36
name : no_extra_fold_on_same_opnd
31
37
tracksRegLiveness : true
32
38
body : |
33
39
bb.0:
40
+ ; GCN-LABEL: name: no_extra_fold_on_same_opnd
41
+ ; GCN: [[DEF:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF
42
+ ; GCN-NEXT: [[DEF1:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF
43
+ ; GCN-NEXT: [[DEF2:%[0-9]+]]:vgpr_32 = IMPLICIT_DEF
44
+ ; GCN-NEXT: [[V_MOV_B32_e32_:%[0-9]+]]:vgpr_32 = V_MOV_B32_e32 0, implicit $exec
45
+ ; GCN-NEXT: [[REG_SEQUENCE:%[0-9]+]]:vreg_64 = REG_SEQUENCE killed [[DEF]], %subreg.sub0, killed [[V_MOV_B32_e32_]], %subreg.sub1
46
+ ; GCN-NEXT: [[V_XOR_B32_e32_:%[0-9]+]]:vgpr_32 = V_XOR_B32_e32 0, [[DEF1]], implicit $exec
47
+ ; GCN-NEXT: [[V_XOR_B32_e32_1:%[0-9]+]]:vgpr_32 = V_XOR_B32_e32 [[DEF2]], [[REG_SEQUENCE]].sub0, implicit $exec
34
48
%0:vgpr_32 = IMPLICIT_DEF
35
49
%1:vgpr_32 = IMPLICIT_DEF
36
50
%2:vgpr_32 = IMPLICIT_DEF
@@ -45,42 +59,44 @@ body: |
45
59
# Make sure the subreg index is not reinterpreted when folding
46
60
# immediates
47
61
#
48
- # GCN-LABEL: name: clear_subreg_imm_fold{{$}}
49
- # GCN: %1:sgpr_32 = S_MOV_B32 4294967288
50
- # GCN: %2:sgpr_32 = S_MOV_B32 4294967295
51
62
name : clear_subreg_imm_fold
52
63
tracksRegLiveness : true
53
64
body : |
54
65
bb.0:
66
+ ; GCN-LABEL: name: clear_subreg_imm_fold
67
+ ; GCN: [[S_MOV_B32_:%[0-9]+]]:sgpr_32 = S_MOV_B32 4294967288
68
+ ; GCN-NEXT: [[S_MOV_B32_1:%[0-9]+]]:sgpr_32 = S_MOV_B32 4294967295
69
+ ; GCN-NEXT: S_ENDPGM 0, implicit [[S_MOV_B32_]], implicit [[S_MOV_B32_1]]
55
70
%0:sreg_64 = S_MOV_B64 -8
56
71
%1:sgpr_32 = COPY %0.sub0
57
72
%2:sgpr_32 = COPY %0.sub1
58
73
S_ENDPGM 0, implicit %1, implicit %2
59
74
60
75
...
61
76
62
- # GCN-LABEL: name: no_fold_imm_into_m0{{$}}
63
- # GCN: %0:sreg_32 = S_MOV_B32 -8
64
- # GCN-NEXT: $m0 = COPY %0
65
-
66
77
---
67
78
name : no_fold_imm_into_m0
68
79
tracksRegLiveness : true
69
80
body : |
70
81
bb.0:
82
+ ; GCN-LABEL: name: no_fold_imm_into_m0
83
+ ; GCN: [[S_MOV_B32_:%[0-9]+]]:sreg_32 = S_MOV_B32 -8
84
+ ; GCN-NEXT: $m0 = COPY [[S_MOV_B32_]]
85
+ ; GCN-NEXT: S_ENDPGM 0, implicit $m0
71
86
%0:sreg_32 = S_MOV_B32 -8
72
87
$m0 = COPY %0
73
88
S_ENDPGM 0, implicit $m0
74
89
75
90
...
76
91
77
- # GCN-LABEL: name: fold_sgpr_imm_to_vgpr_copy{{$}}
78
- # GCN: $vgpr0 = V_MOV_B32_e32 -8, implicit $exec
79
92
---
80
93
name : fold_sgpr_imm_to_vgpr_copy
81
94
tracksRegLiveness : true
82
95
body : |
83
96
bb.0:
97
+ ; GCN-LABEL: name: fold_sgpr_imm_to_vgpr_copy
98
+ ; GCN: $vgpr0 = V_MOV_B32_e32 -8, implicit $exec
99
+ ; GCN-NEXT: S_ENDPGM 0, implicit $vgpr0
84
100
%0:sreg_32 = S_MOV_B32 -8
85
101
$vgpr0 = COPY %0
86
102
S_ENDPGM 0, implicit $vgpr0
@@ -90,16 +106,17 @@ body: |
90
106
# The users of $vgpr1 should not be visited for further immediate
91
107
# folding.
92
108
93
- # GCN-LABEL: name: no_fold_physreg_users_vgpr{{$}}
94
- # GCN: $vgpr1 = V_MOV_B32_e32 0, implicit $exec
95
- # GCN-NEXT: S_NOP 0, implicit-def $vgpr1
96
- # GCN-NEXT: %2:vgpr_32 = COPY $vgpr1
97
- # GCN-NEXT: $vgpr2 = COPY %2
98
109
---
99
110
name : no_fold_physreg_users_vgpr
100
111
tracksRegLiveness : true
101
112
body : |
102
113
bb.0:
114
+ ; GCN-LABEL: name: no_fold_physreg_users_vgpr
115
+ ; GCN: $vgpr1 = V_MOV_B32_e32 0, implicit $exec
116
+ ; GCN-NEXT: S_NOP 0, implicit-def $vgpr1
117
+ ; GCN-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY $vgpr1
118
+ ; GCN-NEXT: $vgpr2 = COPY [[COPY]]
119
+ ; GCN-NEXT: S_ENDPGM 0
103
120
%0:sreg_32 = S_MOV_B32 0
104
121
%1:vgpr_32 = COPY %0
105
122
$vgpr1 = COPY %0
0 commit comments