@@ -16,11 +16,11 @@ define void @t(i8* nocapture %in, i8* nocapture %out, i32* nocapture %rk, i32 %r
16
16
; GENERIC-NEXT: movl (%rdx), %eax
17
17
; GENERIC-NEXT: movl 4(%rdx), %ebx
18
18
; GENERIC-NEXT: decl %ecx
19
- ; GENERIC-NEXT: leaq 20(%rdx), %r11
19
+ ; GENERIC-NEXT: leaq 20(%rdx), %r14
20
20
; GENERIC-NEXT: movq _Te0@{{.*}}(%rip), %r9
21
21
; GENERIC-NEXT: movq _Te1@{{.*}}(%rip), %r8
22
22
; GENERIC-NEXT: movq _Te3@{{.*}}(%rip), %r10
23
- ; GENERIC-NEXT: movq %rcx, %r14
23
+ ; GENERIC-NEXT: movq %rcx, %r11
24
24
; GENERIC-NEXT: .p2align 4, 0x90
25
25
; GENERIC-NEXT: LBB0_1: ## %bb
26
26
; GENERIC-NEXT: ## =>This Inner Loop Header: Depth=1
@@ -32,29 +32,30 @@ define void @t(i8* nocapture %in, i8* nocapture %out, i32* nocapture %rk, i32 %r
32
32
; GENERIC-NEXT: movzbl %bpl, %ebp
33
33
; GENERIC-NEXT: movl (%r8,%rbp,4), %ebp
34
34
; GENERIC-NEXT: xorl (%r9,%rax,4), %ebp
35
- ; GENERIC-NEXT: xorl -12(%r11 ), %ebp
35
+ ; GENERIC-NEXT: xorl -12(%r14 ), %ebp
36
36
; GENERIC-NEXT: shrl $24, %ebx
37
37
; GENERIC-NEXT: movl (%r10,%rdi,4), %edi
38
38
; GENERIC-NEXT: xorl (%r9,%rbx,4), %edi
39
- ; GENERIC-NEXT: xorl -8(%r11 ), %edi
39
+ ; GENERIC-NEXT: xorl -8(%r14 ), %edi
40
40
; GENERIC-NEXT: movl %ebp, %eax
41
41
; GENERIC-NEXT: shrl $24, %eax
42
42
; GENERIC-NEXT: movl (%r9,%rax,4), %eax
43
- ; GENERIC-NEXT: subq $1 , %r14
44
- ; GENERIC-NEXT: jb LBB0_3
43
+ ; GENERIC-NEXT: testq %r11 , %r11
44
+ ; GENERIC-NEXT: je LBB0_3
45
45
; GENERIC-NEXT: ## %bb.2: ## %bb1
46
46
; GENERIC-NEXT: ## in Loop: Header=BB0_1 Depth=1
47
47
; GENERIC-NEXT: movl %edi, %ebx
48
48
; GENERIC-NEXT: shrl $16, %ebx
49
49
; GENERIC-NEXT: movzbl %bl, %ebx
50
50
; GENERIC-NEXT: xorl (%r8,%rbx,4), %eax
51
- ; GENERIC-NEXT: xorl -4(%r11 ), %eax
51
+ ; GENERIC-NEXT: xorl -4(%r14 ), %eax
52
52
; GENERIC-NEXT: shrl $24, %edi
53
53
; GENERIC-NEXT: movzbl %bpl, %ebx
54
54
; GENERIC-NEXT: movl (%r10,%rbx,4), %ebx
55
55
; GENERIC-NEXT: xorl (%r9,%rdi,4), %ebx
56
- ; GENERIC-NEXT: xorl (%r11), %ebx
57
- ; GENERIC-NEXT: addq $16, %r11
56
+ ; GENERIC-NEXT: xorl (%r14), %ebx
57
+ ; GENERIC-NEXT: decq %r11
58
+ ; GENERIC-NEXT: addq $16, %r14
58
59
; GENERIC-NEXT: jmp LBB0_1
59
60
; GENERIC-NEXT: LBB0_3: ## %bb2
60
61
; GENERIC-NEXT: shlq $4, %rcx
@@ -98,12 +99,12 @@ define void @t(i8* nocapture %in, i8* nocapture %out, i32* nocapture %rk, i32 %r
98
99
; ATOM-NEXT: ## kill: def $ecx killed $ecx def $rcx
99
100
; ATOM-NEXT: movl (%rdx), %r15d
100
101
; ATOM-NEXT: movl 4(%rdx), %eax
101
- ; ATOM-NEXT: leaq 20(%rdx), %r11
102
+ ; ATOM-NEXT: leaq 20(%rdx), %r14
102
103
; ATOM-NEXT: movq _Te0@{{.*}}(%rip), %r9
103
104
; ATOM-NEXT: movq _Te1@{{.*}}(%rip), %r8
104
105
; ATOM-NEXT: movq _Te3@{{.*}}(%rip), %r10
105
106
; ATOM-NEXT: decl %ecx
106
- ; ATOM-NEXT: movq %rcx, %r14
107
+ ; ATOM-NEXT: movq %rcx, %r11
107
108
; ATOM-NEXT: .p2align 4, 0x90
108
109
; ATOM-NEXT: LBB0_1: ## %bb
109
110
; ATOM-NEXT: ## =>This Inner Loop Header: Depth=1
@@ -117,27 +118,28 @@ define void @t(i8* nocapture %in, i8* nocapture %out, i32* nocapture %rk, i32 %r
117
118
; ATOM-NEXT: movzbl %r15b, %edi
118
119
; ATOM-NEXT: xorl (%r9,%rbp,4), %ebx
119
120
; ATOM-NEXT: movl (%r10,%rdi,4), %edi
120
- ; ATOM-NEXT: xorl -12(%r11 ), %ebx
121
+ ; ATOM-NEXT: xorl -12(%r14 ), %ebx
121
122
; ATOM-NEXT: xorl (%r9,%rax,4), %edi
122
123
; ATOM-NEXT: movl %ebx, %eax
123
- ; ATOM-NEXT: xorl -8(%r11 ), %edi
124
+ ; ATOM-NEXT: xorl -8(%r14 ), %edi
124
125
; ATOM-NEXT: shrl $24, %eax
125
126
; ATOM-NEXT: movl (%r9,%rax,4), %r15d
126
- ; ATOM-NEXT: subq $1 , %r14
127
+ ; ATOM-NEXT: testq %r11 , %r11
127
128
; ATOM-NEXT: movl %edi, %eax
128
- ; ATOM-NEXT: jb LBB0_3
129
+ ; ATOM-NEXT: je LBB0_3
129
130
; ATOM-NEXT: ## %bb.2: ## %bb1
130
131
; ATOM-NEXT: ## in Loop: Header=BB0_1 Depth=1
131
132
; ATOM-NEXT: shrl $16, %eax
132
133
; ATOM-NEXT: shrl $24, %edi
133
- ; ATOM-NEXT: movzbl %al, %eax
134
- ; ATOM-NEXT: xorl (%r8,%rax,4), %r15d
134
+ ; ATOM-NEXT: decq %r11
135
+ ; ATOM-NEXT: movzbl %al, %ebp
135
136
; ATOM-NEXT: movzbl %bl, %eax
136
137
; ATOM-NEXT: movl (%r10,%rax,4), %eax
137
- ; ATOM-NEXT: xorl -4(%r11 ), %r15d
138
+ ; ATOM-NEXT: xorl (%r8,%rbp,4 ), %r15d
138
139
; ATOM-NEXT: xorl (%r9,%rdi,4), %eax
139
- ; ATOM-NEXT: xorl (%r11), %eax
140
- ; ATOM-NEXT: addq $16, %r11
140
+ ; ATOM-NEXT: xorl -4(%r14), %r15d
141
+ ; ATOM-NEXT: xorl (%r14), %eax
142
+ ; ATOM-NEXT: addq $16, %r14
141
143
; ATOM-NEXT: jmp LBB0_1
142
144
; ATOM-NEXT: LBB0_3: ## %bb2
143
145
; ATOM-NEXT: shrl $16, %eax
0 commit comments