@@ -16,11 +16,11 @@ define void @t(i8* nocapture %in, i8* nocapture %out, i32* nocapture %rk, i32 %r
16
16
; GENERIC-NEXT: movl (%rdx), %eax
17
17
; GENERIC-NEXT: movl 4(%rdx), %ebx
18
18
; GENERIC-NEXT: decl %ecx
19
- ; GENERIC-NEXT: leaq 20(%rdx), %r14
19
+ ; GENERIC-NEXT: leaq 20(%rdx), %r11
20
20
; GENERIC-NEXT: movq _Te0@{{.*}}(%rip), %r9
21
21
; GENERIC-NEXT: movq _Te1@{{.*}}(%rip), %r8
22
22
; GENERIC-NEXT: movq _Te3@{{.*}}(%rip), %r10
23
- ; GENERIC-NEXT: movq %rcx, %r11
23
+ ; GENERIC-NEXT: movq %rcx, %r14
24
24
; GENERIC-NEXT: .p2align 4, 0x90
25
25
; GENERIC-NEXT: LBB0_1: ## %bb
26
26
; GENERIC-NEXT: ## =>This Inner Loop Header: Depth=1
@@ -32,30 +32,29 @@ define void @t(i8* nocapture %in, i8* nocapture %out, i32* nocapture %rk, i32 %r
32
32
; GENERIC-NEXT: movzbl %bpl, %ebp
33
33
; GENERIC-NEXT: movl (%r8,%rbp,4), %ebp
34
34
; GENERIC-NEXT: xorl (%r9,%rax,4), %ebp
35
- ; GENERIC-NEXT: xorl -12(%r14 ), %ebp
35
+ ; GENERIC-NEXT: xorl -12(%r11 ), %ebp
36
36
; GENERIC-NEXT: shrl $24, %ebx
37
37
; GENERIC-NEXT: movl (%r10,%rdi,4), %edi
38
38
; GENERIC-NEXT: xorl (%r9,%rbx,4), %edi
39
- ; GENERIC-NEXT: xorl -8(%r14 ), %edi
39
+ ; GENERIC-NEXT: xorl -8(%r11 ), %edi
40
40
; GENERIC-NEXT: movl %ebp, %eax
41
41
; GENERIC-NEXT: shrl $24, %eax
42
42
; GENERIC-NEXT: movl (%r9,%rax,4), %eax
43
- ; GENERIC-NEXT: testq %r11 , %r11
44
- ; GENERIC-NEXT: je LBB0_3
43
+ ; GENERIC-NEXT: subq $1 , %r14
44
+ ; GENERIC-NEXT: jb LBB0_3
45
45
; GENERIC-NEXT: ## %bb.2: ## %bb1
46
46
; GENERIC-NEXT: ## in Loop: Header=BB0_1 Depth=1
47
47
; GENERIC-NEXT: movl %edi, %ebx
48
48
; GENERIC-NEXT: shrl $16, %ebx
49
49
; GENERIC-NEXT: movzbl %bl, %ebx
50
50
; GENERIC-NEXT: xorl (%r8,%rbx,4), %eax
51
- ; GENERIC-NEXT: xorl -4(%r14 ), %eax
51
+ ; GENERIC-NEXT: xorl -4(%r11 ), %eax
52
52
; GENERIC-NEXT: shrl $24, %edi
53
53
; GENERIC-NEXT: movzbl %bpl, %ebx
54
54
; GENERIC-NEXT: movl (%r10,%rbx,4), %ebx
55
55
; GENERIC-NEXT: xorl (%r9,%rdi,4), %ebx
56
- ; GENERIC-NEXT: xorl (%r14), %ebx
57
- ; GENERIC-NEXT: decq %r11
58
- ; GENERIC-NEXT: addq $16, %r14
56
+ ; GENERIC-NEXT: xorl (%r11), %ebx
57
+ ; GENERIC-NEXT: addq $16, %r11
59
58
; GENERIC-NEXT: jmp LBB0_1
60
59
; GENERIC-NEXT: LBB0_3: ## %bb2
61
60
; GENERIC-NEXT: shlq $4, %rcx
@@ -99,12 +98,12 @@ define void @t(i8* nocapture %in, i8* nocapture %out, i32* nocapture %rk, i32 %r
99
98
; ATOM-NEXT: ## kill: def $ecx killed $ecx def $rcx
100
99
; ATOM-NEXT: movl (%rdx), %r15d
101
100
; ATOM-NEXT: movl 4(%rdx), %eax
102
- ; ATOM-NEXT: leaq 20(%rdx), %r14
101
+ ; ATOM-NEXT: leaq 20(%rdx), %r11
103
102
; ATOM-NEXT: movq _Te0@{{.*}}(%rip), %r9
104
103
; ATOM-NEXT: movq _Te1@{{.*}}(%rip), %r8
105
104
; ATOM-NEXT: movq _Te3@{{.*}}(%rip), %r10
106
105
; ATOM-NEXT: decl %ecx
107
- ; ATOM-NEXT: movq %rcx, %r11
106
+ ; ATOM-NEXT: movq %rcx, %r14
108
107
; ATOM-NEXT: .p2align 4, 0x90
109
108
; ATOM-NEXT: LBB0_1: ## %bb
110
109
; ATOM-NEXT: ## =>This Inner Loop Header: Depth=1
@@ -118,28 +117,27 @@ define void @t(i8* nocapture %in, i8* nocapture %out, i32* nocapture %rk, i32 %r
118
117
; ATOM-NEXT: movzbl %r15b, %edi
119
118
; ATOM-NEXT: xorl (%r9,%rbp,4), %ebx
120
119
; ATOM-NEXT: movl (%r10,%rdi,4), %edi
121
- ; ATOM-NEXT: xorl -12(%r14 ), %ebx
120
+ ; ATOM-NEXT: xorl -12(%r11 ), %ebx
122
121
; ATOM-NEXT: xorl (%r9,%rax,4), %edi
123
122
; ATOM-NEXT: movl %ebx, %eax
124
- ; ATOM-NEXT: xorl -8(%r14 ), %edi
123
+ ; ATOM-NEXT: xorl -8(%r11 ), %edi
125
124
; ATOM-NEXT: shrl $24, %eax
126
125
; ATOM-NEXT: movl (%r9,%rax,4), %r15d
127
- ; ATOM-NEXT: testq %r11 , %r11
126
+ ; ATOM-NEXT: subq $1 , %r14
128
127
; ATOM-NEXT: movl %edi, %eax
129
- ; ATOM-NEXT: je LBB0_3
128
+ ; ATOM-NEXT: jb LBB0_3
130
129
; ATOM-NEXT: ## %bb.2: ## %bb1
131
130
; ATOM-NEXT: ## in Loop: Header=BB0_1 Depth=1
132
131
; ATOM-NEXT: shrl $16, %eax
133
132
; ATOM-NEXT: shrl $24, %edi
134
- ; ATOM-NEXT: decq %r11
135
- ; ATOM-NEXT: movzbl %al, %ebp
133
+ ; ATOM-NEXT: movzbl %al, %eax
134
+ ; ATOM-NEXT: xorl (%r8,%rax,4), %r15d
136
135
; ATOM-NEXT: movzbl %bl, %eax
137
136
; ATOM-NEXT: movl (%r10,%rax,4), %eax
138
- ; ATOM-NEXT: xorl (%r8,%rbp,4 ), %r15d
137
+ ; ATOM-NEXT: xorl -4(%r11 ), %r15d
139
138
; ATOM-NEXT: xorl (%r9,%rdi,4), %eax
140
- ; ATOM-NEXT: xorl -4(%r14), %r15d
141
- ; ATOM-NEXT: xorl (%r14), %eax
142
- ; ATOM-NEXT: addq $16, %r14
139
+ ; ATOM-NEXT: xorl (%r11), %eax
140
+ ; ATOM-NEXT: addq $16, %r11
143
141
; ATOM-NEXT: jmp LBB0_1
144
142
; ATOM-NEXT: LBB0_3: ## %bb2
145
143
; ATOM-NEXT: shrl $16, %eax
0 commit comments