xref: /freebsd/sys/crypto/openssl/amd64/sha256-mb-x86_64.S (revision c0855eaa3ee9614804b6bd6a255aa9f71e095f43)
1bc3d5698SJohn Baldwin/* Do not modify. This file is auto-generated from sha256-mb-x86_64.pl. */
2bc3d5698SJohn Baldwin.text
3bc3d5698SJohn Baldwin
4bc3d5698SJohn Baldwin
5bc3d5698SJohn Baldwin
6bc3d5698SJohn Baldwin.globl	sha256_multi_block
7bc3d5698SJohn Baldwin.type	sha256_multi_block,@function
8bc3d5698SJohn Baldwin.align	32
9bc3d5698SJohn Baldwinsha256_multi_block:
10bc3d5698SJohn Baldwin.cfi_startproc
11bc3d5698SJohn Baldwin	movq	OPENSSL_ia32cap_P+4(%rip),%rcx
12bc3d5698SJohn Baldwin	btq	$61,%rcx
13bc3d5698SJohn Baldwin	jc	_shaext_shortcut
14bc3d5698SJohn Baldwin	testl	$268435456,%ecx
15bc3d5698SJohn Baldwin	jnz	_avx_shortcut
16bc3d5698SJohn Baldwin	movq	%rsp,%rax
17bc3d5698SJohn Baldwin.cfi_def_cfa_register	%rax
18bc3d5698SJohn Baldwin	pushq	%rbx
19bc3d5698SJohn Baldwin.cfi_offset	%rbx,-16
20bc3d5698SJohn Baldwin	pushq	%rbp
21bc3d5698SJohn Baldwin.cfi_offset	%rbp,-24
22bc3d5698SJohn Baldwin	subq	$288,%rsp
23bc3d5698SJohn Baldwin	andq	$-256,%rsp
24bc3d5698SJohn Baldwin	movq	%rax,272(%rsp)
25bc3d5698SJohn Baldwin.cfi_escape	0x0f,0x06,0x77,0x90,0x02,0x06,0x23,0x08
26bc3d5698SJohn Baldwin.Lbody:
27bc3d5698SJohn Baldwin	leaq	K256+128(%rip),%rbp
28bc3d5698SJohn Baldwin	leaq	256(%rsp),%rbx
29bc3d5698SJohn Baldwin	leaq	128(%rdi),%rdi
30bc3d5698SJohn Baldwin
31bc3d5698SJohn Baldwin.Loop_grande:
32bc3d5698SJohn Baldwin	movl	%edx,280(%rsp)
33bc3d5698SJohn Baldwin	xorl	%edx,%edx
34*c0855eaaSJohn Baldwin
35bc3d5698SJohn Baldwin	movq	0(%rsi),%r8
36*c0855eaaSJohn Baldwin
37bc3d5698SJohn Baldwin	movl	8(%rsi),%ecx
38bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
39bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
40bc3d5698SJohn Baldwin	testl	%ecx,%ecx
41bc3d5698SJohn Baldwin	movl	%ecx,0(%rbx)
42bc3d5698SJohn Baldwin	cmovleq	%rbp,%r8
43*c0855eaaSJohn Baldwin
44bc3d5698SJohn Baldwin	movq	16(%rsi),%r9
45*c0855eaaSJohn Baldwin
46bc3d5698SJohn Baldwin	movl	24(%rsi),%ecx
47bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
48bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
49bc3d5698SJohn Baldwin	testl	%ecx,%ecx
50bc3d5698SJohn Baldwin	movl	%ecx,4(%rbx)
51bc3d5698SJohn Baldwin	cmovleq	%rbp,%r9
52*c0855eaaSJohn Baldwin
53bc3d5698SJohn Baldwin	movq	32(%rsi),%r10
54*c0855eaaSJohn Baldwin
55bc3d5698SJohn Baldwin	movl	40(%rsi),%ecx
56bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
57bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
58bc3d5698SJohn Baldwin	testl	%ecx,%ecx
59bc3d5698SJohn Baldwin	movl	%ecx,8(%rbx)
60bc3d5698SJohn Baldwin	cmovleq	%rbp,%r10
61*c0855eaaSJohn Baldwin
62bc3d5698SJohn Baldwin	movq	48(%rsi),%r11
63*c0855eaaSJohn Baldwin
64bc3d5698SJohn Baldwin	movl	56(%rsi),%ecx
65bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
66bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
67bc3d5698SJohn Baldwin	testl	%ecx,%ecx
68bc3d5698SJohn Baldwin	movl	%ecx,12(%rbx)
69bc3d5698SJohn Baldwin	cmovleq	%rbp,%r11
70bc3d5698SJohn Baldwin	testl	%edx,%edx
71bc3d5698SJohn Baldwin	jz	.Ldone
72bc3d5698SJohn Baldwin
73bc3d5698SJohn Baldwin	movdqu	0-128(%rdi),%xmm8
74bc3d5698SJohn Baldwin	leaq	128(%rsp),%rax
75bc3d5698SJohn Baldwin	movdqu	32-128(%rdi),%xmm9
76bc3d5698SJohn Baldwin	movdqu	64-128(%rdi),%xmm10
77bc3d5698SJohn Baldwin	movdqu	96-128(%rdi),%xmm11
78bc3d5698SJohn Baldwin	movdqu	128-128(%rdi),%xmm12
79bc3d5698SJohn Baldwin	movdqu	160-128(%rdi),%xmm13
80bc3d5698SJohn Baldwin	movdqu	192-128(%rdi),%xmm14
81bc3d5698SJohn Baldwin	movdqu	224-128(%rdi),%xmm15
82bc3d5698SJohn Baldwin	movdqu	.Lpbswap(%rip),%xmm6
83bc3d5698SJohn Baldwin	jmp	.Loop
84bc3d5698SJohn Baldwin
85bc3d5698SJohn Baldwin.align	32
86bc3d5698SJohn Baldwin.Loop:
87bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm4
88bc3d5698SJohn Baldwin	pxor	%xmm9,%xmm4
89bc3d5698SJohn Baldwin	movd	0(%r8),%xmm5
90bc3d5698SJohn Baldwin	movd	0(%r9),%xmm0
91bc3d5698SJohn Baldwin	movd	0(%r10),%xmm1
92bc3d5698SJohn Baldwin	movd	0(%r11),%xmm2
93bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
94bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
95bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
96bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm7
97bc3d5698SJohn Baldwin.byte	102,15,56,0,238
98bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm2
99bc3d5698SJohn Baldwin
100bc3d5698SJohn Baldwin	psrld	$6,%xmm7
101bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm1
102bc3d5698SJohn Baldwin	pslld	$7,%xmm2
103bc3d5698SJohn Baldwin	movdqa	%xmm5,0-128(%rax)
104bc3d5698SJohn Baldwin	paddd	%xmm15,%xmm5
105bc3d5698SJohn Baldwin
106bc3d5698SJohn Baldwin	psrld	$11,%xmm1
107bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
108bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
109bc3d5698SJohn Baldwin	paddd	-128(%rbp),%xmm5
110bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
111bc3d5698SJohn Baldwin
112bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
113bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm0
114bc3d5698SJohn Baldwin
115bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
116bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm3
117bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
118bc3d5698SJohn Baldwin	pandn	%xmm14,%xmm0
119bc3d5698SJohn Baldwin	pand	%xmm13,%xmm3
120bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
121bc3d5698SJohn Baldwin
122bc3d5698SJohn Baldwin
123bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm1
124bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
125bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm2
126bc3d5698SJohn Baldwin	psrld	$2,%xmm1
127bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
128bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
129bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm3
130bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm7
131bc3d5698SJohn Baldwin	pslld	$10,%xmm2
132bc3d5698SJohn Baldwin	pxor	%xmm8,%xmm3
133bc3d5698SJohn Baldwin
134bc3d5698SJohn Baldwin
135bc3d5698SJohn Baldwin	psrld	$13,%xmm7
136bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
137bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
138bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
139bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
140bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
141bc3d5698SJohn Baldwin
142bc3d5698SJohn Baldwin
143bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
144bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
145bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm15
146bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
147bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
148bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm15
149bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
150bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
151bc3d5698SJohn Baldwin
152bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
153bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm15
154bc3d5698SJohn Baldwin	movd	4(%r8),%xmm5
155bc3d5698SJohn Baldwin	movd	4(%r9),%xmm0
156bc3d5698SJohn Baldwin	movd	4(%r10),%xmm1
157bc3d5698SJohn Baldwin	movd	4(%r11),%xmm2
158bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
159bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
160bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
161bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm7
162bc3d5698SJohn Baldwin
163bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm2
164bc3d5698SJohn Baldwin.byte	102,15,56,0,238
165bc3d5698SJohn Baldwin	psrld	$6,%xmm7
166bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm1
167bc3d5698SJohn Baldwin	pslld	$7,%xmm2
168bc3d5698SJohn Baldwin	movdqa	%xmm5,16-128(%rax)
169bc3d5698SJohn Baldwin	paddd	%xmm14,%xmm5
170bc3d5698SJohn Baldwin
171bc3d5698SJohn Baldwin	psrld	$11,%xmm1
172bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
173bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
174bc3d5698SJohn Baldwin	paddd	-96(%rbp),%xmm5
175bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
176bc3d5698SJohn Baldwin
177bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
178bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm0
179bc3d5698SJohn Baldwin
180bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
181bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm4
182bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
183bc3d5698SJohn Baldwin	pandn	%xmm13,%xmm0
184bc3d5698SJohn Baldwin	pand	%xmm12,%xmm4
185bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
186bc3d5698SJohn Baldwin
187bc3d5698SJohn Baldwin
188bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm1
189bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
190bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm2
191bc3d5698SJohn Baldwin	psrld	$2,%xmm1
192bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
193bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
194bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm4
195bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm7
196bc3d5698SJohn Baldwin	pslld	$10,%xmm2
197bc3d5698SJohn Baldwin	pxor	%xmm15,%xmm4
198bc3d5698SJohn Baldwin
199bc3d5698SJohn Baldwin
200bc3d5698SJohn Baldwin	psrld	$13,%xmm7
201bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
202bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
203bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
204bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
205bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
206bc3d5698SJohn Baldwin
207bc3d5698SJohn Baldwin
208bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
209bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
210bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm14
211bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
212bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
213bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm14
214bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm10
215bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
216bc3d5698SJohn Baldwin
217bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm14
218bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm14
219bc3d5698SJohn Baldwin	movd	8(%r8),%xmm5
220bc3d5698SJohn Baldwin	movd	8(%r9),%xmm0
221bc3d5698SJohn Baldwin	movd	8(%r10),%xmm1
222bc3d5698SJohn Baldwin	movd	8(%r11),%xmm2
223bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
224bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
225bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
226bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm7
227bc3d5698SJohn Baldwin.byte	102,15,56,0,238
228bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm2
229bc3d5698SJohn Baldwin
230bc3d5698SJohn Baldwin	psrld	$6,%xmm7
231bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm1
232bc3d5698SJohn Baldwin	pslld	$7,%xmm2
233bc3d5698SJohn Baldwin	movdqa	%xmm5,32-128(%rax)
234bc3d5698SJohn Baldwin	paddd	%xmm13,%xmm5
235bc3d5698SJohn Baldwin
236bc3d5698SJohn Baldwin	psrld	$11,%xmm1
237bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
238bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
239bc3d5698SJohn Baldwin	paddd	-64(%rbp),%xmm5
240bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
241bc3d5698SJohn Baldwin
242bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
243bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm0
244bc3d5698SJohn Baldwin
245bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
246bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm3
247bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
248bc3d5698SJohn Baldwin	pandn	%xmm12,%xmm0
249bc3d5698SJohn Baldwin	pand	%xmm11,%xmm3
250bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
251bc3d5698SJohn Baldwin
252bc3d5698SJohn Baldwin
253bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm1
254bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
255bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm2
256bc3d5698SJohn Baldwin	psrld	$2,%xmm1
257bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
258bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
259bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm3
260bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm7
261bc3d5698SJohn Baldwin	pslld	$10,%xmm2
262bc3d5698SJohn Baldwin	pxor	%xmm14,%xmm3
263bc3d5698SJohn Baldwin
264bc3d5698SJohn Baldwin
265bc3d5698SJohn Baldwin	psrld	$13,%xmm7
266bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
267bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
268bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
269bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
270bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
271bc3d5698SJohn Baldwin
272bc3d5698SJohn Baldwin
273bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
274bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
275bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm13
276bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
277bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
278bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm13
279bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm9
280bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
281bc3d5698SJohn Baldwin
282bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm13
283bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm13
284bc3d5698SJohn Baldwin	movd	12(%r8),%xmm5
285bc3d5698SJohn Baldwin	movd	12(%r9),%xmm0
286bc3d5698SJohn Baldwin	movd	12(%r10),%xmm1
287bc3d5698SJohn Baldwin	movd	12(%r11),%xmm2
288bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
289bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
290bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
291bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm7
292bc3d5698SJohn Baldwin
293bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm2
294bc3d5698SJohn Baldwin.byte	102,15,56,0,238
295bc3d5698SJohn Baldwin	psrld	$6,%xmm7
296bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm1
297bc3d5698SJohn Baldwin	pslld	$7,%xmm2
298bc3d5698SJohn Baldwin	movdqa	%xmm5,48-128(%rax)
299bc3d5698SJohn Baldwin	paddd	%xmm12,%xmm5
300bc3d5698SJohn Baldwin
301bc3d5698SJohn Baldwin	psrld	$11,%xmm1
302bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
303bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
304bc3d5698SJohn Baldwin	paddd	-32(%rbp),%xmm5
305bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
306bc3d5698SJohn Baldwin
307bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
308bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm0
309bc3d5698SJohn Baldwin
310bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
311bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm4
312bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
313bc3d5698SJohn Baldwin	pandn	%xmm11,%xmm0
314bc3d5698SJohn Baldwin	pand	%xmm10,%xmm4
315bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
316bc3d5698SJohn Baldwin
317bc3d5698SJohn Baldwin
318bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm1
319bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
320bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm2
321bc3d5698SJohn Baldwin	psrld	$2,%xmm1
322bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
323bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
324bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm4
325bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm7
326bc3d5698SJohn Baldwin	pslld	$10,%xmm2
327bc3d5698SJohn Baldwin	pxor	%xmm13,%xmm4
328bc3d5698SJohn Baldwin
329bc3d5698SJohn Baldwin
330bc3d5698SJohn Baldwin	psrld	$13,%xmm7
331bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
332bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
333bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
334bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
335bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
336bc3d5698SJohn Baldwin
337bc3d5698SJohn Baldwin
338bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
339bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
340bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm12
341bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
342bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
343bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm12
344bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm8
345bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
346bc3d5698SJohn Baldwin
347bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm12
348bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm12
349bc3d5698SJohn Baldwin	movd	16(%r8),%xmm5
350bc3d5698SJohn Baldwin	movd	16(%r9),%xmm0
351bc3d5698SJohn Baldwin	movd	16(%r10),%xmm1
352bc3d5698SJohn Baldwin	movd	16(%r11),%xmm2
353bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
354bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
355bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
356bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm7
357bc3d5698SJohn Baldwin.byte	102,15,56,0,238
358bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm2
359bc3d5698SJohn Baldwin
360bc3d5698SJohn Baldwin	psrld	$6,%xmm7
361bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm1
362bc3d5698SJohn Baldwin	pslld	$7,%xmm2
363bc3d5698SJohn Baldwin	movdqa	%xmm5,64-128(%rax)
364bc3d5698SJohn Baldwin	paddd	%xmm11,%xmm5
365bc3d5698SJohn Baldwin
366bc3d5698SJohn Baldwin	psrld	$11,%xmm1
367bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
368bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
369bc3d5698SJohn Baldwin	paddd	0(%rbp),%xmm5
370bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
371bc3d5698SJohn Baldwin
372bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
373bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm0
374bc3d5698SJohn Baldwin
375bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
376bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm3
377bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
378bc3d5698SJohn Baldwin	pandn	%xmm10,%xmm0
379bc3d5698SJohn Baldwin	pand	%xmm9,%xmm3
380bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
381bc3d5698SJohn Baldwin
382bc3d5698SJohn Baldwin
383bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm1
384bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
385bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm2
386bc3d5698SJohn Baldwin	psrld	$2,%xmm1
387bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
388bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
389bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm3
390bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm7
391bc3d5698SJohn Baldwin	pslld	$10,%xmm2
392bc3d5698SJohn Baldwin	pxor	%xmm12,%xmm3
393bc3d5698SJohn Baldwin
394bc3d5698SJohn Baldwin
395bc3d5698SJohn Baldwin	psrld	$13,%xmm7
396bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
397bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
398bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
399bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
400bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
401bc3d5698SJohn Baldwin
402bc3d5698SJohn Baldwin
403bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
404bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
405bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm11
406bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
407bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
408bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm11
409bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
410bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
411bc3d5698SJohn Baldwin
412bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
413bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm11
414bc3d5698SJohn Baldwin	movd	20(%r8),%xmm5
415bc3d5698SJohn Baldwin	movd	20(%r9),%xmm0
416bc3d5698SJohn Baldwin	movd	20(%r10),%xmm1
417bc3d5698SJohn Baldwin	movd	20(%r11),%xmm2
418bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
419bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
420bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
421bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm7
422bc3d5698SJohn Baldwin
423bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm2
424bc3d5698SJohn Baldwin.byte	102,15,56,0,238
425bc3d5698SJohn Baldwin	psrld	$6,%xmm7
426bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm1
427bc3d5698SJohn Baldwin	pslld	$7,%xmm2
428bc3d5698SJohn Baldwin	movdqa	%xmm5,80-128(%rax)
429bc3d5698SJohn Baldwin	paddd	%xmm10,%xmm5
430bc3d5698SJohn Baldwin
431bc3d5698SJohn Baldwin	psrld	$11,%xmm1
432bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
433bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
434bc3d5698SJohn Baldwin	paddd	32(%rbp),%xmm5
435bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
436bc3d5698SJohn Baldwin
437bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
438bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm0
439bc3d5698SJohn Baldwin
440bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
441bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm4
442bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
443bc3d5698SJohn Baldwin	pandn	%xmm9,%xmm0
444bc3d5698SJohn Baldwin	pand	%xmm8,%xmm4
445bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
446bc3d5698SJohn Baldwin
447bc3d5698SJohn Baldwin
448bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm1
449bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
450bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm2
451bc3d5698SJohn Baldwin	psrld	$2,%xmm1
452bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
453bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
454bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm4
455bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm7
456bc3d5698SJohn Baldwin	pslld	$10,%xmm2
457bc3d5698SJohn Baldwin	pxor	%xmm11,%xmm4
458bc3d5698SJohn Baldwin
459bc3d5698SJohn Baldwin
460bc3d5698SJohn Baldwin	psrld	$13,%xmm7
461bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
462bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
463bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
464bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
465bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
466bc3d5698SJohn Baldwin
467bc3d5698SJohn Baldwin
468bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
469bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
470bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm10
471bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
472bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
473bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm10
474bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm14
475bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
476bc3d5698SJohn Baldwin
477bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm10
478bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm10
479bc3d5698SJohn Baldwin	movd	24(%r8),%xmm5
480bc3d5698SJohn Baldwin	movd	24(%r9),%xmm0
481bc3d5698SJohn Baldwin	movd	24(%r10),%xmm1
482bc3d5698SJohn Baldwin	movd	24(%r11),%xmm2
483bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
484bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
485bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
486bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm7
487bc3d5698SJohn Baldwin.byte	102,15,56,0,238
488bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm2
489bc3d5698SJohn Baldwin
490bc3d5698SJohn Baldwin	psrld	$6,%xmm7
491bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm1
492bc3d5698SJohn Baldwin	pslld	$7,%xmm2
493bc3d5698SJohn Baldwin	movdqa	%xmm5,96-128(%rax)
494bc3d5698SJohn Baldwin	paddd	%xmm9,%xmm5
495bc3d5698SJohn Baldwin
496bc3d5698SJohn Baldwin	psrld	$11,%xmm1
497bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
498bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
499bc3d5698SJohn Baldwin	paddd	64(%rbp),%xmm5
500bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
501bc3d5698SJohn Baldwin
502bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
503bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm0
504bc3d5698SJohn Baldwin
505bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
506bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm3
507bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
508bc3d5698SJohn Baldwin	pandn	%xmm8,%xmm0
509bc3d5698SJohn Baldwin	pand	%xmm15,%xmm3
510bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
511bc3d5698SJohn Baldwin
512bc3d5698SJohn Baldwin
513bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm1
514bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
515bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm2
516bc3d5698SJohn Baldwin	psrld	$2,%xmm1
517bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
518bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
519bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm3
520bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm7
521bc3d5698SJohn Baldwin	pslld	$10,%xmm2
522bc3d5698SJohn Baldwin	pxor	%xmm10,%xmm3
523bc3d5698SJohn Baldwin
524bc3d5698SJohn Baldwin
525bc3d5698SJohn Baldwin	psrld	$13,%xmm7
526bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
527bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
528bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
529bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
530bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
531bc3d5698SJohn Baldwin
532bc3d5698SJohn Baldwin
533bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
534bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
535bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm9
536bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
537bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
538bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm9
539bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm13
540bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
541bc3d5698SJohn Baldwin
542bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm9
543bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm9
544bc3d5698SJohn Baldwin	movd	28(%r8),%xmm5
545bc3d5698SJohn Baldwin	movd	28(%r9),%xmm0
546bc3d5698SJohn Baldwin	movd	28(%r10),%xmm1
547bc3d5698SJohn Baldwin	movd	28(%r11),%xmm2
548bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
549bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
550bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
551bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm7
552bc3d5698SJohn Baldwin
553bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm2
554bc3d5698SJohn Baldwin.byte	102,15,56,0,238
555bc3d5698SJohn Baldwin	psrld	$6,%xmm7
556bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm1
557bc3d5698SJohn Baldwin	pslld	$7,%xmm2
558bc3d5698SJohn Baldwin	movdqa	%xmm5,112-128(%rax)
559bc3d5698SJohn Baldwin	paddd	%xmm8,%xmm5
560bc3d5698SJohn Baldwin
561bc3d5698SJohn Baldwin	psrld	$11,%xmm1
562bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
563bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
564bc3d5698SJohn Baldwin	paddd	96(%rbp),%xmm5
565bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
566bc3d5698SJohn Baldwin
567bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
568bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm0
569bc3d5698SJohn Baldwin
570bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
571bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm4
572bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
573bc3d5698SJohn Baldwin	pandn	%xmm15,%xmm0
574bc3d5698SJohn Baldwin	pand	%xmm14,%xmm4
575bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
576bc3d5698SJohn Baldwin
577bc3d5698SJohn Baldwin
578bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm1
579bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
580bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm2
581bc3d5698SJohn Baldwin	psrld	$2,%xmm1
582bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
583bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
584bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm4
585bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm7
586bc3d5698SJohn Baldwin	pslld	$10,%xmm2
587bc3d5698SJohn Baldwin	pxor	%xmm9,%xmm4
588bc3d5698SJohn Baldwin
589bc3d5698SJohn Baldwin
590bc3d5698SJohn Baldwin	psrld	$13,%xmm7
591bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
592bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
593bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
594bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
595bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
596bc3d5698SJohn Baldwin
597bc3d5698SJohn Baldwin
598bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
599bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
600bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm8
601bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
602bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
603bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm8
604bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm12
605bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
606bc3d5698SJohn Baldwin
607bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm8
608bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm8
609bc3d5698SJohn Baldwin	leaq	256(%rbp),%rbp
610bc3d5698SJohn Baldwin	movd	32(%r8),%xmm5
611bc3d5698SJohn Baldwin	movd	32(%r9),%xmm0
612bc3d5698SJohn Baldwin	movd	32(%r10),%xmm1
613bc3d5698SJohn Baldwin	movd	32(%r11),%xmm2
614bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
615bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
616bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
617bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm7
618bc3d5698SJohn Baldwin.byte	102,15,56,0,238
619bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm2
620bc3d5698SJohn Baldwin
621bc3d5698SJohn Baldwin	psrld	$6,%xmm7
622bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm1
623bc3d5698SJohn Baldwin	pslld	$7,%xmm2
624bc3d5698SJohn Baldwin	movdqa	%xmm5,128-128(%rax)
625bc3d5698SJohn Baldwin	paddd	%xmm15,%xmm5
626bc3d5698SJohn Baldwin
627bc3d5698SJohn Baldwin	psrld	$11,%xmm1
628bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
629bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
630bc3d5698SJohn Baldwin	paddd	-128(%rbp),%xmm5
631bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
632bc3d5698SJohn Baldwin
633bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
634bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm0
635bc3d5698SJohn Baldwin
636bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
637bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm3
638bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
639bc3d5698SJohn Baldwin	pandn	%xmm14,%xmm0
640bc3d5698SJohn Baldwin	pand	%xmm13,%xmm3
641bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
642bc3d5698SJohn Baldwin
643bc3d5698SJohn Baldwin
644bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm1
645bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
646bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm2
647bc3d5698SJohn Baldwin	psrld	$2,%xmm1
648bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
649bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
650bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm3
651bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm7
652bc3d5698SJohn Baldwin	pslld	$10,%xmm2
653bc3d5698SJohn Baldwin	pxor	%xmm8,%xmm3
654bc3d5698SJohn Baldwin
655bc3d5698SJohn Baldwin
656bc3d5698SJohn Baldwin	psrld	$13,%xmm7
657bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
658bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
659bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
660bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
661bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
662bc3d5698SJohn Baldwin
663bc3d5698SJohn Baldwin
664bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
665bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
666bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm15
667bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
668bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
669bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm15
670bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
671bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
672bc3d5698SJohn Baldwin
673bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
674bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm15
675bc3d5698SJohn Baldwin	movd	36(%r8),%xmm5
676bc3d5698SJohn Baldwin	movd	36(%r9),%xmm0
677bc3d5698SJohn Baldwin	movd	36(%r10),%xmm1
678bc3d5698SJohn Baldwin	movd	36(%r11),%xmm2
679bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
680bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
681bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
682bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm7
683bc3d5698SJohn Baldwin
684bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm2
685bc3d5698SJohn Baldwin.byte	102,15,56,0,238
686bc3d5698SJohn Baldwin	psrld	$6,%xmm7
687bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm1
688bc3d5698SJohn Baldwin	pslld	$7,%xmm2
689bc3d5698SJohn Baldwin	movdqa	%xmm5,144-128(%rax)
690bc3d5698SJohn Baldwin	paddd	%xmm14,%xmm5
691bc3d5698SJohn Baldwin
692bc3d5698SJohn Baldwin	psrld	$11,%xmm1
693bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
694bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
695bc3d5698SJohn Baldwin	paddd	-96(%rbp),%xmm5
696bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
697bc3d5698SJohn Baldwin
698bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
699bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm0
700bc3d5698SJohn Baldwin
701bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
702bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm4
703bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
704bc3d5698SJohn Baldwin	pandn	%xmm13,%xmm0
705bc3d5698SJohn Baldwin	pand	%xmm12,%xmm4
706bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
707bc3d5698SJohn Baldwin
708bc3d5698SJohn Baldwin
709bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm1
710bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
711bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm2
712bc3d5698SJohn Baldwin	psrld	$2,%xmm1
713bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
714bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
715bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm4
716bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm7
717bc3d5698SJohn Baldwin	pslld	$10,%xmm2
718bc3d5698SJohn Baldwin	pxor	%xmm15,%xmm4
719bc3d5698SJohn Baldwin
720bc3d5698SJohn Baldwin
721bc3d5698SJohn Baldwin	psrld	$13,%xmm7
722bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
723bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
724bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
725bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
726bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
727bc3d5698SJohn Baldwin
728bc3d5698SJohn Baldwin
729bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
730bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
731bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm14
732bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
733bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
734bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm14
735bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm10
736bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
737bc3d5698SJohn Baldwin
738bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm14
739bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm14
740bc3d5698SJohn Baldwin	movd	40(%r8),%xmm5
741bc3d5698SJohn Baldwin	movd	40(%r9),%xmm0
742bc3d5698SJohn Baldwin	movd	40(%r10),%xmm1
743bc3d5698SJohn Baldwin	movd	40(%r11),%xmm2
744bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
745bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
746bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
747bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm7
748bc3d5698SJohn Baldwin.byte	102,15,56,0,238
749bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm2
750bc3d5698SJohn Baldwin
751bc3d5698SJohn Baldwin	psrld	$6,%xmm7
752bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm1
753bc3d5698SJohn Baldwin	pslld	$7,%xmm2
754bc3d5698SJohn Baldwin	movdqa	%xmm5,160-128(%rax)
755bc3d5698SJohn Baldwin	paddd	%xmm13,%xmm5
756bc3d5698SJohn Baldwin
757bc3d5698SJohn Baldwin	psrld	$11,%xmm1
758bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
759bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
760bc3d5698SJohn Baldwin	paddd	-64(%rbp),%xmm5
761bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
762bc3d5698SJohn Baldwin
763bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
764bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm0
765bc3d5698SJohn Baldwin
766bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
767bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm3
768bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
769bc3d5698SJohn Baldwin	pandn	%xmm12,%xmm0
770bc3d5698SJohn Baldwin	pand	%xmm11,%xmm3
771bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
772bc3d5698SJohn Baldwin
773bc3d5698SJohn Baldwin
774bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm1
775bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
776bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm2
777bc3d5698SJohn Baldwin	psrld	$2,%xmm1
778bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
779bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
780bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm3
781bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm7
782bc3d5698SJohn Baldwin	pslld	$10,%xmm2
783bc3d5698SJohn Baldwin	pxor	%xmm14,%xmm3
784bc3d5698SJohn Baldwin
785bc3d5698SJohn Baldwin
786bc3d5698SJohn Baldwin	psrld	$13,%xmm7
787bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
788bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
789bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
790bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
791bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
792bc3d5698SJohn Baldwin
793bc3d5698SJohn Baldwin
794bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
795bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
796bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm13
797bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
798bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
799bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm13
800bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm9
801bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
802bc3d5698SJohn Baldwin
803bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm13
804bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm13
805bc3d5698SJohn Baldwin	movd	44(%r8),%xmm5
806bc3d5698SJohn Baldwin	movd	44(%r9),%xmm0
807bc3d5698SJohn Baldwin	movd	44(%r10),%xmm1
808bc3d5698SJohn Baldwin	movd	44(%r11),%xmm2
809bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
810bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
811bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
812bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm7
813bc3d5698SJohn Baldwin
814bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm2
815bc3d5698SJohn Baldwin.byte	102,15,56,0,238
816bc3d5698SJohn Baldwin	psrld	$6,%xmm7
817bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm1
818bc3d5698SJohn Baldwin	pslld	$7,%xmm2
819bc3d5698SJohn Baldwin	movdqa	%xmm5,176-128(%rax)
820bc3d5698SJohn Baldwin	paddd	%xmm12,%xmm5
821bc3d5698SJohn Baldwin
822bc3d5698SJohn Baldwin	psrld	$11,%xmm1
823bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
824bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
825bc3d5698SJohn Baldwin	paddd	-32(%rbp),%xmm5
826bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
827bc3d5698SJohn Baldwin
828bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
829bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm0
830bc3d5698SJohn Baldwin
831bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
832bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm4
833bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
834bc3d5698SJohn Baldwin	pandn	%xmm11,%xmm0
835bc3d5698SJohn Baldwin	pand	%xmm10,%xmm4
836bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
837bc3d5698SJohn Baldwin
838bc3d5698SJohn Baldwin
839bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm1
840bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
841bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm2
842bc3d5698SJohn Baldwin	psrld	$2,%xmm1
843bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
844bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
845bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm4
846bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm7
847bc3d5698SJohn Baldwin	pslld	$10,%xmm2
848bc3d5698SJohn Baldwin	pxor	%xmm13,%xmm4
849bc3d5698SJohn Baldwin
850bc3d5698SJohn Baldwin
851bc3d5698SJohn Baldwin	psrld	$13,%xmm7
852bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
853bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
854bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
855bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
856bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
857bc3d5698SJohn Baldwin
858bc3d5698SJohn Baldwin
859bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
860bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
861bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm12
862bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
863bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
864bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm12
865bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm8
866bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
867bc3d5698SJohn Baldwin
868bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm12
869bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm12
870bc3d5698SJohn Baldwin	movd	48(%r8),%xmm5
871bc3d5698SJohn Baldwin	movd	48(%r9),%xmm0
872bc3d5698SJohn Baldwin	movd	48(%r10),%xmm1
873bc3d5698SJohn Baldwin	movd	48(%r11),%xmm2
874bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
875bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
876bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
877bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm7
878bc3d5698SJohn Baldwin.byte	102,15,56,0,238
879bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm2
880bc3d5698SJohn Baldwin
881bc3d5698SJohn Baldwin	psrld	$6,%xmm7
882bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm1
883bc3d5698SJohn Baldwin	pslld	$7,%xmm2
884bc3d5698SJohn Baldwin	movdqa	%xmm5,192-128(%rax)
885bc3d5698SJohn Baldwin	paddd	%xmm11,%xmm5
886bc3d5698SJohn Baldwin
887bc3d5698SJohn Baldwin	psrld	$11,%xmm1
888bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
889bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
890bc3d5698SJohn Baldwin	paddd	0(%rbp),%xmm5
891bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
892bc3d5698SJohn Baldwin
893bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
894bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm0
895bc3d5698SJohn Baldwin
896bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
897bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm3
898bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
899bc3d5698SJohn Baldwin	pandn	%xmm10,%xmm0
900bc3d5698SJohn Baldwin	pand	%xmm9,%xmm3
901bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
902bc3d5698SJohn Baldwin
903bc3d5698SJohn Baldwin
904bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm1
905bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
906bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm2
907bc3d5698SJohn Baldwin	psrld	$2,%xmm1
908bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
909bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
910bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm3
911bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm7
912bc3d5698SJohn Baldwin	pslld	$10,%xmm2
913bc3d5698SJohn Baldwin	pxor	%xmm12,%xmm3
914bc3d5698SJohn Baldwin
915bc3d5698SJohn Baldwin
916bc3d5698SJohn Baldwin	psrld	$13,%xmm7
917bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
918bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
919bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
920bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
921bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
922bc3d5698SJohn Baldwin
923bc3d5698SJohn Baldwin
924bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
925bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
926bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm11
927bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
928bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
929bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm11
930bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
931bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
932bc3d5698SJohn Baldwin
933bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
934bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm11
935bc3d5698SJohn Baldwin	movd	52(%r8),%xmm5
936bc3d5698SJohn Baldwin	movd	52(%r9),%xmm0
937bc3d5698SJohn Baldwin	movd	52(%r10),%xmm1
938bc3d5698SJohn Baldwin	movd	52(%r11),%xmm2
939bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
940bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
941bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
942bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm7
943bc3d5698SJohn Baldwin
944bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm2
945bc3d5698SJohn Baldwin.byte	102,15,56,0,238
946bc3d5698SJohn Baldwin	psrld	$6,%xmm7
947bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm1
948bc3d5698SJohn Baldwin	pslld	$7,%xmm2
949bc3d5698SJohn Baldwin	movdqa	%xmm5,208-128(%rax)
950bc3d5698SJohn Baldwin	paddd	%xmm10,%xmm5
951bc3d5698SJohn Baldwin
952bc3d5698SJohn Baldwin	psrld	$11,%xmm1
953bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
954bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
955bc3d5698SJohn Baldwin	paddd	32(%rbp),%xmm5
956bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
957bc3d5698SJohn Baldwin
958bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
959bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm0
960bc3d5698SJohn Baldwin
961bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
962bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm4
963bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
964bc3d5698SJohn Baldwin	pandn	%xmm9,%xmm0
965bc3d5698SJohn Baldwin	pand	%xmm8,%xmm4
966bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
967bc3d5698SJohn Baldwin
968bc3d5698SJohn Baldwin
969bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm1
970bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
971bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm2
972bc3d5698SJohn Baldwin	psrld	$2,%xmm1
973bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
974bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
975bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm4
976bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm7
977bc3d5698SJohn Baldwin	pslld	$10,%xmm2
978bc3d5698SJohn Baldwin	pxor	%xmm11,%xmm4
979bc3d5698SJohn Baldwin
980bc3d5698SJohn Baldwin
981bc3d5698SJohn Baldwin	psrld	$13,%xmm7
982bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
983bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
984bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
985bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
986bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
987bc3d5698SJohn Baldwin
988bc3d5698SJohn Baldwin
989bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
990bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
991bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm10
992bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
993bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
994bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm10
995bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm14
996bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
997bc3d5698SJohn Baldwin
998bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm10
999bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm10
1000bc3d5698SJohn Baldwin	movd	56(%r8),%xmm5
1001bc3d5698SJohn Baldwin	movd	56(%r9),%xmm0
1002bc3d5698SJohn Baldwin	movd	56(%r10),%xmm1
1003bc3d5698SJohn Baldwin	movd	56(%r11),%xmm2
1004bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
1005bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
1006bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
1007bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm7
1008bc3d5698SJohn Baldwin.byte	102,15,56,0,238
1009bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm2
1010bc3d5698SJohn Baldwin
1011bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1012bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm1
1013bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1014bc3d5698SJohn Baldwin	movdqa	%xmm5,224-128(%rax)
1015bc3d5698SJohn Baldwin	paddd	%xmm9,%xmm5
1016bc3d5698SJohn Baldwin
1017bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1018bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1019bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1020bc3d5698SJohn Baldwin	paddd	64(%rbp),%xmm5
1021bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1022bc3d5698SJohn Baldwin
1023bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1024bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm0
1025bc3d5698SJohn Baldwin
1026bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1027bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm3
1028bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1029bc3d5698SJohn Baldwin	pandn	%xmm8,%xmm0
1030bc3d5698SJohn Baldwin	pand	%xmm15,%xmm3
1031bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1032bc3d5698SJohn Baldwin
1033bc3d5698SJohn Baldwin
1034bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm1
1035bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1036bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm2
1037bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1038bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1039bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1040bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm3
1041bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm7
1042bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1043bc3d5698SJohn Baldwin	pxor	%xmm10,%xmm3
1044bc3d5698SJohn Baldwin
1045bc3d5698SJohn Baldwin
1046bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1047bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1048bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1049bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1050bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
1051bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1052bc3d5698SJohn Baldwin
1053bc3d5698SJohn Baldwin
1054bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1055bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1056bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm9
1057bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1058bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1059bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm9
1060bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm13
1061bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1062bc3d5698SJohn Baldwin
1063bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm9
1064bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm9
1065bc3d5698SJohn Baldwin	movd	60(%r8),%xmm5
1066bc3d5698SJohn Baldwin	leaq	64(%r8),%r8
1067bc3d5698SJohn Baldwin	movd	60(%r9),%xmm0
1068bc3d5698SJohn Baldwin	leaq	64(%r9),%r9
1069bc3d5698SJohn Baldwin	movd	60(%r10),%xmm1
1070bc3d5698SJohn Baldwin	leaq	64(%r10),%r10
1071bc3d5698SJohn Baldwin	movd	60(%r11),%xmm2
1072bc3d5698SJohn Baldwin	leaq	64(%r11),%r11
1073bc3d5698SJohn Baldwin	punpckldq	%xmm1,%xmm5
1074bc3d5698SJohn Baldwin	punpckldq	%xmm2,%xmm0
1075bc3d5698SJohn Baldwin	punpckldq	%xmm0,%xmm5
1076bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm7
1077bc3d5698SJohn Baldwin
1078bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm2
1079bc3d5698SJohn Baldwin.byte	102,15,56,0,238
1080bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1081bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm1
1082bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1083bc3d5698SJohn Baldwin	movdqa	%xmm5,240-128(%rax)
1084bc3d5698SJohn Baldwin	paddd	%xmm8,%xmm5
1085bc3d5698SJohn Baldwin
1086bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1087bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1088bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1089bc3d5698SJohn Baldwin	paddd	96(%rbp),%xmm5
1090bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1091bc3d5698SJohn Baldwin
1092bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1093bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm0
1094bc3d5698SJohn Baldwin	prefetcht0	63(%r8)
1095bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1096bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm4
1097bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1098bc3d5698SJohn Baldwin	pandn	%xmm15,%xmm0
1099bc3d5698SJohn Baldwin	pand	%xmm14,%xmm4
1100bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1101bc3d5698SJohn Baldwin
1102bc3d5698SJohn Baldwin	prefetcht0	63(%r9)
1103bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm1
1104bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1105bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm2
1106bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1107bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1108bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1109bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm4
1110bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm7
1111bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1112bc3d5698SJohn Baldwin	pxor	%xmm9,%xmm4
1113bc3d5698SJohn Baldwin
1114bc3d5698SJohn Baldwin	prefetcht0	63(%r10)
1115bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1116bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1117bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1118bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1119bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
1120bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1121bc3d5698SJohn Baldwin
1122bc3d5698SJohn Baldwin	prefetcht0	63(%r11)
1123bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1124bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1125bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm8
1126bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1127bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1128bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm8
1129bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm12
1130bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1131bc3d5698SJohn Baldwin
1132bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm8
1133bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm8
1134bc3d5698SJohn Baldwin	leaq	256(%rbp),%rbp
1135bc3d5698SJohn Baldwin	movdqu	0-128(%rax),%xmm5
1136bc3d5698SJohn Baldwin	movl	$3,%ecx
1137bc3d5698SJohn Baldwin	jmp	.Loop_16_xx
1138bc3d5698SJohn Baldwin.align	32
1139bc3d5698SJohn Baldwin.Loop_16_xx:
1140bc3d5698SJohn Baldwin	movdqa	16-128(%rax),%xmm6
1141bc3d5698SJohn Baldwin	paddd	144-128(%rax),%xmm5
1142bc3d5698SJohn Baldwin
1143bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm7
1144bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm1
1145bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1146bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm2
1147bc3d5698SJohn Baldwin
1148bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1149bc3d5698SJohn Baldwin	movdqa	224-128(%rax),%xmm0
1150bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1151bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1152bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1153bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm3
1154bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1155bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1156bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1157bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1158bc3d5698SJohn Baldwin	movdqa	%xmm3,%xmm1
1159bc3d5698SJohn Baldwin
1160bc3d5698SJohn Baldwin	psrld	$17,%xmm3
1161bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1162bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1163bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1164bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1165bc3d5698SJohn Baldwin	psrld	$19-17,%xmm3
1166bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1167bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1168bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1169bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1170bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1171bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm7
1172bc3d5698SJohn Baldwin
1173bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm2
1174bc3d5698SJohn Baldwin
1175bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1176bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm1
1177bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1178bc3d5698SJohn Baldwin	movdqa	%xmm5,0-128(%rax)
1179bc3d5698SJohn Baldwin	paddd	%xmm15,%xmm5
1180bc3d5698SJohn Baldwin
1181bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1182bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1183bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1184bc3d5698SJohn Baldwin	paddd	-128(%rbp),%xmm5
1185bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1186bc3d5698SJohn Baldwin
1187bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1188bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm0
1189bc3d5698SJohn Baldwin
1190bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1191bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm3
1192bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1193bc3d5698SJohn Baldwin	pandn	%xmm14,%xmm0
1194bc3d5698SJohn Baldwin	pand	%xmm13,%xmm3
1195bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1196bc3d5698SJohn Baldwin
1197bc3d5698SJohn Baldwin
1198bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm1
1199bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1200bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm2
1201bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1202bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1203bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1204bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm3
1205bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm7
1206bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1207bc3d5698SJohn Baldwin	pxor	%xmm8,%xmm3
1208bc3d5698SJohn Baldwin
1209bc3d5698SJohn Baldwin
1210bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1211bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1212bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1213bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1214bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
1215bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1216bc3d5698SJohn Baldwin
1217bc3d5698SJohn Baldwin
1218bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1219bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1220bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm15
1221bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1222bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1223bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm15
1224bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
1225bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1226bc3d5698SJohn Baldwin
1227bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
1228bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm15
1229bc3d5698SJohn Baldwin	movdqa	32-128(%rax),%xmm5
1230bc3d5698SJohn Baldwin	paddd	160-128(%rax),%xmm6
1231bc3d5698SJohn Baldwin
1232bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm7
1233bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm1
1234bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1235bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm2
1236bc3d5698SJohn Baldwin
1237bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1238bc3d5698SJohn Baldwin	movdqa	240-128(%rax),%xmm0
1239bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1240bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1241bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1242bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm4
1243bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1244bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1245bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1246bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1247bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm1
1248bc3d5698SJohn Baldwin
1249bc3d5698SJohn Baldwin	psrld	$17,%xmm4
1250bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1251bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1252bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1253bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1254bc3d5698SJohn Baldwin	psrld	$19-17,%xmm4
1255bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1256bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1257bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1258bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1259bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1260bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm7
1261bc3d5698SJohn Baldwin
1262bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm2
1263bc3d5698SJohn Baldwin
1264bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1265bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm1
1266bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1267bc3d5698SJohn Baldwin	movdqa	%xmm6,16-128(%rax)
1268bc3d5698SJohn Baldwin	paddd	%xmm14,%xmm6
1269bc3d5698SJohn Baldwin
1270bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1271bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1272bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1273bc3d5698SJohn Baldwin	paddd	-96(%rbp),%xmm6
1274bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1275bc3d5698SJohn Baldwin
1276bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1277bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm0
1278bc3d5698SJohn Baldwin
1279bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1280bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm4
1281bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1282bc3d5698SJohn Baldwin	pandn	%xmm13,%xmm0
1283bc3d5698SJohn Baldwin	pand	%xmm12,%xmm4
1284bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1285bc3d5698SJohn Baldwin
1286bc3d5698SJohn Baldwin
1287bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm1
1288bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1289bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm2
1290bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1291bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1292bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1293bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm4
1294bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm7
1295bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1296bc3d5698SJohn Baldwin	pxor	%xmm15,%xmm4
1297bc3d5698SJohn Baldwin
1298bc3d5698SJohn Baldwin
1299bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1300bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1301bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1302bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1303bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
1304bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1305bc3d5698SJohn Baldwin
1306bc3d5698SJohn Baldwin
1307bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1308bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1309bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm14
1310bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1311bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1312bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm14
1313bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm10
1314bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1315bc3d5698SJohn Baldwin
1316bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm14
1317bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm14
1318bc3d5698SJohn Baldwin	movdqa	48-128(%rax),%xmm6
1319bc3d5698SJohn Baldwin	paddd	176-128(%rax),%xmm5
1320bc3d5698SJohn Baldwin
1321bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm7
1322bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm1
1323bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1324bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm2
1325bc3d5698SJohn Baldwin
1326bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1327bc3d5698SJohn Baldwin	movdqa	0-128(%rax),%xmm0
1328bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1329bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1330bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1331bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm3
1332bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1333bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1334bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1335bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1336bc3d5698SJohn Baldwin	movdqa	%xmm3,%xmm1
1337bc3d5698SJohn Baldwin
1338bc3d5698SJohn Baldwin	psrld	$17,%xmm3
1339bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1340bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1341bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1342bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1343bc3d5698SJohn Baldwin	psrld	$19-17,%xmm3
1344bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1345bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1346bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1347bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1348bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1349bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm7
1350bc3d5698SJohn Baldwin
1351bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm2
1352bc3d5698SJohn Baldwin
1353bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1354bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm1
1355bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1356bc3d5698SJohn Baldwin	movdqa	%xmm5,32-128(%rax)
1357bc3d5698SJohn Baldwin	paddd	%xmm13,%xmm5
1358bc3d5698SJohn Baldwin
1359bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1360bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1361bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1362bc3d5698SJohn Baldwin	paddd	-64(%rbp),%xmm5
1363bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1364bc3d5698SJohn Baldwin
1365bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1366bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm0
1367bc3d5698SJohn Baldwin
1368bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1369bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm3
1370bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1371bc3d5698SJohn Baldwin	pandn	%xmm12,%xmm0
1372bc3d5698SJohn Baldwin	pand	%xmm11,%xmm3
1373bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1374bc3d5698SJohn Baldwin
1375bc3d5698SJohn Baldwin
1376bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm1
1377bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1378bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm2
1379bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1380bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1381bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1382bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm3
1383bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm7
1384bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1385bc3d5698SJohn Baldwin	pxor	%xmm14,%xmm3
1386bc3d5698SJohn Baldwin
1387bc3d5698SJohn Baldwin
1388bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1389bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1390bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1391bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1392bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
1393bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1394bc3d5698SJohn Baldwin
1395bc3d5698SJohn Baldwin
1396bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1397bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1398bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm13
1399bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1400bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1401bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm13
1402bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm9
1403bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1404bc3d5698SJohn Baldwin
1405bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm13
1406bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm13
1407bc3d5698SJohn Baldwin	movdqa	64-128(%rax),%xmm5
1408bc3d5698SJohn Baldwin	paddd	192-128(%rax),%xmm6
1409bc3d5698SJohn Baldwin
1410bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm7
1411bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm1
1412bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1413bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm2
1414bc3d5698SJohn Baldwin
1415bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1416bc3d5698SJohn Baldwin	movdqa	16-128(%rax),%xmm0
1417bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1418bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1419bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1420bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm4
1421bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1422bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1423bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1424bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1425bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm1
1426bc3d5698SJohn Baldwin
1427bc3d5698SJohn Baldwin	psrld	$17,%xmm4
1428bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1429bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1430bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1431bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1432bc3d5698SJohn Baldwin	psrld	$19-17,%xmm4
1433bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1434bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1435bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1436bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1437bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1438bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm7
1439bc3d5698SJohn Baldwin
1440bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm2
1441bc3d5698SJohn Baldwin
1442bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1443bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm1
1444bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1445bc3d5698SJohn Baldwin	movdqa	%xmm6,48-128(%rax)
1446bc3d5698SJohn Baldwin	paddd	%xmm12,%xmm6
1447bc3d5698SJohn Baldwin
1448bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1449bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1450bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1451bc3d5698SJohn Baldwin	paddd	-32(%rbp),%xmm6
1452bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1453bc3d5698SJohn Baldwin
1454bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1455bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm0
1456bc3d5698SJohn Baldwin
1457bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1458bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm4
1459bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1460bc3d5698SJohn Baldwin	pandn	%xmm11,%xmm0
1461bc3d5698SJohn Baldwin	pand	%xmm10,%xmm4
1462bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1463bc3d5698SJohn Baldwin
1464bc3d5698SJohn Baldwin
1465bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm1
1466bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1467bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm2
1468bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1469bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1470bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1471bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm4
1472bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm7
1473bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1474bc3d5698SJohn Baldwin	pxor	%xmm13,%xmm4
1475bc3d5698SJohn Baldwin
1476bc3d5698SJohn Baldwin
1477bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1478bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1479bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1480bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1481bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
1482bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1483bc3d5698SJohn Baldwin
1484bc3d5698SJohn Baldwin
1485bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1486bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1487bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm12
1488bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1489bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1490bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm12
1491bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm8
1492bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1493bc3d5698SJohn Baldwin
1494bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm12
1495bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm12
1496bc3d5698SJohn Baldwin	movdqa	80-128(%rax),%xmm6
1497bc3d5698SJohn Baldwin	paddd	208-128(%rax),%xmm5
1498bc3d5698SJohn Baldwin
1499bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm7
1500bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm1
1501bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1502bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm2
1503bc3d5698SJohn Baldwin
1504bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1505bc3d5698SJohn Baldwin	movdqa	32-128(%rax),%xmm0
1506bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1507bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1508bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1509bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm3
1510bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1511bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1512bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1513bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1514bc3d5698SJohn Baldwin	movdqa	%xmm3,%xmm1
1515bc3d5698SJohn Baldwin
1516bc3d5698SJohn Baldwin	psrld	$17,%xmm3
1517bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1518bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1519bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1520bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1521bc3d5698SJohn Baldwin	psrld	$19-17,%xmm3
1522bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1523bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1524bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1525bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1526bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1527bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm7
1528bc3d5698SJohn Baldwin
1529bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm2
1530bc3d5698SJohn Baldwin
1531bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1532bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm1
1533bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1534bc3d5698SJohn Baldwin	movdqa	%xmm5,64-128(%rax)
1535bc3d5698SJohn Baldwin	paddd	%xmm11,%xmm5
1536bc3d5698SJohn Baldwin
1537bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1538bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1539bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1540bc3d5698SJohn Baldwin	paddd	0(%rbp),%xmm5
1541bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1542bc3d5698SJohn Baldwin
1543bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1544bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm0
1545bc3d5698SJohn Baldwin
1546bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1547bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm3
1548bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1549bc3d5698SJohn Baldwin	pandn	%xmm10,%xmm0
1550bc3d5698SJohn Baldwin	pand	%xmm9,%xmm3
1551bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1552bc3d5698SJohn Baldwin
1553bc3d5698SJohn Baldwin
1554bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm1
1555bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1556bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm2
1557bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1558bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1559bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1560bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm3
1561bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm7
1562bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1563bc3d5698SJohn Baldwin	pxor	%xmm12,%xmm3
1564bc3d5698SJohn Baldwin
1565bc3d5698SJohn Baldwin
1566bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1567bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1568bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1569bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1570bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
1571bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1572bc3d5698SJohn Baldwin
1573bc3d5698SJohn Baldwin
1574bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1575bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1576bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm11
1577bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1578bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1579bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm11
1580bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
1581bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1582bc3d5698SJohn Baldwin
1583bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
1584bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm11
1585bc3d5698SJohn Baldwin	movdqa	96-128(%rax),%xmm5
1586bc3d5698SJohn Baldwin	paddd	224-128(%rax),%xmm6
1587bc3d5698SJohn Baldwin
1588bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm7
1589bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm1
1590bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1591bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm2
1592bc3d5698SJohn Baldwin
1593bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1594bc3d5698SJohn Baldwin	movdqa	48-128(%rax),%xmm0
1595bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1596bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1597bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1598bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm4
1599bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1600bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1601bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1602bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1603bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm1
1604bc3d5698SJohn Baldwin
1605bc3d5698SJohn Baldwin	psrld	$17,%xmm4
1606bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1607bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1608bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1609bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1610bc3d5698SJohn Baldwin	psrld	$19-17,%xmm4
1611bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1612bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1613bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1614bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1615bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1616bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm7
1617bc3d5698SJohn Baldwin
1618bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm2
1619bc3d5698SJohn Baldwin
1620bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1621bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm1
1622bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1623bc3d5698SJohn Baldwin	movdqa	%xmm6,80-128(%rax)
1624bc3d5698SJohn Baldwin	paddd	%xmm10,%xmm6
1625bc3d5698SJohn Baldwin
1626bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1627bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1628bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1629bc3d5698SJohn Baldwin	paddd	32(%rbp),%xmm6
1630bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1631bc3d5698SJohn Baldwin
1632bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1633bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm0
1634bc3d5698SJohn Baldwin
1635bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1636bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm4
1637bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1638bc3d5698SJohn Baldwin	pandn	%xmm9,%xmm0
1639bc3d5698SJohn Baldwin	pand	%xmm8,%xmm4
1640bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1641bc3d5698SJohn Baldwin
1642bc3d5698SJohn Baldwin
1643bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm1
1644bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1645bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm2
1646bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1647bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1648bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1649bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm4
1650bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm7
1651bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1652bc3d5698SJohn Baldwin	pxor	%xmm11,%xmm4
1653bc3d5698SJohn Baldwin
1654bc3d5698SJohn Baldwin
1655bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1656bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1657bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1658bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1659bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
1660bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1661bc3d5698SJohn Baldwin
1662bc3d5698SJohn Baldwin
1663bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1664bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1665bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm10
1666bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1667bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1668bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm10
1669bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm14
1670bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1671bc3d5698SJohn Baldwin
1672bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm10
1673bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm10
1674bc3d5698SJohn Baldwin	movdqa	112-128(%rax),%xmm6
1675bc3d5698SJohn Baldwin	paddd	240-128(%rax),%xmm5
1676bc3d5698SJohn Baldwin
1677bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm7
1678bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm1
1679bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1680bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm2
1681bc3d5698SJohn Baldwin
1682bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1683bc3d5698SJohn Baldwin	movdqa	64-128(%rax),%xmm0
1684bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1685bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1686bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1687bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm3
1688bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1689bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1690bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1691bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1692bc3d5698SJohn Baldwin	movdqa	%xmm3,%xmm1
1693bc3d5698SJohn Baldwin
1694bc3d5698SJohn Baldwin	psrld	$17,%xmm3
1695bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1696bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1697bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1698bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1699bc3d5698SJohn Baldwin	psrld	$19-17,%xmm3
1700bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1701bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1702bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1703bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1704bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1705bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm7
1706bc3d5698SJohn Baldwin
1707bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm2
1708bc3d5698SJohn Baldwin
1709bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1710bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm1
1711bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1712bc3d5698SJohn Baldwin	movdqa	%xmm5,96-128(%rax)
1713bc3d5698SJohn Baldwin	paddd	%xmm9,%xmm5
1714bc3d5698SJohn Baldwin
1715bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1716bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1717bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1718bc3d5698SJohn Baldwin	paddd	64(%rbp),%xmm5
1719bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1720bc3d5698SJohn Baldwin
1721bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1722bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm0
1723bc3d5698SJohn Baldwin
1724bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1725bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm3
1726bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1727bc3d5698SJohn Baldwin	pandn	%xmm8,%xmm0
1728bc3d5698SJohn Baldwin	pand	%xmm15,%xmm3
1729bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1730bc3d5698SJohn Baldwin
1731bc3d5698SJohn Baldwin
1732bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm1
1733bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1734bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm2
1735bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1736bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1737bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1738bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm3
1739bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm7
1740bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1741bc3d5698SJohn Baldwin	pxor	%xmm10,%xmm3
1742bc3d5698SJohn Baldwin
1743bc3d5698SJohn Baldwin
1744bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1745bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1746bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1747bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1748bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
1749bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1750bc3d5698SJohn Baldwin
1751bc3d5698SJohn Baldwin
1752bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1753bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1754bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm9
1755bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1756bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1757bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm9
1758bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm13
1759bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1760bc3d5698SJohn Baldwin
1761bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm9
1762bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm9
1763bc3d5698SJohn Baldwin	movdqa	128-128(%rax),%xmm5
1764bc3d5698SJohn Baldwin	paddd	0-128(%rax),%xmm6
1765bc3d5698SJohn Baldwin
1766bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm7
1767bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm1
1768bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1769bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm2
1770bc3d5698SJohn Baldwin
1771bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1772bc3d5698SJohn Baldwin	movdqa	80-128(%rax),%xmm0
1773bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1774bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1775bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1776bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm4
1777bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1778bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1779bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1780bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1781bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm1
1782bc3d5698SJohn Baldwin
1783bc3d5698SJohn Baldwin	psrld	$17,%xmm4
1784bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1785bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1786bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1787bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1788bc3d5698SJohn Baldwin	psrld	$19-17,%xmm4
1789bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1790bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1791bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1792bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1793bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1794bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm7
1795bc3d5698SJohn Baldwin
1796bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm2
1797bc3d5698SJohn Baldwin
1798bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1799bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm1
1800bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1801bc3d5698SJohn Baldwin	movdqa	%xmm6,112-128(%rax)
1802bc3d5698SJohn Baldwin	paddd	%xmm8,%xmm6
1803bc3d5698SJohn Baldwin
1804bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1805bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1806bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1807bc3d5698SJohn Baldwin	paddd	96(%rbp),%xmm6
1808bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1809bc3d5698SJohn Baldwin
1810bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1811bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm0
1812bc3d5698SJohn Baldwin
1813bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1814bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm4
1815bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1816bc3d5698SJohn Baldwin	pandn	%xmm15,%xmm0
1817bc3d5698SJohn Baldwin	pand	%xmm14,%xmm4
1818bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1819bc3d5698SJohn Baldwin
1820bc3d5698SJohn Baldwin
1821bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm1
1822bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1823bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm2
1824bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1825bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1826bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1827bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm4
1828bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm7
1829bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1830bc3d5698SJohn Baldwin	pxor	%xmm9,%xmm4
1831bc3d5698SJohn Baldwin
1832bc3d5698SJohn Baldwin
1833bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1834bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1835bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1836bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1837bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
1838bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1839bc3d5698SJohn Baldwin
1840bc3d5698SJohn Baldwin
1841bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1842bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1843bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm8
1844bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1845bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1846bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm8
1847bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm12
1848bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1849bc3d5698SJohn Baldwin
1850bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm8
1851bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm8
1852bc3d5698SJohn Baldwin	leaq	256(%rbp),%rbp
1853bc3d5698SJohn Baldwin	movdqa	144-128(%rax),%xmm6
1854bc3d5698SJohn Baldwin	paddd	16-128(%rax),%xmm5
1855bc3d5698SJohn Baldwin
1856bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm7
1857bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm1
1858bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1859bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm2
1860bc3d5698SJohn Baldwin
1861bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1862bc3d5698SJohn Baldwin	movdqa	96-128(%rax),%xmm0
1863bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1864bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1865bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1866bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm3
1867bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1868bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1869bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1870bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1871bc3d5698SJohn Baldwin	movdqa	%xmm3,%xmm1
1872bc3d5698SJohn Baldwin
1873bc3d5698SJohn Baldwin	psrld	$17,%xmm3
1874bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1875bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1876bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1877bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1878bc3d5698SJohn Baldwin	psrld	$19-17,%xmm3
1879bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1880bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1881bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1882bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1883bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1884bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm7
1885bc3d5698SJohn Baldwin
1886bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm2
1887bc3d5698SJohn Baldwin
1888bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1889bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm1
1890bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1891bc3d5698SJohn Baldwin	movdqa	%xmm5,128-128(%rax)
1892bc3d5698SJohn Baldwin	paddd	%xmm15,%xmm5
1893bc3d5698SJohn Baldwin
1894bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1895bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1896bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1897bc3d5698SJohn Baldwin	paddd	-128(%rbp),%xmm5
1898bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1899bc3d5698SJohn Baldwin
1900bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1901bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm0
1902bc3d5698SJohn Baldwin
1903bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1904bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm3
1905bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1906bc3d5698SJohn Baldwin	pandn	%xmm14,%xmm0
1907bc3d5698SJohn Baldwin	pand	%xmm13,%xmm3
1908bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1909bc3d5698SJohn Baldwin
1910bc3d5698SJohn Baldwin
1911bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm1
1912bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1913bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm2
1914bc3d5698SJohn Baldwin	psrld	$2,%xmm1
1915bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
1916bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
1917bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm3
1918bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm7
1919bc3d5698SJohn Baldwin	pslld	$10,%xmm2
1920bc3d5698SJohn Baldwin	pxor	%xmm8,%xmm3
1921bc3d5698SJohn Baldwin
1922bc3d5698SJohn Baldwin
1923bc3d5698SJohn Baldwin	psrld	$13,%xmm7
1924bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1925bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
1926bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
1927bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
1928bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
1929bc3d5698SJohn Baldwin
1930bc3d5698SJohn Baldwin
1931bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
1932bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
1933bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm15
1934bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
1935bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1936bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm15
1937bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
1938bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1939bc3d5698SJohn Baldwin
1940bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
1941bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm15
1942bc3d5698SJohn Baldwin	movdqa	160-128(%rax),%xmm5
1943bc3d5698SJohn Baldwin	paddd	32-128(%rax),%xmm6
1944bc3d5698SJohn Baldwin
1945bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm7
1946bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm1
1947bc3d5698SJohn Baldwin	psrld	$3,%xmm7
1948bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm2
1949bc3d5698SJohn Baldwin
1950bc3d5698SJohn Baldwin	psrld	$7,%xmm1
1951bc3d5698SJohn Baldwin	movdqa	112-128(%rax),%xmm0
1952bc3d5698SJohn Baldwin	pslld	$14,%xmm2
1953bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1954bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
1955bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm4
1956bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1957bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
1958bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1959bc3d5698SJohn Baldwin	psrld	$10,%xmm0
1960bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm1
1961bc3d5698SJohn Baldwin
1962bc3d5698SJohn Baldwin	psrld	$17,%xmm4
1963bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1964bc3d5698SJohn Baldwin	pslld	$13,%xmm1
1965bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
1966bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1967bc3d5698SJohn Baldwin	psrld	$19-17,%xmm4
1968bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1969bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
1970bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
1971bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
1972bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
1973bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm7
1974bc3d5698SJohn Baldwin
1975bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm2
1976bc3d5698SJohn Baldwin
1977bc3d5698SJohn Baldwin	psrld	$6,%xmm7
1978bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm1
1979bc3d5698SJohn Baldwin	pslld	$7,%xmm2
1980bc3d5698SJohn Baldwin	movdqa	%xmm6,144-128(%rax)
1981bc3d5698SJohn Baldwin	paddd	%xmm14,%xmm6
1982bc3d5698SJohn Baldwin
1983bc3d5698SJohn Baldwin	psrld	$11,%xmm1
1984bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1985bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
1986bc3d5698SJohn Baldwin	paddd	-96(%rbp),%xmm6
1987bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1988bc3d5698SJohn Baldwin
1989bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
1990bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm0
1991bc3d5698SJohn Baldwin
1992bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
1993bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm4
1994bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
1995bc3d5698SJohn Baldwin	pandn	%xmm13,%xmm0
1996bc3d5698SJohn Baldwin	pand	%xmm12,%xmm4
1997bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
1998bc3d5698SJohn Baldwin
1999bc3d5698SJohn Baldwin
2000bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm1
2001bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2002bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm2
2003bc3d5698SJohn Baldwin	psrld	$2,%xmm1
2004bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
2005bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2006bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm4
2007bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm7
2008bc3d5698SJohn Baldwin	pslld	$10,%xmm2
2009bc3d5698SJohn Baldwin	pxor	%xmm15,%xmm4
2010bc3d5698SJohn Baldwin
2011bc3d5698SJohn Baldwin
2012bc3d5698SJohn Baldwin	psrld	$13,%xmm7
2013bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2014bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
2015bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
2016bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
2017bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
2018bc3d5698SJohn Baldwin
2019bc3d5698SJohn Baldwin
2020bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
2021bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2022bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm14
2023bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
2024bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2025bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm14
2026bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm10
2027bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2028bc3d5698SJohn Baldwin
2029bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm14
2030bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm14
2031bc3d5698SJohn Baldwin	movdqa	176-128(%rax),%xmm6
2032bc3d5698SJohn Baldwin	paddd	48-128(%rax),%xmm5
2033bc3d5698SJohn Baldwin
2034bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm7
2035bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm1
2036bc3d5698SJohn Baldwin	psrld	$3,%xmm7
2037bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm2
2038bc3d5698SJohn Baldwin
2039bc3d5698SJohn Baldwin	psrld	$7,%xmm1
2040bc3d5698SJohn Baldwin	movdqa	128-128(%rax),%xmm0
2041bc3d5698SJohn Baldwin	pslld	$14,%xmm2
2042bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2043bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
2044bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm3
2045bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2046bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
2047bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2048bc3d5698SJohn Baldwin	psrld	$10,%xmm0
2049bc3d5698SJohn Baldwin	movdqa	%xmm3,%xmm1
2050bc3d5698SJohn Baldwin
2051bc3d5698SJohn Baldwin	psrld	$17,%xmm3
2052bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2053bc3d5698SJohn Baldwin	pslld	$13,%xmm1
2054bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
2055bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2056bc3d5698SJohn Baldwin	psrld	$19-17,%xmm3
2057bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2058bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
2059bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2060bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2061bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
2062bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm7
2063bc3d5698SJohn Baldwin
2064bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm2
2065bc3d5698SJohn Baldwin
2066bc3d5698SJohn Baldwin	psrld	$6,%xmm7
2067bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm1
2068bc3d5698SJohn Baldwin	pslld	$7,%xmm2
2069bc3d5698SJohn Baldwin	movdqa	%xmm5,160-128(%rax)
2070bc3d5698SJohn Baldwin	paddd	%xmm13,%xmm5
2071bc3d5698SJohn Baldwin
2072bc3d5698SJohn Baldwin	psrld	$11,%xmm1
2073bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2074bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
2075bc3d5698SJohn Baldwin	paddd	-64(%rbp),%xmm5
2076bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2077bc3d5698SJohn Baldwin
2078bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
2079bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm0
2080bc3d5698SJohn Baldwin
2081bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2082bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm3
2083bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
2084bc3d5698SJohn Baldwin	pandn	%xmm12,%xmm0
2085bc3d5698SJohn Baldwin	pand	%xmm11,%xmm3
2086bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2087bc3d5698SJohn Baldwin
2088bc3d5698SJohn Baldwin
2089bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm1
2090bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2091bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm2
2092bc3d5698SJohn Baldwin	psrld	$2,%xmm1
2093bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
2094bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2095bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm3
2096bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm7
2097bc3d5698SJohn Baldwin	pslld	$10,%xmm2
2098bc3d5698SJohn Baldwin	pxor	%xmm14,%xmm3
2099bc3d5698SJohn Baldwin
2100bc3d5698SJohn Baldwin
2101bc3d5698SJohn Baldwin	psrld	$13,%xmm7
2102bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2103bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
2104bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
2105bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
2106bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
2107bc3d5698SJohn Baldwin
2108bc3d5698SJohn Baldwin
2109bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
2110bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2111bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm13
2112bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
2113bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2114bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm13
2115bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm9
2116bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2117bc3d5698SJohn Baldwin
2118bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm13
2119bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm13
2120bc3d5698SJohn Baldwin	movdqa	192-128(%rax),%xmm5
2121bc3d5698SJohn Baldwin	paddd	64-128(%rax),%xmm6
2122bc3d5698SJohn Baldwin
2123bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm7
2124bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm1
2125bc3d5698SJohn Baldwin	psrld	$3,%xmm7
2126bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm2
2127bc3d5698SJohn Baldwin
2128bc3d5698SJohn Baldwin	psrld	$7,%xmm1
2129bc3d5698SJohn Baldwin	movdqa	144-128(%rax),%xmm0
2130bc3d5698SJohn Baldwin	pslld	$14,%xmm2
2131bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2132bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
2133bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm4
2134bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2135bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
2136bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2137bc3d5698SJohn Baldwin	psrld	$10,%xmm0
2138bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm1
2139bc3d5698SJohn Baldwin
2140bc3d5698SJohn Baldwin	psrld	$17,%xmm4
2141bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2142bc3d5698SJohn Baldwin	pslld	$13,%xmm1
2143bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
2144bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2145bc3d5698SJohn Baldwin	psrld	$19-17,%xmm4
2146bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2147bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
2148bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2149bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2150bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
2151bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm7
2152bc3d5698SJohn Baldwin
2153bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm2
2154bc3d5698SJohn Baldwin
2155bc3d5698SJohn Baldwin	psrld	$6,%xmm7
2156bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm1
2157bc3d5698SJohn Baldwin	pslld	$7,%xmm2
2158bc3d5698SJohn Baldwin	movdqa	%xmm6,176-128(%rax)
2159bc3d5698SJohn Baldwin	paddd	%xmm12,%xmm6
2160bc3d5698SJohn Baldwin
2161bc3d5698SJohn Baldwin	psrld	$11,%xmm1
2162bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2163bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
2164bc3d5698SJohn Baldwin	paddd	-32(%rbp),%xmm6
2165bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2166bc3d5698SJohn Baldwin
2167bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
2168bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm0
2169bc3d5698SJohn Baldwin
2170bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2171bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm4
2172bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
2173bc3d5698SJohn Baldwin	pandn	%xmm11,%xmm0
2174bc3d5698SJohn Baldwin	pand	%xmm10,%xmm4
2175bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2176bc3d5698SJohn Baldwin
2177bc3d5698SJohn Baldwin
2178bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm1
2179bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2180bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm2
2181bc3d5698SJohn Baldwin	psrld	$2,%xmm1
2182bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
2183bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2184bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm4
2185bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm7
2186bc3d5698SJohn Baldwin	pslld	$10,%xmm2
2187bc3d5698SJohn Baldwin	pxor	%xmm13,%xmm4
2188bc3d5698SJohn Baldwin
2189bc3d5698SJohn Baldwin
2190bc3d5698SJohn Baldwin	psrld	$13,%xmm7
2191bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2192bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
2193bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
2194bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
2195bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
2196bc3d5698SJohn Baldwin
2197bc3d5698SJohn Baldwin
2198bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
2199bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2200bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm12
2201bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
2202bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2203bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm12
2204bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm8
2205bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2206bc3d5698SJohn Baldwin
2207bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm12
2208bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm12
2209bc3d5698SJohn Baldwin	movdqa	208-128(%rax),%xmm6
2210bc3d5698SJohn Baldwin	paddd	80-128(%rax),%xmm5
2211bc3d5698SJohn Baldwin
2212bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm7
2213bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm1
2214bc3d5698SJohn Baldwin	psrld	$3,%xmm7
2215bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm2
2216bc3d5698SJohn Baldwin
2217bc3d5698SJohn Baldwin	psrld	$7,%xmm1
2218bc3d5698SJohn Baldwin	movdqa	160-128(%rax),%xmm0
2219bc3d5698SJohn Baldwin	pslld	$14,%xmm2
2220bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2221bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
2222bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm3
2223bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2224bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
2225bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2226bc3d5698SJohn Baldwin	psrld	$10,%xmm0
2227bc3d5698SJohn Baldwin	movdqa	%xmm3,%xmm1
2228bc3d5698SJohn Baldwin
2229bc3d5698SJohn Baldwin	psrld	$17,%xmm3
2230bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2231bc3d5698SJohn Baldwin	pslld	$13,%xmm1
2232bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
2233bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2234bc3d5698SJohn Baldwin	psrld	$19-17,%xmm3
2235bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2236bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
2237bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2238bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2239bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
2240bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm7
2241bc3d5698SJohn Baldwin
2242bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm2
2243bc3d5698SJohn Baldwin
2244bc3d5698SJohn Baldwin	psrld	$6,%xmm7
2245bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm1
2246bc3d5698SJohn Baldwin	pslld	$7,%xmm2
2247bc3d5698SJohn Baldwin	movdqa	%xmm5,192-128(%rax)
2248bc3d5698SJohn Baldwin	paddd	%xmm11,%xmm5
2249bc3d5698SJohn Baldwin
2250bc3d5698SJohn Baldwin	psrld	$11,%xmm1
2251bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2252bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
2253bc3d5698SJohn Baldwin	paddd	0(%rbp),%xmm5
2254bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2255bc3d5698SJohn Baldwin
2256bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
2257bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm0
2258bc3d5698SJohn Baldwin
2259bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2260bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm3
2261bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
2262bc3d5698SJohn Baldwin	pandn	%xmm10,%xmm0
2263bc3d5698SJohn Baldwin	pand	%xmm9,%xmm3
2264bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2265bc3d5698SJohn Baldwin
2266bc3d5698SJohn Baldwin
2267bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm1
2268bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2269bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm2
2270bc3d5698SJohn Baldwin	psrld	$2,%xmm1
2271bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
2272bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2273bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm3
2274bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm7
2275bc3d5698SJohn Baldwin	pslld	$10,%xmm2
2276bc3d5698SJohn Baldwin	pxor	%xmm12,%xmm3
2277bc3d5698SJohn Baldwin
2278bc3d5698SJohn Baldwin
2279bc3d5698SJohn Baldwin	psrld	$13,%xmm7
2280bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2281bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
2282bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
2283bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
2284bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
2285bc3d5698SJohn Baldwin
2286bc3d5698SJohn Baldwin
2287bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
2288bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2289bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm11
2290bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
2291bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2292bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm11
2293bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
2294bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2295bc3d5698SJohn Baldwin
2296bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
2297bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm11
2298bc3d5698SJohn Baldwin	movdqa	224-128(%rax),%xmm5
2299bc3d5698SJohn Baldwin	paddd	96-128(%rax),%xmm6
2300bc3d5698SJohn Baldwin
2301bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm7
2302bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm1
2303bc3d5698SJohn Baldwin	psrld	$3,%xmm7
2304bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm2
2305bc3d5698SJohn Baldwin
2306bc3d5698SJohn Baldwin	psrld	$7,%xmm1
2307bc3d5698SJohn Baldwin	movdqa	176-128(%rax),%xmm0
2308bc3d5698SJohn Baldwin	pslld	$14,%xmm2
2309bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2310bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
2311bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm4
2312bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2313bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
2314bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2315bc3d5698SJohn Baldwin	psrld	$10,%xmm0
2316bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm1
2317bc3d5698SJohn Baldwin
2318bc3d5698SJohn Baldwin	psrld	$17,%xmm4
2319bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2320bc3d5698SJohn Baldwin	pslld	$13,%xmm1
2321bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
2322bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2323bc3d5698SJohn Baldwin	psrld	$19-17,%xmm4
2324bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2325bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
2326bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2327bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2328bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
2329bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm7
2330bc3d5698SJohn Baldwin
2331bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm2
2332bc3d5698SJohn Baldwin
2333bc3d5698SJohn Baldwin	psrld	$6,%xmm7
2334bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm1
2335bc3d5698SJohn Baldwin	pslld	$7,%xmm2
2336bc3d5698SJohn Baldwin	movdqa	%xmm6,208-128(%rax)
2337bc3d5698SJohn Baldwin	paddd	%xmm10,%xmm6
2338bc3d5698SJohn Baldwin
2339bc3d5698SJohn Baldwin	psrld	$11,%xmm1
2340bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2341bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
2342bc3d5698SJohn Baldwin	paddd	32(%rbp),%xmm6
2343bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2344bc3d5698SJohn Baldwin
2345bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
2346bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm0
2347bc3d5698SJohn Baldwin
2348bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2349bc3d5698SJohn Baldwin	movdqa	%xmm15,%xmm4
2350bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
2351bc3d5698SJohn Baldwin	pandn	%xmm9,%xmm0
2352bc3d5698SJohn Baldwin	pand	%xmm8,%xmm4
2353bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2354bc3d5698SJohn Baldwin
2355bc3d5698SJohn Baldwin
2356bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm1
2357bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2358bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm2
2359bc3d5698SJohn Baldwin	psrld	$2,%xmm1
2360bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
2361bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2362bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm4
2363bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm7
2364bc3d5698SJohn Baldwin	pslld	$10,%xmm2
2365bc3d5698SJohn Baldwin	pxor	%xmm11,%xmm4
2366bc3d5698SJohn Baldwin
2367bc3d5698SJohn Baldwin
2368bc3d5698SJohn Baldwin	psrld	$13,%xmm7
2369bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2370bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
2371bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
2372bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
2373bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
2374bc3d5698SJohn Baldwin
2375bc3d5698SJohn Baldwin
2376bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
2377bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2378bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm10
2379bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
2380bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2381bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm10
2382bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm14
2383bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2384bc3d5698SJohn Baldwin
2385bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm10
2386bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm10
2387bc3d5698SJohn Baldwin	movdqa	240-128(%rax),%xmm6
2388bc3d5698SJohn Baldwin	paddd	112-128(%rax),%xmm5
2389bc3d5698SJohn Baldwin
2390bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm7
2391bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm1
2392bc3d5698SJohn Baldwin	psrld	$3,%xmm7
2393bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm2
2394bc3d5698SJohn Baldwin
2395bc3d5698SJohn Baldwin	psrld	$7,%xmm1
2396bc3d5698SJohn Baldwin	movdqa	192-128(%rax),%xmm0
2397bc3d5698SJohn Baldwin	pslld	$14,%xmm2
2398bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2399bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
2400bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm3
2401bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2402bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
2403bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2404bc3d5698SJohn Baldwin	psrld	$10,%xmm0
2405bc3d5698SJohn Baldwin	movdqa	%xmm3,%xmm1
2406bc3d5698SJohn Baldwin
2407bc3d5698SJohn Baldwin	psrld	$17,%xmm3
2408bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2409bc3d5698SJohn Baldwin	pslld	$13,%xmm1
2410bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
2411bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2412bc3d5698SJohn Baldwin	psrld	$19-17,%xmm3
2413bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2414bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
2415bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2416bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2417bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
2418bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm7
2419bc3d5698SJohn Baldwin
2420bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm2
2421bc3d5698SJohn Baldwin
2422bc3d5698SJohn Baldwin	psrld	$6,%xmm7
2423bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm1
2424bc3d5698SJohn Baldwin	pslld	$7,%xmm2
2425bc3d5698SJohn Baldwin	movdqa	%xmm5,224-128(%rax)
2426bc3d5698SJohn Baldwin	paddd	%xmm9,%xmm5
2427bc3d5698SJohn Baldwin
2428bc3d5698SJohn Baldwin	psrld	$11,%xmm1
2429bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2430bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
2431bc3d5698SJohn Baldwin	paddd	64(%rbp),%xmm5
2432bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2433bc3d5698SJohn Baldwin
2434bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
2435bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm0
2436bc3d5698SJohn Baldwin
2437bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2438bc3d5698SJohn Baldwin	movdqa	%xmm14,%xmm3
2439bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
2440bc3d5698SJohn Baldwin	pandn	%xmm8,%xmm0
2441bc3d5698SJohn Baldwin	pand	%xmm15,%xmm3
2442bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2443bc3d5698SJohn Baldwin
2444bc3d5698SJohn Baldwin
2445bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm1
2446bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2447bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm2
2448bc3d5698SJohn Baldwin	psrld	$2,%xmm1
2449bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm5
2450bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm0
2451bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm3
2452bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm7
2453bc3d5698SJohn Baldwin	pslld	$10,%xmm2
2454bc3d5698SJohn Baldwin	pxor	%xmm10,%xmm3
2455bc3d5698SJohn Baldwin
2456bc3d5698SJohn Baldwin
2457bc3d5698SJohn Baldwin	psrld	$13,%xmm7
2458bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2459bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm5
2460bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
2461bc3d5698SJohn Baldwin	pand	%xmm3,%xmm4
2462bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
2463bc3d5698SJohn Baldwin
2464bc3d5698SJohn Baldwin
2465bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
2466bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2467bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm9
2468bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
2469bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2470bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm9
2471bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm13
2472bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2473bc3d5698SJohn Baldwin
2474bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm9
2475bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm9
2476bc3d5698SJohn Baldwin	movdqa	0-128(%rax),%xmm5
2477bc3d5698SJohn Baldwin	paddd	128-128(%rax),%xmm6
2478bc3d5698SJohn Baldwin
2479bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm7
2480bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm1
2481bc3d5698SJohn Baldwin	psrld	$3,%xmm7
2482bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm2
2483bc3d5698SJohn Baldwin
2484bc3d5698SJohn Baldwin	psrld	$7,%xmm1
2485bc3d5698SJohn Baldwin	movdqa	208-128(%rax),%xmm0
2486bc3d5698SJohn Baldwin	pslld	$14,%xmm2
2487bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2488bc3d5698SJohn Baldwin	psrld	$18-7,%xmm1
2489bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm4
2490bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2491bc3d5698SJohn Baldwin	pslld	$25-14,%xmm2
2492bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2493bc3d5698SJohn Baldwin	psrld	$10,%xmm0
2494bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm1
2495bc3d5698SJohn Baldwin
2496bc3d5698SJohn Baldwin	psrld	$17,%xmm4
2497bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2498bc3d5698SJohn Baldwin	pslld	$13,%xmm1
2499bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
2500bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2501bc3d5698SJohn Baldwin	psrld	$19-17,%xmm4
2502bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2503bc3d5698SJohn Baldwin	pslld	$15-13,%xmm1
2504bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2505bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm0
2506bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
2507bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm7
2508bc3d5698SJohn Baldwin
2509bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm2
2510bc3d5698SJohn Baldwin
2511bc3d5698SJohn Baldwin	psrld	$6,%xmm7
2512bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm1
2513bc3d5698SJohn Baldwin	pslld	$7,%xmm2
2514bc3d5698SJohn Baldwin	movdqa	%xmm6,240-128(%rax)
2515bc3d5698SJohn Baldwin	paddd	%xmm8,%xmm6
2516bc3d5698SJohn Baldwin
2517bc3d5698SJohn Baldwin	psrld	$11,%xmm1
2518bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2519bc3d5698SJohn Baldwin	pslld	$21-7,%xmm2
2520bc3d5698SJohn Baldwin	paddd	96(%rbp),%xmm6
2521bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2522bc3d5698SJohn Baldwin
2523bc3d5698SJohn Baldwin	psrld	$25-11,%xmm1
2524bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm0
2525bc3d5698SJohn Baldwin
2526bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2527bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm4
2528bc3d5698SJohn Baldwin	pslld	$26-21,%xmm2
2529bc3d5698SJohn Baldwin	pandn	%xmm15,%xmm0
2530bc3d5698SJohn Baldwin	pand	%xmm14,%xmm4
2531bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2532bc3d5698SJohn Baldwin
2533bc3d5698SJohn Baldwin
2534bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm1
2535bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2536bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm2
2537bc3d5698SJohn Baldwin	psrld	$2,%xmm1
2538bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm6
2539bc3d5698SJohn Baldwin	pxor	%xmm4,%xmm0
2540bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm4
2541bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm7
2542bc3d5698SJohn Baldwin	pslld	$10,%xmm2
2543bc3d5698SJohn Baldwin	pxor	%xmm9,%xmm4
2544bc3d5698SJohn Baldwin
2545bc3d5698SJohn Baldwin
2546bc3d5698SJohn Baldwin	psrld	$13,%xmm7
2547bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2548bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm6
2549bc3d5698SJohn Baldwin	pslld	$19-10,%xmm2
2550bc3d5698SJohn Baldwin	pand	%xmm4,%xmm3
2551bc3d5698SJohn Baldwin	pxor	%xmm7,%xmm1
2552bc3d5698SJohn Baldwin
2553bc3d5698SJohn Baldwin
2554bc3d5698SJohn Baldwin	psrld	$22-13,%xmm7
2555bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm1
2556bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm8
2557bc3d5698SJohn Baldwin	pslld	$30-19,%xmm2
2558bc3d5698SJohn Baldwin	pxor	%xmm1,%xmm7
2559bc3d5698SJohn Baldwin	pxor	%xmm3,%xmm8
2560bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm12
2561bc3d5698SJohn Baldwin	pxor	%xmm2,%xmm7
2562bc3d5698SJohn Baldwin
2563bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm8
2564bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm8
2565bc3d5698SJohn Baldwin	leaq	256(%rbp),%rbp
2566bc3d5698SJohn Baldwin	decl	%ecx
2567bc3d5698SJohn Baldwin	jnz	.Loop_16_xx
2568bc3d5698SJohn Baldwin
2569bc3d5698SJohn Baldwin	movl	$1,%ecx
2570bc3d5698SJohn Baldwin	leaq	K256+128(%rip),%rbp
2571bc3d5698SJohn Baldwin
2572bc3d5698SJohn Baldwin	movdqa	(%rbx),%xmm7
2573bc3d5698SJohn Baldwin	cmpl	0(%rbx),%ecx
2574bc3d5698SJohn Baldwin	pxor	%xmm0,%xmm0
2575bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r8
2576bc3d5698SJohn Baldwin	cmpl	4(%rbx),%ecx
2577bc3d5698SJohn Baldwin	movdqa	%xmm7,%xmm6
2578bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r9
2579bc3d5698SJohn Baldwin	cmpl	8(%rbx),%ecx
2580bc3d5698SJohn Baldwin	pcmpgtd	%xmm0,%xmm6
2581bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r10
2582bc3d5698SJohn Baldwin	cmpl	12(%rbx),%ecx
2583bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm7
2584bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r11
2585bc3d5698SJohn Baldwin
2586bc3d5698SJohn Baldwin	movdqu	0-128(%rdi),%xmm0
2587bc3d5698SJohn Baldwin	pand	%xmm6,%xmm8
2588bc3d5698SJohn Baldwin	movdqu	32-128(%rdi),%xmm1
2589bc3d5698SJohn Baldwin	pand	%xmm6,%xmm9
2590bc3d5698SJohn Baldwin	movdqu	64-128(%rdi),%xmm2
2591bc3d5698SJohn Baldwin	pand	%xmm6,%xmm10
2592bc3d5698SJohn Baldwin	movdqu	96-128(%rdi),%xmm5
2593bc3d5698SJohn Baldwin	pand	%xmm6,%xmm11
2594bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm8
2595bc3d5698SJohn Baldwin	movdqu	128-128(%rdi),%xmm0
2596bc3d5698SJohn Baldwin	pand	%xmm6,%xmm12
2597bc3d5698SJohn Baldwin	paddd	%xmm1,%xmm9
2598bc3d5698SJohn Baldwin	movdqu	160-128(%rdi),%xmm1
2599bc3d5698SJohn Baldwin	pand	%xmm6,%xmm13
2600bc3d5698SJohn Baldwin	paddd	%xmm2,%xmm10
2601bc3d5698SJohn Baldwin	movdqu	192-128(%rdi),%xmm2
2602bc3d5698SJohn Baldwin	pand	%xmm6,%xmm14
2603bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm11
2604bc3d5698SJohn Baldwin	movdqu	224-128(%rdi),%xmm5
2605bc3d5698SJohn Baldwin	pand	%xmm6,%xmm15
2606bc3d5698SJohn Baldwin	paddd	%xmm0,%xmm12
2607bc3d5698SJohn Baldwin	paddd	%xmm1,%xmm13
2608bc3d5698SJohn Baldwin	movdqu	%xmm8,0-128(%rdi)
2609bc3d5698SJohn Baldwin	paddd	%xmm2,%xmm14
2610bc3d5698SJohn Baldwin	movdqu	%xmm9,32-128(%rdi)
2611bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm15
2612bc3d5698SJohn Baldwin	movdqu	%xmm10,64-128(%rdi)
2613bc3d5698SJohn Baldwin	movdqu	%xmm11,96-128(%rdi)
2614bc3d5698SJohn Baldwin	movdqu	%xmm12,128-128(%rdi)
2615bc3d5698SJohn Baldwin	movdqu	%xmm13,160-128(%rdi)
2616bc3d5698SJohn Baldwin	movdqu	%xmm14,192-128(%rdi)
2617bc3d5698SJohn Baldwin	movdqu	%xmm15,224-128(%rdi)
2618bc3d5698SJohn Baldwin
2619bc3d5698SJohn Baldwin	movdqa	%xmm7,(%rbx)
2620bc3d5698SJohn Baldwin	movdqa	.Lpbswap(%rip),%xmm6
2621bc3d5698SJohn Baldwin	decl	%edx
2622bc3d5698SJohn Baldwin	jnz	.Loop
2623bc3d5698SJohn Baldwin
2624bc3d5698SJohn Baldwin	movl	280(%rsp),%edx
2625bc3d5698SJohn Baldwin	leaq	16(%rdi),%rdi
2626bc3d5698SJohn Baldwin	leaq	64(%rsi),%rsi
2627bc3d5698SJohn Baldwin	decl	%edx
2628bc3d5698SJohn Baldwin	jnz	.Loop_grande
2629bc3d5698SJohn Baldwin
2630bc3d5698SJohn Baldwin.Ldone:
2631bc3d5698SJohn Baldwin	movq	272(%rsp),%rax
2632bc3d5698SJohn Baldwin.cfi_def_cfa	%rax,8
2633bc3d5698SJohn Baldwin	movq	-16(%rax),%rbp
2634bc3d5698SJohn Baldwin.cfi_restore	%rbp
2635bc3d5698SJohn Baldwin	movq	-8(%rax),%rbx
2636bc3d5698SJohn Baldwin.cfi_restore	%rbx
2637bc3d5698SJohn Baldwin	leaq	(%rax),%rsp
2638bc3d5698SJohn Baldwin.cfi_def_cfa_register	%rsp
2639bc3d5698SJohn Baldwin.Lepilogue:
2640bc3d5698SJohn Baldwin	.byte	0xf3,0xc3
2641bc3d5698SJohn Baldwin.cfi_endproc
2642bc3d5698SJohn Baldwin.size	sha256_multi_block,.-sha256_multi_block
2643bc3d5698SJohn Baldwin.type	sha256_multi_block_shaext,@function
2644bc3d5698SJohn Baldwin.align	32
2645bc3d5698SJohn Baldwinsha256_multi_block_shaext:
2646bc3d5698SJohn Baldwin.cfi_startproc
2647bc3d5698SJohn Baldwin_shaext_shortcut:
2648bc3d5698SJohn Baldwin	movq	%rsp,%rax
2649bc3d5698SJohn Baldwin.cfi_def_cfa_register	%rax
2650bc3d5698SJohn Baldwin	pushq	%rbx
2651bc3d5698SJohn Baldwin.cfi_offset	%rbx,-16
2652bc3d5698SJohn Baldwin	pushq	%rbp
2653bc3d5698SJohn Baldwin.cfi_offset	%rbp,-24
2654bc3d5698SJohn Baldwin	subq	$288,%rsp
2655bc3d5698SJohn Baldwin	shll	$1,%edx
2656bc3d5698SJohn Baldwin	andq	$-256,%rsp
2657bc3d5698SJohn Baldwin	leaq	128(%rdi),%rdi
2658bc3d5698SJohn Baldwin	movq	%rax,272(%rsp)
2659bc3d5698SJohn Baldwin.Lbody_shaext:
2660bc3d5698SJohn Baldwin	leaq	256(%rsp),%rbx
2661bc3d5698SJohn Baldwin	leaq	K256_shaext+128(%rip),%rbp
2662bc3d5698SJohn Baldwin
2663bc3d5698SJohn Baldwin.Loop_grande_shaext:
2664bc3d5698SJohn Baldwin	movl	%edx,280(%rsp)
2665bc3d5698SJohn Baldwin	xorl	%edx,%edx
2666*c0855eaaSJohn Baldwin
2667bc3d5698SJohn Baldwin	movq	0(%rsi),%r8
2668*c0855eaaSJohn Baldwin
2669bc3d5698SJohn Baldwin	movl	8(%rsi),%ecx
2670bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
2671bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
2672bc3d5698SJohn Baldwin	testl	%ecx,%ecx
2673bc3d5698SJohn Baldwin	movl	%ecx,0(%rbx)
2674bc3d5698SJohn Baldwin	cmovleq	%rsp,%r8
2675*c0855eaaSJohn Baldwin
2676bc3d5698SJohn Baldwin	movq	16(%rsi),%r9
2677*c0855eaaSJohn Baldwin
2678bc3d5698SJohn Baldwin	movl	24(%rsi),%ecx
2679bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
2680bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
2681bc3d5698SJohn Baldwin	testl	%ecx,%ecx
2682bc3d5698SJohn Baldwin	movl	%ecx,4(%rbx)
2683bc3d5698SJohn Baldwin	cmovleq	%rsp,%r9
2684bc3d5698SJohn Baldwin	testl	%edx,%edx
2685bc3d5698SJohn Baldwin	jz	.Ldone_shaext
2686bc3d5698SJohn Baldwin
2687bc3d5698SJohn Baldwin	movq	0-128(%rdi),%xmm12
2688bc3d5698SJohn Baldwin	movq	32-128(%rdi),%xmm4
2689bc3d5698SJohn Baldwin	movq	64-128(%rdi),%xmm13
2690bc3d5698SJohn Baldwin	movq	96-128(%rdi),%xmm5
2691bc3d5698SJohn Baldwin	movq	128-128(%rdi),%xmm8
2692bc3d5698SJohn Baldwin	movq	160-128(%rdi),%xmm9
2693bc3d5698SJohn Baldwin	movq	192-128(%rdi),%xmm10
2694bc3d5698SJohn Baldwin	movq	224-128(%rdi),%xmm11
2695bc3d5698SJohn Baldwin
2696bc3d5698SJohn Baldwin	punpckldq	%xmm4,%xmm12
2697bc3d5698SJohn Baldwin	punpckldq	%xmm5,%xmm13
2698bc3d5698SJohn Baldwin	punpckldq	%xmm9,%xmm8
2699bc3d5698SJohn Baldwin	punpckldq	%xmm11,%xmm10
2700bc3d5698SJohn Baldwin	movdqa	K256_shaext-16(%rip),%xmm3
2701bc3d5698SJohn Baldwin
2702bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm14
2703bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm15
2704bc3d5698SJohn Baldwin	punpcklqdq	%xmm8,%xmm12
2705bc3d5698SJohn Baldwin	punpcklqdq	%xmm10,%xmm13
2706bc3d5698SJohn Baldwin	punpckhqdq	%xmm8,%xmm14
2707bc3d5698SJohn Baldwin	punpckhqdq	%xmm10,%xmm15
2708bc3d5698SJohn Baldwin
2709bc3d5698SJohn Baldwin	pshufd	$27,%xmm12,%xmm12
2710bc3d5698SJohn Baldwin	pshufd	$27,%xmm13,%xmm13
2711bc3d5698SJohn Baldwin	pshufd	$27,%xmm14,%xmm14
2712bc3d5698SJohn Baldwin	pshufd	$27,%xmm15,%xmm15
2713bc3d5698SJohn Baldwin	jmp	.Loop_shaext
2714bc3d5698SJohn Baldwin
2715bc3d5698SJohn Baldwin.align	32
2716bc3d5698SJohn Baldwin.Loop_shaext:
2717bc3d5698SJohn Baldwin	movdqu	0(%r8),%xmm4
2718bc3d5698SJohn Baldwin	movdqu	0(%r9),%xmm8
2719bc3d5698SJohn Baldwin	movdqu	16(%r8),%xmm5
2720bc3d5698SJohn Baldwin	movdqu	16(%r9),%xmm9
2721bc3d5698SJohn Baldwin	movdqu	32(%r8),%xmm6
2722bc3d5698SJohn Baldwin.byte	102,15,56,0,227
2723bc3d5698SJohn Baldwin	movdqu	32(%r9),%xmm10
2724bc3d5698SJohn Baldwin.byte	102,68,15,56,0,195
2725bc3d5698SJohn Baldwin	movdqu	48(%r8),%xmm7
2726bc3d5698SJohn Baldwin	leaq	64(%r8),%r8
2727bc3d5698SJohn Baldwin	movdqu	48(%r9),%xmm11
2728bc3d5698SJohn Baldwin	leaq	64(%r9),%r9
2729bc3d5698SJohn Baldwin
2730bc3d5698SJohn Baldwin	movdqa	0-128(%rbp),%xmm0
2731bc3d5698SJohn Baldwin.byte	102,15,56,0,235
2732bc3d5698SJohn Baldwin	paddd	%xmm4,%xmm0
2733bc3d5698SJohn Baldwin	pxor	%xmm12,%xmm4
2734bc3d5698SJohn Baldwin	movdqa	%xmm0,%xmm1
2735bc3d5698SJohn Baldwin	movdqa	0-128(%rbp),%xmm2
2736bc3d5698SJohn Baldwin.byte	102,68,15,56,0,203
2737bc3d5698SJohn Baldwin	paddd	%xmm8,%xmm2
2738bc3d5698SJohn Baldwin	movdqa	%xmm13,80(%rsp)
2739bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2740bc3d5698SJohn Baldwin	pxor	%xmm14,%xmm8
2741bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2742bc3d5698SJohn Baldwin	movdqa	%xmm15,112(%rsp)
2743bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2744bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2745bc3d5698SJohn Baldwin	pxor	%xmm12,%xmm4
2746bc3d5698SJohn Baldwin	movdqa	%xmm12,64(%rsp)
2747bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2748bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2749bc3d5698SJohn Baldwin	pxor	%xmm14,%xmm8
2750bc3d5698SJohn Baldwin	movdqa	%xmm14,96(%rsp)
2751bc3d5698SJohn Baldwin	movdqa	16-128(%rbp),%xmm1
2752bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm1
2753bc3d5698SJohn Baldwin.byte	102,15,56,0,243
2754bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2755bc3d5698SJohn Baldwin
2756bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2757bc3d5698SJohn Baldwin	movdqa	16-128(%rbp),%xmm2
2758bc3d5698SJohn Baldwin	paddd	%xmm9,%xmm2
2759bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2760bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2761bc3d5698SJohn Baldwin	prefetcht0	127(%r8)
2762bc3d5698SJohn Baldwin.byte	102,15,56,0,251
2763bc3d5698SJohn Baldwin.byte	102,68,15,56,0,211
2764bc3d5698SJohn Baldwin	prefetcht0	127(%r9)
2765bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2766bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2767bc3d5698SJohn Baldwin.byte	102,68,15,56,0,219
2768bc3d5698SJohn Baldwin.byte	15,56,204,229
2769bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2770bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2771bc3d5698SJohn Baldwin	movdqa	32-128(%rbp),%xmm1
2772bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm1
2773bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2774bc3d5698SJohn Baldwin
2775bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2776bc3d5698SJohn Baldwin	movdqa	32-128(%rbp),%xmm2
2777bc3d5698SJohn Baldwin	paddd	%xmm10,%xmm2
2778bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2779bc3d5698SJohn Baldwin.byte	69,15,56,204,193
2780bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2781bc3d5698SJohn Baldwin	movdqa	%xmm7,%xmm3
2782bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2783bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2784bc3d5698SJohn Baldwin.byte	102,15,58,15,222,4
2785bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm4
2786bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm3
2787bc3d5698SJohn Baldwin.byte	102,65,15,58,15,218,4
2788bc3d5698SJohn Baldwin.byte	15,56,204,238
2789bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2790bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2791bc3d5698SJohn Baldwin	movdqa	48-128(%rbp),%xmm1
2792bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm1
2793bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2794bc3d5698SJohn Baldwin.byte	69,15,56,204,202
2795bc3d5698SJohn Baldwin
2796bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2797bc3d5698SJohn Baldwin	movdqa	48-128(%rbp),%xmm2
2798bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm8
2799bc3d5698SJohn Baldwin	paddd	%xmm11,%xmm2
2800bc3d5698SJohn Baldwin.byte	15,56,205,231
2801bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2802bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2803bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm3
2804bc3d5698SJohn Baldwin.byte	102,15,58,15,223,4
2805bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2806bc3d5698SJohn Baldwin.byte	69,15,56,205,195
2807bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2808bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm5
2809bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm3
2810bc3d5698SJohn Baldwin.byte	102,65,15,58,15,219,4
2811bc3d5698SJohn Baldwin.byte	15,56,204,247
2812bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2813bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2814bc3d5698SJohn Baldwin	movdqa	64-128(%rbp),%xmm1
2815bc3d5698SJohn Baldwin	paddd	%xmm4,%xmm1
2816bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2817bc3d5698SJohn Baldwin.byte	69,15,56,204,211
2818bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2819bc3d5698SJohn Baldwin	movdqa	64-128(%rbp),%xmm2
2820bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm9
2821bc3d5698SJohn Baldwin	paddd	%xmm8,%xmm2
2822bc3d5698SJohn Baldwin.byte	15,56,205,236
2823bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2824bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2825bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm3
2826bc3d5698SJohn Baldwin.byte	102,15,58,15,220,4
2827bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2828bc3d5698SJohn Baldwin.byte	69,15,56,205,200
2829bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2830bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm6
2831bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm3
2832bc3d5698SJohn Baldwin.byte	102,65,15,58,15,216,4
2833bc3d5698SJohn Baldwin.byte	15,56,204,252
2834bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2835bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2836bc3d5698SJohn Baldwin	movdqa	80-128(%rbp),%xmm1
2837bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm1
2838bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2839bc3d5698SJohn Baldwin.byte	69,15,56,204,216
2840bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2841bc3d5698SJohn Baldwin	movdqa	80-128(%rbp),%xmm2
2842bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm10
2843bc3d5698SJohn Baldwin	paddd	%xmm9,%xmm2
2844bc3d5698SJohn Baldwin.byte	15,56,205,245
2845bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2846bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2847bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm3
2848bc3d5698SJohn Baldwin.byte	102,15,58,15,221,4
2849bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2850bc3d5698SJohn Baldwin.byte	69,15,56,205,209
2851bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2852bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm7
2853bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm3
2854bc3d5698SJohn Baldwin.byte	102,65,15,58,15,217,4
2855bc3d5698SJohn Baldwin.byte	15,56,204,229
2856bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2857bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2858bc3d5698SJohn Baldwin	movdqa	96-128(%rbp),%xmm1
2859bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm1
2860bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2861bc3d5698SJohn Baldwin.byte	69,15,56,204,193
2862bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2863bc3d5698SJohn Baldwin	movdqa	96-128(%rbp),%xmm2
2864bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm11
2865bc3d5698SJohn Baldwin	paddd	%xmm10,%xmm2
2866bc3d5698SJohn Baldwin.byte	15,56,205,254
2867bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2868bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2869bc3d5698SJohn Baldwin	movdqa	%xmm7,%xmm3
2870bc3d5698SJohn Baldwin.byte	102,15,58,15,222,4
2871bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2872bc3d5698SJohn Baldwin.byte	69,15,56,205,218
2873bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2874bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm4
2875bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm3
2876bc3d5698SJohn Baldwin.byte	102,65,15,58,15,218,4
2877bc3d5698SJohn Baldwin.byte	15,56,204,238
2878bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2879bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2880bc3d5698SJohn Baldwin	movdqa	112-128(%rbp),%xmm1
2881bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm1
2882bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2883bc3d5698SJohn Baldwin.byte	69,15,56,204,202
2884bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2885bc3d5698SJohn Baldwin	movdqa	112-128(%rbp),%xmm2
2886bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm8
2887bc3d5698SJohn Baldwin	paddd	%xmm11,%xmm2
2888bc3d5698SJohn Baldwin.byte	15,56,205,231
2889bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2890bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2891bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm3
2892bc3d5698SJohn Baldwin.byte	102,15,58,15,223,4
2893bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2894bc3d5698SJohn Baldwin.byte	69,15,56,205,195
2895bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2896bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm5
2897bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm3
2898bc3d5698SJohn Baldwin.byte	102,65,15,58,15,219,4
2899bc3d5698SJohn Baldwin.byte	15,56,204,247
2900bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2901bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2902bc3d5698SJohn Baldwin	movdqa	128-128(%rbp),%xmm1
2903bc3d5698SJohn Baldwin	paddd	%xmm4,%xmm1
2904bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2905bc3d5698SJohn Baldwin.byte	69,15,56,204,211
2906bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2907bc3d5698SJohn Baldwin	movdqa	128-128(%rbp),%xmm2
2908bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm9
2909bc3d5698SJohn Baldwin	paddd	%xmm8,%xmm2
2910bc3d5698SJohn Baldwin.byte	15,56,205,236
2911bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2912bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2913bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm3
2914bc3d5698SJohn Baldwin.byte	102,15,58,15,220,4
2915bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2916bc3d5698SJohn Baldwin.byte	69,15,56,205,200
2917bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2918bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm6
2919bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm3
2920bc3d5698SJohn Baldwin.byte	102,65,15,58,15,216,4
2921bc3d5698SJohn Baldwin.byte	15,56,204,252
2922bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2923bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2924bc3d5698SJohn Baldwin	movdqa	144-128(%rbp),%xmm1
2925bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm1
2926bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2927bc3d5698SJohn Baldwin.byte	69,15,56,204,216
2928bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2929bc3d5698SJohn Baldwin	movdqa	144-128(%rbp),%xmm2
2930bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm10
2931bc3d5698SJohn Baldwin	paddd	%xmm9,%xmm2
2932bc3d5698SJohn Baldwin.byte	15,56,205,245
2933bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2934bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2935bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm3
2936bc3d5698SJohn Baldwin.byte	102,15,58,15,221,4
2937bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2938bc3d5698SJohn Baldwin.byte	69,15,56,205,209
2939bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2940bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm7
2941bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm3
2942bc3d5698SJohn Baldwin.byte	102,65,15,58,15,217,4
2943bc3d5698SJohn Baldwin.byte	15,56,204,229
2944bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2945bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2946bc3d5698SJohn Baldwin	movdqa	160-128(%rbp),%xmm1
2947bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm1
2948bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2949bc3d5698SJohn Baldwin.byte	69,15,56,204,193
2950bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2951bc3d5698SJohn Baldwin	movdqa	160-128(%rbp),%xmm2
2952bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm11
2953bc3d5698SJohn Baldwin	paddd	%xmm10,%xmm2
2954bc3d5698SJohn Baldwin.byte	15,56,205,254
2955bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2956bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2957bc3d5698SJohn Baldwin	movdqa	%xmm7,%xmm3
2958bc3d5698SJohn Baldwin.byte	102,15,58,15,222,4
2959bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2960bc3d5698SJohn Baldwin.byte	69,15,56,205,218
2961bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2962bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm4
2963bc3d5698SJohn Baldwin	movdqa	%xmm11,%xmm3
2964bc3d5698SJohn Baldwin.byte	102,65,15,58,15,218,4
2965bc3d5698SJohn Baldwin.byte	15,56,204,238
2966bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2967bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2968bc3d5698SJohn Baldwin	movdqa	176-128(%rbp),%xmm1
2969bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm1
2970bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2971bc3d5698SJohn Baldwin.byte	69,15,56,204,202
2972bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2973bc3d5698SJohn Baldwin	movdqa	176-128(%rbp),%xmm2
2974bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm8
2975bc3d5698SJohn Baldwin	paddd	%xmm11,%xmm2
2976bc3d5698SJohn Baldwin.byte	15,56,205,231
2977bc3d5698SJohn Baldwin.byte	69,15,56,203,236
2978bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
2979bc3d5698SJohn Baldwin	movdqa	%xmm4,%xmm3
2980bc3d5698SJohn Baldwin.byte	102,15,58,15,223,4
2981bc3d5698SJohn Baldwin.byte	69,15,56,203,254
2982bc3d5698SJohn Baldwin.byte	69,15,56,205,195
2983bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
2984bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm5
2985bc3d5698SJohn Baldwin	movdqa	%xmm8,%xmm3
2986bc3d5698SJohn Baldwin.byte	102,65,15,58,15,219,4
2987bc3d5698SJohn Baldwin.byte	15,56,204,247
2988bc3d5698SJohn Baldwin.byte	69,15,56,203,229
2989bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
2990bc3d5698SJohn Baldwin	movdqa	192-128(%rbp),%xmm1
2991bc3d5698SJohn Baldwin	paddd	%xmm4,%xmm1
2992bc3d5698SJohn Baldwin.byte	69,15,56,203,247
2993bc3d5698SJohn Baldwin.byte	69,15,56,204,211
2994bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
2995bc3d5698SJohn Baldwin	movdqa	192-128(%rbp),%xmm2
2996bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm9
2997bc3d5698SJohn Baldwin	paddd	%xmm8,%xmm2
2998bc3d5698SJohn Baldwin.byte	15,56,205,236
2999bc3d5698SJohn Baldwin.byte	69,15,56,203,236
3000bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
3001bc3d5698SJohn Baldwin	movdqa	%xmm5,%xmm3
3002bc3d5698SJohn Baldwin.byte	102,15,58,15,220,4
3003bc3d5698SJohn Baldwin.byte	69,15,56,203,254
3004bc3d5698SJohn Baldwin.byte	69,15,56,205,200
3005bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
3006bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm6
3007bc3d5698SJohn Baldwin	movdqa	%xmm9,%xmm3
3008bc3d5698SJohn Baldwin.byte	102,65,15,58,15,216,4
3009bc3d5698SJohn Baldwin.byte	15,56,204,252
3010bc3d5698SJohn Baldwin.byte	69,15,56,203,229
3011bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
3012bc3d5698SJohn Baldwin	movdqa	208-128(%rbp),%xmm1
3013bc3d5698SJohn Baldwin	paddd	%xmm5,%xmm1
3014bc3d5698SJohn Baldwin.byte	69,15,56,203,247
3015bc3d5698SJohn Baldwin.byte	69,15,56,204,216
3016bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
3017bc3d5698SJohn Baldwin	movdqa	208-128(%rbp),%xmm2
3018bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm10
3019bc3d5698SJohn Baldwin	paddd	%xmm9,%xmm2
3020bc3d5698SJohn Baldwin.byte	15,56,205,245
3021bc3d5698SJohn Baldwin.byte	69,15,56,203,236
3022bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
3023bc3d5698SJohn Baldwin	movdqa	%xmm6,%xmm3
3024bc3d5698SJohn Baldwin.byte	102,15,58,15,221,4
3025bc3d5698SJohn Baldwin.byte	69,15,56,203,254
3026bc3d5698SJohn Baldwin.byte	69,15,56,205,209
3027bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
3028bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm7
3029bc3d5698SJohn Baldwin	movdqa	%xmm10,%xmm3
3030bc3d5698SJohn Baldwin.byte	102,65,15,58,15,217,4
3031bc3d5698SJohn Baldwin	nop
3032bc3d5698SJohn Baldwin.byte	69,15,56,203,229
3033bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
3034bc3d5698SJohn Baldwin	movdqa	224-128(%rbp),%xmm1
3035bc3d5698SJohn Baldwin	paddd	%xmm6,%xmm1
3036bc3d5698SJohn Baldwin.byte	69,15,56,203,247
3037bc3d5698SJohn Baldwin
3038bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
3039bc3d5698SJohn Baldwin	movdqa	224-128(%rbp),%xmm2
3040bc3d5698SJohn Baldwin	paddd	%xmm3,%xmm11
3041bc3d5698SJohn Baldwin	paddd	%xmm10,%xmm2
3042bc3d5698SJohn Baldwin.byte	15,56,205,254
3043bc3d5698SJohn Baldwin	nop
3044bc3d5698SJohn Baldwin.byte	69,15,56,203,236
3045bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
3046bc3d5698SJohn Baldwin	movl	$1,%ecx
3047bc3d5698SJohn Baldwin	pxor	%xmm6,%xmm6
3048bc3d5698SJohn Baldwin.byte	69,15,56,203,254
3049bc3d5698SJohn Baldwin.byte	69,15,56,205,218
3050bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
3051bc3d5698SJohn Baldwin	movdqa	240-128(%rbp),%xmm1
3052bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm1
3053bc3d5698SJohn Baldwin	movq	(%rbx),%xmm7
3054bc3d5698SJohn Baldwin	nop
3055bc3d5698SJohn Baldwin.byte	69,15,56,203,229
3056bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
3057bc3d5698SJohn Baldwin	movdqa	240-128(%rbp),%xmm2
3058bc3d5698SJohn Baldwin	paddd	%xmm11,%xmm2
3059bc3d5698SJohn Baldwin.byte	69,15,56,203,247
3060bc3d5698SJohn Baldwin
3061bc3d5698SJohn Baldwin	movdqa	%xmm1,%xmm0
3062bc3d5698SJohn Baldwin	cmpl	0(%rbx),%ecx
3063bc3d5698SJohn Baldwin	cmovgeq	%rsp,%r8
3064bc3d5698SJohn Baldwin	cmpl	4(%rbx),%ecx
3065bc3d5698SJohn Baldwin	cmovgeq	%rsp,%r9
3066bc3d5698SJohn Baldwin	pshufd	$0x00,%xmm7,%xmm9
3067bc3d5698SJohn Baldwin.byte	69,15,56,203,236
3068bc3d5698SJohn Baldwin	movdqa	%xmm2,%xmm0
3069bc3d5698SJohn Baldwin	pshufd	$0x55,%xmm7,%xmm10
3070bc3d5698SJohn Baldwin	movdqa	%xmm7,%xmm11
3071bc3d5698SJohn Baldwin.byte	69,15,56,203,254
3072bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm1,%xmm0
3073bc3d5698SJohn Baldwin	pcmpgtd	%xmm6,%xmm9
3074bc3d5698SJohn Baldwin	pcmpgtd	%xmm6,%xmm10
3075bc3d5698SJohn Baldwin.byte	69,15,56,203,229
3076bc3d5698SJohn Baldwin	pshufd	$0x0e,%xmm2,%xmm0
3077bc3d5698SJohn Baldwin	pcmpgtd	%xmm6,%xmm11
3078bc3d5698SJohn Baldwin	movdqa	K256_shaext-16(%rip),%xmm3
3079bc3d5698SJohn Baldwin.byte	69,15,56,203,247
3080bc3d5698SJohn Baldwin
3081bc3d5698SJohn Baldwin	pand	%xmm9,%xmm13
3082bc3d5698SJohn Baldwin	pand	%xmm10,%xmm15
3083bc3d5698SJohn Baldwin	pand	%xmm9,%xmm12
3084bc3d5698SJohn Baldwin	pand	%xmm10,%xmm14
3085bc3d5698SJohn Baldwin	paddd	%xmm7,%xmm11
3086bc3d5698SJohn Baldwin
3087bc3d5698SJohn Baldwin	paddd	80(%rsp),%xmm13
3088bc3d5698SJohn Baldwin	paddd	112(%rsp),%xmm15
3089bc3d5698SJohn Baldwin	paddd	64(%rsp),%xmm12
3090bc3d5698SJohn Baldwin	paddd	96(%rsp),%xmm14
3091bc3d5698SJohn Baldwin
3092bc3d5698SJohn Baldwin	movq	%xmm11,(%rbx)
3093bc3d5698SJohn Baldwin	decl	%edx
3094bc3d5698SJohn Baldwin	jnz	.Loop_shaext
3095bc3d5698SJohn Baldwin
3096bc3d5698SJohn Baldwin	movl	280(%rsp),%edx
3097bc3d5698SJohn Baldwin
3098bc3d5698SJohn Baldwin	pshufd	$27,%xmm12,%xmm12
3099bc3d5698SJohn Baldwin	pshufd	$27,%xmm13,%xmm13
3100bc3d5698SJohn Baldwin	pshufd	$27,%xmm14,%xmm14
3101bc3d5698SJohn Baldwin	pshufd	$27,%xmm15,%xmm15
3102bc3d5698SJohn Baldwin
3103bc3d5698SJohn Baldwin	movdqa	%xmm12,%xmm5
3104bc3d5698SJohn Baldwin	movdqa	%xmm13,%xmm6
3105bc3d5698SJohn Baldwin	punpckldq	%xmm14,%xmm12
3106bc3d5698SJohn Baldwin	punpckhdq	%xmm14,%xmm5
3107bc3d5698SJohn Baldwin	punpckldq	%xmm15,%xmm13
3108bc3d5698SJohn Baldwin	punpckhdq	%xmm15,%xmm6
3109bc3d5698SJohn Baldwin
3110bc3d5698SJohn Baldwin	movq	%xmm12,0-128(%rdi)
3111bc3d5698SJohn Baldwin	psrldq	$8,%xmm12
3112bc3d5698SJohn Baldwin	movq	%xmm5,128-128(%rdi)
3113bc3d5698SJohn Baldwin	psrldq	$8,%xmm5
3114bc3d5698SJohn Baldwin	movq	%xmm12,32-128(%rdi)
3115bc3d5698SJohn Baldwin	movq	%xmm5,160-128(%rdi)
3116bc3d5698SJohn Baldwin
3117bc3d5698SJohn Baldwin	movq	%xmm13,64-128(%rdi)
3118bc3d5698SJohn Baldwin	psrldq	$8,%xmm13
3119bc3d5698SJohn Baldwin	movq	%xmm6,192-128(%rdi)
3120bc3d5698SJohn Baldwin	psrldq	$8,%xmm6
3121bc3d5698SJohn Baldwin	movq	%xmm13,96-128(%rdi)
3122bc3d5698SJohn Baldwin	movq	%xmm6,224-128(%rdi)
3123bc3d5698SJohn Baldwin
3124bc3d5698SJohn Baldwin	leaq	8(%rdi),%rdi
3125bc3d5698SJohn Baldwin	leaq	32(%rsi),%rsi
3126bc3d5698SJohn Baldwin	decl	%edx
3127bc3d5698SJohn Baldwin	jnz	.Loop_grande_shaext
3128bc3d5698SJohn Baldwin
3129bc3d5698SJohn Baldwin.Ldone_shaext:
3130bc3d5698SJohn Baldwin
3131bc3d5698SJohn Baldwin	movq	-16(%rax),%rbp
3132bc3d5698SJohn Baldwin.cfi_restore	%rbp
3133bc3d5698SJohn Baldwin	movq	-8(%rax),%rbx
3134bc3d5698SJohn Baldwin.cfi_restore	%rbx
3135bc3d5698SJohn Baldwin	leaq	(%rax),%rsp
3136bc3d5698SJohn Baldwin.cfi_def_cfa_register	%rsp
3137bc3d5698SJohn Baldwin.Lepilogue_shaext:
3138bc3d5698SJohn Baldwin	.byte	0xf3,0xc3
3139bc3d5698SJohn Baldwin.cfi_endproc
3140bc3d5698SJohn Baldwin.size	sha256_multi_block_shaext,.-sha256_multi_block_shaext
3141bc3d5698SJohn Baldwin.type	sha256_multi_block_avx,@function
3142bc3d5698SJohn Baldwin.align	32
3143bc3d5698SJohn Baldwinsha256_multi_block_avx:
3144bc3d5698SJohn Baldwin.cfi_startproc
3145bc3d5698SJohn Baldwin_avx_shortcut:
3146bc3d5698SJohn Baldwin	shrq	$32,%rcx
3147bc3d5698SJohn Baldwin	cmpl	$2,%edx
3148bc3d5698SJohn Baldwin	jb	.Lavx
3149bc3d5698SJohn Baldwin	testl	$32,%ecx
3150bc3d5698SJohn Baldwin	jnz	_avx2_shortcut
3151bc3d5698SJohn Baldwin	jmp	.Lavx
3152bc3d5698SJohn Baldwin.align	32
3153bc3d5698SJohn Baldwin.Lavx:
3154bc3d5698SJohn Baldwin	movq	%rsp,%rax
3155bc3d5698SJohn Baldwin.cfi_def_cfa_register	%rax
3156bc3d5698SJohn Baldwin	pushq	%rbx
3157bc3d5698SJohn Baldwin.cfi_offset	%rbx,-16
3158bc3d5698SJohn Baldwin	pushq	%rbp
3159bc3d5698SJohn Baldwin.cfi_offset	%rbp,-24
3160bc3d5698SJohn Baldwin	subq	$288,%rsp
3161bc3d5698SJohn Baldwin	andq	$-256,%rsp
3162bc3d5698SJohn Baldwin	movq	%rax,272(%rsp)
3163bc3d5698SJohn Baldwin.cfi_escape	0x0f,0x06,0x77,0x90,0x02,0x06,0x23,0x08
3164bc3d5698SJohn Baldwin.Lbody_avx:
3165bc3d5698SJohn Baldwin	leaq	K256+128(%rip),%rbp
3166bc3d5698SJohn Baldwin	leaq	256(%rsp),%rbx
3167bc3d5698SJohn Baldwin	leaq	128(%rdi),%rdi
3168bc3d5698SJohn Baldwin
3169bc3d5698SJohn Baldwin.Loop_grande_avx:
3170bc3d5698SJohn Baldwin	movl	%edx,280(%rsp)
3171bc3d5698SJohn Baldwin	xorl	%edx,%edx
3172*c0855eaaSJohn Baldwin
3173bc3d5698SJohn Baldwin	movq	0(%rsi),%r8
3174*c0855eaaSJohn Baldwin
3175bc3d5698SJohn Baldwin	movl	8(%rsi),%ecx
3176bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
3177bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
3178bc3d5698SJohn Baldwin	testl	%ecx,%ecx
3179bc3d5698SJohn Baldwin	movl	%ecx,0(%rbx)
3180bc3d5698SJohn Baldwin	cmovleq	%rbp,%r8
3181*c0855eaaSJohn Baldwin
3182bc3d5698SJohn Baldwin	movq	16(%rsi),%r9
3183*c0855eaaSJohn Baldwin
3184bc3d5698SJohn Baldwin	movl	24(%rsi),%ecx
3185bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
3186bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
3187bc3d5698SJohn Baldwin	testl	%ecx,%ecx
3188bc3d5698SJohn Baldwin	movl	%ecx,4(%rbx)
3189bc3d5698SJohn Baldwin	cmovleq	%rbp,%r9
3190*c0855eaaSJohn Baldwin
3191bc3d5698SJohn Baldwin	movq	32(%rsi),%r10
3192*c0855eaaSJohn Baldwin
3193bc3d5698SJohn Baldwin	movl	40(%rsi),%ecx
3194bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
3195bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
3196bc3d5698SJohn Baldwin	testl	%ecx,%ecx
3197bc3d5698SJohn Baldwin	movl	%ecx,8(%rbx)
3198bc3d5698SJohn Baldwin	cmovleq	%rbp,%r10
3199*c0855eaaSJohn Baldwin
3200bc3d5698SJohn Baldwin	movq	48(%rsi),%r11
3201*c0855eaaSJohn Baldwin
3202bc3d5698SJohn Baldwin	movl	56(%rsi),%ecx
3203bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
3204bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
3205bc3d5698SJohn Baldwin	testl	%ecx,%ecx
3206bc3d5698SJohn Baldwin	movl	%ecx,12(%rbx)
3207bc3d5698SJohn Baldwin	cmovleq	%rbp,%r11
3208bc3d5698SJohn Baldwin	testl	%edx,%edx
3209bc3d5698SJohn Baldwin	jz	.Ldone_avx
3210bc3d5698SJohn Baldwin
3211bc3d5698SJohn Baldwin	vmovdqu	0-128(%rdi),%xmm8
3212bc3d5698SJohn Baldwin	leaq	128(%rsp),%rax
3213bc3d5698SJohn Baldwin	vmovdqu	32-128(%rdi),%xmm9
3214bc3d5698SJohn Baldwin	vmovdqu	64-128(%rdi),%xmm10
3215bc3d5698SJohn Baldwin	vmovdqu	96-128(%rdi),%xmm11
3216bc3d5698SJohn Baldwin	vmovdqu	128-128(%rdi),%xmm12
3217bc3d5698SJohn Baldwin	vmovdqu	160-128(%rdi),%xmm13
3218bc3d5698SJohn Baldwin	vmovdqu	192-128(%rdi),%xmm14
3219bc3d5698SJohn Baldwin	vmovdqu	224-128(%rdi),%xmm15
3220bc3d5698SJohn Baldwin	vmovdqu	.Lpbswap(%rip),%xmm6
3221bc3d5698SJohn Baldwin	jmp	.Loop_avx
3222bc3d5698SJohn Baldwin
3223bc3d5698SJohn Baldwin.align	32
3224bc3d5698SJohn Baldwin.Loop_avx:
3225bc3d5698SJohn Baldwin	vpxor	%xmm9,%xmm10,%xmm4
3226bc3d5698SJohn Baldwin	vmovd	0(%r8),%xmm5
3227bc3d5698SJohn Baldwin	vmovd	0(%r9),%xmm0
3228bc3d5698SJohn Baldwin	vpinsrd	$1,0(%r10),%xmm5,%xmm5
3229bc3d5698SJohn Baldwin	vpinsrd	$1,0(%r11),%xmm0,%xmm0
3230bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3231bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3232bc3d5698SJohn Baldwin	vpsrld	$6,%xmm12,%xmm7
3233bc3d5698SJohn Baldwin	vpslld	$26,%xmm12,%xmm2
3234bc3d5698SJohn Baldwin	vmovdqu	%xmm5,0-128(%rax)
3235bc3d5698SJohn Baldwin	vpaddd	%xmm15,%xmm5,%xmm5
3236bc3d5698SJohn Baldwin
3237bc3d5698SJohn Baldwin	vpsrld	$11,%xmm12,%xmm1
3238bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3239bc3d5698SJohn Baldwin	vpslld	$21,%xmm12,%xmm2
3240bc3d5698SJohn Baldwin	vpaddd	-128(%rbp),%xmm5,%xmm5
3241bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3242bc3d5698SJohn Baldwin
3243bc3d5698SJohn Baldwin	vpsrld	$25,%xmm12,%xmm1
3244bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3245bc3d5698SJohn Baldwin
3246bc3d5698SJohn Baldwin	vpslld	$7,%xmm12,%xmm2
3247bc3d5698SJohn Baldwin	vpandn	%xmm14,%xmm12,%xmm0
3248bc3d5698SJohn Baldwin	vpand	%xmm13,%xmm12,%xmm3
3249bc3d5698SJohn Baldwin
3250bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3251bc3d5698SJohn Baldwin
3252bc3d5698SJohn Baldwin	vpsrld	$2,%xmm8,%xmm15
3253bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3254bc3d5698SJohn Baldwin
3255bc3d5698SJohn Baldwin	vpslld	$30,%xmm8,%xmm1
3256bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
3257bc3d5698SJohn Baldwin	vpxor	%xmm8,%xmm9,%xmm3
3258bc3d5698SJohn Baldwin
3259bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm15,%xmm15
3260bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3261bc3d5698SJohn Baldwin
3262bc3d5698SJohn Baldwin	vpsrld	$13,%xmm8,%xmm1
3263bc3d5698SJohn Baldwin
3264bc3d5698SJohn Baldwin	vpslld	$19,%xmm8,%xmm2
3265bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3266bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
3267bc3d5698SJohn Baldwin
3268bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm15,%xmm7
3269bc3d5698SJohn Baldwin
3270bc3d5698SJohn Baldwin	vpsrld	$22,%xmm8,%xmm1
3271bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3272bc3d5698SJohn Baldwin
3273bc3d5698SJohn Baldwin	vpslld	$10,%xmm8,%xmm2
3274bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm9,%xmm15
3275bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
3276bc3d5698SJohn Baldwin
3277bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3278bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3279bc3d5698SJohn Baldwin
3280bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
3281bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm15,%xmm15
3282bc3d5698SJohn Baldwin	vmovd	4(%r8),%xmm5
3283bc3d5698SJohn Baldwin	vmovd	4(%r9),%xmm0
3284bc3d5698SJohn Baldwin	vpinsrd	$1,4(%r10),%xmm5,%xmm5
3285bc3d5698SJohn Baldwin	vpinsrd	$1,4(%r11),%xmm0,%xmm0
3286bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3287bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3288bc3d5698SJohn Baldwin	vpsrld	$6,%xmm11,%xmm7
3289bc3d5698SJohn Baldwin	vpslld	$26,%xmm11,%xmm2
3290bc3d5698SJohn Baldwin	vmovdqu	%xmm5,16-128(%rax)
3291bc3d5698SJohn Baldwin	vpaddd	%xmm14,%xmm5,%xmm5
3292bc3d5698SJohn Baldwin
3293bc3d5698SJohn Baldwin	vpsrld	$11,%xmm11,%xmm1
3294bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3295bc3d5698SJohn Baldwin	vpslld	$21,%xmm11,%xmm2
3296bc3d5698SJohn Baldwin	vpaddd	-96(%rbp),%xmm5,%xmm5
3297bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3298bc3d5698SJohn Baldwin
3299bc3d5698SJohn Baldwin	vpsrld	$25,%xmm11,%xmm1
3300bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3301bc3d5698SJohn Baldwin
3302bc3d5698SJohn Baldwin	vpslld	$7,%xmm11,%xmm2
3303bc3d5698SJohn Baldwin	vpandn	%xmm13,%xmm11,%xmm0
3304bc3d5698SJohn Baldwin	vpand	%xmm12,%xmm11,%xmm4
3305bc3d5698SJohn Baldwin
3306bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3307bc3d5698SJohn Baldwin
3308bc3d5698SJohn Baldwin	vpsrld	$2,%xmm15,%xmm14
3309bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3310bc3d5698SJohn Baldwin
3311bc3d5698SJohn Baldwin	vpslld	$30,%xmm15,%xmm1
3312bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
3313bc3d5698SJohn Baldwin	vpxor	%xmm15,%xmm8,%xmm4
3314bc3d5698SJohn Baldwin
3315bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm14,%xmm14
3316bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3317bc3d5698SJohn Baldwin
3318bc3d5698SJohn Baldwin	vpsrld	$13,%xmm15,%xmm1
3319bc3d5698SJohn Baldwin
3320bc3d5698SJohn Baldwin	vpslld	$19,%xmm15,%xmm2
3321bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3322bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
3323bc3d5698SJohn Baldwin
3324bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm14,%xmm7
3325bc3d5698SJohn Baldwin
3326bc3d5698SJohn Baldwin	vpsrld	$22,%xmm15,%xmm1
3327bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3328bc3d5698SJohn Baldwin
3329bc3d5698SJohn Baldwin	vpslld	$10,%xmm15,%xmm2
3330bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm8,%xmm14
3331bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm10,%xmm10
3332bc3d5698SJohn Baldwin
3333bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3334bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3335bc3d5698SJohn Baldwin
3336bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm14,%xmm14
3337bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm14,%xmm14
3338bc3d5698SJohn Baldwin	vmovd	8(%r8),%xmm5
3339bc3d5698SJohn Baldwin	vmovd	8(%r9),%xmm0
3340bc3d5698SJohn Baldwin	vpinsrd	$1,8(%r10),%xmm5,%xmm5
3341bc3d5698SJohn Baldwin	vpinsrd	$1,8(%r11),%xmm0,%xmm0
3342bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3343bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3344bc3d5698SJohn Baldwin	vpsrld	$6,%xmm10,%xmm7
3345bc3d5698SJohn Baldwin	vpslld	$26,%xmm10,%xmm2
3346bc3d5698SJohn Baldwin	vmovdqu	%xmm5,32-128(%rax)
3347bc3d5698SJohn Baldwin	vpaddd	%xmm13,%xmm5,%xmm5
3348bc3d5698SJohn Baldwin
3349bc3d5698SJohn Baldwin	vpsrld	$11,%xmm10,%xmm1
3350bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3351bc3d5698SJohn Baldwin	vpslld	$21,%xmm10,%xmm2
3352bc3d5698SJohn Baldwin	vpaddd	-64(%rbp),%xmm5,%xmm5
3353bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3354bc3d5698SJohn Baldwin
3355bc3d5698SJohn Baldwin	vpsrld	$25,%xmm10,%xmm1
3356bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3357bc3d5698SJohn Baldwin
3358bc3d5698SJohn Baldwin	vpslld	$7,%xmm10,%xmm2
3359bc3d5698SJohn Baldwin	vpandn	%xmm12,%xmm10,%xmm0
3360bc3d5698SJohn Baldwin	vpand	%xmm11,%xmm10,%xmm3
3361bc3d5698SJohn Baldwin
3362bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3363bc3d5698SJohn Baldwin
3364bc3d5698SJohn Baldwin	vpsrld	$2,%xmm14,%xmm13
3365bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3366bc3d5698SJohn Baldwin
3367bc3d5698SJohn Baldwin	vpslld	$30,%xmm14,%xmm1
3368bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
3369bc3d5698SJohn Baldwin	vpxor	%xmm14,%xmm15,%xmm3
3370bc3d5698SJohn Baldwin
3371bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm13,%xmm13
3372bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3373bc3d5698SJohn Baldwin
3374bc3d5698SJohn Baldwin	vpsrld	$13,%xmm14,%xmm1
3375bc3d5698SJohn Baldwin
3376bc3d5698SJohn Baldwin	vpslld	$19,%xmm14,%xmm2
3377bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3378bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
3379bc3d5698SJohn Baldwin
3380bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm13,%xmm7
3381bc3d5698SJohn Baldwin
3382bc3d5698SJohn Baldwin	vpsrld	$22,%xmm14,%xmm1
3383bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3384bc3d5698SJohn Baldwin
3385bc3d5698SJohn Baldwin	vpslld	$10,%xmm14,%xmm2
3386bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm15,%xmm13
3387bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm9,%xmm9
3388bc3d5698SJohn Baldwin
3389bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3390bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3391bc3d5698SJohn Baldwin
3392bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm13,%xmm13
3393bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm13,%xmm13
3394bc3d5698SJohn Baldwin	vmovd	12(%r8),%xmm5
3395bc3d5698SJohn Baldwin	vmovd	12(%r9),%xmm0
3396bc3d5698SJohn Baldwin	vpinsrd	$1,12(%r10),%xmm5,%xmm5
3397bc3d5698SJohn Baldwin	vpinsrd	$1,12(%r11),%xmm0,%xmm0
3398bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3399bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3400bc3d5698SJohn Baldwin	vpsrld	$6,%xmm9,%xmm7
3401bc3d5698SJohn Baldwin	vpslld	$26,%xmm9,%xmm2
3402bc3d5698SJohn Baldwin	vmovdqu	%xmm5,48-128(%rax)
3403bc3d5698SJohn Baldwin	vpaddd	%xmm12,%xmm5,%xmm5
3404bc3d5698SJohn Baldwin
3405bc3d5698SJohn Baldwin	vpsrld	$11,%xmm9,%xmm1
3406bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3407bc3d5698SJohn Baldwin	vpslld	$21,%xmm9,%xmm2
3408bc3d5698SJohn Baldwin	vpaddd	-32(%rbp),%xmm5,%xmm5
3409bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3410bc3d5698SJohn Baldwin
3411bc3d5698SJohn Baldwin	vpsrld	$25,%xmm9,%xmm1
3412bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3413bc3d5698SJohn Baldwin
3414bc3d5698SJohn Baldwin	vpslld	$7,%xmm9,%xmm2
3415bc3d5698SJohn Baldwin	vpandn	%xmm11,%xmm9,%xmm0
3416bc3d5698SJohn Baldwin	vpand	%xmm10,%xmm9,%xmm4
3417bc3d5698SJohn Baldwin
3418bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3419bc3d5698SJohn Baldwin
3420bc3d5698SJohn Baldwin	vpsrld	$2,%xmm13,%xmm12
3421bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3422bc3d5698SJohn Baldwin
3423bc3d5698SJohn Baldwin	vpslld	$30,%xmm13,%xmm1
3424bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
3425bc3d5698SJohn Baldwin	vpxor	%xmm13,%xmm14,%xmm4
3426bc3d5698SJohn Baldwin
3427bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm12,%xmm12
3428bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3429bc3d5698SJohn Baldwin
3430bc3d5698SJohn Baldwin	vpsrld	$13,%xmm13,%xmm1
3431bc3d5698SJohn Baldwin
3432bc3d5698SJohn Baldwin	vpslld	$19,%xmm13,%xmm2
3433bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3434bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
3435bc3d5698SJohn Baldwin
3436bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm12,%xmm7
3437bc3d5698SJohn Baldwin
3438bc3d5698SJohn Baldwin	vpsrld	$22,%xmm13,%xmm1
3439bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3440bc3d5698SJohn Baldwin
3441bc3d5698SJohn Baldwin	vpslld	$10,%xmm13,%xmm2
3442bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm14,%xmm12
3443bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm8,%xmm8
3444bc3d5698SJohn Baldwin
3445bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3446bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3447bc3d5698SJohn Baldwin
3448bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm12,%xmm12
3449bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm12,%xmm12
3450bc3d5698SJohn Baldwin	vmovd	16(%r8),%xmm5
3451bc3d5698SJohn Baldwin	vmovd	16(%r9),%xmm0
3452bc3d5698SJohn Baldwin	vpinsrd	$1,16(%r10),%xmm5,%xmm5
3453bc3d5698SJohn Baldwin	vpinsrd	$1,16(%r11),%xmm0,%xmm0
3454bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3455bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3456bc3d5698SJohn Baldwin	vpsrld	$6,%xmm8,%xmm7
3457bc3d5698SJohn Baldwin	vpslld	$26,%xmm8,%xmm2
3458bc3d5698SJohn Baldwin	vmovdqu	%xmm5,64-128(%rax)
3459bc3d5698SJohn Baldwin	vpaddd	%xmm11,%xmm5,%xmm5
3460bc3d5698SJohn Baldwin
3461bc3d5698SJohn Baldwin	vpsrld	$11,%xmm8,%xmm1
3462bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3463bc3d5698SJohn Baldwin	vpslld	$21,%xmm8,%xmm2
3464bc3d5698SJohn Baldwin	vpaddd	0(%rbp),%xmm5,%xmm5
3465bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3466bc3d5698SJohn Baldwin
3467bc3d5698SJohn Baldwin	vpsrld	$25,%xmm8,%xmm1
3468bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3469bc3d5698SJohn Baldwin
3470bc3d5698SJohn Baldwin	vpslld	$7,%xmm8,%xmm2
3471bc3d5698SJohn Baldwin	vpandn	%xmm10,%xmm8,%xmm0
3472bc3d5698SJohn Baldwin	vpand	%xmm9,%xmm8,%xmm3
3473bc3d5698SJohn Baldwin
3474bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3475bc3d5698SJohn Baldwin
3476bc3d5698SJohn Baldwin	vpsrld	$2,%xmm12,%xmm11
3477bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3478bc3d5698SJohn Baldwin
3479bc3d5698SJohn Baldwin	vpslld	$30,%xmm12,%xmm1
3480bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
3481bc3d5698SJohn Baldwin	vpxor	%xmm12,%xmm13,%xmm3
3482bc3d5698SJohn Baldwin
3483bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm11,%xmm11
3484bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3485bc3d5698SJohn Baldwin
3486bc3d5698SJohn Baldwin	vpsrld	$13,%xmm12,%xmm1
3487bc3d5698SJohn Baldwin
3488bc3d5698SJohn Baldwin	vpslld	$19,%xmm12,%xmm2
3489bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3490bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
3491bc3d5698SJohn Baldwin
3492bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm11,%xmm7
3493bc3d5698SJohn Baldwin
3494bc3d5698SJohn Baldwin	vpsrld	$22,%xmm12,%xmm1
3495bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3496bc3d5698SJohn Baldwin
3497bc3d5698SJohn Baldwin	vpslld	$10,%xmm12,%xmm2
3498bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm13,%xmm11
3499bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
3500bc3d5698SJohn Baldwin
3501bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3502bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3503bc3d5698SJohn Baldwin
3504bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
3505bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm11,%xmm11
3506bc3d5698SJohn Baldwin	vmovd	20(%r8),%xmm5
3507bc3d5698SJohn Baldwin	vmovd	20(%r9),%xmm0
3508bc3d5698SJohn Baldwin	vpinsrd	$1,20(%r10),%xmm5,%xmm5
3509bc3d5698SJohn Baldwin	vpinsrd	$1,20(%r11),%xmm0,%xmm0
3510bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3511bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3512bc3d5698SJohn Baldwin	vpsrld	$6,%xmm15,%xmm7
3513bc3d5698SJohn Baldwin	vpslld	$26,%xmm15,%xmm2
3514bc3d5698SJohn Baldwin	vmovdqu	%xmm5,80-128(%rax)
3515bc3d5698SJohn Baldwin	vpaddd	%xmm10,%xmm5,%xmm5
3516bc3d5698SJohn Baldwin
3517bc3d5698SJohn Baldwin	vpsrld	$11,%xmm15,%xmm1
3518bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3519bc3d5698SJohn Baldwin	vpslld	$21,%xmm15,%xmm2
3520bc3d5698SJohn Baldwin	vpaddd	32(%rbp),%xmm5,%xmm5
3521bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3522bc3d5698SJohn Baldwin
3523bc3d5698SJohn Baldwin	vpsrld	$25,%xmm15,%xmm1
3524bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3525bc3d5698SJohn Baldwin
3526bc3d5698SJohn Baldwin	vpslld	$7,%xmm15,%xmm2
3527bc3d5698SJohn Baldwin	vpandn	%xmm9,%xmm15,%xmm0
3528bc3d5698SJohn Baldwin	vpand	%xmm8,%xmm15,%xmm4
3529bc3d5698SJohn Baldwin
3530bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3531bc3d5698SJohn Baldwin
3532bc3d5698SJohn Baldwin	vpsrld	$2,%xmm11,%xmm10
3533bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3534bc3d5698SJohn Baldwin
3535bc3d5698SJohn Baldwin	vpslld	$30,%xmm11,%xmm1
3536bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
3537bc3d5698SJohn Baldwin	vpxor	%xmm11,%xmm12,%xmm4
3538bc3d5698SJohn Baldwin
3539bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm10,%xmm10
3540bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3541bc3d5698SJohn Baldwin
3542bc3d5698SJohn Baldwin	vpsrld	$13,%xmm11,%xmm1
3543bc3d5698SJohn Baldwin
3544bc3d5698SJohn Baldwin	vpslld	$19,%xmm11,%xmm2
3545bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3546bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
3547bc3d5698SJohn Baldwin
3548bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm10,%xmm7
3549bc3d5698SJohn Baldwin
3550bc3d5698SJohn Baldwin	vpsrld	$22,%xmm11,%xmm1
3551bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3552bc3d5698SJohn Baldwin
3553bc3d5698SJohn Baldwin	vpslld	$10,%xmm11,%xmm2
3554bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm12,%xmm10
3555bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm14,%xmm14
3556bc3d5698SJohn Baldwin
3557bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3558bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3559bc3d5698SJohn Baldwin
3560bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm10,%xmm10
3561bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm10,%xmm10
3562bc3d5698SJohn Baldwin	vmovd	24(%r8),%xmm5
3563bc3d5698SJohn Baldwin	vmovd	24(%r9),%xmm0
3564bc3d5698SJohn Baldwin	vpinsrd	$1,24(%r10),%xmm5,%xmm5
3565bc3d5698SJohn Baldwin	vpinsrd	$1,24(%r11),%xmm0,%xmm0
3566bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3567bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3568bc3d5698SJohn Baldwin	vpsrld	$6,%xmm14,%xmm7
3569bc3d5698SJohn Baldwin	vpslld	$26,%xmm14,%xmm2
3570bc3d5698SJohn Baldwin	vmovdqu	%xmm5,96-128(%rax)
3571bc3d5698SJohn Baldwin	vpaddd	%xmm9,%xmm5,%xmm5
3572bc3d5698SJohn Baldwin
3573bc3d5698SJohn Baldwin	vpsrld	$11,%xmm14,%xmm1
3574bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3575bc3d5698SJohn Baldwin	vpslld	$21,%xmm14,%xmm2
3576bc3d5698SJohn Baldwin	vpaddd	64(%rbp),%xmm5,%xmm5
3577bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3578bc3d5698SJohn Baldwin
3579bc3d5698SJohn Baldwin	vpsrld	$25,%xmm14,%xmm1
3580bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3581bc3d5698SJohn Baldwin
3582bc3d5698SJohn Baldwin	vpslld	$7,%xmm14,%xmm2
3583bc3d5698SJohn Baldwin	vpandn	%xmm8,%xmm14,%xmm0
3584bc3d5698SJohn Baldwin	vpand	%xmm15,%xmm14,%xmm3
3585bc3d5698SJohn Baldwin
3586bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3587bc3d5698SJohn Baldwin
3588bc3d5698SJohn Baldwin	vpsrld	$2,%xmm10,%xmm9
3589bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3590bc3d5698SJohn Baldwin
3591bc3d5698SJohn Baldwin	vpslld	$30,%xmm10,%xmm1
3592bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
3593bc3d5698SJohn Baldwin	vpxor	%xmm10,%xmm11,%xmm3
3594bc3d5698SJohn Baldwin
3595bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm9,%xmm9
3596bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3597bc3d5698SJohn Baldwin
3598bc3d5698SJohn Baldwin	vpsrld	$13,%xmm10,%xmm1
3599bc3d5698SJohn Baldwin
3600bc3d5698SJohn Baldwin	vpslld	$19,%xmm10,%xmm2
3601bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3602bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
3603bc3d5698SJohn Baldwin
3604bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm9,%xmm7
3605bc3d5698SJohn Baldwin
3606bc3d5698SJohn Baldwin	vpsrld	$22,%xmm10,%xmm1
3607bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3608bc3d5698SJohn Baldwin
3609bc3d5698SJohn Baldwin	vpslld	$10,%xmm10,%xmm2
3610bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm11,%xmm9
3611bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm13,%xmm13
3612bc3d5698SJohn Baldwin
3613bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3614bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3615bc3d5698SJohn Baldwin
3616bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm9,%xmm9
3617bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm9,%xmm9
3618bc3d5698SJohn Baldwin	vmovd	28(%r8),%xmm5
3619bc3d5698SJohn Baldwin	vmovd	28(%r9),%xmm0
3620bc3d5698SJohn Baldwin	vpinsrd	$1,28(%r10),%xmm5,%xmm5
3621bc3d5698SJohn Baldwin	vpinsrd	$1,28(%r11),%xmm0,%xmm0
3622bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3623bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3624bc3d5698SJohn Baldwin	vpsrld	$6,%xmm13,%xmm7
3625bc3d5698SJohn Baldwin	vpslld	$26,%xmm13,%xmm2
3626bc3d5698SJohn Baldwin	vmovdqu	%xmm5,112-128(%rax)
3627bc3d5698SJohn Baldwin	vpaddd	%xmm8,%xmm5,%xmm5
3628bc3d5698SJohn Baldwin
3629bc3d5698SJohn Baldwin	vpsrld	$11,%xmm13,%xmm1
3630bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3631bc3d5698SJohn Baldwin	vpslld	$21,%xmm13,%xmm2
3632bc3d5698SJohn Baldwin	vpaddd	96(%rbp),%xmm5,%xmm5
3633bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3634bc3d5698SJohn Baldwin
3635bc3d5698SJohn Baldwin	vpsrld	$25,%xmm13,%xmm1
3636bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3637bc3d5698SJohn Baldwin
3638bc3d5698SJohn Baldwin	vpslld	$7,%xmm13,%xmm2
3639bc3d5698SJohn Baldwin	vpandn	%xmm15,%xmm13,%xmm0
3640bc3d5698SJohn Baldwin	vpand	%xmm14,%xmm13,%xmm4
3641bc3d5698SJohn Baldwin
3642bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3643bc3d5698SJohn Baldwin
3644bc3d5698SJohn Baldwin	vpsrld	$2,%xmm9,%xmm8
3645bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3646bc3d5698SJohn Baldwin
3647bc3d5698SJohn Baldwin	vpslld	$30,%xmm9,%xmm1
3648bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
3649bc3d5698SJohn Baldwin	vpxor	%xmm9,%xmm10,%xmm4
3650bc3d5698SJohn Baldwin
3651bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm8,%xmm8
3652bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3653bc3d5698SJohn Baldwin
3654bc3d5698SJohn Baldwin	vpsrld	$13,%xmm9,%xmm1
3655bc3d5698SJohn Baldwin
3656bc3d5698SJohn Baldwin	vpslld	$19,%xmm9,%xmm2
3657bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3658bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
3659bc3d5698SJohn Baldwin
3660bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm8,%xmm7
3661bc3d5698SJohn Baldwin
3662bc3d5698SJohn Baldwin	vpsrld	$22,%xmm9,%xmm1
3663bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3664bc3d5698SJohn Baldwin
3665bc3d5698SJohn Baldwin	vpslld	$10,%xmm9,%xmm2
3666bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm10,%xmm8
3667bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm12,%xmm12
3668bc3d5698SJohn Baldwin
3669bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3670bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3671bc3d5698SJohn Baldwin
3672bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm8,%xmm8
3673bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm8,%xmm8
3674bc3d5698SJohn Baldwin	addq	$256,%rbp
3675bc3d5698SJohn Baldwin	vmovd	32(%r8),%xmm5
3676bc3d5698SJohn Baldwin	vmovd	32(%r9),%xmm0
3677bc3d5698SJohn Baldwin	vpinsrd	$1,32(%r10),%xmm5,%xmm5
3678bc3d5698SJohn Baldwin	vpinsrd	$1,32(%r11),%xmm0,%xmm0
3679bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3680bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3681bc3d5698SJohn Baldwin	vpsrld	$6,%xmm12,%xmm7
3682bc3d5698SJohn Baldwin	vpslld	$26,%xmm12,%xmm2
3683bc3d5698SJohn Baldwin	vmovdqu	%xmm5,128-128(%rax)
3684bc3d5698SJohn Baldwin	vpaddd	%xmm15,%xmm5,%xmm5
3685bc3d5698SJohn Baldwin
3686bc3d5698SJohn Baldwin	vpsrld	$11,%xmm12,%xmm1
3687bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3688bc3d5698SJohn Baldwin	vpslld	$21,%xmm12,%xmm2
3689bc3d5698SJohn Baldwin	vpaddd	-128(%rbp),%xmm5,%xmm5
3690bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3691bc3d5698SJohn Baldwin
3692bc3d5698SJohn Baldwin	vpsrld	$25,%xmm12,%xmm1
3693bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3694bc3d5698SJohn Baldwin
3695bc3d5698SJohn Baldwin	vpslld	$7,%xmm12,%xmm2
3696bc3d5698SJohn Baldwin	vpandn	%xmm14,%xmm12,%xmm0
3697bc3d5698SJohn Baldwin	vpand	%xmm13,%xmm12,%xmm3
3698bc3d5698SJohn Baldwin
3699bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3700bc3d5698SJohn Baldwin
3701bc3d5698SJohn Baldwin	vpsrld	$2,%xmm8,%xmm15
3702bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3703bc3d5698SJohn Baldwin
3704bc3d5698SJohn Baldwin	vpslld	$30,%xmm8,%xmm1
3705bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
3706bc3d5698SJohn Baldwin	vpxor	%xmm8,%xmm9,%xmm3
3707bc3d5698SJohn Baldwin
3708bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm15,%xmm15
3709bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3710bc3d5698SJohn Baldwin
3711bc3d5698SJohn Baldwin	vpsrld	$13,%xmm8,%xmm1
3712bc3d5698SJohn Baldwin
3713bc3d5698SJohn Baldwin	vpslld	$19,%xmm8,%xmm2
3714bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3715bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
3716bc3d5698SJohn Baldwin
3717bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm15,%xmm7
3718bc3d5698SJohn Baldwin
3719bc3d5698SJohn Baldwin	vpsrld	$22,%xmm8,%xmm1
3720bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3721bc3d5698SJohn Baldwin
3722bc3d5698SJohn Baldwin	vpslld	$10,%xmm8,%xmm2
3723bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm9,%xmm15
3724bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
3725bc3d5698SJohn Baldwin
3726bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3727bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3728bc3d5698SJohn Baldwin
3729bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
3730bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm15,%xmm15
3731bc3d5698SJohn Baldwin	vmovd	36(%r8),%xmm5
3732bc3d5698SJohn Baldwin	vmovd	36(%r9),%xmm0
3733bc3d5698SJohn Baldwin	vpinsrd	$1,36(%r10),%xmm5,%xmm5
3734bc3d5698SJohn Baldwin	vpinsrd	$1,36(%r11),%xmm0,%xmm0
3735bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3736bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3737bc3d5698SJohn Baldwin	vpsrld	$6,%xmm11,%xmm7
3738bc3d5698SJohn Baldwin	vpslld	$26,%xmm11,%xmm2
3739bc3d5698SJohn Baldwin	vmovdqu	%xmm5,144-128(%rax)
3740bc3d5698SJohn Baldwin	vpaddd	%xmm14,%xmm5,%xmm5
3741bc3d5698SJohn Baldwin
3742bc3d5698SJohn Baldwin	vpsrld	$11,%xmm11,%xmm1
3743bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3744bc3d5698SJohn Baldwin	vpslld	$21,%xmm11,%xmm2
3745bc3d5698SJohn Baldwin	vpaddd	-96(%rbp),%xmm5,%xmm5
3746bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3747bc3d5698SJohn Baldwin
3748bc3d5698SJohn Baldwin	vpsrld	$25,%xmm11,%xmm1
3749bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3750bc3d5698SJohn Baldwin
3751bc3d5698SJohn Baldwin	vpslld	$7,%xmm11,%xmm2
3752bc3d5698SJohn Baldwin	vpandn	%xmm13,%xmm11,%xmm0
3753bc3d5698SJohn Baldwin	vpand	%xmm12,%xmm11,%xmm4
3754bc3d5698SJohn Baldwin
3755bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3756bc3d5698SJohn Baldwin
3757bc3d5698SJohn Baldwin	vpsrld	$2,%xmm15,%xmm14
3758bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3759bc3d5698SJohn Baldwin
3760bc3d5698SJohn Baldwin	vpslld	$30,%xmm15,%xmm1
3761bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
3762bc3d5698SJohn Baldwin	vpxor	%xmm15,%xmm8,%xmm4
3763bc3d5698SJohn Baldwin
3764bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm14,%xmm14
3765bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3766bc3d5698SJohn Baldwin
3767bc3d5698SJohn Baldwin	vpsrld	$13,%xmm15,%xmm1
3768bc3d5698SJohn Baldwin
3769bc3d5698SJohn Baldwin	vpslld	$19,%xmm15,%xmm2
3770bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3771bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
3772bc3d5698SJohn Baldwin
3773bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm14,%xmm7
3774bc3d5698SJohn Baldwin
3775bc3d5698SJohn Baldwin	vpsrld	$22,%xmm15,%xmm1
3776bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3777bc3d5698SJohn Baldwin
3778bc3d5698SJohn Baldwin	vpslld	$10,%xmm15,%xmm2
3779bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm8,%xmm14
3780bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm10,%xmm10
3781bc3d5698SJohn Baldwin
3782bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3783bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3784bc3d5698SJohn Baldwin
3785bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm14,%xmm14
3786bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm14,%xmm14
3787bc3d5698SJohn Baldwin	vmovd	40(%r8),%xmm5
3788bc3d5698SJohn Baldwin	vmovd	40(%r9),%xmm0
3789bc3d5698SJohn Baldwin	vpinsrd	$1,40(%r10),%xmm5,%xmm5
3790bc3d5698SJohn Baldwin	vpinsrd	$1,40(%r11),%xmm0,%xmm0
3791bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3792bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3793bc3d5698SJohn Baldwin	vpsrld	$6,%xmm10,%xmm7
3794bc3d5698SJohn Baldwin	vpslld	$26,%xmm10,%xmm2
3795bc3d5698SJohn Baldwin	vmovdqu	%xmm5,160-128(%rax)
3796bc3d5698SJohn Baldwin	vpaddd	%xmm13,%xmm5,%xmm5
3797bc3d5698SJohn Baldwin
3798bc3d5698SJohn Baldwin	vpsrld	$11,%xmm10,%xmm1
3799bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3800bc3d5698SJohn Baldwin	vpslld	$21,%xmm10,%xmm2
3801bc3d5698SJohn Baldwin	vpaddd	-64(%rbp),%xmm5,%xmm5
3802bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3803bc3d5698SJohn Baldwin
3804bc3d5698SJohn Baldwin	vpsrld	$25,%xmm10,%xmm1
3805bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3806bc3d5698SJohn Baldwin
3807bc3d5698SJohn Baldwin	vpslld	$7,%xmm10,%xmm2
3808bc3d5698SJohn Baldwin	vpandn	%xmm12,%xmm10,%xmm0
3809bc3d5698SJohn Baldwin	vpand	%xmm11,%xmm10,%xmm3
3810bc3d5698SJohn Baldwin
3811bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3812bc3d5698SJohn Baldwin
3813bc3d5698SJohn Baldwin	vpsrld	$2,%xmm14,%xmm13
3814bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3815bc3d5698SJohn Baldwin
3816bc3d5698SJohn Baldwin	vpslld	$30,%xmm14,%xmm1
3817bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
3818bc3d5698SJohn Baldwin	vpxor	%xmm14,%xmm15,%xmm3
3819bc3d5698SJohn Baldwin
3820bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm13,%xmm13
3821bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3822bc3d5698SJohn Baldwin
3823bc3d5698SJohn Baldwin	vpsrld	$13,%xmm14,%xmm1
3824bc3d5698SJohn Baldwin
3825bc3d5698SJohn Baldwin	vpslld	$19,%xmm14,%xmm2
3826bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3827bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
3828bc3d5698SJohn Baldwin
3829bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm13,%xmm7
3830bc3d5698SJohn Baldwin
3831bc3d5698SJohn Baldwin	vpsrld	$22,%xmm14,%xmm1
3832bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3833bc3d5698SJohn Baldwin
3834bc3d5698SJohn Baldwin	vpslld	$10,%xmm14,%xmm2
3835bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm15,%xmm13
3836bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm9,%xmm9
3837bc3d5698SJohn Baldwin
3838bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3839bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3840bc3d5698SJohn Baldwin
3841bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm13,%xmm13
3842bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm13,%xmm13
3843bc3d5698SJohn Baldwin	vmovd	44(%r8),%xmm5
3844bc3d5698SJohn Baldwin	vmovd	44(%r9),%xmm0
3845bc3d5698SJohn Baldwin	vpinsrd	$1,44(%r10),%xmm5,%xmm5
3846bc3d5698SJohn Baldwin	vpinsrd	$1,44(%r11),%xmm0,%xmm0
3847bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3848bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3849bc3d5698SJohn Baldwin	vpsrld	$6,%xmm9,%xmm7
3850bc3d5698SJohn Baldwin	vpslld	$26,%xmm9,%xmm2
3851bc3d5698SJohn Baldwin	vmovdqu	%xmm5,176-128(%rax)
3852bc3d5698SJohn Baldwin	vpaddd	%xmm12,%xmm5,%xmm5
3853bc3d5698SJohn Baldwin
3854bc3d5698SJohn Baldwin	vpsrld	$11,%xmm9,%xmm1
3855bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3856bc3d5698SJohn Baldwin	vpslld	$21,%xmm9,%xmm2
3857bc3d5698SJohn Baldwin	vpaddd	-32(%rbp),%xmm5,%xmm5
3858bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3859bc3d5698SJohn Baldwin
3860bc3d5698SJohn Baldwin	vpsrld	$25,%xmm9,%xmm1
3861bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3862bc3d5698SJohn Baldwin
3863bc3d5698SJohn Baldwin	vpslld	$7,%xmm9,%xmm2
3864bc3d5698SJohn Baldwin	vpandn	%xmm11,%xmm9,%xmm0
3865bc3d5698SJohn Baldwin	vpand	%xmm10,%xmm9,%xmm4
3866bc3d5698SJohn Baldwin
3867bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3868bc3d5698SJohn Baldwin
3869bc3d5698SJohn Baldwin	vpsrld	$2,%xmm13,%xmm12
3870bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3871bc3d5698SJohn Baldwin
3872bc3d5698SJohn Baldwin	vpslld	$30,%xmm13,%xmm1
3873bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
3874bc3d5698SJohn Baldwin	vpxor	%xmm13,%xmm14,%xmm4
3875bc3d5698SJohn Baldwin
3876bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm12,%xmm12
3877bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3878bc3d5698SJohn Baldwin
3879bc3d5698SJohn Baldwin	vpsrld	$13,%xmm13,%xmm1
3880bc3d5698SJohn Baldwin
3881bc3d5698SJohn Baldwin	vpslld	$19,%xmm13,%xmm2
3882bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3883bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
3884bc3d5698SJohn Baldwin
3885bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm12,%xmm7
3886bc3d5698SJohn Baldwin
3887bc3d5698SJohn Baldwin	vpsrld	$22,%xmm13,%xmm1
3888bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3889bc3d5698SJohn Baldwin
3890bc3d5698SJohn Baldwin	vpslld	$10,%xmm13,%xmm2
3891bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm14,%xmm12
3892bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm8,%xmm8
3893bc3d5698SJohn Baldwin
3894bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3895bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3896bc3d5698SJohn Baldwin
3897bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm12,%xmm12
3898bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm12,%xmm12
3899bc3d5698SJohn Baldwin	vmovd	48(%r8),%xmm5
3900bc3d5698SJohn Baldwin	vmovd	48(%r9),%xmm0
3901bc3d5698SJohn Baldwin	vpinsrd	$1,48(%r10),%xmm5,%xmm5
3902bc3d5698SJohn Baldwin	vpinsrd	$1,48(%r11),%xmm0,%xmm0
3903bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3904bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3905bc3d5698SJohn Baldwin	vpsrld	$6,%xmm8,%xmm7
3906bc3d5698SJohn Baldwin	vpslld	$26,%xmm8,%xmm2
3907bc3d5698SJohn Baldwin	vmovdqu	%xmm5,192-128(%rax)
3908bc3d5698SJohn Baldwin	vpaddd	%xmm11,%xmm5,%xmm5
3909bc3d5698SJohn Baldwin
3910bc3d5698SJohn Baldwin	vpsrld	$11,%xmm8,%xmm1
3911bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3912bc3d5698SJohn Baldwin	vpslld	$21,%xmm8,%xmm2
3913bc3d5698SJohn Baldwin	vpaddd	0(%rbp),%xmm5,%xmm5
3914bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3915bc3d5698SJohn Baldwin
3916bc3d5698SJohn Baldwin	vpsrld	$25,%xmm8,%xmm1
3917bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3918bc3d5698SJohn Baldwin
3919bc3d5698SJohn Baldwin	vpslld	$7,%xmm8,%xmm2
3920bc3d5698SJohn Baldwin	vpandn	%xmm10,%xmm8,%xmm0
3921bc3d5698SJohn Baldwin	vpand	%xmm9,%xmm8,%xmm3
3922bc3d5698SJohn Baldwin
3923bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3924bc3d5698SJohn Baldwin
3925bc3d5698SJohn Baldwin	vpsrld	$2,%xmm12,%xmm11
3926bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3927bc3d5698SJohn Baldwin
3928bc3d5698SJohn Baldwin	vpslld	$30,%xmm12,%xmm1
3929bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
3930bc3d5698SJohn Baldwin	vpxor	%xmm12,%xmm13,%xmm3
3931bc3d5698SJohn Baldwin
3932bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm11,%xmm11
3933bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3934bc3d5698SJohn Baldwin
3935bc3d5698SJohn Baldwin	vpsrld	$13,%xmm12,%xmm1
3936bc3d5698SJohn Baldwin
3937bc3d5698SJohn Baldwin	vpslld	$19,%xmm12,%xmm2
3938bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3939bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
3940bc3d5698SJohn Baldwin
3941bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm11,%xmm7
3942bc3d5698SJohn Baldwin
3943bc3d5698SJohn Baldwin	vpsrld	$22,%xmm12,%xmm1
3944bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3945bc3d5698SJohn Baldwin
3946bc3d5698SJohn Baldwin	vpslld	$10,%xmm12,%xmm2
3947bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm13,%xmm11
3948bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
3949bc3d5698SJohn Baldwin
3950bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3951bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3952bc3d5698SJohn Baldwin
3953bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
3954bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm11,%xmm11
3955bc3d5698SJohn Baldwin	vmovd	52(%r8),%xmm5
3956bc3d5698SJohn Baldwin	vmovd	52(%r9),%xmm0
3957bc3d5698SJohn Baldwin	vpinsrd	$1,52(%r10),%xmm5,%xmm5
3958bc3d5698SJohn Baldwin	vpinsrd	$1,52(%r11),%xmm0,%xmm0
3959bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
3960bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
3961bc3d5698SJohn Baldwin	vpsrld	$6,%xmm15,%xmm7
3962bc3d5698SJohn Baldwin	vpslld	$26,%xmm15,%xmm2
3963bc3d5698SJohn Baldwin	vmovdqu	%xmm5,208-128(%rax)
3964bc3d5698SJohn Baldwin	vpaddd	%xmm10,%xmm5,%xmm5
3965bc3d5698SJohn Baldwin
3966bc3d5698SJohn Baldwin	vpsrld	$11,%xmm15,%xmm1
3967bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3968bc3d5698SJohn Baldwin	vpslld	$21,%xmm15,%xmm2
3969bc3d5698SJohn Baldwin	vpaddd	32(%rbp),%xmm5,%xmm5
3970bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3971bc3d5698SJohn Baldwin
3972bc3d5698SJohn Baldwin	vpsrld	$25,%xmm15,%xmm1
3973bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3974bc3d5698SJohn Baldwin
3975bc3d5698SJohn Baldwin	vpslld	$7,%xmm15,%xmm2
3976bc3d5698SJohn Baldwin	vpandn	%xmm9,%xmm15,%xmm0
3977bc3d5698SJohn Baldwin	vpand	%xmm8,%xmm15,%xmm4
3978bc3d5698SJohn Baldwin
3979bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
3980bc3d5698SJohn Baldwin
3981bc3d5698SJohn Baldwin	vpsrld	$2,%xmm11,%xmm10
3982bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
3983bc3d5698SJohn Baldwin
3984bc3d5698SJohn Baldwin	vpslld	$30,%xmm11,%xmm1
3985bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
3986bc3d5698SJohn Baldwin	vpxor	%xmm11,%xmm12,%xmm4
3987bc3d5698SJohn Baldwin
3988bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm10,%xmm10
3989bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
3990bc3d5698SJohn Baldwin
3991bc3d5698SJohn Baldwin	vpsrld	$13,%xmm11,%xmm1
3992bc3d5698SJohn Baldwin
3993bc3d5698SJohn Baldwin	vpslld	$19,%xmm11,%xmm2
3994bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
3995bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
3996bc3d5698SJohn Baldwin
3997bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm10,%xmm7
3998bc3d5698SJohn Baldwin
3999bc3d5698SJohn Baldwin	vpsrld	$22,%xmm11,%xmm1
4000bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4001bc3d5698SJohn Baldwin
4002bc3d5698SJohn Baldwin	vpslld	$10,%xmm11,%xmm2
4003bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm12,%xmm10
4004bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm14,%xmm14
4005bc3d5698SJohn Baldwin
4006bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4007bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4008bc3d5698SJohn Baldwin
4009bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm10,%xmm10
4010bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm10,%xmm10
4011bc3d5698SJohn Baldwin	vmovd	56(%r8),%xmm5
4012bc3d5698SJohn Baldwin	vmovd	56(%r9),%xmm0
4013bc3d5698SJohn Baldwin	vpinsrd	$1,56(%r10),%xmm5,%xmm5
4014bc3d5698SJohn Baldwin	vpinsrd	$1,56(%r11),%xmm0,%xmm0
4015bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
4016bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
4017bc3d5698SJohn Baldwin	vpsrld	$6,%xmm14,%xmm7
4018bc3d5698SJohn Baldwin	vpslld	$26,%xmm14,%xmm2
4019bc3d5698SJohn Baldwin	vmovdqu	%xmm5,224-128(%rax)
4020bc3d5698SJohn Baldwin	vpaddd	%xmm9,%xmm5,%xmm5
4021bc3d5698SJohn Baldwin
4022bc3d5698SJohn Baldwin	vpsrld	$11,%xmm14,%xmm1
4023bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4024bc3d5698SJohn Baldwin	vpslld	$21,%xmm14,%xmm2
4025bc3d5698SJohn Baldwin	vpaddd	64(%rbp),%xmm5,%xmm5
4026bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4027bc3d5698SJohn Baldwin
4028bc3d5698SJohn Baldwin	vpsrld	$25,%xmm14,%xmm1
4029bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4030bc3d5698SJohn Baldwin
4031bc3d5698SJohn Baldwin	vpslld	$7,%xmm14,%xmm2
4032bc3d5698SJohn Baldwin	vpandn	%xmm8,%xmm14,%xmm0
4033bc3d5698SJohn Baldwin	vpand	%xmm15,%xmm14,%xmm3
4034bc3d5698SJohn Baldwin
4035bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4036bc3d5698SJohn Baldwin
4037bc3d5698SJohn Baldwin	vpsrld	$2,%xmm10,%xmm9
4038bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4039bc3d5698SJohn Baldwin
4040bc3d5698SJohn Baldwin	vpslld	$30,%xmm10,%xmm1
4041bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
4042bc3d5698SJohn Baldwin	vpxor	%xmm10,%xmm11,%xmm3
4043bc3d5698SJohn Baldwin
4044bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm9,%xmm9
4045bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4046bc3d5698SJohn Baldwin
4047bc3d5698SJohn Baldwin	vpsrld	$13,%xmm10,%xmm1
4048bc3d5698SJohn Baldwin
4049bc3d5698SJohn Baldwin	vpslld	$19,%xmm10,%xmm2
4050bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
4051bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
4052bc3d5698SJohn Baldwin
4053bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm9,%xmm7
4054bc3d5698SJohn Baldwin
4055bc3d5698SJohn Baldwin	vpsrld	$22,%xmm10,%xmm1
4056bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4057bc3d5698SJohn Baldwin
4058bc3d5698SJohn Baldwin	vpslld	$10,%xmm10,%xmm2
4059bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm11,%xmm9
4060bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm13,%xmm13
4061bc3d5698SJohn Baldwin
4062bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4063bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4064bc3d5698SJohn Baldwin
4065bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm9,%xmm9
4066bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm9,%xmm9
4067bc3d5698SJohn Baldwin	vmovd	60(%r8),%xmm5
4068bc3d5698SJohn Baldwin	leaq	64(%r8),%r8
4069bc3d5698SJohn Baldwin	vmovd	60(%r9),%xmm0
4070bc3d5698SJohn Baldwin	leaq	64(%r9),%r9
4071bc3d5698SJohn Baldwin	vpinsrd	$1,60(%r10),%xmm5,%xmm5
4072bc3d5698SJohn Baldwin	leaq	64(%r10),%r10
4073bc3d5698SJohn Baldwin	vpinsrd	$1,60(%r11),%xmm0,%xmm0
4074bc3d5698SJohn Baldwin	leaq	64(%r11),%r11
4075bc3d5698SJohn Baldwin	vpunpckldq	%xmm0,%xmm5,%xmm5
4076bc3d5698SJohn Baldwin	vpshufb	%xmm6,%xmm5,%xmm5
4077bc3d5698SJohn Baldwin	vpsrld	$6,%xmm13,%xmm7
4078bc3d5698SJohn Baldwin	vpslld	$26,%xmm13,%xmm2
4079bc3d5698SJohn Baldwin	vmovdqu	%xmm5,240-128(%rax)
4080bc3d5698SJohn Baldwin	vpaddd	%xmm8,%xmm5,%xmm5
4081bc3d5698SJohn Baldwin
4082bc3d5698SJohn Baldwin	vpsrld	$11,%xmm13,%xmm1
4083bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4084bc3d5698SJohn Baldwin	vpslld	$21,%xmm13,%xmm2
4085bc3d5698SJohn Baldwin	vpaddd	96(%rbp),%xmm5,%xmm5
4086bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4087bc3d5698SJohn Baldwin
4088bc3d5698SJohn Baldwin	vpsrld	$25,%xmm13,%xmm1
4089bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4090bc3d5698SJohn Baldwin	prefetcht0	63(%r8)
4091bc3d5698SJohn Baldwin	vpslld	$7,%xmm13,%xmm2
4092bc3d5698SJohn Baldwin	vpandn	%xmm15,%xmm13,%xmm0
4093bc3d5698SJohn Baldwin	vpand	%xmm14,%xmm13,%xmm4
4094bc3d5698SJohn Baldwin	prefetcht0	63(%r9)
4095bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4096bc3d5698SJohn Baldwin
4097bc3d5698SJohn Baldwin	vpsrld	$2,%xmm9,%xmm8
4098bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4099bc3d5698SJohn Baldwin	prefetcht0	63(%r10)
4100bc3d5698SJohn Baldwin	vpslld	$30,%xmm9,%xmm1
4101bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
4102bc3d5698SJohn Baldwin	vpxor	%xmm9,%xmm10,%xmm4
4103bc3d5698SJohn Baldwin	prefetcht0	63(%r11)
4104bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm8,%xmm8
4105bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4106bc3d5698SJohn Baldwin
4107bc3d5698SJohn Baldwin	vpsrld	$13,%xmm9,%xmm1
4108bc3d5698SJohn Baldwin
4109bc3d5698SJohn Baldwin	vpslld	$19,%xmm9,%xmm2
4110bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
4111bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
4112bc3d5698SJohn Baldwin
4113bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm8,%xmm7
4114bc3d5698SJohn Baldwin
4115bc3d5698SJohn Baldwin	vpsrld	$22,%xmm9,%xmm1
4116bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4117bc3d5698SJohn Baldwin
4118bc3d5698SJohn Baldwin	vpslld	$10,%xmm9,%xmm2
4119bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm10,%xmm8
4120bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm12,%xmm12
4121bc3d5698SJohn Baldwin
4122bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4123bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4124bc3d5698SJohn Baldwin
4125bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm8,%xmm8
4126bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm8,%xmm8
4127bc3d5698SJohn Baldwin	addq	$256,%rbp
4128bc3d5698SJohn Baldwin	vmovdqu	0-128(%rax),%xmm5
4129bc3d5698SJohn Baldwin	movl	$3,%ecx
4130bc3d5698SJohn Baldwin	jmp	.Loop_16_xx_avx
4131bc3d5698SJohn Baldwin.align	32
4132bc3d5698SJohn Baldwin.Loop_16_xx_avx:
4133bc3d5698SJohn Baldwin	vmovdqu	16-128(%rax),%xmm6
4134bc3d5698SJohn Baldwin	vpaddd	144-128(%rax),%xmm5,%xmm5
4135bc3d5698SJohn Baldwin
4136bc3d5698SJohn Baldwin	vpsrld	$3,%xmm6,%xmm7
4137bc3d5698SJohn Baldwin	vpsrld	$7,%xmm6,%xmm1
4138bc3d5698SJohn Baldwin	vpslld	$25,%xmm6,%xmm2
4139bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4140bc3d5698SJohn Baldwin	vpsrld	$18,%xmm6,%xmm1
4141bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4142bc3d5698SJohn Baldwin	vpslld	$14,%xmm6,%xmm2
4143bc3d5698SJohn Baldwin	vmovdqu	224-128(%rax),%xmm0
4144bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm3
4145bc3d5698SJohn Baldwin
4146bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4147bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4148bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4149bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4150bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4151bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm3,%xmm7
4152bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4153bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4154bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4155bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4156bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4157bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4158bc3d5698SJohn Baldwin	vpsrld	$6,%xmm12,%xmm7
4159bc3d5698SJohn Baldwin	vpslld	$26,%xmm12,%xmm2
4160bc3d5698SJohn Baldwin	vmovdqu	%xmm5,0-128(%rax)
4161bc3d5698SJohn Baldwin	vpaddd	%xmm15,%xmm5,%xmm5
4162bc3d5698SJohn Baldwin
4163bc3d5698SJohn Baldwin	vpsrld	$11,%xmm12,%xmm1
4164bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4165bc3d5698SJohn Baldwin	vpslld	$21,%xmm12,%xmm2
4166bc3d5698SJohn Baldwin	vpaddd	-128(%rbp),%xmm5,%xmm5
4167bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4168bc3d5698SJohn Baldwin
4169bc3d5698SJohn Baldwin	vpsrld	$25,%xmm12,%xmm1
4170bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4171bc3d5698SJohn Baldwin
4172bc3d5698SJohn Baldwin	vpslld	$7,%xmm12,%xmm2
4173bc3d5698SJohn Baldwin	vpandn	%xmm14,%xmm12,%xmm0
4174bc3d5698SJohn Baldwin	vpand	%xmm13,%xmm12,%xmm3
4175bc3d5698SJohn Baldwin
4176bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4177bc3d5698SJohn Baldwin
4178bc3d5698SJohn Baldwin	vpsrld	$2,%xmm8,%xmm15
4179bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4180bc3d5698SJohn Baldwin
4181bc3d5698SJohn Baldwin	vpslld	$30,%xmm8,%xmm1
4182bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
4183bc3d5698SJohn Baldwin	vpxor	%xmm8,%xmm9,%xmm3
4184bc3d5698SJohn Baldwin
4185bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm15,%xmm15
4186bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4187bc3d5698SJohn Baldwin
4188bc3d5698SJohn Baldwin	vpsrld	$13,%xmm8,%xmm1
4189bc3d5698SJohn Baldwin
4190bc3d5698SJohn Baldwin	vpslld	$19,%xmm8,%xmm2
4191bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
4192bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
4193bc3d5698SJohn Baldwin
4194bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm15,%xmm7
4195bc3d5698SJohn Baldwin
4196bc3d5698SJohn Baldwin	vpsrld	$22,%xmm8,%xmm1
4197bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4198bc3d5698SJohn Baldwin
4199bc3d5698SJohn Baldwin	vpslld	$10,%xmm8,%xmm2
4200bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm9,%xmm15
4201bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
4202bc3d5698SJohn Baldwin
4203bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4204bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4205bc3d5698SJohn Baldwin
4206bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
4207bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm15,%xmm15
4208bc3d5698SJohn Baldwin	vmovdqu	32-128(%rax),%xmm5
4209bc3d5698SJohn Baldwin	vpaddd	160-128(%rax),%xmm6,%xmm6
4210bc3d5698SJohn Baldwin
4211bc3d5698SJohn Baldwin	vpsrld	$3,%xmm5,%xmm7
4212bc3d5698SJohn Baldwin	vpsrld	$7,%xmm5,%xmm1
4213bc3d5698SJohn Baldwin	vpslld	$25,%xmm5,%xmm2
4214bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4215bc3d5698SJohn Baldwin	vpsrld	$18,%xmm5,%xmm1
4216bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4217bc3d5698SJohn Baldwin	vpslld	$14,%xmm5,%xmm2
4218bc3d5698SJohn Baldwin	vmovdqu	240-128(%rax),%xmm0
4219bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm4
4220bc3d5698SJohn Baldwin
4221bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4222bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4223bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4224bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4225bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4226bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm4,%xmm7
4227bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4228bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4229bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4230bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4231bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4232bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4233bc3d5698SJohn Baldwin	vpsrld	$6,%xmm11,%xmm7
4234bc3d5698SJohn Baldwin	vpslld	$26,%xmm11,%xmm2
4235bc3d5698SJohn Baldwin	vmovdqu	%xmm6,16-128(%rax)
4236bc3d5698SJohn Baldwin	vpaddd	%xmm14,%xmm6,%xmm6
4237bc3d5698SJohn Baldwin
4238bc3d5698SJohn Baldwin	vpsrld	$11,%xmm11,%xmm1
4239bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4240bc3d5698SJohn Baldwin	vpslld	$21,%xmm11,%xmm2
4241bc3d5698SJohn Baldwin	vpaddd	-96(%rbp),%xmm6,%xmm6
4242bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4243bc3d5698SJohn Baldwin
4244bc3d5698SJohn Baldwin	vpsrld	$25,%xmm11,%xmm1
4245bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4246bc3d5698SJohn Baldwin
4247bc3d5698SJohn Baldwin	vpslld	$7,%xmm11,%xmm2
4248bc3d5698SJohn Baldwin	vpandn	%xmm13,%xmm11,%xmm0
4249bc3d5698SJohn Baldwin	vpand	%xmm12,%xmm11,%xmm4
4250bc3d5698SJohn Baldwin
4251bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4252bc3d5698SJohn Baldwin
4253bc3d5698SJohn Baldwin	vpsrld	$2,%xmm15,%xmm14
4254bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4255bc3d5698SJohn Baldwin
4256bc3d5698SJohn Baldwin	vpslld	$30,%xmm15,%xmm1
4257bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
4258bc3d5698SJohn Baldwin	vpxor	%xmm15,%xmm8,%xmm4
4259bc3d5698SJohn Baldwin
4260bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm14,%xmm14
4261bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4262bc3d5698SJohn Baldwin
4263bc3d5698SJohn Baldwin	vpsrld	$13,%xmm15,%xmm1
4264bc3d5698SJohn Baldwin
4265bc3d5698SJohn Baldwin	vpslld	$19,%xmm15,%xmm2
4266bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm6,%xmm6
4267bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
4268bc3d5698SJohn Baldwin
4269bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm14,%xmm7
4270bc3d5698SJohn Baldwin
4271bc3d5698SJohn Baldwin	vpsrld	$22,%xmm15,%xmm1
4272bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4273bc3d5698SJohn Baldwin
4274bc3d5698SJohn Baldwin	vpslld	$10,%xmm15,%xmm2
4275bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm8,%xmm14
4276bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm10,%xmm10
4277bc3d5698SJohn Baldwin
4278bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4279bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4280bc3d5698SJohn Baldwin
4281bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm14,%xmm14
4282bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm14,%xmm14
4283bc3d5698SJohn Baldwin	vmovdqu	48-128(%rax),%xmm6
4284bc3d5698SJohn Baldwin	vpaddd	176-128(%rax),%xmm5,%xmm5
4285bc3d5698SJohn Baldwin
4286bc3d5698SJohn Baldwin	vpsrld	$3,%xmm6,%xmm7
4287bc3d5698SJohn Baldwin	vpsrld	$7,%xmm6,%xmm1
4288bc3d5698SJohn Baldwin	vpslld	$25,%xmm6,%xmm2
4289bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4290bc3d5698SJohn Baldwin	vpsrld	$18,%xmm6,%xmm1
4291bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4292bc3d5698SJohn Baldwin	vpslld	$14,%xmm6,%xmm2
4293bc3d5698SJohn Baldwin	vmovdqu	0-128(%rax),%xmm0
4294bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm3
4295bc3d5698SJohn Baldwin
4296bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4297bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4298bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4299bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4300bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4301bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm3,%xmm7
4302bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4303bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4304bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4305bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4306bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4307bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4308bc3d5698SJohn Baldwin	vpsrld	$6,%xmm10,%xmm7
4309bc3d5698SJohn Baldwin	vpslld	$26,%xmm10,%xmm2
4310bc3d5698SJohn Baldwin	vmovdqu	%xmm5,32-128(%rax)
4311bc3d5698SJohn Baldwin	vpaddd	%xmm13,%xmm5,%xmm5
4312bc3d5698SJohn Baldwin
4313bc3d5698SJohn Baldwin	vpsrld	$11,%xmm10,%xmm1
4314bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4315bc3d5698SJohn Baldwin	vpslld	$21,%xmm10,%xmm2
4316bc3d5698SJohn Baldwin	vpaddd	-64(%rbp),%xmm5,%xmm5
4317bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4318bc3d5698SJohn Baldwin
4319bc3d5698SJohn Baldwin	vpsrld	$25,%xmm10,%xmm1
4320bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4321bc3d5698SJohn Baldwin
4322bc3d5698SJohn Baldwin	vpslld	$7,%xmm10,%xmm2
4323bc3d5698SJohn Baldwin	vpandn	%xmm12,%xmm10,%xmm0
4324bc3d5698SJohn Baldwin	vpand	%xmm11,%xmm10,%xmm3
4325bc3d5698SJohn Baldwin
4326bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4327bc3d5698SJohn Baldwin
4328bc3d5698SJohn Baldwin	vpsrld	$2,%xmm14,%xmm13
4329bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4330bc3d5698SJohn Baldwin
4331bc3d5698SJohn Baldwin	vpslld	$30,%xmm14,%xmm1
4332bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
4333bc3d5698SJohn Baldwin	vpxor	%xmm14,%xmm15,%xmm3
4334bc3d5698SJohn Baldwin
4335bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm13,%xmm13
4336bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4337bc3d5698SJohn Baldwin
4338bc3d5698SJohn Baldwin	vpsrld	$13,%xmm14,%xmm1
4339bc3d5698SJohn Baldwin
4340bc3d5698SJohn Baldwin	vpslld	$19,%xmm14,%xmm2
4341bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
4342bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
4343bc3d5698SJohn Baldwin
4344bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm13,%xmm7
4345bc3d5698SJohn Baldwin
4346bc3d5698SJohn Baldwin	vpsrld	$22,%xmm14,%xmm1
4347bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4348bc3d5698SJohn Baldwin
4349bc3d5698SJohn Baldwin	vpslld	$10,%xmm14,%xmm2
4350bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm15,%xmm13
4351bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm9,%xmm9
4352bc3d5698SJohn Baldwin
4353bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4354bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4355bc3d5698SJohn Baldwin
4356bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm13,%xmm13
4357bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm13,%xmm13
4358bc3d5698SJohn Baldwin	vmovdqu	64-128(%rax),%xmm5
4359bc3d5698SJohn Baldwin	vpaddd	192-128(%rax),%xmm6,%xmm6
4360bc3d5698SJohn Baldwin
4361bc3d5698SJohn Baldwin	vpsrld	$3,%xmm5,%xmm7
4362bc3d5698SJohn Baldwin	vpsrld	$7,%xmm5,%xmm1
4363bc3d5698SJohn Baldwin	vpslld	$25,%xmm5,%xmm2
4364bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4365bc3d5698SJohn Baldwin	vpsrld	$18,%xmm5,%xmm1
4366bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4367bc3d5698SJohn Baldwin	vpslld	$14,%xmm5,%xmm2
4368bc3d5698SJohn Baldwin	vmovdqu	16-128(%rax),%xmm0
4369bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm4
4370bc3d5698SJohn Baldwin
4371bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4372bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4373bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4374bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4375bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4376bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm4,%xmm7
4377bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4378bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4379bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4380bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4381bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4382bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4383bc3d5698SJohn Baldwin	vpsrld	$6,%xmm9,%xmm7
4384bc3d5698SJohn Baldwin	vpslld	$26,%xmm9,%xmm2
4385bc3d5698SJohn Baldwin	vmovdqu	%xmm6,48-128(%rax)
4386bc3d5698SJohn Baldwin	vpaddd	%xmm12,%xmm6,%xmm6
4387bc3d5698SJohn Baldwin
4388bc3d5698SJohn Baldwin	vpsrld	$11,%xmm9,%xmm1
4389bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4390bc3d5698SJohn Baldwin	vpslld	$21,%xmm9,%xmm2
4391bc3d5698SJohn Baldwin	vpaddd	-32(%rbp),%xmm6,%xmm6
4392bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4393bc3d5698SJohn Baldwin
4394bc3d5698SJohn Baldwin	vpsrld	$25,%xmm9,%xmm1
4395bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4396bc3d5698SJohn Baldwin
4397bc3d5698SJohn Baldwin	vpslld	$7,%xmm9,%xmm2
4398bc3d5698SJohn Baldwin	vpandn	%xmm11,%xmm9,%xmm0
4399bc3d5698SJohn Baldwin	vpand	%xmm10,%xmm9,%xmm4
4400bc3d5698SJohn Baldwin
4401bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4402bc3d5698SJohn Baldwin
4403bc3d5698SJohn Baldwin	vpsrld	$2,%xmm13,%xmm12
4404bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4405bc3d5698SJohn Baldwin
4406bc3d5698SJohn Baldwin	vpslld	$30,%xmm13,%xmm1
4407bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
4408bc3d5698SJohn Baldwin	vpxor	%xmm13,%xmm14,%xmm4
4409bc3d5698SJohn Baldwin
4410bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm12,%xmm12
4411bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4412bc3d5698SJohn Baldwin
4413bc3d5698SJohn Baldwin	vpsrld	$13,%xmm13,%xmm1
4414bc3d5698SJohn Baldwin
4415bc3d5698SJohn Baldwin	vpslld	$19,%xmm13,%xmm2
4416bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm6,%xmm6
4417bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
4418bc3d5698SJohn Baldwin
4419bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm12,%xmm7
4420bc3d5698SJohn Baldwin
4421bc3d5698SJohn Baldwin	vpsrld	$22,%xmm13,%xmm1
4422bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4423bc3d5698SJohn Baldwin
4424bc3d5698SJohn Baldwin	vpslld	$10,%xmm13,%xmm2
4425bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm14,%xmm12
4426bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm8,%xmm8
4427bc3d5698SJohn Baldwin
4428bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4429bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4430bc3d5698SJohn Baldwin
4431bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm12,%xmm12
4432bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm12,%xmm12
4433bc3d5698SJohn Baldwin	vmovdqu	80-128(%rax),%xmm6
4434bc3d5698SJohn Baldwin	vpaddd	208-128(%rax),%xmm5,%xmm5
4435bc3d5698SJohn Baldwin
4436bc3d5698SJohn Baldwin	vpsrld	$3,%xmm6,%xmm7
4437bc3d5698SJohn Baldwin	vpsrld	$7,%xmm6,%xmm1
4438bc3d5698SJohn Baldwin	vpslld	$25,%xmm6,%xmm2
4439bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4440bc3d5698SJohn Baldwin	vpsrld	$18,%xmm6,%xmm1
4441bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4442bc3d5698SJohn Baldwin	vpslld	$14,%xmm6,%xmm2
4443bc3d5698SJohn Baldwin	vmovdqu	32-128(%rax),%xmm0
4444bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm3
4445bc3d5698SJohn Baldwin
4446bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4447bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4448bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4449bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4450bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4451bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm3,%xmm7
4452bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4453bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4454bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4455bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4456bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4457bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4458bc3d5698SJohn Baldwin	vpsrld	$6,%xmm8,%xmm7
4459bc3d5698SJohn Baldwin	vpslld	$26,%xmm8,%xmm2
4460bc3d5698SJohn Baldwin	vmovdqu	%xmm5,64-128(%rax)
4461bc3d5698SJohn Baldwin	vpaddd	%xmm11,%xmm5,%xmm5
4462bc3d5698SJohn Baldwin
4463bc3d5698SJohn Baldwin	vpsrld	$11,%xmm8,%xmm1
4464bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4465bc3d5698SJohn Baldwin	vpslld	$21,%xmm8,%xmm2
4466bc3d5698SJohn Baldwin	vpaddd	0(%rbp),%xmm5,%xmm5
4467bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4468bc3d5698SJohn Baldwin
4469bc3d5698SJohn Baldwin	vpsrld	$25,%xmm8,%xmm1
4470bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4471bc3d5698SJohn Baldwin
4472bc3d5698SJohn Baldwin	vpslld	$7,%xmm8,%xmm2
4473bc3d5698SJohn Baldwin	vpandn	%xmm10,%xmm8,%xmm0
4474bc3d5698SJohn Baldwin	vpand	%xmm9,%xmm8,%xmm3
4475bc3d5698SJohn Baldwin
4476bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4477bc3d5698SJohn Baldwin
4478bc3d5698SJohn Baldwin	vpsrld	$2,%xmm12,%xmm11
4479bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4480bc3d5698SJohn Baldwin
4481bc3d5698SJohn Baldwin	vpslld	$30,%xmm12,%xmm1
4482bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
4483bc3d5698SJohn Baldwin	vpxor	%xmm12,%xmm13,%xmm3
4484bc3d5698SJohn Baldwin
4485bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm11,%xmm11
4486bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4487bc3d5698SJohn Baldwin
4488bc3d5698SJohn Baldwin	vpsrld	$13,%xmm12,%xmm1
4489bc3d5698SJohn Baldwin
4490bc3d5698SJohn Baldwin	vpslld	$19,%xmm12,%xmm2
4491bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
4492bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
4493bc3d5698SJohn Baldwin
4494bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm11,%xmm7
4495bc3d5698SJohn Baldwin
4496bc3d5698SJohn Baldwin	vpsrld	$22,%xmm12,%xmm1
4497bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4498bc3d5698SJohn Baldwin
4499bc3d5698SJohn Baldwin	vpslld	$10,%xmm12,%xmm2
4500bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm13,%xmm11
4501bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
4502bc3d5698SJohn Baldwin
4503bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4504bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4505bc3d5698SJohn Baldwin
4506bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
4507bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm11,%xmm11
4508bc3d5698SJohn Baldwin	vmovdqu	96-128(%rax),%xmm5
4509bc3d5698SJohn Baldwin	vpaddd	224-128(%rax),%xmm6,%xmm6
4510bc3d5698SJohn Baldwin
4511bc3d5698SJohn Baldwin	vpsrld	$3,%xmm5,%xmm7
4512bc3d5698SJohn Baldwin	vpsrld	$7,%xmm5,%xmm1
4513bc3d5698SJohn Baldwin	vpslld	$25,%xmm5,%xmm2
4514bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4515bc3d5698SJohn Baldwin	vpsrld	$18,%xmm5,%xmm1
4516bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4517bc3d5698SJohn Baldwin	vpslld	$14,%xmm5,%xmm2
4518bc3d5698SJohn Baldwin	vmovdqu	48-128(%rax),%xmm0
4519bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm4
4520bc3d5698SJohn Baldwin
4521bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4522bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4523bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4524bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4525bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4526bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm4,%xmm7
4527bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4528bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4529bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4530bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4531bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4532bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4533bc3d5698SJohn Baldwin	vpsrld	$6,%xmm15,%xmm7
4534bc3d5698SJohn Baldwin	vpslld	$26,%xmm15,%xmm2
4535bc3d5698SJohn Baldwin	vmovdqu	%xmm6,80-128(%rax)
4536bc3d5698SJohn Baldwin	vpaddd	%xmm10,%xmm6,%xmm6
4537bc3d5698SJohn Baldwin
4538bc3d5698SJohn Baldwin	vpsrld	$11,%xmm15,%xmm1
4539bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4540bc3d5698SJohn Baldwin	vpslld	$21,%xmm15,%xmm2
4541bc3d5698SJohn Baldwin	vpaddd	32(%rbp),%xmm6,%xmm6
4542bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4543bc3d5698SJohn Baldwin
4544bc3d5698SJohn Baldwin	vpsrld	$25,%xmm15,%xmm1
4545bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4546bc3d5698SJohn Baldwin
4547bc3d5698SJohn Baldwin	vpslld	$7,%xmm15,%xmm2
4548bc3d5698SJohn Baldwin	vpandn	%xmm9,%xmm15,%xmm0
4549bc3d5698SJohn Baldwin	vpand	%xmm8,%xmm15,%xmm4
4550bc3d5698SJohn Baldwin
4551bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4552bc3d5698SJohn Baldwin
4553bc3d5698SJohn Baldwin	vpsrld	$2,%xmm11,%xmm10
4554bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4555bc3d5698SJohn Baldwin
4556bc3d5698SJohn Baldwin	vpslld	$30,%xmm11,%xmm1
4557bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
4558bc3d5698SJohn Baldwin	vpxor	%xmm11,%xmm12,%xmm4
4559bc3d5698SJohn Baldwin
4560bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm10,%xmm10
4561bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4562bc3d5698SJohn Baldwin
4563bc3d5698SJohn Baldwin	vpsrld	$13,%xmm11,%xmm1
4564bc3d5698SJohn Baldwin
4565bc3d5698SJohn Baldwin	vpslld	$19,%xmm11,%xmm2
4566bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm6,%xmm6
4567bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
4568bc3d5698SJohn Baldwin
4569bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm10,%xmm7
4570bc3d5698SJohn Baldwin
4571bc3d5698SJohn Baldwin	vpsrld	$22,%xmm11,%xmm1
4572bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4573bc3d5698SJohn Baldwin
4574bc3d5698SJohn Baldwin	vpslld	$10,%xmm11,%xmm2
4575bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm12,%xmm10
4576bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm14,%xmm14
4577bc3d5698SJohn Baldwin
4578bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4579bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4580bc3d5698SJohn Baldwin
4581bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm10,%xmm10
4582bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm10,%xmm10
4583bc3d5698SJohn Baldwin	vmovdqu	112-128(%rax),%xmm6
4584bc3d5698SJohn Baldwin	vpaddd	240-128(%rax),%xmm5,%xmm5
4585bc3d5698SJohn Baldwin
4586bc3d5698SJohn Baldwin	vpsrld	$3,%xmm6,%xmm7
4587bc3d5698SJohn Baldwin	vpsrld	$7,%xmm6,%xmm1
4588bc3d5698SJohn Baldwin	vpslld	$25,%xmm6,%xmm2
4589bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4590bc3d5698SJohn Baldwin	vpsrld	$18,%xmm6,%xmm1
4591bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4592bc3d5698SJohn Baldwin	vpslld	$14,%xmm6,%xmm2
4593bc3d5698SJohn Baldwin	vmovdqu	64-128(%rax),%xmm0
4594bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm3
4595bc3d5698SJohn Baldwin
4596bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4597bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4598bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4599bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4600bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4601bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm3,%xmm7
4602bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4603bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4604bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4605bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4606bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4607bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4608bc3d5698SJohn Baldwin	vpsrld	$6,%xmm14,%xmm7
4609bc3d5698SJohn Baldwin	vpslld	$26,%xmm14,%xmm2
4610bc3d5698SJohn Baldwin	vmovdqu	%xmm5,96-128(%rax)
4611bc3d5698SJohn Baldwin	vpaddd	%xmm9,%xmm5,%xmm5
4612bc3d5698SJohn Baldwin
4613bc3d5698SJohn Baldwin	vpsrld	$11,%xmm14,%xmm1
4614bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4615bc3d5698SJohn Baldwin	vpslld	$21,%xmm14,%xmm2
4616bc3d5698SJohn Baldwin	vpaddd	64(%rbp),%xmm5,%xmm5
4617bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4618bc3d5698SJohn Baldwin
4619bc3d5698SJohn Baldwin	vpsrld	$25,%xmm14,%xmm1
4620bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4621bc3d5698SJohn Baldwin
4622bc3d5698SJohn Baldwin	vpslld	$7,%xmm14,%xmm2
4623bc3d5698SJohn Baldwin	vpandn	%xmm8,%xmm14,%xmm0
4624bc3d5698SJohn Baldwin	vpand	%xmm15,%xmm14,%xmm3
4625bc3d5698SJohn Baldwin
4626bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4627bc3d5698SJohn Baldwin
4628bc3d5698SJohn Baldwin	vpsrld	$2,%xmm10,%xmm9
4629bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4630bc3d5698SJohn Baldwin
4631bc3d5698SJohn Baldwin	vpslld	$30,%xmm10,%xmm1
4632bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
4633bc3d5698SJohn Baldwin	vpxor	%xmm10,%xmm11,%xmm3
4634bc3d5698SJohn Baldwin
4635bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm9,%xmm9
4636bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4637bc3d5698SJohn Baldwin
4638bc3d5698SJohn Baldwin	vpsrld	$13,%xmm10,%xmm1
4639bc3d5698SJohn Baldwin
4640bc3d5698SJohn Baldwin	vpslld	$19,%xmm10,%xmm2
4641bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
4642bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
4643bc3d5698SJohn Baldwin
4644bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm9,%xmm7
4645bc3d5698SJohn Baldwin
4646bc3d5698SJohn Baldwin	vpsrld	$22,%xmm10,%xmm1
4647bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4648bc3d5698SJohn Baldwin
4649bc3d5698SJohn Baldwin	vpslld	$10,%xmm10,%xmm2
4650bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm11,%xmm9
4651bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm13,%xmm13
4652bc3d5698SJohn Baldwin
4653bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4654bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4655bc3d5698SJohn Baldwin
4656bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm9,%xmm9
4657bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm9,%xmm9
4658bc3d5698SJohn Baldwin	vmovdqu	128-128(%rax),%xmm5
4659bc3d5698SJohn Baldwin	vpaddd	0-128(%rax),%xmm6,%xmm6
4660bc3d5698SJohn Baldwin
4661bc3d5698SJohn Baldwin	vpsrld	$3,%xmm5,%xmm7
4662bc3d5698SJohn Baldwin	vpsrld	$7,%xmm5,%xmm1
4663bc3d5698SJohn Baldwin	vpslld	$25,%xmm5,%xmm2
4664bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4665bc3d5698SJohn Baldwin	vpsrld	$18,%xmm5,%xmm1
4666bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4667bc3d5698SJohn Baldwin	vpslld	$14,%xmm5,%xmm2
4668bc3d5698SJohn Baldwin	vmovdqu	80-128(%rax),%xmm0
4669bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm4
4670bc3d5698SJohn Baldwin
4671bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4672bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4673bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4674bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4675bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4676bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm4,%xmm7
4677bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4678bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4679bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4680bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4681bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4682bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4683bc3d5698SJohn Baldwin	vpsrld	$6,%xmm13,%xmm7
4684bc3d5698SJohn Baldwin	vpslld	$26,%xmm13,%xmm2
4685bc3d5698SJohn Baldwin	vmovdqu	%xmm6,112-128(%rax)
4686bc3d5698SJohn Baldwin	vpaddd	%xmm8,%xmm6,%xmm6
4687bc3d5698SJohn Baldwin
4688bc3d5698SJohn Baldwin	vpsrld	$11,%xmm13,%xmm1
4689bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4690bc3d5698SJohn Baldwin	vpslld	$21,%xmm13,%xmm2
4691bc3d5698SJohn Baldwin	vpaddd	96(%rbp),%xmm6,%xmm6
4692bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4693bc3d5698SJohn Baldwin
4694bc3d5698SJohn Baldwin	vpsrld	$25,%xmm13,%xmm1
4695bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4696bc3d5698SJohn Baldwin
4697bc3d5698SJohn Baldwin	vpslld	$7,%xmm13,%xmm2
4698bc3d5698SJohn Baldwin	vpandn	%xmm15,%xmm13,%xmm0
4699bc3d5698SJohn Baldwin	vpand	%xmm14,%xmm13,%xmm4
4700bc3d5698SJohn Baldwin
4701bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4702bc3d5698SJohn Baldwin
4703bc3d5698SJohn Baldwin	vpsrld	$2,%xmm9,%xmm8
4704bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4705bc3d5698SJohn Baldwin
4706bc3d5698SJohn Baldwin	vpslld	$30,%xmm9,%xmm1
4707bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
4708bc3d5698SJohn Baldwin	vpxor	%xmm9,%xmm10,%xmm4
4709bc3d5698SJohn Baldwin
4710bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm8,%xmm8
4711bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4712bc3d5698SJohn Baldwin
4713bc3d5698SJohn Baldwin	vpsrld	$13,%xmm9,%xmm1
4714bc3d5698SJohn Baldwin
4715bc3d5698SJohn Baldwin	vpslld	$19,%xmm9,%xmm2
4716bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm6,%xmm6
4717bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
4718bc3d5698SJohn Baldwin
4719bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm8,%xmm7
4720bc3d5698SJohn Baldwin
4721bc3d5698SJohn Baldwin	vpsrld	$22,%xmm9,%xmm1
4722bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4723bc3d5698SJohn Baldwin
4724bc3d5698SJohn Baldwin	vpslld	$10,%xmm9,%xmm2
4725bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm10,%xmm8
4726bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm12,%xmm12
4727bc3d5698SJohn Baldwin
4728bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4729bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4730bc3d5698SJohn Baldwin
4731bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm8,%xmm8
4732bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm8,%xmm8
4733bc3d5698SJohn Baldwin	addq	$256,%rbp
4734bc3d5698SJohn Baldwin	vmovdqu	144-128(%rax),%xmm6
4735bc3d5698SJohn Baldwin	vpaddd	16-128(%rax),%xmm5,%xmm5
4736bc3d5698SJohn Baldwin
4737bc3d5698SJohn Baldwin	vpsrld	$3,%xmm6,%xmm7
4738bc3d5698SJohn Baldwin	vpsrld	$7,%xmm6,%xmm1
4739bc3d5698SJohn Baldwin	vpslld	$25,%xmm6,%xmm2
4740bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4741bc3d5698SJohn Baldwin	vpsrld	$18,%xmm6,%xmm1
4742bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4743bc3d5698SJohn Baldwin	vpslld	$14,%xmm6,%xmm2
4744bc3d5698SJohn Baldwin	vmovdqu	96-128(%rax),%xmm0
4745bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm3
4746bc3d5698SJohn Baldwin
4747bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4748bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4749bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4750bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4751bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4752bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm3,%xmm7
4753bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4754bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4755bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4756bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4757bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4758bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4759bc3d5698SJohn Baldwin	vpsrld	$6,%xmm12,%xmm7
4760bc3d5698SJohn Baldwin	vpslld	$26,%xmm12,%xmm2
4761bc3d5698SJohn Baldwin	vmovdqu	%xmm5,128-128(%rax)
4762bc3d5698SJohn Baldwin	vpaddd	%xmm15,%xmm5,%xmm5
4763bc3d5698SJohn Baldwin
4764bc3d5698SJohn Baldwin	vpsrld	$11,%xmm12,%xmm1
4765bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4766bc3d5698SJohn Baldwin	vpslld	$21,%xmm12,%xmm2
4767bc3d5698SJohn Baldwin	vpaddd	-128(%rbp),%xmm5,%xmm5
4768bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4769bc3d5698SJohn Baldwin
4770bc3d5698SJohn Baldwin	vpsrld	$25,%xmm12,%xmm1
4771bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4772bc3d5698SJohn Baldwin
4773bc3d5698SJohn Baldwin	vpslld	$7,%xmm12,%xmm2
4774bc3d5698SJohn Baldwin	vpandn	%xmm14,%xmm12,%xmm0
4775bc3d5698SJohn Baldwin	vpand	%xmm13,%xmm12,%xmm3
4776bc3d5698SJohn Baldwin
4777bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4778bc3d5698SJohn Baldwin
4779bc3d5698SJohn Baldwin	vpsrld	$2,%xmm8,%xmm15
4780bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4781bc3d5698SJohn Baldwin
4782bc3d5698SJohn Baldwin	vpslld	$30,%xmm8,%xmm1
4783bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
4784bc3d5698SJohn Baldwin	vpxor	%xmm8,%xmm9,%xmm3
4785bc3d5698SJohn Baldwin
4786bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm15,%xmm15
4787bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4788bc3d5698SJohn Baldwin
4789bc3d5698SJohn Baldwin	vpsrld	$13,%xmm8,%xmm1
4790bc3d5698SJohn Baldwin
4791bc3d5698SJohn Baldwin	vpslld	$19,%xmm8,%xmm2
4792bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
4793bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
4794bc3d5698SJohn Baldwin
4795bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm15,%xmm7
4796bc3d5698SJohn Baldwin
4797bc3d5698SJohn Baldwin	vpsrld	$22,%xmm8,%xmm1
4798bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4799bc3d5698SJohn Baldwin
4800bc3d5698SJohn Baldwin	vpslld	$10,%xmm8,%xmm2
4801bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm9,%xmm15
4802bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
4803bc3d5698SJohn Baldwin
4804bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4805bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4806bc3d5698SJohn Baldwin
4807bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
4808bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm15,%xmm15
4809bc3d5698SJohn Baldwin	vmovdqu	160-128(%rax),%xmm5
4810bc3d5698SJohn Baldwin	vpaddd	32-128(%rax),%xmm6,%xmm6
4811bc3d5698SJohn Baldwin
4812bc3d5698SJohn Baldwin	vpsrld	$3,%xmm5,%xmm7
4813bc3d5698SJohn Baldwin	vpsrld	$7,%xmm5,%xmm1
4814bc3d5698SJohn Baldwin	vpslld	$25,%xmm5,%xmm2
4815bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4816bc3d5698SJohn Baldwin	vpsrld	$18,%xmm5,%xmm1
4817bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4818bc3d5698SJohn Baldwin	vpslld	$14,%xmm5,%xmm2
4819bc3d5698SJohn Baldwin	vmovdqu	112-128(%rax),%xmm0
4820bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm4
4821bc3d5698SJohn Baldwin
4822bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4823bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4824bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4825bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4826bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4827bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm4,%xmm7
4828bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4829bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4830bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4831bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4832bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4833bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4834bc3d5698SJohn Baldwin	vpsrld	$6,%xmm11,%xmm7
4835bc3d5698SJohn Baldwin	vpslld	$26,%xmm11,%xmm2
4836bc3d5698SJohn Baldwin	vmovdqu	%xmm6,144-128(%rax)
4837bc3d5698SJohn Baldwin	vpaddd	%xmm14,%xmm6,%xmm6
4838bc3d5698SJohn Baldwin
4839bc3d5698SJohn Baldwin	vpsrld	$11,%xmm11,%xmm1
4840bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4841bc3d5698SJohn Baldwin	vpslld	$21,%xmm11,%xmm2
4842bc3d5698SJohn Baldwin	vpaddd	-96(%rbp),%xmm6,%xmm6
4843bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4844bc3d5698SJohn Baldwin
4845bc3d5698SJohn Baldwin	vpsrld	$25,%xmm11,%xmm1
4846bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4847bc3d5698SJohn Baldwin
4848bc3d5698SJohn Baldwin	vpslld	$7,%xmm11,%xmm2
4849bc3d5698SJohn Baldwin	vpandn	%xmm13,%xmm11,%xmm0
4850bc3d5698SJohn Baldwin	vpand	%xmm12,%xmm11,%xmm4
4851bc3d5698SJohn Baldwin
4852bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4853bc3d5698SJohn Baldwin
4854bc3d5698SJohn Baldwin	vpsrld	$2,%xmm15,%xmm14
4855bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4856bc3d5698SJohn Baldwin
4857bc3d5698SJohn Baldwin	vpslld	$30,%xmm15,%xmm1
4858bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
4859bc3d5698SJohn Baldwin	vpxor	%xmm15,%xmm8,%xmm4
4860bc3d5698SJohn Baldwin
4861bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm14,%xmm14
4862bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4863bc3d5698SJohn Baldwin
4864bc3d5698SJohn Baldwin	vpsrld	$13,%xmm15,%xmm1
4865bc3d5698SJohn Baldwin
4866bc3d5698SJohn Baldwin	vpslld	$19,%xmm15,%xmm2
4867bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm6,%xmm6
4868bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
4869bc3d5698SJohn Baldwin
4870bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm14,%xmm7
4871bc3d5698SJohn Baldwin
4872bc3d5698SJohn Baldwin	vpsrld	$22,%xmm15,%xmm1
4873bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4874bc3d5698SJohn Baldwin
4875bc3d5698SJohn Baldwin	vpslld	$10,%xmm15,%xmm2
4876bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm8,%xmm14
4877bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm10,%xmm10
4878bc3d5698SJohn Baldwin
4879bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4880bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4881bc3d5698SJohn Baldwin
4882bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm14,%xmm14
4883bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm14,%xmm14
4884bc3d5698SJohn Baldwin	vmovdqu	176-128(%rax),%xmm6
4885bc3d5698SJohn Baldwin	vpaddd	48-128(%rax),%xmm5,%xmm5
4886bc3d5698SJohn Baldwin
4887bc3d5698SJohn Baldwin	vpsrld	$3,%xmm6,%xmm7
4888bc3d5698SJohn Baldwin	vpsrld	$7,%xmm6,%xmm1
4889bc3d5698SJohn Baldwin	vpslld	$25,%xmm6,%xmm2
4890bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4891bc3d5698SJohn Baldwin	vpsrld	$18,%xmm6,%xmm1
4892bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4893bc3d5698SJohn Baldwin	vpslld	$14,%xmm6,%xmm2
4894bc3d5698SJohn Baldwin	vmovdqu	128-128(%rax),%xmm0
4895bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm3
4896bc3d5698SJohn Baldwin
4897bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4898bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4899bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4900bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4901bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4902bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm3,%xmm7
4903bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4904bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4905bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4906bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4907bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4908bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4909bc3d5698SJohn Baldwin	vpsrld	$6,%xmm10,%xmm7
4910bc3d5698SJohn Baldwin	vpslld	$26,%xmm10,%xmm2
4911bc3d5698SJohn Baldwin	vmovdqu	%xmm5,160-128(%rax)
4912bc3d5698SJohn Baldwin	vpaddd	%xmm13,%xmm5,%xmm5
4913bc3d5698SJohn Baldwin
4914bc3d5698SJohn Baldwin	vpsrld	$11,%xmm10,%xmm1
4915bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4916bc3d5698SJohn Baldwin	vpslld	$21,%xmm10,%xmm2
4917bc3d5698SJohn Baldwin	vpaddd	-64(%rbp),%xmm5,%xmm5
4918bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4919bc3d5698SJohn Baldwin
4920bc3d5698SJohn Baldwin	vpsrld	$25,%xmm10,%xmm1
4921bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4922bc3d5698SJohn Baldwin
4923bc3d5698SJohn Baldwin	vpslld	$7,%xmm10,%xmm2
4924bc3d5698SJohn Baldwin	vpandn	%xmm12,%xmm10,%xmm0
4925bc3d5698SJohn Baldwin	vpand	%xmm11,%xmm10,%xmm3
4926bc3d5698SJohn Baldwin
4927bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4928bc3d5698SJohn Baldwin
4929bc3d5698SJohn Baldwin	vpsrld	$2,%xmm14,%xmm13
4930bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4931bc3d5698SJohn Baldwin
4932bc3d5698SJohn Baldwin	vpslld	$30,%xmm14,%xmm1
4933bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
4934bc3d5698SJohn Baldwin	vpxor	%xmm14,%xmm15,%xmm3
4935bc3d5698SJohn Baldwin
4936bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm13,%xmm13
4937bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
4938bc3d5698SJohn Baldwin
4939bc3d5698SJohn Baldwin	vpsrld	$13,%xmm14,%xmm1
4940bc3d5698SJohn Baldwin
4941bc3d5698SJohn Baldwin	vpslld	$19,%xmm14,%xmm2
4942bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
4943bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
4944bc3d5698SJohn Baldwin
4945bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm13,%xmm7
4946bc3d5698SJohn Baldwin
4947bc3d5698SJohn Baldwin	vpsrld	$22,%xmm14,%xmm1
4948bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4949bc3d5698SJohn Baldwin
4950bc3d5698SJohn Baldwin	vpslld	$10,%xmm14,%xmm2
4951bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm15,%xmm13
4952bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm9,%xmm9
4953bc3d5698SJohn Baldwin
4954bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4955bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4956bc3d5698SJohn Baldwin
4957bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm13,%xmm13
4958bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm13,%xmm13
4959bc3d5698SJohn Baldwin	vmovdqu	192-128(%rax),%xmm5
4960bc3d5698SJohn Baldwin	vpaddd	64-128(%rax),%xmm6,%xmm6
4961bc3d5698SJohn Baldwin
4962bc3d5698SJohn Baldwin	vpsrld	$3,%xmm5,%xmm7
4963bc3d5698SJohn Baldwin	vpsrld	$7,%xmm5,%xmm1
4964bc3d5698SJohn Baldwin	vpslld	$25,%xmm5,%xmm2
4965bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4966bc3d5698SJohn Baldwin	vpsrld	$18,%xmm5,%xmm1
4967bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4968bc3d5698SJohn Baldwin	vpslld	$14,%xmm5,%xmm2
4969bc3d5698SJohn Baldwin	vmovdqu	144-128(%rax),%xmm0
4970bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm4
4971bc3d5698SJohn Baldwin
4972bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4973bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
4974bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4975bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
4976bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4977bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm4,%xmm7
4978bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
4979bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4980bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
4981bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4982bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4983bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
4984bc3d5698SJohn Baldwin	vpsrld	$6,%xmm9,%xmm7
4985bc3d5698SJohn Baldwin	vpslld	$26,%xmm9,%xmm2
4986bc3d5698SJohn Baldwin	vmovdqu	%xmm6,176-128(%rax)
4987bc3d5698SJohn Baldwin	vpaddd	%xmm12,%xmm6,%xmm6
4988bc3d5698SJohn Baldwin
4989bc3d5698SJohn Baldwin	vpsrld	$11,%xmm9,%xmm1
4990bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4991bc3d5698SJohn Baldwin	vpslld	$21,%xmm9,%xmm2
4992bc3d5698SJohn Baldwin	vpaddd	-32(%rbp),%xmm6,%xmm6
4993bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
4994bc3d5698SJohn Baldwin
4995bc3d5698SJohn Baldwin	vpsrld	$25,%xmm9,%xmm1
4996bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
4997bc3d5698SJohn Baldwin
4998bc3d5698SJohn Baldwin	vpslld	$7,%xmm9,%xmm2
4999bc3d5698SJohn Baldwin	vpandn	%xmm11,%xmm9,%xmm0
5000bc3d5698SJohn Baldwin	vpand	%xmm10,%xmm9,%xmm4
5001bc3d5698SJohn Baldwin
5002bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5003bc3d5698SJohn Baldwin
5004bc3d5698SJohn Baldwin	vpsrld	$2,%xmm13,%xmm12
5005bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5006bc3d5698SJohn Baldwin
5007bc3d5698SJohn Baldwin	vpslld	$30,%xmm13,%xmm1
5008bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
5009bc3d5698SJohn Baldwin	vpxor	%xmm13,%xmm14,%xmm4
5010bc3d5698SJohn Baldwin
5011bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm12,%xmm12
5012bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
5013bc3d5698SJohn Baldwin
5014bc3d5698SJohn Baldwin	vpsrld	$13,%xmm13,%xmm1
5015bc3d5698SJohn Baldwin
5016bc3d5698SJohn Baldwin	vpslld	$19,%xmm13,%xmm2
5017bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm6,%xmm6
5018bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
5019bc3d5698SJohn Baldwin
5020bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm12,%xmm7
5021bc3d5698SJohn Baldwin
5022bc3d5698SJohn Baldwin	vpsrld	$22,%xmm13,%xmm1
5023bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5024bc3d5698SJohn Baldwin
5025bc3d5698SJohn Baldwin	vpslld	$10,%xmm13,%xmm2
5026bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm14,%xmm12
5027bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm8,%xmm8
5028bc3d5698SJohn Baldwin
5029bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5030bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5031bc3d5698SJohn Baldwin
5032bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm12,%xmm12
5033bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm12,%xmm12
5034bc3d5698SJohn Baldwin	vmovdqu	208-128(%rax),%xmm6
5035bc3d5698SJohn Baldwin	vpaddd	80-128(%rax),%xmm5,%xmm5
5036bc3d5698SJohn Baldwin
5037bc3d5698SJohn Baldwin	vpsrld	$3,%xmm6,%xmm7
5038bc3d5698SJohn Baldwin	vpsrld	$7,%xmm6,%xmm1
5039bc3d5698SJohn Baldwin	vpslld	$25,%xmm6,%xmm2
5040bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5041bc3d5698SJohn Baldwin	vpsrld	$18,%xmm6,%xmm1
5042bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5043bc3d5698SJohn Baldwin	vpslld	$14,%xmm6,%xmm2
5044bc3d5698SJohn Baldwin	vmovdqu	160-128(%rax),%xmm0
5045bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm3
5046bc3d5698SJohn Baldwin
5047bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5048bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
5049bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5050bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
5051bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
5052bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm3,%xmm7
5053bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
5054bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5055bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
5056bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5057bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5058bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
5059bc3d5698SJohn Baldwin	vpsrld	$6,%xmm8,%xmm7
5060bc3d5698SJohn Baldwin	vpslld	$26,%xmm8,%xmm2
5061bc3d5698SJohn Baldwin	vmovdqu	%xmm5,192-128(%rax)
5062bc3d5698SJohn Baldwin	vpaddd	%xmm11,%xmm5,%xmm5
5063bc3d5698SJohn Baldwin
5064bc3d5698SJohn Baldwin	vpsrld	$11,%xmm8,%xmm1
5065bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5066bc3d5698SJohn Baldwin	vpslld	$21,%xmm8,%xmm2
5067bc3d5698SJohn Baldwin	vpaddd	0(%rbp),%xmm5,%xmm5
5068bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5069bc3d5698SJohn Baldwin
5070bc3d5698SJohn Baldwin	vpsrld	$25,%xmm8,%xmm1
5071bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5072bc3d5698SJohn Baldwin
5073bc3d5698SJohn Baldwin	vpslld	$7,%xmm8,%xmm2
5074bc3d5698SJohn Baldwin	vpandn	%xmm10,%xmm8,%xmm0
5075bc3d5698SJohn Baldwin	vpand	%xmm9,%xmm8,%xmm3
5076bc3d5698SJohn Baldwin
5077bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5078bc3d5698SJohn Baldwin
5079bc3d5698SJohn Baldwin	vpsrld	$2,%xmm12,%xmm11
5080bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5081bc3d5698SJohn Baldwin
5082bc3d5698SJohn Baldwin	vpslld	$30,%xmm12,%xmm1
5083bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
5084bc3d5698SJohn Baldwin	vpxor	%xmm12,%xmm13,%xmm3
5085bc3d5698SJohn Baldwin
5086bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm11,%xmm11
5087bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
5088bc3d5698SJohn Baldwin
5089bc3d5698SJohn Baldwin	vpsrld	$13,%xmm12,%xmm1
5090bc3d5698SJohn Baldwin
5091bc3d5698SJohn Baldwin	vpslld	$19,%xmm12,%xmm2
5092bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
5093bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
5094bc3d5698SJohn Baldwin
5095bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm11,%xmm7
5096bc3d5698SJohn Baldwin
5097bc3d5698SJohn Baldwin	vpsrld	$22,%xmm12,%xmm1
5098bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5099bc3d5698SJohn Baldwin
5100bc3d5698SJohn Baldwin	vpslld	$10,%xmm12,%xmm2
5101bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm13,%xmm11
5102bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
5103bc3d5698SJohn Baldwin
5104bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5105bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5106bc3d5698SJohn Baldwin
5107bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
5108bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm11,%xmm11
5109bc3d5698SJohn Baldwin	vmovdqu	224-128(%rax),%xmm5
5110bc3d5698SJohn Baldwin	vpaddd	96-128(%rax),%xmm6,%xmm6
5111bc3d5698SJohn Baldwin
5112bc3d5698SJohn Baldwin	vpsrld	$3,%xmm5,%xmm7
5113bc3d5698SJohn Baldwin	vpsrld	$7,%xmm5,%xmm1
5114bc3d5698SJohn Baldwin	vpslld	$25,%xmm5,%xmm2
5115bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5116bc3d5698SJohn Baldwin	vpsrld	$18,%xmm5,%xmm1
5117bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5118bc3d5698SJohn Baldwin	vpslld	$14,%xmm5,%xmm2
5119bc3d5698SJohn Baldwin	vmovdqu	176-128(%rax),%xmm0
5120bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm4
5121bc3d5698SJohn Baldwin
5122bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5123bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
5124bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5125bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
5126bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
5127bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm4,%xmm7
5128bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
5129bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5130bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
5131bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5132bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5133bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
5134bc3d5698SJohn Baldwin	vpsrld	$6,%xmm15,%xmm7
5135bc3d5698SJohn Baldwin	vpslld	$26,%xmm15,%xmm2
5136bc3d5698SJohn Baldwin	vmovdqu	%xmm6,208-128(%rax)
5137bc3d5698SJohn Baldwin	vpaddd	%xmm10,%xmm6,%xmm6
5138bc3d5698SJohn Baldwin
5139bc3d5698SJohn Baldwin	vpsrld	$11,%xmm15,%xmm1
5140bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5141bc3d5698SJohn Baldwin	vpslld	$21,%xmm15,%xmm2
5142bc3d5698SJohn Baldwin	vpaddd	32(%rbp),%xmm6,%xmm6
5143bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5144bc3d5698SJohn Baldwin
5145bc3d5698SJohn Baldwin	vpsrld	$25,%xmm15,%xmm1
5146bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5147bc3d5698SJohn Baldwin
5148bc3d5698SJohn Baldwin	vpslld	$7,%xmm15,%xmm2
5149bc3d5698SJohn Baldwin	vpandn	%xmm9,%xmm15,%xmm0
5150bc3d5698SJohn Baldwin	vpand	%xmm8,%xmm15,%xmm4
5151bc3d5698SJohn Baldwin
5152bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5153bc3d5698SJohn Baldwin
5154bc3d5698SJohn Baldwin	vpsrld	$2,%xmm11,%xmm10
5155bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5156bc3d5698SJohn Baldwin
5157bc3d5698SJohn Baldwin	vpslld	$30,%xmm11,%xmm1
5158bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
5159bc3d5698SJohn Baldwin	vpxor	%xmm11,%xmm12,%xmm4
5160bc3d5698SJohn Baldwin
5161bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm10,%xmm10
5162bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
5163bc3d5698SJohn Baldwin
5164bc3d5698SJohn Baldwin	vpsrld	$13,%xmm11,%xmm1
5165bc3d5698SJohn Baldwin
5166bc3d5698SJohn Baldwin	vpslld	$19,%xmm11,%xmm2
5167bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm6,%xmm6
5168bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
5169bc3d5698SJohn Baldwin
5170bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm10,%xmm7
5171bc3d5698SJohn Baldwin
5172bc3d5698SJohn Baldwin	vpsrld	$22,%xmm11,%xmm1
5173bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5174bc3d5698SJohn Baldwin
5175bc3d5698SJohn Baldwin	vpslld	$10,%xmm11,%xmm2
5176bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm12,%xmm10
5177bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm14,%xmm14
5178bc3d5698SJohn Baldwin
5179bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5180bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5181bc3d5698SJohn Baldwin
5182bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm10,%xmm10
5183bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm10,%xmm10
5184bc3d5698SJohn Baldwin	vmovdqu	240-128(%rax),%xmm6
5185bc3d5698SJohn Baldwin	vpaddd	112-128(%rax),%xmm5,%xmm5
5186bc3d5698SJohn Baldwin
5187bc3d5698SJohn Baldwin	vpsrld	$3,%xmm6,%xmm7
5188bc3d5698SJohn Baldwin	vpsrld	$7,%xmm6,%xmm1
5189bc3d5698SJohn Baldwin	vpslld	$25,%xmm6,%xmm2
5190bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5191bc3d5698SJohn Baldwin	vpsrld	$18,%xmm6,%xmm1
5192bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5193bc3d5698SJohn Baldwin	vpslld	$14,%xmm6,%xmm2
5194bc3d5698SJohn Baldwin	vmovdqu	192-128(%rax),%xmm0
5195bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm3
5196bc3d5698SJohn Baldwin
5197bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5198bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
5199bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5200bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
5201bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
5202bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm3,%xmm7
5203bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
5204bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5205bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
5206bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5207bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5208bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
5209bc3d5698SJohn Baldwin	vpsrld	$6,%xmm14,%xmm7
5210bc3d5698SJohn Baldwin	vpslld	$26,%xmm14,%xmm2
5211bc3d5698SJohn Baldwin	vmovdqu	%xmm5,224-128(%rax)
5212bc3d5698SJohn Baldwin	vpaddd	%xmm9,%xmm5,%xmm5
5213bc3d5698SJohn Baldwin
5214bc3d5698SJohn Baldwin	vpsrld	$11,%xmm14,%xmm1
5215bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5216bc3d5698SJohn Baldwin	vpslld	$21,%xmm14,%xmm2
5217bc3d5698SJohn Baldwin	vpaddd	64(%rbp),%xmm5,%xmm5
5218bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5219bc3d5698SJohn Baldwin
5220bc3d5698SJohn Baldwin	vpsrld	$25,%xmm14,%xmm1
5221bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5222bc3d5698SJohn Baldwin
5223bc3d5698SJohn Baldwin	vpslld	$7,%xmm14,%xmm2
5224bc3d5698SJohn Baldwin	vpandn	%xmm8,%xmm14,%xmm0
5225bc3d5698SJohn Baldwin	vpand	%xmm15,%xmm14,%xmm3
5226bc3d5698SJohn Baldwin
5227bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5228bc3d5698SJohn Baldwin
5229bc3d5698SJohn Baldwin	vpsrld	$2,%xmm10,%xmm9
5230bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5231bc3d5698SJohn Baldwin
5232bc3d5698SJohn Baldwin	vpslld	$30,%xmm10,%xmm1
5233bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm0,%xmm0
5234bc3d5698SJohn Baldwin	vpxor	%xmm10,%xmm11,%xmm3
5235bc3d5698SJohn Baldwin
5236bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm9,%xmm9
5237bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm5,%xmm5
5238bc3d5698SJohn Baldwin
5239bc3d5698SJohn Baldwin	vpsrld	$13,%xmm10,%xmm1
5240bc3d5698SJohn Baldwin
5241bc3d5698SJohn Baldwin	vpslld	$19,%xmm10,%xmm2
5242bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm5,%xmm5
5243bc3d5698SJohn Baldwin	vpand	%xmm3,%xmm4,%xmm4
5244bc3d5698SJohn Baldwin
5245bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm9,%xmm7
5246bc3d5698SJohn Baldwin
5247bc3d5698SJohn Baldwin	vpsrld	$22,%xmm10,%xmm1
5248bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5249bc3d5698SJohn Baldwin
5250bc3d5698SJohn Baldwin	vpslld	$10,%xmm10,%xmm2
5251bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm11,%xmm9
5252bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm13,%xmm13
5253bc3d5698SJohn Baldwin
5254bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5255bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5256bc3d5698SJohn Baldwin
5257bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm9,%xmm9
5258bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm9,%xmm9
5259bc3d5698SJohn Baldwin	vmovdqu	0-128(%rax),%xmm5
5260bc3d5698SJohn Baldwin	vpaddd	128-128(%rax),%xmm6,%xmm6
5261bc3d5698SJohn Baldwin
5262bc3d5698SJohn Baldwin	vpsrld	$3,%xmm5,%xmm7
5263bc3d5698SJohn Baldwin	vpsrld	$7,%xmm5,%xmm1
5264bc3d5698SJohn Baldwin	vpslld	$25,%xmm5,%xmm2
5265bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5266bc3d5698SJohn Baldwin	vpsrld	$18,%xmm5,%xmm1
5267bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5268bc3d5698SJohn Baldwin	vpslld	$14,%xmm5,%xmm2
5269bc3d5698SJohn Baldwin	vmovdqu	208-128(%rax),%xmm0
5270bc3d5698SJohn Baldwin	vpsrld	$10,%xmm0,%xmm4
5271bc3d5698SJohn Baldwin
5272bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5273bc3d5698SJohn Baldwin	vpsrld	$17,%xmm0,%xmm1
5274bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5275bc3d5698SJohn Baldwin	vpslld	$15,%xmm0,%xmm2
5276bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
5277bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm4,%xmm7
5278bc3d5698SJohn Baldwin	vpsrld	$19,%xmm0,%xmm1
5279bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5280bc3d5698SJohn Baldwin	vpslld	$13,%xmm0,%xmm2
5281bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5282bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5283bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
5284bc3d5698SJohn Baldwin	vpsrld	$6,%xmm13,%xmm7
5285bc3d5698SJohn Baldwin	vpslld	$26,%xmm13,%xmm2
5286bc3d5698SJohn Baldwin	vmovdqu	%xmm6,240-128(%rax)
5287bc3d5698SJohn Baldwin	vpaddd	%xmm8,%xmm6,%xmm6
5288bc3d5698SJohn Baldwin
5289bc3d5698SJohn Baldwin	vpsrld	$11,%xmm13,%xmm1
5290bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5291bc3d5698SJohn Baldwin	vpslld	$21,%xmm13,%xmm2
5292bc3d5698SJohn Baldwin	vpaddd	96(%rbp),%xmm6,%xmm6
5293bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5294bc3d5698SJohn Baldwin
5295bc3d5698SJohn Baldwin	vpsrld	$25,%xmm13,%xmm1
5296bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5297bc3d5698SJohn Baldwin
5298bc3d5698SJohn Baldwin	vpslld	$7,%xmm13,%xmm2
5299bc3d5698SJohn Baldwin	vpandn	%xmm15,%xmm13,%xmm0
5300bc3d5698SJohn Baldwin	vpand	%xmm14,%xmm13,%xmm4
5301bc3d5698SJohn Baldwin
5302bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5303bc3d5698SJohn Baldwin
5304bc3d5698SJohn Baldwin	vpsrld	$2,%xmm9,%xmm8
5305bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5306bc3d5698SJohn Baldwin
5307bc3d5698SJohn Baldwin	vpslld	$30,%xmm9,%xmm1
5308bc3d5698SJohn Baldwin	vpxor	%xmm4,%xmm0,%xmm0
5309bc3d5698SJohn Baldwin	vpxor	%xmm9,%xmm10,%xmm4
5310bc3d5698SJohn Baldwin
5311bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm8,%xmm8
5312bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm6,%xmm6
5313bc3d5698SJohn Baldwin
5314bc3d5698SJohn Baldwin	vpsrld	$13,%xmm9,%xmm1
5315bc3d5698SJohn Baldwin
5316bc3d5698SJohn Baldwin	vpslld	$19,%xmm9,%xmm2
5317bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm6,%xmm6
5318bc3d5698SJohn Baldwin	vpand	%xmm4,%xmm3,%xmm3
5319bc3d5698SJohn Baldwin
5320bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm8,%xmm7
5321bc3d5698SJohn Baldwin
5322bc3d5698SJohn Baldwin	vpsrld	$22,%xmm9,%xmm1
5323bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5324bc3d5698SJohn Baldwin
5325bc3d5698SJohn Baldwin	vpslld	$10,%xmm9,%xmm2
5326bc3d5698SJohn Baldwin	vpxor	%xmm3,%xmm10,%xmm8
5327bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm12,%xmm12
5328bc3d5698SJohn Baldwin
5329bc3d5698SJohn Baldwin	vpxor	%xmm1,%xmm7,%xmm7
5330bc3d5698SJohn Baldwin	vpxor	%xmm2,%xmm7,%xmm7
5331bc3d5698SJohn Baldwin
5332bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm8,%xmm8
5333bc3d5698SJohn Baldwin	vpaddd	%xmm7,%xmm8,%xmm8
5334bc3d5698SJohn Baldwin	addq	$256,%rbp
5335bc3d5698SJohn Baldwin	decl	%ecx
5336bc3d5698SJohn Baldwin	jnz	.Loop_16_xx_avx
5337bc3d5698SJohn Baldwin
5338bc3d5698SJohn Baldwin	movl	$1,%ecx
5339bc3d5698SJohn Baldwin	leaq	K256+128(%rip),%rbp
5340bc3d5698SJohn Baldwin	cmpl	0(%rbx),%ecx
5341bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r8
5342bc3d5698SJohn Baldwin	cmpl	4(%rbx),%ecx
5343bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r9
5344bc3d5698SJohn Baldwin	cmpl	8(%rbx),%ecx
5345bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r10
5346bc3d5698SJohn Baldwin	cmpl	12(%rbx),%ecx
5347bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r11
5348bc3d5698SJohn Baldwin	vmovdqa	(%rbx),%xmm7
5349bc3d5698SJohn Baldwin	vpxor	%xmm0,%xmm0,%xmm0
5350bc3d5698SJohn Baldwin	vmovdqa	%xmm7,%xmm6
5351bc3d5698SJohn Baldwin	vpcmpgtd	%xmm0,%xmm6,%xmm6
5352bc3d5698SJohn Baldwin	vpaddd	%xmm6,%xmm7,%xmm7
5353bc3d5698SJohn Baldwin
5354bc3d5698SJohn Baldwin	vmovdqu	0-128(%rdi),%xmm0
5355bc3d5698SJohn Baldwin	vpand	%xmm6,%xmm8,%xmm8
5356bc3d5698SJohn Baldwin	vmovdqu	32-128(%rdi),%xmm1
5357bc3d5698SJohn Baldwin	vpand	%xmm6,%xmm9,%xmm9
5358bc3d5698SJohn Baldwin	vmovdqu	64-128(%rdi),%xmm2
5359bc3d5698SJohn Baldwin	vpand	%xmm6,%xmm10,%xmm10
5360bc3d5698SJohn Baldwin	vmovdqu	96-128(%rdi),%xmm5
5361bc3d5698SJohn Baldwin	vpand	%xmm6,%xmm11,%xmm11
5362bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm8,%xmm8
5363bc3d5698SJohn Baldwin	vmovdqu	128-128(%rdi),%xmm0
5364bc3d5698SJohn Baldwin	vpand	%xmm6,%xmm12,%xmm12
5365bc3d5698SJohn Baldwin	vpaddd	%xmm1,%xmm9,%xmm9
5366bc3d5698SJohn Baldwin	vmovdqu	160-128(%rdi),%xmm1
5367bc3d5698SJohn Baldwin	vpand	%xmm6,%xmm13,%xmm13
5368bc3d5698SJohn Baldwin	vpaddd	%xmm2,%xmm10,%xmm10
5369bc3d5698SJohn Baldwin	vmovdqu	192-128(%rdi),%xmm2
5370bc3d5698SJohn Baldwin	vpand	%xmm6,%xmm14,%xmm14
5371bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm11,%xmm11
5372bc3d5698SJohn Baldwin	vmovdqu	224-128(%rdi),%xmm5
5373bc3d5698SJohn Baldwin	vpand	%xmm6,%xmm15,%xmm15
5374bc3d5698SJohn Baldwin	vpaddd	%xmm0,%xmm12,%xmm12
5375bc3d5698SJohn Baldwin	vpaddd	%xmm1,%xmm13,%xmm13
5376bc3d5698SJohn Baldwin	vmovdqu	%xmm8,0-128(%rdi)
5377bc3d5698SJohn Baldwin	vpaddd	%xmm2,%xmm14,%xmm14
5378bc3d5698SJohn Baldwin	vmovdqu	%xmm9,32-128(%rdi)
5379bc3d5698SJohn Baldwin	vpaddd	%xmm5,%xmm15,%xmm15
5380bc3d5698SJohn Baldwin	vmovdqu	%xmm10,64-128(%rdi)
5381bc3d5698SJohn Baldwin	vmovdqu	%xmm11,96-128(%rdi)
5382bc3d5698SJohn Baldwin	vmovdqu	%xmm12,128-128(%rdi)
5383bc3d5698SJohn Baldwin	vmovdqu	%xmm13,160-128(%rdi)
5384bc3d5698SJohn Baldwin	vmovdqu	%xmm14,192-128(%rdi)
5385bc3d5698SJohn Baldwin	vmovdqu	%xmm15,224-128(%rdi)
5386bc3d5698SJohn Baldwin
5387bc3d5698SJohn Baldwin	vmovdqu	%xmm7,(%rbx)
5388bc3d5698SJohn Baldwin	vmovdqu	.Lpbswap(%rip),%xmm6
5389bc3d5698SJohn Baldwin	decl	%edx
5390bc3d5698SJohn Baldwin	jnz	.Loop_avx
5391bc3d5698SJohn Baldwin
5392bc3d5698SJohn Baldwin	movl	280(%rsp),%edx
5393bc3d5698SJohn Baldwin	leaq	16(%rdi),%rdi
5394bc3d5698SJohn Baldwin	leaq	64(%rsi),%rsi
5395bc3d5698SJohn Baldwin	decl	%edx
5396bc3d5698SJohn Baldwin	jnz	.Loop_grande_avx
5397bc3d5698SJohn Baldwin
5398bc3d5698SJohn Baldwin.Ldone_avx:
5399bc3d5698SJohn Baldwin	movq	272(%rsp),%rax
5400bc3d5698SJohn Baldwin.cfi_def_cfa	%rax,8
5401bc3d5698SJohn Baldwin	vzeroupper
5402bc3d5698SJohn Baldwin	movq	-16(%rax),%rbp
5403bc3d5698SJohn Baldwin.cfi_restore	%rbp
5404bc3d5698SJohn Baldwin	movq	-8(%rax),%rbx
5405bc3d5698SJohn Baldwin.cfi_restore	%rbx
5406bc3d5698SJohn Baldwin	leaq	(%rax),%rsp
5407bc3d5698SJohn Baldwin.cfi_def_cfa_register	%rsp
5408bc3d5698SJohn Baldwin.Lepilogue_avx:
5409bc3d5698SJohn Baldwin	.byte	0xf3,0xc3
5410bc3d5698SJohn Baldwin.cfi_endproc
5411bc3d5698SJohn Baldwin.size	sha256_multi_block_avx,.-sha256_multi_block_avx
5412bc3d5698SJohn Baldwin.type	sha256_multi_block_avx2,@function
5413bc3d5698SJohn Baldwin.align	32
5414bc3d5698SJohn Baldwinsha256_multi_block_avx2:
5415bc3d5698SJohn Baldwin.cfi_startproc
5416bc3d5698SJohn Baldwin_avx2_shortcut:
5417bc3d5698SJohn Baldwin	movq	%rsp,%rax
5418bc3d5698SJohn Baldwin.cfi_def_cfa_register	%rax
5419bc3d5698SJohn Baldwin	pushq	%rbx
5420bc3d5698SJohn Baldwin.cfi_offset	%rbx,-16
5421bc3d5698SJohn Baldwin	pushq	%rbp
5422bc3d5698SJohn Baldwin.cfi_offset	%rbp,-24
5423bc3d5698SJohn Baldwin	pushq	%r12
5424bc3d5698SJohn Baldwin.cfi_offset	%r12,-32
5425bc3d5698SJohn Baldwin	pushq	%r13
5426bc3d5698SJohn Baldwin.cfi_offset	%r13,-40
5427bc3d5698SJohn Baldwin	pushq	%r14
5428bc3d5698SJohn Baldwin.cfi_offset	%r14,-48
5429bc3d5698SJohn Baldwin	pushq	%r15
5430bc3d5698SJohn Baldwin.cfi_offset	%r15,-56
5431bc3d5698SJohn Baldwin	subq	$576,%rsp
5432bc3d5698SJohn Baldwin	andq	$-256,%rsp
5433bc3d5698SJohn Baldwin	movq	%rax,544(%rsp)
5434bc3d5698SJohn Baldwin.cfi_escape	0x0f,0x06,0x77,0xa0,0x04,0x06,0x23,0x08
5435bc3d5698SJohn Baldwin.Lbody_avx2:
5436bc3d5698SJohn Baldwin	leaq	K256+128(%rip),%rbp
5437bc3d5698SJohn Baldwin	leaq	128(%rdi),%rdi
5438bc3d5698SJohn Baldwin
5439bc3d5698SJohn Baldwin.Loop_grande_avx2:
5440bc3d5698SJohn Baldwin	movl	%edx,552(%rsp)
5441bc3d5698SJohn Baldwin	xorl	%edx,%edx
5442bc3d5698SJohn Baldwin	leaq	512(%rsp),%rbx
5443*c0855eaaSJohn Baldwin
5444bc3d5698SJohn Baldwin	movq	0(%rsi),%r12
5445*c0855eaaSJohn Baldwin
5446bc3d5698SJohn Baldwin	movl	8(%rsi),%ecx
5447bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
5448bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
5449bc3d5698SJohn Baldwin	testl	%ecx,%ecx
5450bc3d5698SJohn Baldwin	movl	%ecx,0(%rbx)
5451bc3d5698SJohn Baldwin	cmovleq	%rbp,%r12
5452*c0855eaaSJohn Baldwin
5453bc3d5698SJohn Baldwin	movq	16(%rsi),%r13
5454*c0855eaaSJohn Baldwin
5455bc3d5698SJohn Baldwin	movl	24(%rsi),%ecx
5456bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
5457bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
5458bc3d5698SJohn Baldwin	testl	%ecx,%ecx
5459bc3d5698SJohn Baldwin	movl	%ecx,4(%rbx)
5460bc3d5698SJohn Baldwin	cmovleq	%rbp,%r13
5461*c0855eaaSJohn Baldwin
5462bc3d5698SJohn Baldwin	movq	32(%rsi),%r14
5463*c0855eaaSJohn Baldwin
5464bc3d5698SJohn Baldwin	movl	40(%rsi),%ecx
5465bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
5466bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
5467bc3d5698SJohn Baldwin	testl	%ecx,%ecx
5468bc3d5698SJohn Baldwin	movl	%ecx,8(%rbx)
5469bc3d5698SJohn Baldwin	cmovleq	%rbp,%r14
5470*c0855eaaSJohn Baldwin
5471bc3d5698SJohn Baldwin	movq	48(%rsi),%r15
5472*c0855eaaSJohn Baldwin
5473bc3d5698SJohn Baldwin	movl	56(%rsi),%ecx
5474bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
5475bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
5476bc3d5698SJohn Baldwin	testl	%ecx,%ecx
5477bc3d5698SJohn Baldwin	movl	%ecx,12(%rbx)
5478bc3d5698SJohn Baldwin	cmovleq	%rbp,%r15
5479*c0855eaaSJohn Baldwin
5480bc3d5698SJohn Baldwin	movq	64(%rsi),%r8
5481*c0855eaaSJohn Baldwin
5482bc3d5698SJohn Baldwin	movl	72(%rsi),%ecx
5483bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
5484bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
5485bc3d5698SJohn Baldwin	testl	%ecx,%ecx
5486bc3d5698SJohn Baldwin	movl	%ecx,16(%rbx)
5487bc3d5698SJohn Baldwin	cmovleq	%rbp,%r8
5488*c0855eaaSJohn Baldwin
5489bc3d5698SJohn Baldwin	movq	80(%rsi),%r9
5490*c0855eaaSJohn Baldwin
5491bc3d5698SJohn Baldwin	movl	88(%rsi),%ecx
5492bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
5493bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
5494bc3d5698SJohn Baldwin	testl	%ecx,%ecx
5495bc3d5698SJohn Baldwin	movl	%ecx,20(%rbx)
5496bc3d5698SJohn Baldwin	cmovleq	%rbp,%r9
5497*c0855eaaSJohn Baldwin
5498bc3d5698SJohn Baldwin	movq	96(%rsi),%r10
5499*c0855eaaSJohn Baldwin
5500bc3d5698SJohn Baldwin	movl	104(%rsi),%ecx
5501bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
5502bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
5503bc3d5698SJohn Baldwin	testl	%ecx,%ecx
5504bc3d5698SJohn Baldwin	movl	%ecx,24(%rbx)
5505bc3d5698SJohn Baldwin	cmovleq	%rbp,%r10
5506*c0855eaaSJohn Baldwin
5507bc3d5698SJohn Baldwin	movq	112(%rsi),%r11
5508*c0855eaaSJohn Baldwin
5509bc3d5698SJohn Baldwin	movl	120(%rsi),%ecx
5510bc3d5698SJohn Baldwin	cmpl	%edx,%ecx
5511bc3d5698SJohn Baldwin	cmovgl	%ecx,%edx
5512bc3d5698SJohn Baldwin	testl	%ecx,%ecx
5513bc3d5698SJohn Baldwin	movl	%ecx,28(%rbx)
5514bc3d5698SJohn Baldwin	cmovleq	%rbp,%r11
5515bc3d5698SJohn Baldwin	vmovdqu	0-128(%rdi),%ymm8
5516bc3d5698SJohn Baldwin	leaq	128(%rsp),%rax
5517bc3d5698SJohn Baldwin	vmovdqu	32-128(%rdi),%ymm9
5518bc3d5698SJohn Baldwin	leaq	256+128(%rsp),%rbx
5519bc3d5698SJohn Baldwin	vmovdqu	64-128(%rdi),%ymm10
5520bc3d5698SJohn Baldwin	vmovdqu	96-128(%rdi),%ymm11
5521bc3d5698SJohn Baldwin	vmovdqu	128-128(%rdi),%ymm12
5522bc3d5698SJohn Baldwin	vmovdqu	160-128(%rdi),%ymm13
5523bc3d5698SJohn Baldwin	vmovdqu	192-128(%rdi),%ymm14
5524bc3d5698SJohn Baldwin	vmovdqu	224-128(%rdi),%ymm15
5525bc3d5698SJohn Baldwin	vmovdqu	.Lpbswap(%rip),%ymm6
5526bc3d5698SJohn Baldwin	jmp	.Loop_avx2
5527bc3d5698SJohn Baldwin
5528bc3d5698SJohn Baldwin.align	32
5529bc3d5698SJohn Baldwin.Loop_avx2:
5530bc3d5698SJohn Baldwin	vpxor	%ymm9,%ymm10,%ymm4
5531bc3d5698SJohn Baldwin	vmovd	0(%r12),%xmm5
5532bc3d5698SJohn Baldwin	vmovd	0(%r8),%xmm0
5533bc3d5698SJohn Baldwin	vmovd	0(%r13),%xmm1
5534bc3d5698SJohn Baldwin	vmovd	0(%r9),%xmm2
5535bc3d5698SJohn Baldwin	vpinsrd	$1,0(%r14),%xmm5,%xmm5
5536bc3d5698SJohn Baldwin	vpinsrd	$1,0(%r10),%xmm0,%xmm0
5537bc3d5698SJohn Baldwin	vpinsrd	$1,0(%r15),%xmm1,%xmm1
5538bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
5539bc3d5698SJohn Baldwin	vpinsrd	$1,0(%r11),%xmm2,%xmm2
5540bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
5541bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
5542bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
5543bc3d5698SJohn Baldwin	vpsrld	$6,%ymm12,%ymm7
5544bc3d5698SJohn Baldwin	vpslld	$26,%ymm12,%ymm2
5545bc3d5698SJohn Baldwin	vmovdqu	%ymm5,0-128(%rax)
5546bc3d5698SJohn Baldwin	vpaddd	%ymm15,%ymm5,%ymm5
5547bc3d5698SJohn Baldwin
5548bc3d5698SJohn Baldwin	vpsrld	$11,%ymm12,%ymm1
5549bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5550bc3d5698SJohn Baldwin	vpslld	$21,%ymm12,%ymm2
5551bc3d5698SJohn Baldwin	vpaddd	-128(%rbp),%ymm5,%ymm5
5552bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5553bc3d5698SJohn Baldwin
5554bc3d5698SJohn Baldwin	vpsrld	$25,%ymm12,%ymm1
5555bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5556bc3d5698SJohn Baldwin
5557bc3d5698SJohn Baldwin	vpslld	$7,%ymm12,%ymm2
5558bc3d5698SJohn Baldwin	vpandn	%ymm14,%ymm12,%ymm0
5559bc3d5698SJohn Baldwin	vpand	%ymm13,%ymm12,%ymm3
5560bc3d5698SJohn Baldwin
5561bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5562bc3d5698SJohn Baldwin
5563bc3d5698SJohn Baldwin	vpsrld	$2,%ymm8,%ymm15
5564bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5565bc3d5698SJohn Baldwin
5566bc3d5698SJohn Baldwin	vpslld	$30,%ymm8,%ymm1
5567bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
5568bc3d5698SJohn Baldwin	vpxor	%ymm8,%ymm9,%ymm3
5569bc3d5698SJohn Baldwin
5570bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm15,%ymm15
5571bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
5572bc3d5698SJohn Baldwin
5573bc3d5698SJohn Baldwin	vpsrld	$13,%ymm8,%ymm1
5574bc3d5698SJohn Baldwin
5575bc3d5698SJohn Baldwin	vpslld	$19,%ymm8,%ymm2
5576bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
5577bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
5578bc3d5698SJohn Baldwin
5579bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm15,%ymm7
5580bc3d5698SJohn Baldwin
5581bc3d5698SJohn Baldwin	vpsrld	$22,%ymm8,%ymm1
5582bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5583bc3d5698SJohn Baldwin
5584bc3d5698SJohn Baldwin	vpslld	$10,%ymm8,%ymm2
5585bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm9,%ymm15
5586bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
5587bc3d5698SJohn Baldwin
5588bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5589bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5590bc3d5698SJohn Baldwin
5591bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
5592bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm15,%ymm15
5593bc3d5698SJohn Baldwin	vmovd	4(%r12),%xmm5
5594bc3d5698SJohn Baldwin	vmovd	4(%r8),%xmm0
5595bc3d5698SJohn Baldwin	vmovd	4(%r13),%xmm1
5596bc3d5698SJohn Baldwin	vmovd	4(%r9),%xmm2
5597bc3d5698SJohn Baldwin	vpinsrd	$1,4(%r14),%xmm5,%xmm5
5598bc3d5698SJohn Baldwin	vpinsrd	$1,4(%r10),%xmm0,%xmm0
5599bc3d5698SJohn Baldwin	vpinsrd	$1,4(%r15),%xmm1,%xmm1
5600bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
5601bc3d5698SJohn Baldwin	vpinsrd	$1,4(%r11),%xmm2,%xmm2
5602bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
5603bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
5604bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
5605bc3d5698SJohn Baldwin	vpsrld	$6,%ymm11,%ymm7
5606bc3d5698SJohn Baldwin	vpslld	$26,%ymm11,%ymm2
5607bc3d5698SJohn Baldwin	vmovdqu	%ymm5,32-128(%rax)
5608bc3d5698SJohn Baldwin	vpaddd	%ymm14,%ymm5,%ymm5
5609bc3d5698SJohn Baldwin
5610bc3d5698SJohn Baldwin	vpsrld	$11,%ymm11,%ymm1
5611bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5612bc3d5698SJohn Baldwin	vpslld	$21,%ymm11,%ymm2
5613bc3d5698SJohn Baldwin	vpaddd	-96(%rbp),%ymm5,%ymm5
5614bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5615bc3d5698SJohn Baldwin
5616bc3d5698SJohn Baldwin	vpsrld	$25,%ymm11,%ymm1
5617bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5618bc3d5698SJohn Baldwin
5619bc3d5698SJohn Baldwin	vpslld	$7,%ymm11,%ymm2
5620bc3d5698SJohn Baldwin	vpandn	%ymm13,%ymm11,%ymm0
5621bc3d5698SJohn Baldwin	vpand	%ymm12,%ymm11,%ymm4
5622bc3d5698SJohn Baldwin
5623bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5624bc3d5698SJohn Baldwin
5625bc3d5698SJohn Baldwin	vpsrld	$2,%ymm15,%ymm14
5626bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5627bc3d5698SJohn Baldwin
5628bc3d5698SJohn Baldwin	vpslld	$30,%ymm15,%ymm1
5629bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
5630bc3d5698SJohn Baldwin	vpxor	%ymm15,%ymm8,%ymm4
5631bc3d5698SJohn Baldwin
5632bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm14,%ymm14
5633bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
5634bc3d5698SJohn Baldwin
5635bc3d5698SJohn Baldwin	vpsrld	$13,%ymm15,%ymm1
5636bc3d5698SJohn Baldwin
5637bc3d5698SJohn Baldwin	vpslld	$19,%ymm15,%ymm2
5638bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
5639bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
5640bc3d5698SJohn Baldwin
5641bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm14,%ymm7
5642bc3d5698SJohn Baldwin
5643bc3d5698SJohn Baldwin	vpsrld	$22,%ymm15,%ymm1
5644bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5645bc3d5698SJohn Baldwin
5646bc3d5698SJohn Baldwin	vpslld	$10,%ymm15,%ymm2
5647bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm8,%ymm14
5648bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm10,%ymm10
5649bc3d5698SJohn Baldwin
5650bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5651bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5652bc3d5698SJohn Baldwin
5653bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm14,%ymm14
5654bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm14,%ymm14
5655bc3d5698SJohn Baldwin	vmovd	8(%r12),%xmm5
5656bc3d5698SJohn Baldwin	vmovd	8(%r8),%xmm0
5657bc3d5698SJohn Baldwin	vmovd	8(%r13),%xmm1
5658bc3d5698SJohn Baldwin	vmovd	8(%r9),%xmm2
5659bc3d5698SJohn Baldwin	vpinsrd	$1,8(%r14),%xmm5,%xmm5
5660bc3d5698SJohn Baldwin	vpinsrd	$1,8(%r10),%xmm0,%xmm0
5661bc3d5698SJohn Baldwin	vpinsrd	$1,8(%r15),%xmm1,%xmm1
5662bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
5663bc3d5698SJohn Baldwin	vpinsrd	$1,8(%r11),%xmm2,%xmm2
5664bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
5665bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
5666bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
5667bc3d5698SJohn Baldwin	vpsrld	$6,%ymm10,%ymm7
5668bc3d5698SJohn Baldwin	vpslld	$26,%ymm10,%ymm2
5669bc3d5698SJohn Baldwin	vmovdqu	%ymm5,64-128(%rax)
5670bc3d5698SJohn Baldwin	vpaddd	%ymm13,%ymm5,%ymm5
5671bc3d5698SJohn Baldwin
5672bc3d5698SJohn Baldwin	vpsrld	$11,%ymm10,%ymm1
5673bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5674bc3d5698SJohn Baldwin	vpslld	$21,%ymm10,%ymm2
5675bc3d5698SJohn Baldwin	vpaddd	-64(%rbp),%ymm5,%ymm5
5676bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5677bc3d5698SJohn Baldwin
5678bc3d5698SJohn Baldwin	vpsrld	$25,%ymm10,%ymm1
5679bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5680bc3d5698SJohn Baldwin
5681bc3d5698SJohn Baldwin	vpslld	$7,%ymm10,%ymm2
5682bc3d5698SJohn Baldwin	vpandn	%ymm12,%ymm10,%ymm0
5683bc3d5698SJohn Baldwin	vpand	%ymm11,%ymm10,%ymm3
5684bc3d5698SJohn Baldwin
5685bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5686bc3d5698SJohn Baldwin
5687bc3d5698SJohn Baldwin	vpsrld	$2,%ymm14,%ymm13
5688bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5689bc3d5698SJohn Baldwin
5690bc3d5698SJohn Baldwin	vpslld	$30,%ymm14,%ymm1
5691bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
5692bc3d5698SJohn Baldwin	vpxor	%ymm14,%ymm15,%ymm3
5693bc3d5698SJohn Baldwin
5694bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm13,%ymm13
5695bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
5696bc3d5698SJohn Baldwin
5697bc3d5698SJohn Baldwin	vpsrld	$13,%ymm14,%ymm1
5698bc3d5698SJohn Baldwin
5699bc3d5698SJohn Baldwin	vpslld	$19,%ymm14,%ymm2
5700bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
5701bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
5702bc3d5698SJohn Baldwin
5703bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm13,%ymm7
5704bc3d5698SJohn Baldwin
5705bc3d5698SJohn Baldwin	vpsrld	$22,%ymm14,%ymm1
5706bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5707bc3d5698SJohn Baldwin
5708bc3d5698SJohn Baldwin	vpslld	$10,%ymm14,%ymm2
5709bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm15,%ymm13
5710bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm9,%ymm9
5711bc3d5698SJohn Baldwin
5712bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5713bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5714bc3d5698SJohn Baldwin
5715bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm13,%ymm13
5716bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm13,%ymm13
5717bc3d5698SJohn Baldwin	vmovd	12(%r12),%xmm5
5718bc3d5698SJohn Baldwin	vmovd	12(%r8),%xmm0
5719bc3d5698SJohn Baldwin	vmovd	12(%r13),%xmm1
5720bc3d5698SJohn Baldwin	vmovd	12(%r9),%xmm2
5721bc3d5698SJohn Baldwin	vpinsrd	$1,12(%r14),%xmm5,%xmm5
5722bc3d5698SJohn Baldwin	vpinsrd	$1,12(%r10),%xmm0,%xmm0
5723bc3d5698SJohn Baldwin	vpinsrd	$1,12(%r15),%xmm1,%xmm1
5724bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
5725bc3d5698SJohn Baldwin	vpinsrd	$1,12(%r11),%xmm2,%xmm2
5726bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
5727bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
5728bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
5729bc3d5698SJohn Baldwin	vpsrld	$6,%ymm9,%ymm7
5730bc3d5698SJohn Baldwin	vpslld	$26,%ymm9,%ymm2
5731bc3d5698SJohn Baldwin	vmovdqu	%ymm5,96-128(%rax)
5732bc3d5698SJohn Baldwin	vpaddd	%ymm12,%ymm5,%ymm5
5733bc3d5698SJohn Baldwin
5734bc3d5698SJohn Baldwin	vpsrld	$11,%ymm9,%ymm1
5735bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5736bc3d5698SJohn Baldwin	vpslld	$21,%ymm9,%ymm2
5737bc3d5698SJohn Baldwin	vpaddd	-32(%rbp),%ymm5,%ymm5
5738bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5739bc3d5698SJohn Baldwin
5740bc3d5698SJohn Baldwin	vpsrld	$25,%ymm9,%ymm1
5741bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5742bc3d5698SJohn Baldwin
5743bc3d5698SJohn Baldwin	vpslld	$7,%ymm9,%ymm2
5744bc3d5698SJohn Baldwin	vpandn	%ymm11,%ymm9,%ymm0
5745bc3d5698SJohn Baldwin	vpand	%ymm10,%ymm9,%ymm4
5746bc3d5698SJohn Baldwin
5747bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5748bc3d5698SJohn Baldwin
5749bc3d5698SJohn Baldwin	vpsrld	$2,%ymm13,%ymm12
5750bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5751bc3d5698SJohn Baldwin
5752bc3d5698SJohn Baldwin	vpslld	$30,%ymm13,%ymm1
5753bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
5754bc3d5698SJohn Baldwin	vpxor	%ymm13,%ymm14,%ymm4
5755bc3d5698SJohn Baldwin
5756bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm12,%ymm12
5757bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
5758bc3d5698SJohn Baldwin
5759bc3d5698SJohn Baldwin	vpsrld	$13,%ymm13,%ymm1
5760bc3d5698SJohn Baldwin
5761bc3d5698SJohn Baldwin	vpslld	$19,%ymm13,%ymm2
5762bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
5763bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
5764bc3d5698SJohn Baldwin
5765bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm12,%ymm7
5766bc3d5698SJohn Baldwin
5767bc3d5698SJohn Baldwin	vpsrld	$22,%ymm13,%ymm1
5768bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5769bc3d5698SJohn Baldwin
5770bc3d5698SJohn Baldwin	vpslld	$10,%ymm13,%ymm2
5771bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm14,%ymm12
5772bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm8,%ymm8
5773bc3d5698SJohn Baldwin
5774bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5775bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5776bc3d5698SJohn Baldwin
5777bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm12,%ymm12
5778bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm12,%ymm12
5779bc3d5698SJohn Baldwin	vmovd	16(%r12),%xmm5
5780bc3d5698SJohn Baldwin	vmovd	16(%r8),%xmm0
5781bc3d5698SJohn Baldwin	vmovd	16(%r13),%xmm1
5782bc3d5698SJohn Baldwin	vmovd	16(%r9),%xmm2
5783bc3d5698SJohn Baldwin	vpinsrd	$1,16(%r14),%xmm5,%xmm5
5784bc3d5698SJohn Baldwin	vpinsrd	$1,16(%r10),%xmm0,%xmm0
5785bc3d5698SJohn Baldwin	vpinsrd	$1,16(%r15),%xmm1,%xmm1
5786bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
5787bc3d5698SJohn Baldwin	vpinsrd	$1,16(%r11),%xmm2,%xmm2
5788bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
5789bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
5790bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
5791bc3d5698SJohn Baldwin	vpsrld	$6,%ymm8,%ymm7
5792bc3d5698SJohn Baldwin	vpslld	$26,%ymm8,%ymm2
5793bc3d5698SJohn Baldwin	vmovdqu	%ymm5,128-128(%rax)
5794bc3d5698SJohn Baldwin	vpaddd	%ymm11,%ymm5,%ymm5
5795bc3d5698SJohn Baldwin
5796bc3d5698SJohn Baldwin	vpsrld	$11,%ymm8,%ymm1
5797bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5798bc3d5698SJohn Baldwin	vpslld	$21,%ymm8,%ymm2
5799bc3d5698SJohn Baldwin	vpaddd	0(%rbp),%ymm5,%ymm5
5800bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5801bc3d5698SJohn Baldwin
5802bc3d5698SJohn Baldwin	vpsrld	$25,%ymm8,%ymm1
5803bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5804bc3d5698SJohn Baldwin
5805bc3d5698SJohn Baldwin	vpslld	$7,%ymm8,%ymm2
5806bc3d5698SJohn Baldwin	vpandn	%ymm10,%ymm8,%ymm0
5807bc3d5698SJohn Baldwin	vpand	%ymm9,%ymm8,%ymm3
5808bc3d5698SJohn Baldwin
5809bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5810bc3d5698SJohn Baldwin
5811bc3d5698SJohn Baldwin	vpsrld	$2,%ymm12,%ymm11
5812bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5813bc3d5698SJohn Baldwin
5814bc3d5698SJohn Baldwin	vpslld	$30,%ymm12,%ymm1
5815bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
5816bc3d5698SJohn Baldwin	vpxor	%ymm12,%ymm13,%ymm3
5817bc3d5698SJohn Baldwin
5818bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm11,%ymm11
5819bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
5820bc3d5698SJohn Baldwin
5821bc3d5698SJohn Baldwin	vpsrld	$13,%ymm12,%ymm1
5822bc3d5698SJohn Baldwin
5823bc3d5698SJohn Baldwin	vpslld	$19,%ymm12,%ymm2
5824bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
5825bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
5826bc3d5698SJohn Baldwin
5827bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm11,%ymm7
5828bc3d5698SJohn Baldwin
5829bc3d5698SJohn Baldwin	vpsrld	$22,%ymm12,%ymm1
5830bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5831bc3d5698SJohn Baldwin
5832bc3d5698SJohn Baldwin	vpslld	$10,%ymm12,%ymm2
5833bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm13,%ymm11
5834bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
5835bc3d5698SJohn Baldwin
5836bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5837bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5838bc3d5698SJohn Baldwin
5839bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
5840bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm11,%ymm11
5841bc3d5698SJohn Baldwin	vmovd	20(%r12),%xmm5
5842bc3d5698SJohn Baldwin	vmovd	20(%r8),%xmm0
5843bc3d5698SJohn Baldwin	vmovd	20(%r13),%xmm1
5844bc3d5698SJohn Baldwin	vmovd	20(%r9),%xmm2
5845bc3d5698SJohn Baldwin	vpinsrd	$1,20(%r14),%xmm5,%xmm5
5846bc3d5698SJohn Baldwin	vpinsrd	$1,20(%r10),%xmm0,%xmm0
5847bc3d5698SJohn Baldwin	vpinsrd	$1,20(%r15),%xmm1,%xmm1
5848bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
5849bc3d5698SJohn Baldwin	vpinsrd	$1,20(%r11),%xmm2,%xmm2
5850bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
5851bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
5852bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
5853bc3d5698SJohn Baldwin	vpsrld	$6,%ymm15,%ymm7
5854bc3d5698SJohn Baldwin	vpslld	$26,%ymm15,%ymm2
5855bc3d5698SJohn Baldwin	vmovdqu	%ymm5,160-128(%rax)
5856bc3d5698SJohn Baldwin	vpaddd	%ymm10,%ymm5,%ymm5
5857bc3d5698SJohn Baldwin
5858bc3d5698SJohn Baldwin	vpsrld	$11,%ymm15,%ymm1
5859bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5860bc3d5698SJohn Baldwin	vpslld	$21,%ymm15,%ymm2
5861bc3d5698SJohn Baldwin	vpaddd	32(%rbp),%ymm5,%ymm5
5862bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5863bc3d5698SJohn Baldwin
5864bc3d5698SJohn Baldwin	vpsrld	$25,%ymm15,%ymm1
5865bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5866bc3d5698SJohn Baldwin
5867bc3d5698SJohn Baldwin	vpslld	$7,%ymm15,%ymm2
5868bc3d5698SJohn Baldwin	vpandn	%ymm9,%ymm15,%ymm0
5869bc3d5698SJohn Baldwin	vpand	%ymm8,%ymm15,%ymm4
5870bc3d5698SJohn Baldwin
5871bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5872bc3d5698SJohn Baldwin
5873bc3d5698SJohn Baldwin	vpsrld	$2,%ymm11,%ymm10
5874bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5875bc3d5698SJohn Baldwin
5876bc3d5698SJohn Baldwin	vpslld	$30,%ymm11,%ymm1
5877bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
5878bc3d5698SJohn Baldwin	vpxor	%ymm11,%ymm12,%ymm4
5879bc3d5698SJohn Baldwin
5880bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm10,%ymm10
5881bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
5882bc3d5698SJohn Baldwin
5883bc3d5698SJohn Baldwin	vpsrld	$13,%ymm11,%ymm1
5884bc3d5698SJohn Baldwin
5885bc3d5698SJohn Baldwin	vpslld	$19,%ymm11,%ymm2
5886bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
5887bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
5888bc3d5698SJohn Baldwin
5889bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm10,%ymm7
5890bc3d5698SJohn Baldwin
5891bc3d5698SJohn Baldwin	vpsrld	$22,%ymm11,%ymm1
5892bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5893bc3d5698SJohn Baldwin
5894bc3d5698SJohn Baldwin	vpslld	$10,%ymm11,%ymm2
5895bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm12,%ymm10
5896bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm14,%ymm14
5897bc3d5698SJohn Baldwin
5898bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5899bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5900bc3d5698SJohn Baldwin
5901bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm10,%ymm10
5902bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm10,%ymm10
5903bc3d5698SJohn Baldwin	vmovd	24(%r12),%xmm5
5904bc3d5698SJohn Baldwin	vmovd	24(%r8),%xmm0
5905bc3d5698SJohn Baldwin	vmovd	24(%r13),%xmm1
5906bc3d5698SJohn Baldwin	vmovd	24(%r9),%xmm2
5907bc3d5698SJohn Baldwin	vpinsrd	$1,24(%r14),%xmm5,%xmm5
5908bc3d5698SJohn Baldwin	vpinsrd	$1,24(%r10),%xmm0,%xmm0
5909bc3d5698SJohn Baldwin	vpinsrd	$1,24(%r15),%xmm1,%xmm1
5910bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
5911bc3d5698SJohn Baldwin	vpinsrd	$1,24(%r11),%xmm2,%xmm2
5912bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
5913bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
5914bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
5915bc3d5698SJohn Baldwin	vpsrld	$6,%ymm14,%ymm7
5916bc3d5698SJohn Baldwin	vpslld	$26,%ymm14,%ymm2
5917bc3d5698SJohn Baldwin	vmovdqu	%ymm5,192-128(%rax)
5918bc3d5698SJohn Baldwin	vpaddd	%ymm9,%ymm5,%ymm5
5919bc3d5698SJohn Baldwin
5920bc3d5698SJohn Baldwin	vpsrld	$11,%ymm14,%ymm1
5921bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5922bc3d5698SJohn Baldwin	vpslld	$21,%ymm14,%ymm2
5923bc3d5698SJohn Baldwin	vpaddd	64(%rbp),%ymm5,%ymm5
5924bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5925bc3d5698SJohn Baldwin
5926bc3d5698SJohn Baldwin	vpsrld	$25,%ymm14,%ymm1
5927bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5928bc3d5698SJohn Baldwin
5929bc3d5698SJohn Baldwin	vpslld	$7,%ymm14,%ymm2
5930bc3d5698SJohn Baldwin	vpandn	%ymm8,%ymm14,%ymm0
5931bc3d5698SJohn Baldwin	vpand	%ymm15,%ymm14,%ymm3
5932bc3d5698SJohn Baldwin
5933bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5934bc3d5698SJohn Baldwin
5935bc3d5698SJohn Baldwin	vpsrld	$2,%ymm10,%ymm9
5936bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5937bc3d5698SJohn Baldwin
5938bc3d5698SJohn Baldwin	vpslld	$30,%ymm10,%ymm1
5939bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
5940bc3d5698SJohn Baldwin	vpxor	%ymm10,%ymm11,%ymm3
5941bc3d5698SJohn Baldwin
5942bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm9,%ymm9
5943bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
5944bc3d5698SJohn Baldwin
5945bc3d5698SJohn Baldwin	vpsrld	$13,%ymm10,%ymm1
5946bc3d5698SJohn Baldwin
5947bc3d5698SJohn Baldwin	vpslld	$19,%ymm10,%ymm2
5948bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
5949bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
5950bc3d5698SJohn Baldwin
5951bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm9,%ymm7
5952bc3d5698SJohn Baldwin
5953bc3d5698SJohn Baldwin	vpsrld	$22,%ymm10,%ymm1
5954bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5955bc3d5698SJohn Baldwin
5956bc3d5698SJohn Baldwin	vpslld	$10,%ymm10,%ymm2
5957bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm11,%ymm9
5958bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm13,%ymm13
5959bc3d5698SJohn Baldwin
5960bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5961bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5962bc3d5698SJohn Baldwin
5963bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm9,%ymm9
5964bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm9,%ymm9
5965bc3d5698SJohn Baldwin	vmovd	28(%r12),%xmm5
5966bc3d5698SJohn Baldwin	vmovd	28(%r8),%xmm0
5967bc3d5698SJohn Baldwin	vmovd	28(%r13),%xmm1
5968bc3d5698SJohn Baldwin	vmovd	28(%r9),%xmm2
5969bc3d5698SJohn Baldwin	vpinsrd	$1,28(%r14),%xmm5,%xmm5
5970bc3d5698SJohn Baldwin	vpinsrd	$1,28(%r10),%xmm0,%xmm0
5971bc3d5698SJohn Baldwin	vpinsrd	$1,28(%r15),%xmm1,%xmm1
5972bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
5973bc3d5698SJohn Baldwin	vpinsrd	$1,28(%r11),%xmm2,%xmm2
5974bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
5975bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
5976bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
5977bc3d5698SJohn Baldwin	vpsrld	$6,%ymm13,%ymm7
5978bc3d5698SJohn Baldwin	vpslld	$26,%ymm13,%ymm2
5979bc3d5698SJohn Baldwin	vmovdqu	%ymm5,224-128(%rax)
5980bc3d5698SJohn Baldwin	vpaddd	%ymm8,%ymm5,%ymm5
5981bc3d5698SJohn Baldwin
5982bc3d5698SJohn Baldwin	vpsrld	$11,%ymm13,%ymm1
5983bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5984bc3d5698SJohn Baldwin	vpslld	$21,%ymm13,%ymm2
5985bc3d5698SJohn Baldwin	vpaddd	96(%rbp),%ymm5,%ymm5
5986bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5987bc3d5698SJohn Baldwin
5988bc3d5698SJohn Baldwin	vpsrld	$25,%ymm13,%ymm1
5989bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5990bc3d5698SJohn Baldwin
5991bc3d5698SJohn Baldwin	vpslld	$7,%ymm13,%ymm2
5992bc3d5698SJohn Baldwin	vpandn	%ymm15,%ymm13,%ymm0
5993bc3d5698SJohn Baldwin	vpand	%ymm14,%ymm13,%ymm4
5994bc3d5698SJohn Baldwin
5995bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
5996bc3d5698SJohn Baldwin
5997bc3d5698SJohn Baldwin	vpsrld	$2,%ymm9,%ymm8
5998bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
5999bc3d5698SJohn Baldwin
6000bc3d5698SJohn Baldwin	vpslld	$30,%ymm9,%ymm1
6001bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
6002bc3d5698SJohn Baldwin	vpxor	%ymm9,%ymm10,%ymm4
6003bc3d5698SJohn Baldwin
6004bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm8,%ymm8
6005bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6006bc3d5698SJohn Baldwin
6007bc3d5698SJohn Baldwin	vpsrld	$13,%ymm9,%ymm1
6008bc3d5698SJohn Baldwin
6009bc3d5698SJohn Baldwin	vpslld	$19,%ymm9,%ymm2
6010bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6011bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
6012bc3d5698SJohn Baldwin
6013bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm8,%ymm7
6014bc3d5698SJohn Baldwin
6015bc3d5698SJohn Baldwin	vpsrld	$22,%ymm9,%ymm1
6016bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6017bc3d5698SJohn Baldwin
6018bc3d5698SJohn Baldwin	vpslld	$10,%ymm9,%ymm2
6019bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm10,%ymm8
6020bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm12,%ymm12
6021bc3d5698SJohn Baldwin
6022bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6023bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6024bc3d5698SJohn Baldwin
6025bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm8,%ymm8
6026bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm8,%ymm8
6027bc3d5698SJohn Baldwin	addq	$256,%rbp
6028bc3d5698SJohn Baldwin	vmovd	32(%r12),%xmm5
6029bc3d5698SJohn Baldwin	vmovd	32(%r8),%xmm0
6030bc3d5698SJohn Baldwin	vmovd	32(%r13),%xmm1
6031bc3d5698SJohn Baldwin	vmovd	32(%r9),%xmm2
6032bc3d5698SJohn Baldwin	vpinsrd	$1,32(%r14),%xmm5,%xmm5
6033bc3d5698SJohn Baldwin	vpinsrd	$1,32(%r10),%xmm0,%xmm0
6034bc3d5698SJohn Baldwin	vpinsrd	$1,32(%r15),%xmm1,%xmm1
6035bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
6036bc3d5698SJohn Baldwin	vpinsrd	$1,32(%r11),%xmm2,%xmm2
6037bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
6038bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
6039bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
6040bc3d5698SJohn Baldwin	vpsrld	$6,%ymm12,%ymm7
6041bc3d5698SJohn Baldwin	vpslld	$26,%ymm12,%ymm2
6042bc3d5698SJohn Baldwin	vmovdqu	%ymm5,256-256-128(%rbx)
6043bc3d5698SJohn Baldwin	vpaddd	%ymm15,%ymm5,%ymm5
6044bc3d5698SJohn Baldwin
6045bc3d5698SJohn Baldwin	vpsrld	$11,%ymm12,%ymm1
6046bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6047bc3d5698SJohn Baldwin	vpslld	$21,%ymm12,%ymm2
6048bc3d5698SJohn Baldwin	vpaddd	-128(%rbp),%ymm5,%ymm5
6049bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6050bc3d5698SJohn Baldwin
6051bc3d5698SJohn Baldwin	vpsrld	$25,%ymm12,%ymm1
6052bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6053bc3d5698SJohn Baldwin
6054bc3d5698SJohn Baldwin	vpslld	$7,%ymm12,%ymm2
6055bc3d5698SJohn Baldwin	vpandn	%ymm14,%ymm12,%ymm0
6056bc3d5698SJohn Baldwin	vpand	%ymm13,%ymm12,%ymm3
6057bc3d5698SJohn Baldwin
6058bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6059bc3d5698SJohn Baldwin
6060bc3d5698SJohn Baldwin	vpsrld	$2,%ymm8,%ymm15
6061bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6062bc3d5698SJohn Baldwin
6063bc3d5698SJohn Baldwin	vpslld	$30,%ymm8,%ymm1
6064bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
6065bc3d5698SJohn Baldwin	vpxor	%ymm8,%ymm9,%ymm3
6066bc3d5698SJohn Baldwin
6067bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm15,%ymm15
6068bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6069bc3d5698SJohn Baldwin
6070bc3d5698SJohn Baldwin	vpsrld	$13,%ymm8,%ymm1
6071bc3d5698SJohn Baldwin
6072bc3d5698SJohn Baldwin	vpslld	$19,%ymm8,%ymm2
6073bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6074bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
6075bc3d5698SJohn Baldwin
6076bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm15,%ymm7
6077bc3d5698SJohn Baldwin
6078bc3d5698SJohn Baldwin	vpsrld	$22,%ymm8,%ymm1
6079bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6080bc3d5698SJohn Baldwin
6081bc3d5698SJohn Baldwin	vpslld	$10,%ymm8,%ymm2
6082bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm9,%ymm15
6083bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
6084bc3d5698SJohn Baldwin
6085bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6086bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6087bc3d5698SJohn Baldwin
6088bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
6089bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm15,%ymm15
6090bc3d5698SJohn Baldwin	vmovd	36(%r12),%xmm5
6091bc3d5698SJohn Baldwin	vmovd	36(%r8),%xmm0
6092bc3d5698SJohn Baldwin	vmovd	36(%r13),%xmm1
6093bc3d5698SJohn Baldwin	vmovd	36(%r9),%xmm2
6094bc3d5698SJohn Baldwin	vpinsrd	$1,36(%r14),%xmm5,%xmm5
6095bc3d5698SJohn Baldwin	vpinsrd	$1,36(%r10),%xmm0,%xmm0
6096bc3d5698SJohn Baldwin	vpinsrd	$1,36(%r15),%xmm1,%xmm1
6097bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
6098bc3d5698SJohn Baldwin	vpinsrd	$1,36(%r11),%xmm2,%xmm2
6099bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
6100bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
6101bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
6102bc3d5698SJohn Baldwin	vpsrld	$6,%ymm11,%ymm7
6103bc3d5698SJohn Baldwin	vpslld	$26,%ymm11,%ymm2
6104bc3d5698SJohn Baldwin	vmovdqu	%ymm5,288-256-128(%rbx)
6105bc3d5698SJohn Baldwin	vpaddd	%ymm14,%ymm5,%ymm5
6106bc3d5698SJohn Baldwin
6107bc3d5698SJohn Baldwin	vpsrld	$11,%ymm11,%ymm1
6108bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6109bc3d5698SJohn Baldwin	vpslld	$21,%ymm11,%ymm2
6110bc3d5698SJohn Baldwin	vpaddd	-96(%rbp),%ymm5,%ymm5
6111bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6112bc3d5698SJohn Baldwin
6113bc3d5698SJohn Baldwin	vpsrld	$25,%ymm11,%ymm1
6114bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6115bc3d5698SJohn Baldwin
6116bc3d5698SJohn Baldwin	vpslld	$7,%ymm11,%ymm2
6117bc3d5698SJohn Baldwin	vpandn	%ymm13,%ymm11,%ymm0
6118bc3d5698SJohn Baldwin	vpand	%ymm12,%ymm11,%ymm4
6119bc3d5698SJohn Baldwin
6120bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6121bc3d5698SJohn Baldwin
6122bc3d5698SJohn Baldwin	vpsrld	$2,%ymm15,%ymm14
6123bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6124bc3d5698SJohn Baldwin
6125bc3d5698SJohn Baldwin	vpslld	$30,%ymm15,%ymm1
6126bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
6127bc3d5698SJohn Baldwin	vpxor	%ymm15,%ymm8,%ymm4
6128bc3d5698SJohn Baldwin
6129bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm14,%ymm14
6130bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6131bc3d5698SJohn Baldwin
6132bc3d5698SJohn Baldwin	vpsrld	$13,%ymm15,%ymm1
6133bc3d5698SJohn Baldwin
6134bc3d5698SJohn Baldwin	vpslld	$19,%ymm15,%ymm2
6135bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6136bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
6137bc3d5698SJohn Baldwin
6138bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm14,%ymm7
6139bc3d5698SJohn Baldwin
6140bc3d5698SJohn Baldwin	vpsrld	$22,%ymm15,%ymm1
6141bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6142bc3d5698SJohn Baldwin
6143bc3d5698SJohn Baldwin	vpslld	$10,%ymm15,%ymm2
6144bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm8,%ymm14
6145bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm10,%ymm10
6146bc3d5698SJohn Baldwin
6147bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6148bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6149bc3d5698SJohn Baldwin
6150bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm14,%ymm14
6151bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm14,%ymm14
6152bc3d5698SJohn Baldwin	vmovd	40(%r12),%xmm5
6153bc3d5698SJohn Baldwin	vmovd	40(%r8),%xmm0
6154bc3d5698SJohn Baldwin	vmovd	40(%r13),%xmm1
6155bc3d5698SJohn Baldwin	vmovd	40(%r9),%xmm2
6156bc3d5698SJohn Baldwin	vpinsrd	$1,40(%r14),%xmm5,%xmm5
6157bc3d5698SJohn Baldwin	vpinsrd	$1,40(%r10),%xmm0,%xmm0
6158bc3d5698SJohn Baldwin	vpinsrd	$1,40(%r15),%xmm1,%xmm1
6159bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
6160bc3d5698SJohn Baldwin	vpinsrd	$1,40(%r11),%xmm2,%xmm2
6161bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
6162bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
6163bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
6164bc3d5698SJohn Baldwin	vpsrld	$6,%ymm10,%ymm7
6165bc3d5698SJohn Baldwin	vpslld	$26,%ymm10,%ymm2
6166bc3d5698SJohn Baldwin	vmovdqu	%ymm5,320-256-128(%rbx)
6167bc3d5698SJohn Baldwin	vpaddd	%ymm13,%ymm5,%ymm5
6168bc3d5698SJohn Baldwin
6169bc3d5698SJohn Baldwin	vpsrld	$11,%ymm10,%ymm1
6170bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6171bc3d5698SJohn Baldwin	vpslld	$21,%ymm10,%ymm2
6172bc3d5698SJohn Baldwin	vpaddd	-64(%rbp),%ymm5,%ymm5
6173bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6174bc3d5698SJohn Baldwin
6175bc3d5698SJohn Baldwin	vpsrld	$25,%ymm10,%ymm1
6176bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6177bc3d5698SJohn Baldwin
6178bc3d5698SJohn Baldwin	vpslld	$7,%ymm10,%ymm2
6179bc3d5698SJohn Baldwin	vpandn	%ymm12,%ymm10,%ymm0
6180bc3d5698SJohn Baldwin	vpand	%ymm11,%ymm10,%ymm3
6181bc3d5698SJohn Baldwin
6182bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6183bc3d5698SJohn Baldwin
6184bc3d5698SJohn Baldwin	vpsrld	$2,%ymm14,%ymm13
6185bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6186bc3d5698SJohn Baldwin
6187bc3d5698SJohn Baldwin	vpslld	$30,%ymm14,%ymm1
6188bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
6189bc3d5698SJohn Baldwin	vpxor	%ymm14,%ymm15,%ymm3
6190bc3d5698SJohn Baldwin
6191bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm13,%ymm13
6192bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6193bc3d5698SJohn Baldwin
6194bc3d5698SJohn Baldwin	vpsrld	$13,%ymm14,%ymm1
6195bc3d5698SJohn Baldwin
6196bc3d5698SJohn Baldwin	vpslld	$19,%ymm14,%ymm2
6197bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6198bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
6199bc3d5698SJohn Baldwin
6200bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm13,%ymm7
6201bc3d5698SJohn Baldwin
6202bc3d5698SJohn Baldwin	vpsrld	$22,%ymm14,%ymm1
6203bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6204bc3d5698SJohn Baldwin
6205bc3d5698SJohn Baldwin	vpslld	$10,%ymm14,%ymm2
6206bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm15,%ymm13
6207bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm9,%ymm9
6208bc3d5698SJohn Baldwin
6209bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6210bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6211bc3d5698SJohn Baldwin
6212bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm13,%ymm13
6213bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm13,%ymm13
6214bc3d5698SJohn Baldwin	vmovd	44(%r12),%xmm5
6215bc3d5698SJohn Baldwin	vmovd	44(%r8),%xmm0
6216bc3d5698SJohn Baldwin	vmovd	44(%r13),%xmm1
6217bc3d5698SJohn Baldwin	vmovd	44(%r9),%xmm2
6218bc3d5698SJohn Baldwin	vpinsrd	$1,44(%r14),%xmm5,%xmm5
6219bc3d5698SJohn Baldwin	vpinsrd	$1,44(%r10),%xmm0,%xmm0
6220bc3d5698SJohn Baldwin	vpinsrd	$1,44(%r15),%xmm1,%xmm1
6221bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
6222bc3d5698SJohn Baldwin	vpinsrd	$1,44(%r11),%xmm2,%xmm2
6223bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
6224bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
6225bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
6226bc3d5698SJohn Baldwin	vpsrld	$6,%ymm9,%ymm7
6227bc3d5698SJohn Baldwin	vpslld	$26,%ymm9,%ymm2
6228bc3d5698SJohn Baldwin	vmovdqu	%ymm5,352-256-128(%rbx)
6229bc3d5698SJohn Baldwin	vpaddd	%ymm12,%ymm5,%ymm5
6230bc3d5698SJohn Baldwin
6231bc3d5698SJohn Baldwin	vpsrld	$11,%ymm9,%ymm1
6232bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6233bc3d5698SJohn Baldwin	vpslld	$21,%ymm9,%ymm2
6234bc3d5698SJohn Baldwin	vpaddd	-32(%rbp),%ymm5,%ymm5
6235bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6236bc3d5698SJohn Baldwin
6237bc3d5698SJohn Baldwin	vpsrld	$25,%ymm9,%ymm1
6238bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6239bc3d5698SJohn Baldwin
6240bc3d5698SJohn Baldwin	vpslld	$7,%ymm9,%ymm2
6241bc3d5698SJohn Baldwin	vpandn	%ymm11,%ymm9,%ymm0
6242bc3d5698SJohn Baldwin	vpand	%ymm10,%ymm9,%ymm4
6243bc3d5698SJohn Baldwin
6244bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6245bc3d5698SJohn Baldwin
6246bc3d5698SJohn Baldwin	vpsrld	$2,%ymm13,%ymm12
6247bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6248bc3d5698SJohn Baldwin
6249bc3d5698SJohn Baldwin	vpslld	$30,%ymm13,%ymm1
6250bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
6251bc3d5698SJohn Baldwin	vpxor	%ymm13,%ymm14,%ymm4
6252bc3d5698SJohn Baldwin
6253bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm12,%ymm12
6254bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6255bc3d5698SJohn Baldwin
6256bc3d5698SJohn Baldwin	vpsrld	$13,%ymm13,%ymm1
6257bc3d5698SJohn Baldwin
6258bc3d5698SJohn Baldwin	vpslld	$19,%ymm13,%ymm2
6259bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6260bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
6261bc3d5698SJohn Baldwin
6262bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm12,%ymm7
6263bc3d5698SJohn Baldwin
6264bc3d5698SJohn Baldwin	vpsrld	$22,%ymm13,%ymm1
6265bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6266bc3d5698SJohn Baldwin
6267bc3d5698SJohn Baldwin	vpslld	$10,%ymm13,%ymm2
6268bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm14,%ymm12
6269bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm8,%ymm8
6270bc3d5698SJohn Baldwin
6271bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6272bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6273bc3d5698SJohn Baldwin
6274bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm12,%ymm12
6275bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm12,%ymm12
6276bc3d5698SJohn Baldwin	vmovd	48(%r12),%xmm5
6277bc3d5698SJohn Baldwin	vmovd	48(%r8),%xmm0
6278bc3d5698SJohn Baldwin	vmovd	48(%r13),%xmm1
6279bc3d5698SJohn Baldwin	vmovd	48(%r9),%xmm2
6280bc3d5698SJohn Baldwin	vpinsrd	$1,48(%r14),%xmm5,%xmm5
6281bc3d5698SJohn Baldwin	vpinsrd	$1,48(%r10),%xmm0,%xmm0
6282bc3d5698SJohn Baldwin	vpinsrd	$1,48(%r15),%xmm1,%xmm1
6283bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
6284bc3d5698SJohn Baldwin	vpinsrd	$1,48(%r11),%xmm2,%xmm2
6285bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
6286bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
6287bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
6288bc3d5698SJohn Baldwin	vpsrld	$6,%ymm8,%ymm7
6289bc3d5698SJohn Baldwin	vpslld	$26,%ymm8,%ymm2
6290bc3d5698SJohn Baldwin	vmovdqu	%ymm5,384-256-128(%rbx)
6291bc3d5698SJohn Baldwin	vpaddd	%ymm11,%ymm5,%ymm5
6292bc3d5698SJohn Baldwin
6293bc3d5698SJohn Baldwin	vpsrld	$11,%ymm8,%ymm1
6294bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6295bc3d5698SJohn Baldwin	vpslld	$21,%ymm8,%ymm2
6296bc3d5698SJohn Baldwin	vpaddd	0(%rbp),%ymm5,%ymm5
6297bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6298bc3d5698SJohn Baldwin
6299bc3d5698SJohn Baldwin	vpsrld	$25,%ymm8,%ymm1
6300bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6301bc3d5698SJohn Baldwin
6302bc3d5698SJohn Baldwin	vpslld	$7,%ymm8,%ymm2
6303bc3d5698SJohn Baldwin	vpandn	%ymm10,%ymm8,%ymm0
6304bc3d5698SJohn Baldwin	vpand	%ymm9,%ymm8,%ymm3
6305bc3d5698SJohn Baldwin
6306bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6307bc3d5698SJohn Baldwin
6308bc3d5698SJohn Baldwin	vpsrld	$2,%ymm12,%ymm11
6309bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6310bc3d5698SJohn Baldwin
6311bc3d5698SJohn Baldwin	vpslld	$30,%ymm12,%ymm1
6312bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
6313bc3d5698SJohn Baldwin	vpxor	%ymm12,%ymm13,%ymm3
6314bc3d5698SJohn Baldwin
6315bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm11,%ymm11
6316bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6317bc3d5698SJohn Baldwin
6318bc3d5698SJohn Baldwin	vpsrld	$13,%ymm12,%ymm1
6319bc3d5698SJohn Baldwin
6320bc3d5698SJohn Baldwin	vpslld	$19,%ymm12,%ymm2
6321bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6322bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
6323bc3d5698SJohn Baldwin
6324bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm11,%ymm7
6325bc3d5698SJohn Baldwin
6326bc3d5698SJohn Baldwin	vpsrld	$22,%ymm12,%ymm1
6327bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6328bc3d5698SJohn Baldwin
6329bc3d5698SJohn Baldwin	vpslld	$10,%ymm12,%ymm2
6330bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm13,%ymm11
6331bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
6332bc3d5698SJohn Baldwin
6333bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6334bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6335bc3d5698SJohn Baldwin
6336bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
6337bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm11,%ymm11
6338bc3d5698SJohn Baldwin	vmovd	52(%r12),%xmm5
6339bc3d5698SJohn Baldwin	vmovd	52(%r8),%xmm0
6340bc3d5698SJohn Baldwin	vmovd	52(%r13),%xmm1
6341bc3d5698SJohn Baldwin	vmovd	52(%r9),%xmm2
6342bc3d5698SJohn Baldwin	vpinsrd	$1,52(%r14),%xmm5,%xmm5
6343bc3d5698SJohn Baldwin	vpinsrd	$1,52(%r10),%xmm0,%xmm0
6344bc3d5698SJohn Baldwin	vpinsrd	$1,52(%r15),%xmm1,%xmm1
6345bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
6346bc3d5698SJohn Baldwin	vpinsrd	$1,52(%r11),%xmm2,%xmm2
6347bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
6348bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
6349bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
6350bc3d5698SJohn Baldwin	vpsrld	$6,%ymm15,%ymm7
6351bc3d5698SJohn Baldwin	vpslld	$26,%ymm15,%ymm2
6352bc3d5698SJohn Baldwin	vmovdqu	%ymm5,416-256-128(%rbx)
6353bc3d5698SJohn Baldwin	vpaddd	%ymm10,%ymm5,%ymm5
6354bc3d5698SJohn Baldwin
6355bc3d5698SJohn Baldwin	vpsrld	$11,%ymm15,%ymm1
6356bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6357bc3d5698SJohn Baldwin	vpslld	$21,%ymm15,%ymm2
6358bc3d5698SJohn Baldwin	vpaddd	32(%rbp),%ymm5,%ymm5
6359bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6360bc3d5698SJohn Baldwin
6361bc3d5698SJohn Baldwin	vpsrld	$25,%ymm15,%ymm1
6362bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6363bc3d5698SJohn Baldwin
6364bc3d5698SJohn Baldwin	vpslld	$7,%ymm15,%ymm2
6365bc3d5698SJohn Baldwin	vpandn	%ymm9,%ymm15,%ymm0
6366bc3d5698SJohn Baldwin	vpand	%ymm8,%ymm15,%ymm4
6367bc3d5698SJohn Baldwin
6368bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6369bc3d5698SJohn Baldwin
6370bc3d5698SJohn Baldwin	vpsrld	$2,%ymm11,%ymm10
6371bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6372bc3d5698SJohn Baldwin
6373bc3d5698SJohn Baldwin	vpslld	$30,%ymm11,%ymm1
6374bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
6375bc3d5698SJohn Baldwin	vpxor	%ymm11,%ymm12,%ymm4
6376bc3d5698SJohn Baldwin
6377bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm10,%ymm10
6378bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6379bc3d5698SJohn Baldwin
6380bc3d5698SJohn Baldwin	vpsrld	$13,%ymm11,%ymm1
6381bc3d5698SJohn Baldwin
6382bc3d5698SJohn Baldwin	vpslld	$19,%ymm11,%ymm2
6383bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6384bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
6385bc3d5698SJohn Baldwin
6386bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm10,%ymm7
6387bc3d5698SJohn Baldwin
6388bc3d5698SJohn Baldwin	vpsrld	$22,%ymm11,%ymm1
6389bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6390bc3d5698SJohn Baldwin
6391bc3d5698SJohn Baldwin	vpslld	$10,%ymm11,%ymm2
6392bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm12,%ymm10
6393bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm14,%ymm14
6394bc3d5698SJohn Baldwin
6395bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6396bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6397bc3d5698SJohn Baldwin
6398bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm10,%ymm10
6399bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm10,%ymm10
6400bc3d5698SJohn Baldwin	vmovd	56(%r12),%xmm5
6401bc3d5698SJohn Baldwin	vmovd	56(%r8),%xmm0
6402bc3d5698SJohn Baldwin	vmovd	56(%r13),%xmm1
6403bc3d5698SJohn Baldwin	vmovd	56(%r9),%xmm2
6404bc3d5698SJohn Baldwin	vpinsrd	$1,56(%r14),%xmm5,%xmm5
6405bc3d5698SJohn Baldwin	vpinsrd	$1,56(%r10),%xmm0,%xmm0
6406bc3d5698SJohn Baldwin	vpinsrd	$1,56(%r15),%xmm1,%xmm1
6407bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
6408bc3d5698SJohn Baldwin	vpinsrd	$1,56(%r11),%xmm2,%xmm2
6409bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
6410bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
6411bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
6412bc3d5698SJohn Baldwin	vpsrld	$6,%ymm14,%ymm7
6413bc3d5698SJohn Baldwin	vpslld	$26,%ymm14,%ymm2
6414bc3d5698SJohn Baldwin	vmovdqu	%ymm5,448-256-128(%rbx)
6415bc3d5698SJohn Baldwin	vpaddd	%ymm9,%ymm5,%ymm5
6416bc3d5698SJohn Baldwin
6417bc3d5698SJohn Baldwin	vpsrld	$11,%ymm14,%ymm1
6418bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6419bc3d5698SJohn Baldwin	vpslld	$21,%ymm14,%ymm2
6420bc3d5698SJohn Baldwin	vpaddd	64(%rbp),%ymm5,%ymm5
6421bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6422bc3d5698SJohn Baldwin
6423bc3d5698SJohn Baldwin	vpsrld	$25,%ymm14,%ymm1
6424bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6425bc3d5698SJohn Baldwin
6426bc3d5698SJohn Baldwin	vpslld	$7,%ymm14,%ymm2
6427bc3d5698SJohn Baldwin	vpandn	%ymm8,%ymm14,%ymm0
6428bc3d5698SJohn Baldwin	vpand	%ymm15,%ymm14,%ymm3
6429bc3d5698SJohn Baldwin
6430bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6431bc3d5698SJohn Baldwin
6432bc3d5698SJohn Baldwin	vpsrld	$2,%ymm10,%ymm9
6433bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6434bc3d5698SJohn Baldwin
6435bc3d5698SJohn Baldwin	vpslld	$30,%ymm10,%ymm1
6436bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
6437bc3d5698SJohn Baldwin	vpxor	%ymm10,%ymm11,%ymm3
6438bc3d5698SJohn Baldwin
6439bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm9,%ymm9
6440bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6441bc3d5698SJohn Baldwin
6442bc3d5698SJohn Baldwin	vpsrld	$13,%ymm10,%ymm1
6443bc3d5698SJohn Baldwin
6444bc3d5698SJohn Baldwin	vpslld	$19,%ymm10,%ymm2
6445bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6446bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
6447bc3d5698SJohn Baldwin
6448bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm9,%ymm7
6449bc3d5698SJohn Baldwin
6450bc3d5698SJohn Baldwin	vpsrld	$22,%ymm10,%ymm1
6451bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6452bc3d5698SJohn Baldwin
6453bc3d5698SJohn Baldwin	vpslld	$10,%ymm10,%ymm2
6454bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm11,%ymm9
6455bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm13,%ymm13
6456bc3d5698SJohn Baldwin
6457bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6458bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6459bc3d5698SJohn Baldwin
6460bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm9,%ymm9
6461bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm9,%ymm9
6462bc3d5698SJohn Baldwin	vmovd	60(%r12),%xmm5
6463bc3d5698SJohn Baldwin	leaq	64(%r12),%r12
6464bc3d5698SJohn Baldwin	vmovd	60(%r8),%xmm0
6465bc3d5698SJohn Baldwin	leaq	64(%r8),%r8
6466bc3d5698SJohn Baldwin	vmovd	60(%r13),%xmm1
6467bc3d5698SJohn Baldwin	leaq	64(%r13),%r13
6468bc3d5698SJohn Baldwin	vmovd	60(%r9),%xmm2
6469bc3d5698SJohn Baldwin	leaq	64(%r9),%r9
6470bc3d5698SJohn Baldwin	vpinsrd	$1,60(%r14),%xmm5,%xmm5
6471bc3d5698SJohn Baldwin	leaq	64(%r14),%r14
6472bc3d5698SJohn Baldwin	vpinsrd	$1,60(%r10),%xmm0,%xmm0
6473bc3d5698SJohn Baldwin	leaq	64(%r10),%r10
6474bc3d5698SJohn Baldwin	vpinsrd	$1,60(%r15),%xmm1,%xmm1
6475bc3d5698SJohn Baldwin	leaq	64(%r15),%r15
6476bc3d5698SJohn Baldwin	vpunpckldq	%ymm1,%ymm5,%ymm5
6477bc3d5698SJohn Baldwin	vpinsrd	$1,60(%r11),%xmm2,%xmm2
6478bc3d5698SJohn Baldwin	leaq	64(%r11),%r11
6479bc3d5698SJohn Baldwin	vpunpckldq	%ymm2,%ymm0,%ymm0
6480bc3d5698SJohn Baldwin	vinserti128	$1,%xmm0,%ymm5,%ymm5
6481bc3d5698SJohn Baldwin	vpshufb	%ymm6,%ymm5,%ymm5
6482bc3d5698SJohn Baldwin	vpsrld	$6,%ymm13,%ymm7
6483bc3d5698SJohn Baldwin	vpslld	$26,%ymm13,%ymm2
6484bc3d5698SJohn Baldwin	vmovdqu	%ymm5,480-256-128(%rbx)
6485bc3d5698SJohn Baldwin	vpaddd	%ymm8,%ymm5,%ymm5
6486bc3d5698SJohn Baldwin
6487bc3d5698SJohn Baldwin	vpsrld	$11,%ymm13,%ymm1
6488bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6489bc3d5698SJohn Baldwin	vpslld	$21,%ymm13,%ymm2
6490bc3d5698SJohn Baldwin	vpaddd	96(%rbp),%ymm5,%ymm5
6491bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6492bc3d5698SJohn Baldwin
6493bc3d5698SJohn Baldwin	vpsrld	$25,%ymm13,%ymm1
6494bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6495bc3d5698SJohn Baldwin	prefetcht0	63(%r12)
6496bc3d5698SJohn Baldwin	vpslld	$7,%ymm13,%ymm2
6497bc3d5698SJohn Baldwin	vpandn	%ymm15,%ymm13,%ymm0
6498bc3d5698SJohn Baldwin	vpand	%ymm14,%ymm13,%ymm4
6499bc3d5698SJohn Baldwin	prefetcht0	63(%r13)
6500bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6501bc3d5698SJohn Baldwin
6502bc3d5698SJohn Baldwin	vpsrld	$2,%ymm9,%ymm8
6503bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6504bc3d5698SJohn Baldwin	prefetcht0	63(%r14)
6505bc3d5698SJohn Baldwin	vpslld	$30,%ymm9,%ymm1
6506bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
6507bc3d5698SJohn Baldwin	vpxor	%ymm9,%ymm10,%ymm4
6508bc3d5698SJohn Baldwin	prefetcht0	63(%r15)
6509bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm8,%ymm8
6510bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6511bc3d5698SJohn Baldwin
6512bc3d5698SJohn Baldwin	vpsrld	$13,%ymm9,%ymm1
6513bc3d5698SJohn Baldwin	prefetcht0	63(%r8)
6514bc3d5698SJohn Baldwin	vpslld	$19,%ymm9,%ymm2
6515bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6516bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
6517bc3d5698SJohn Baldwin	prefetcht0	63(%r9)
6518bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm8,%ymm7
6519bc3d5698SJohn Baldwin
6520bc3d5698SJohn Baldwin	vpsrld	$22,%ymm9,%ymm1
6521bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6522bc3d5698SJohn Baldwin	prefetcht0	63(%r10)
6523bc3d5698SJohn Baldwin	vpslld	$10,%ymm9,%ymm2
6524bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm10,%ymm8
6525bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm12,%ymm12
6526bc3d5698SJohn Baldwin	prefetcht0	63(%r11)
6527bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6528bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6529bc3d5698SJohn Baldwin
6530bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm8,%ymm8
6531bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm8,%ymm8
6532bc3d5698SJohn Baldwin	addq	$256,%rbp
6533bc3d5698SJohn Baldwin	vmovdqu	0-128(%rax),%ymm5
6534bc3d5698SJohn Baldwin	movl	$3,%ecx
6535bc3d5698SJohn Baldwin	jmp	.Loop_16_xx_avx2
6536bc3d5698SJohn Baldwin.align	32
6537bc3d5698SJohn Baldwin.Loop_16_xx_avx2:
6538bc3d5698SJohn Baldwin	vmovdqu	32-128(%rax),%ymm6
6539bc3d5698SJohn Baldwin	vpaddd	288-256-128(%rbx),%ymm5,%ymm5
6540bc3d5698SJohn Baldwin
6541bc3d5698SJohn Baldwin	vpsrld	$3,%ymm6,%ymm7
6542bc3d5698SJohn Baldwin	vpsrld	$7,%ymm6,%ymm1
6543bc3d5698SJohn Baldwin	vpslld	$25,%ymm6,%ymm2
6544bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6545bc3d5698SJohn Baldwin	vpsrld	$18,%ymm6,%ymm1
6546bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6547bc3d5698SJohn Baldwin	vpslld	$14,%ymm6,%ymm2
6548bc3d5698SJohn Baldwin	vmovdqu	448-256-128(%rbx),%ymm0
6549bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm3
6550bc3d5698SJohn Baldwin
6551bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6552bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
6553bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6554bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
6555bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6556bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm3,%ymm7
6557bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
6558bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6559bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
6560bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6561bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6562bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6563bc3d5698SJohn Baldwin	vpsrld	$6,%ymm12,%ymm7
6564bc3d5698SJohn Baldwin	vpslld	$26,%ymm12,%ymm2
6565bc3d5698SJohn Baldwin	vmovdqu	%ymm5,0-128(%rax)
6566bc3d5698SJohn Baldwin	vpaddd	%ymm15,%ymm5,%ymm5
6567bc3d5698SJohn Baldwin
6568bc3d5698SJohn Baldwin	vpsrld	$11,%ymm12,%ymm1
6569bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6570bc3d5698SJohn Baldwin	vpslld	$21,%ymm12,%ymm2
6571bc3d5698SJohn Baldwin	vpaddd	-128(%rbp),%ymm5,%ymm5
6572bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6573bc3d5698SJohn Baldwin
6574bc3d5698SJohn Baldwin	vpsrld	$25,%ymm12,%ymm1
6575bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6576bc3d5698SJohn Baldwin
6577bc3d5698SJohn Baldwin	vpslld	$7,%ymm12,%ymm2
6578bc3d5698SJohn Baldwin	vpandn	%ymm14,%ymm12,%ymm0
6579bc3d5698SJohn Baldwin	vpand	%ymm13,%ymm12,%ymm3
6580bc3d5698SJohn Baldwin
6581bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6582bc3d5698SJohn Baldwin
6583bc3d5698SJohn Baldwin	vpsrld	$2,%ymm8,%ymm15
6584bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6585bc3d5698SJohn Baldwin
6586bc3d5698SJohn Baldwin	vpslld	$30,%ymm8,%ymm1
6587bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
6588bc3d5698SJohn Baldwin	vpxor	%ymm8,%ymm9,%ymm3
6589bc3d5698SJohn Baldwin
6590bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm15,%ymm15
6591bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6592bc3d5698SJohn Baldwin
6593bc3d5698SJohn Baldwin	vpsrld	$13,%ymm8,%ymm1
6594bc3d5698SJohn Baldwin
6595bc3d5698SJohn Baldwin	vpslld	$19,%ymm8,%ymm2
6596bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6597bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
6598bc3d5698SJohn Baldwin
6599bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm15,%ymm7
6600bc3d5698SJohn Baldwin
6601bc3d5698SJohn Baldwin	vpsrld	$22,%ymm8,%ymm1
6602bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6603bc3d5698SJohn Baldwin
6604bc3d5698SJohn Baldwin	vpslld	$10,%ymm8,%ymm2
6605bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm9,%ymm15
6606bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
6607bc3d5698SJohn Baldwin
6608bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6609bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6610bc3d5698SJohn Baldwin
6611bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
6612bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm15,%ymm15
6613bc3d5698SJohn Baldwin	vmovdqu	64-128(%rax),%ymm5
6614bc3d5698SJohn Baldwin	vpaddd	320-256-128(%rbx),%ymm6,%ymm6
6615bc3d5698SJohn Baldwin
6616bc3d5698SJohn Baldwin	vpsrld	$3,%ymm5,%ymm7
6617bc3d5698SJohn Baldwin	vpsrld	$7,%ymm5,%ymm1
6618bc3d5698SJohn Baldwin	vpslld	$25,%ymm5,%ymm2
6619bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6620bc3d5698SJohn Baldwin	vpsrld	$18,%ymm5,%ymm1
6621bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6622bc3d5698SJohn Baldwin	vpslld	$14,%ymm5,%ymm2
6623bc3d5698SJohn Baldwin	vmovdqu	480-256-128(%rbx),%ymm0
6624bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm4
6625bc3d5698SJohn Baldwin
6626bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6627bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
6628bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6629bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
6630bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6631bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm4,%ymm7
6632bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
6633bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6634bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
6635bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6636bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6637bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6638bc3d5698SJohn Baldwin	vpsrld	$6,%ymm11,%ymm7
6639bc3d5698SJohn Baldwin	vpslld	$26,%ymm11,%ymm2
6640bc3d5698SJohn Baldwin	vmovdqu	%ymm6,32-128(%rax)
6641bc3d5698SJohn Baldwin	vpaddd	%ymm14,%ymm6,%ymm6
6642bc3d5698SJohn Baldwin
6643bc3d5698SJohn Baldwin	vpsrld	$11,%ymm11,%ymm1
6644bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6645bc3d5698SJohn Baldwin	vpslld	$21,%ymm11,%ymm2
6646bc3d5698SJohn Baldwin	vpaddd	-96(%rbp),%ymm6,%ymm6
6647bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6648bc3d5698SJohn Baldwin
6649bc3d5698SJohn Baldwin	vpsrld	$25,%ymm11,%ymm1
6650bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6651bc3d5698SJohn Baldwin
6652bc3d5698SJohn Baldwin	vpslld	$7,%ymm11,%ymm2
6653bc3d5698SJohn Baldwin	vpandn	%ymm13,%ymm11,%ymm0
6654bc3d5698SJohn Baldwin	vpand	%ymm12,%ymm11,%ymm4
6655bc3d5698SJohn Baldwin
6656bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6657bc3d5698SJohn Baldwin
6658bc3d5698SJohn Baldwin	vpsrld	$2,%ymm15,%ymm14
6659bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6660bc3d5698SJohn Baldwin
6661bc3d5698SJohn Baldwin	vpslld	$30,%ymm15,%ymm1
6662bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
6663bc3d5698SJohn Baldwin	vpxor	%ymm15,%ymm8,%ymm4
6664bc3d5698SJohn Baldwin
6665bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm14,%ymm14
6666bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6667bc3d5698SJohn Baldwin
6668bc3d5698SJohn Baldwin	vpsrld	$13,%ymm15,%ymm1
6669bc3d5698SJohn Baldwin
6670bc3d5698SJohn Baldwin	vpslld	$19,%ymm15,%ymm2
6671bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm6,%ymm6
6672bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
6673bc3d5698SJohn Baldwin
6674bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm14,%ymm7
6675bc3d5698SJohn Baldwin
6676bc3d5698SJohn Baldwin	vpsrld	$22,%ymm15,%ymm1
6677bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6678bc3d5698SJohn Baldwin
6679bc3d5698SJohn Baldwin	vpslld	$10,%ymm15,%ymm2
6680bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm8,%ymm14
6681bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm10,%ymm10
6682bc3d5698SJohn Baldwin
6683bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6684bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6685bc3d5698SJohn Baldwin
6686bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm14,%ymm14
6687bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm14,%ymm14
6688bc3d5698SJohn Baldwin	vmovdqu	96-128(%rax),%ymm6
6689bc3d5698SJohn Baldwin	vpaddd	352-256-128(%rbx),%ymm5,%ymm5
6690bc3d5698SJohn Baldwin
6691bc3d5698SJohn Baldwin	vpsrld	$3,%ymm6,%ymm7
6692bc3d5698SJohn Baldwin	vpsrld	$7,%ymm6,%ymm1
6693bc3d5698SJohn Baldwin	vpslld	$25,%ymm6,%ymm2
6694bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6695bc3d5698SJohn Baldwin	vpsrld	$18,%ymm6,%ymm1
6696bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6697bc3d5698SJohn Baldwin	vpslld	$14,%ymm6,%ymm2
6698bc3d5698SJohn Baldwin	vmovdqu	0-128(%rax),%ymm0
6699bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm3
6700bc3d5698SJohn Baldwin
6701bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6702bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
6703bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6704bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
6705bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6706bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm3,%ymm7
6707bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
6708bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6709bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
6710bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6711bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6712bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6713bc3d5698SJohn Baldwin	vpsrld	$6,%ymm10,%ymm7
6714bc3d5698SJohn Baldwin	vpslld	$26,%ymm10,%ymm2
6715bc3d5698SJohn Baldwin	vmovdqu	%ymm5,64-128(%rax)
6716bc3d5698SJohn Baldwin	vpaddd	%ymm13,%ymm5,%ymm5
6717bc3d5698SJohn Baldwin
6718bc3d5698SJohn Baldwin	vpsrld	$11,%ymm10,%ymm1
6719bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6720bc3d5698SJohn Baldwin	vpslld	$21,%ymm10,%ymm2
6721bc3d5698SJohn Baldwin	vpaddd	-64(%rbp),%ymm5,%ymm5
6722bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6723bc3d5698SJohn Baldwin
6724bc3d5698SJohn Baldwin	vpsrld	$25,%ymm10,%ymm1
6725bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6726bc3d5698SJohn Baldwin
6727bc3d5698SJohn Baldwin	vpslld	$7,%ymm10,%ymm2
6728bc3d5698SJohn Baldwin	vpandn	%ymm12,%ymm10,%ymm0
6729bc3d5698SJohn Baldwin	vpand	%ymm11,%ymm10,%ymm3
6730bc3d5698SJohn Baldwin
6731bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6732bc3d5698SJohn Baldwin
6733bc3d5698SJohn Baldwin	vpsrld	$2,%ymm14,%ymm13
6734bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6735bc3d5698SJohn Baldwin
6736bc3d5698SJohn Baldwin	vpslld	$30,%ymm14,%ymm1
6737bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
6738bc3d5698SJohn Baldwin	vpxor	%ymm14,%ymm15,%ymm3
6739bc3d5698SJohn Baldwin
6740bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm13,%ymm13
6741bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6742bc3d5698SJohn Baldwin
6743bc3d5698SJohn Baldwin	vpsrld	$13,%ymm14,%ymm1
6744bc3d5698SJohn Baldwin
6745bc3d5698SJohn Baldwin	vpslld	$19,%ymm14,%ymm2
6746bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6747bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
6748bc3d5698SJohn Baldwin
6749bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm13,%ymm7
6750bc3d5698SJohn Baldwin
6751bc3d5698SJohn Baldwin	vpsrld	$22,%ymm14,%ymm1
6752bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6753bc3d5698SJohn Baldwin
6754bc3d5698SJohn Baldwin	vpslld	$10,%ymm14,%ymm2
6755bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm15,%ymm13
6756bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm9,%ymm9
6757bc3d5698SJohn Baldwin
6758bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6759bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6760bc3d5698SJohn Baldwin
6761bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm13,%ymm13
6762bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm13,%ymm13
6763bc3d5698SJohn Baldwin	vmovdqu	128-128(%rax),%ymm5
6764bc3d5698SJohn Baldwin	vpaddd	384-256-128(%rbx),%ymm6,%ymm6
6765bc3d5698SJohn Baldwin
6766bc3d5698SJohn Baldwin	vpsrld	$3,%ymm5,%ymm7
6767bc3d5698SJohn Baldwin	vpsrld	$7,%ymm5,%ymm1
6768bc3d5698SJohn Baldwin	vpslld	$25,%ymm5,%ymm2
6769bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6770bc3d5698SJohn Baldwin	vpsrld	$18,%ymm5,%ymm1
6771bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6772bc3d5698SJohn Baldwin	vpslld	$14,%ymm5,%ymm2
6773bc3d5698SJohn Baldwin	vmovdqu	32-128(%rax),%ymm0
6774bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm4
6775bc3d5698SJohn Baldwin
6776bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6777bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
6778bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6779bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
6780bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6781bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm4,%ymm7
6782bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
6783bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6784bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
6785bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6786bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6787bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6788bc3d5698SJohn Baldwin	vpsrld	$6,%ymm9,%ymm7
6789bc3d5698SJohn Baldwin	vpslld	$26,%ymm9,%ymm2
6790bc3d5698SJohn Baldwin	vmovdqu	%ymm6,96-128(%rax)
6791bc3d5698SJohn Baldwin	vpaddd	%ymm12,%ymm6,%ymm6
6792bc3d5698SJohn Baldwin
6793bc3d5698SJohn Baldwin	vpsrld	$11,%ymm9,%ymm1
6794bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6795bc3d5698SJohn Baldwin	vpslld	$21,%ymm9,%ymm2
6796bc3d5698SJohn Baldwin	vpaddd	-32(%rbp),%ymm6,%ymm6
6797bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6798bc3d5698SJohn Baldwin
6799bc3d5698SJohn Baldwin	vpsrld	$25,%ymm9,%ymm1
6800bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6801bc3d5698SJohn Baldwin
6802bc3d5698SJohn Baldwin	vpslld	$7,%ymm9,%ymm2
6803bc3d5698SJohn Baldwin	vpandn	%ymm11,%ymm9,%ymm0
6804bc3d5698SJohn Baldwin	vpand	%ymm10,%ymm9,%ymm4
6805bc3d5698SJohn Baldwin
6806bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6807bc3d5698SJohn Baldwin
6808bc3d5698SJohn Baldwin	vpsrld	$2,%ymm13,%ymm12
6809bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6810bc3d5698SJohn Baldwin
6811bc3d5698SJohn Baldwin	vpslld	$30,%ymm13,%ymm1
6812bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
6813bc3d5698SJohn Baldwin	vpxor	%ymm13,%ymm14,%ymm4
6814bc3d5698SJohn Baldwin
6815bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm12,%ymm12
6816bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6817bc3d5698SJohn Baldwin
6818bc3d5698SJohn Baldwin	vpsrld	$13,%ymm13,%ymm1
6819bc3d5698SJohn Baldwin
6820bc3d5698SJohn Baldwin	vpslld	$19,%ymm13,%ymm2
6821bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm6,%ymm6
6822bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
6823bc3d5698SJohn Baldwin
6824bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm12,%ymm7
6825bc3d5698SJohn Baldwin
6826bc3d5698SJohn Baldwin	vpsrld	$22,%ymm13,%ymm1
6827bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6828bc3d5698SJohn Baldwin
6829bc3d5698SJohn Baldwin	vpslld	$10,%ymm13,%ymm2
6830bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm14,%ymm12
6831bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm8,%ymm8
6832bc3d5698SJohn Baldwin
6833bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6834bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6835bc3d5698SJohn Baldwin
6836bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm12,%ymm12
6837bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm12,%ymm12
6838bc3d5698SJohn Baldwin	vmovdqu	160-128(%rax),%ymm6
6839bc3d5698SJohn Baldwin	vpaddd	416-256-128(%rbx),%ymm5,%ymm5
6840bc3d5698SJohn Baldwin
6841bc3d5698SJohn Baldwin	vpsrld	$3,%ymm6,%ymm7
6842bc3d5698SJohn Baldwin	vpsrld	$7,%ymm6,%ymm1
6843bc3d5698SJohn Baldwin	vpslld	$25,%ymm6,%ymm2
6844bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6845bc3d5698SJohn Baldwin	vpsrld	$18,%ymm6,%ymm1
6846bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6847bc3d5698SJohn Baldwin	vpslld	$14,%ymm6,%ymm2
6848bc3d5698SJohn Baldwin	vmovdqu	64-128(%rax),%ymm0
6849bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm3
6850bc3d5698SJohn Baldwin
6851bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6852bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
6853bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6854bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
6855bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6856bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm3,%ymm7
6857bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
6858bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6859bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
6860bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6861bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6862bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6863bc3d5698SJohn Baldwin	vpsrld	$6,%ymm8,%ymm7
6864bc3d5698SJohn Baldwin	vpslld	$26,%ymm8,%ymm2
6865bc3d5698SJohn Baldwin	vmovdqu	%ymm5,128-128(%rax)
6866bc3d5698SJohn Baldwin	vpaddd	%ymm11,%ymm5,%ymm5
6867bc3d5698SJohn Baldwin
6868bc3d5698SJohn Baldwin	vpsrld	$11,%ymm8,%ymm1
6869bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6870bc3d5698SJohn Baldwin	vpslld	$21,%ymm8,%ymm2
6871bc3d5698SJohn Baldwin	vpaddd	0(%rbp),%ymm5,%ymm5
6872bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6873bc3d5698SJohn Baldwin
6874bc3d5698SJohn Baldwin	vpsrld	$25,%ymm8,%ymm1
6875bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6876bc3d5698SJohn Baldwin
6877bc3d5698SJohn Baldwin	vpslld	$7,%ymm8,%ymm2
6878bc3d5698SJohn Baldwin	vpandn	%ymm10,%ymm8,%ymm0
6879bc3d5698SJohn Baldwin	vpand	%ymm9,%ymm8,%ymm3
6880bc3d5698SJohn Baldwin
6881bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6882bc3d5698SJohn Baldwin
6883bc3d5698SJohn Baldwin	vpsrld	$2,%ymm12,%ymm11
6884bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6885bc3d5698SJohn Baldwin
6886bc3d5698SJohn Baldwin	vpslld	$30,%ymm12,%ymm1
6887bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
6888bc3d5698SJohn Baldwin	vpxor	%ymm12,%ymm13,%ymm3
6889bc3d5698SJohn Baldwin
6890bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm11,%ymm11
6891bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
6892bc3d5698SJohn Baldwin
6893bc3d5698SJohn Baldwin	vpsrld	$13,%ymm12,%ymm1
6894bc3d5698SJohn Baldwin
6895bc3d5698SJohn Baldwin	vpslld	$19,%ymm12,%ymm2
6896bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
6897bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
6898bc3d5698SJohn Baldwin
6899bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm11,%ymm7
6900bc3d5698SJohn Baldwin
6901bc3d5698SJohn Baldwin	vpsrld	$22,%ymm12,%ymm1
6902bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6903bc3d5698SJohn Baldwin
6904bc3d5698SJohn Baldwin	vpslld	$10,%ymm12,%ymm2
6905bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm13,%ymm11
6906bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
6907bc3d5698SJohn Baldwin
6908bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6909bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6910bc3d5698SJohn Baldwin
6911bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
6912bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm11,%ymm11
6913bc3d5698SJohn Baldwin	vmovdqu	192-128(%rax),%ymm5
6914bc3d5698SJohn Baldwin	vpaddd	448-256-128(%rbx),%ymm6,%ymm6
6915bc3d5698SJohn Baldwin
6916bc3d5698SJohn Baldwin	vpsrld	$3,%ymm5,%ymm7
6917bc3d5698SJohn Baldwin	vpsrld	$7,%ymm5,%ymm1
6918bc3d5698SJohn Baldwin	vpslld	$25,%ymm5,%ymm2
6919bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6920bc3d5698SJohn Baldwin	vpsrld	$18,%ymm5,%ymm1
6921bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6922bc3d5698SJohn Baldwin	vpslld	$14,%ymm5,%ymm2
6923bc3d5698SJohn Baldwin	vmovdqu	96-128(%rax),%ymm0
6924bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm4
6925bc3d5698SJohn Baldwin
6926bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6927bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
6928bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6929bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
6930bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6931bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm4,%ymm7
6932bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
6933bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6934bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
6935bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6936bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6937bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6938bc3d5698SJohn Baldwin	vpsrld	$6,%ymm15,%ymm7
6939bc3d5698SJohn Baldwin	vpslld	$26,%ymm15,%ymm2
6940bc3d5698SJohn Baldwin	vmovdqu	%ymm6,160-128(%rax)
6941bc3d5698SJohn Baldwin	vpaddd	%ymm10,%ymm6,%ymm6
6942bc3d5698SJohn Baldwin
6943bc3d5698SJohn Baldwin	vpsrld	$11,%ymm15,%ymm1
6944bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6945bc3d5698SJohn Baldwin	vpslld	$21,%ymm15,%ymm2
6946bc3d5698SJohn Baldwin	vpaddd	32(%rbp),%ymm6,%ymm6
6947bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6948bc3d5698SJohn Baldwin
6949bc3d5698SJohn Baldwin	vpsrld	$25,%ymm15,%ymm1
6950bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6951bc3d5698SJohn Baldwin
6952bc3d5698SJohn Baldwin	vpslld	$7,%ymm15,%ymm2
6953bc3d5698SJohn Baldwin	vpandn	%ymm9,%ymm15,%ymm0
6954bc3d5698SJohn Baldwin	vpand	%ymm8,%ymm15,%ymm4
6955bc3d5698SJohn Baldwin
6956bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6957bc3d5698SJohn Baldwin
6958bc3d5698SJohn Baldwin	vpsrld	$2,%ymm11,%ymm10
6959bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6960bc3d5698SJohn Baldwin
6961bc3d5698SJohn Baldwin	vpslld	$30,%ymm11,%ymm1
6962bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
6963bc3d5698SJohn Baldwin	vpxor	%ymm11,%ymm12,%ymm4
6964bc3d5698SJohn Baldwin
6965bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm10,%ymm10
6966bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
6967bc3d5698SJohn Baldwin
6968bc3d5698SJohn Baldwin	vpsrld	$13,%ymm11,%ymm1
6969bc3d5698SJohn Baldwin
6970bc3d5698SJohn Baldwin	vpslld	$19,%ymm11,%ymm2
6971bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm6,%ymm6
6972bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
6973bc3d5698SJohn Baldwin
6974bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm10,%ymm7
6975bc3d5698SJohn Baldwin
6976bc3d5698SJohn Baldwin	vpsrld	$22,%ymm11,%ymm1
6977bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6978bc3d5698SJohn Baldwin
6979bc3d5698SJohn Baldwin	vpslld	$10,%ymm11,%ymm2
6980bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm12,%ymm10
6981bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm14,%ymm14
6982bc3d5698SJohn Baldwin
6983bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6984bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6985bc3d5698SJohn Baldwin
6986bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm10,%ymm10
6987bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm10,%ymm10
6988bc3d5698SJohn Baldwin	vmovdqu	224-128(%rax),%ymm6
6989bc3d5698SJohn Baldwin	vpaddd	480-256-128(%rbx),%ymm5,%ymm5
6990bc3d5698SJohn Baldwin
6991bc3d5698SJohn Baldwin	vpsrld	$3,%ymm6,%ymm7
6992bc3d5698SJohn Baldwin	vpsrld	$7,%ymm6,%ymm1
6993bc3d5698SJohn Baldwin	vpslld	$25,%ymm6,%ymm2
6994bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
6995bc3d5698SJohn Baldwin	vpsrld	$18,%ymm6,%ymm1
6996bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
6997bc3d5698SJohn Baldwin	vpslld	$14,%ymm6,%ymm2
6998bc3d5698SJohn Baldwin	vmovdqu	128-128(%rax),%ymm0
6999bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm3
7000bc3d5698SJohn Baldwin
7001bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7002bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7003bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7004bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7005bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7006bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm3,%ymm7
7007bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7008bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7009bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7010bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7011bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7012bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7013bc3d5698SJohn Baldwin	vpsrld	$6,%ymm14,%ymm7
7014bc3d5698SJohn Baldwin	vpslld	$26,%ymm14,%ymm2
7015bc3d5698SJohn Baldwin	vmovdqu	%ymm5,192-128(%rax)
7016bc3d5698SJohn Baldwin	vpaddd	%ymm9,%ymm5,%ymm5
7017bc3d5698SJohn Baldwin
7018bc3d5698SJohn Baldwin	vpsrld	$11,%ymm14,%ymm1
7019bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7020bc3d5698SJohn Baldwin	vpslld	$21,%ymm14,%ymm2
7021bc3d5698SJohn Baldwin	vpaddd	64(%rbp),%ymm5,%ymm5
7022bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7023bc3d5698SJohn Baldwin
7024bc3d5698SJohn Baldwin	vpsrld	$25,%ymm14,%ymm1
7025bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7026bc3d5698SJohn Baldwin
7027bc3d5698SJohn Baldwin	vpslld	$7,%ymm14,%ymm2
7028bc3d5698SJohn Baldwin	vpandn	%ymm8,%ymm14,%ymm0
7029bc3d5698SJohn Baldwin	vpand	%ymm15,%ymm14,%ymm3
7030bc3d5698SJohn Baldwin
7031bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7032bc3d5698SJohn Baldwin
7033bc3d5698SJohn Baldwin	vpsrld	$2,%ymm10,%ymm9
7034bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7035bc3d5698SJohn Baldwin
7036bc3d5698SJohn Baldwin	vpslld	$30,%ymm10,%ymm1
7037bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
7038bc3d5698SJohn Baldwin	vpxor	%ymm10,%ymm11,%ymm3
7039bc3d5698SJohn Baldwin
7040bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm9,%ymm9
7041bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7042bc3d5698SJohn Baldwin
7043bc3d5698SJohn Baldwin	vpsrld	$13,%ymm10,%ymm1
7044bc3d5698SJohn Baldwin
7045bc3d5698SJohn Baldwin	vpslld	$19,%ymm10,%ymm2
7046bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
7047bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
7048bc3d5698SJohn Baldwin
7049bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm9,%ymm7
7050bc3d5698SJohn Baldwin
7051bc3d5698SJohn Baldwin	vpsrld	$22,%ymm10,%ymm1
7052bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7053bc3d5698SJohn Baldwin
7054bc3d5698SJohn Baldwin	vpslld	$10,%ymm10,%ymm2
7055bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm11,%ymm9
7056bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm13,%ymm13
7057bc3d5698SJohn Baldwin
7058bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7059bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7060bc3d5698SJohn Baldwin
7061bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm9,%ymm9
7062bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm9,%ymm9
7063bc3d5698SJohn Baldwin	vmovdqu	256-256-128(%rbx),%ymm5
7064bc3d5698SJohn Baldwin	vpaddd	0-128(%rax),%ymm6,%ymm6
7065bc3d5698SJohn Baldwin
7066bc3d5698SJohn Baldwin	vpsrld	$3,%ymm5,%ymm7
7067bc3d5698SJohn Baldwin	vpsrld	$7,%ymm5,%ymm1
7068bc3d5698SJohn Baldwin	vpslld	$25,%ymm5,%ymm2
7069bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7070bc3d5698SJohn Baldwin	vpsrld	$18,%ymm5,%ymm1
7071bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7072bc3d5698SJohn Baldwin	vpslld	$14,%ymm5,%ymm2
7073bc3d5698SJohn Baldwin	vmovdqu	160-128(%rax),%ymm0
7074bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm4
7075bc3d5698SJohn Baldwin
7076bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7077bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7078bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7079bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7080bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7081bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm4,%ymm7
7082bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7083bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7084bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7085bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7086bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7087bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7088bc3d5698SJohn Baldwin	vpsrld	$6,%ymm13,%ymm7
7089bc3d5698SJohn Baldwin	vpslld	$26,%ymm13,%ymm2
7090bc3d5698SJohn Baldwin	vmovdqu	%ymm6,224-128(%rax)
7091bc3d5698SJohn Baldwin	vpaddd	%ymm8,%ymm6,%ymm6
7092bc3d5698SJohn Baldwin
7093bc3d5698SJohn Baldwin	vpsrld	$11,%ymm13,%ymm1
7094bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7095bc3d5698SJohn Baldwin	vpslld	$21,%ymm13,%ymm2
7096bc3d5698SJohn Baldwin	vpaddd	96(%rbp),%ymm6,%ymm6
7097bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7098bc3d5698SJohn Baldwin
7099bc3d5698SJohn Baldwin	vpsrld	$25,%ymm13,%ymm1
7100bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7101bc3d5698SJohn Baldwin
7102bc3d5698SJohn Baldwin	vpslld	$7,%ymm13,%ymm2
7103bc3d5698SJohn Baldwin	vpandn	%ymm15,%ymm13,%ymm0
7104bc3d5698SJohn Baldwin	vpand	%ymm14,%ymm13,%ymm4
7105bc3d5698SJohn Baldwin
7106bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7107bc3d5698SJohn Baldwin
7108bc3d5698SJohn Baldwin	vpsrld	$2,%ymm9,%ymm8
7109bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7110bc3d5698SJohn Baldwin
7111bc3d5698SJohn Baldwin	vpslld	$30,%ymm9,%ymm1
7112bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
7113bc3d5698SJohn Baldwin	vpxor	%ymm9,%ymm10,%ymm4
7114bc3d5698SJohn Baldwin
7115bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm8,%ymm8
7116bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7117bc3d5698SJohn Baldwin
7118bc3d5698SJohn Baldwin	vpsrld	$13,%ymm9,%ymm1
7119bc3d5698SJohn Baldwin
7120bc3d5698SJohn Baldwin	vpslld	$19,%ymm9,%ymm2
7121bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm6,%ymm6
7122bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
7123bc3d5698SJohn Baldwin
7124bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm8,%ymm7
7125bc3d5698SJohn Baldwin
7126bc3d5698SJohn Baldwin	vpsrld	$22,%ymm9,%ymm1
7127bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7128bc3d5698SJohn Baldwin
7129bc3d5698SJohn Baldwin	vpslld	$10,%ymm9,%ymm2
7130bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm10,%ymm8
7131bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm12,%ymm12
7132bc3d5698SJohn Baldwin
7133bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7134bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7135bc3d5698SJohn Baldwin
7136bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm8,%ymm8
7137bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm8,%ymm8
7138bc3d5698SJohn Baldwin	addq	$256,%rbp
7139bc3d5698SJohn Baldwin	vmovdqu	288-256-128(%rbx),%ymm6
7140bc3d5698SJohn Baldwin	vpaddd	32-128(%rax),%ymm5,%ymm5
7141bc3d5698SJohn Baldwin
7142bc3d5698SJohn Baldwin	vpsrld	$3,%ymm6,%ymm7
7143bc3d5698SJohn Baldwin	vpsrld	$7,%ymm6,%ymm1
7144bc3d5698SJohn Baldwin	vpslld	$25,%ymm6,%ymm2
7145bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7146bc3d5698SJohn Baldwin	vpsrld	$18,%ymm6,%ymm1
7147bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7148bc3d5698SJohn Baldwin	vpslld	$14,%ymm6,%ymm2
7149bc3d5698SJohn Baldwin	vmovdqu	192-128(%rax),%ymm0
7150bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm3
7151bc3d5698SJohn Baldwin
7152bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7153bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7154bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7155bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7156bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7157bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm3,%ymm7
7158bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7159bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7160bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7161bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7162bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7163bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7164bc3d5698SJohn Baldwin	vpsrld	$6,%ymm12,%ymm7
7165bc3d5698SJohn Baldwin	vpslld	$26,%ymm12,%ymm2
7166bc3d5698SJohn Baldwin	vmovdqu	%ymm5,256-256-128(%rbx)
7167bc3d5698SJohn Baldwin	vpaddd	%ymm15,%ymm5,%ymm5
7168bc3d5698SJohn Baldwin
7169bc3d5698SJohn Baldwin	vpsrld	$11,%ymm12,%ymm1
7170bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7171bc3d5698SJohn Baldwin	vpslld	$21,%ymm12,%ymm2
7172bc3d5698SJohn Baldwin	vpaddd	-128(%rbp),%ymm5,%ymm5
7173bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7174bc3d5698SJohn Baldwin
7175bc3d5698SJohn Baldwin	vpsrld	$25,%ymm12,%ymm1
7176bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7177bc3d5698SJohn Baldwin
7178bc3d5698SJohn Baldwin	vpslld	$7,%ymm12,%ymm2
7179bc3d5698SJohn Baldwin	vpandn	%ymm14,%ymm12,%ymm0
7180bc3d5698SJohn Baldwin	vpand	%ymm13,%ymm12,%ymm3
7181bc3d5698SJohn Baldwin
7182bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7183bc3d5698SJohn Baldwin
7184bc3d5698SJohn Baldwin	vpsrld	$2,%ymm8,%ymm15
7185bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7186bc3d5698SJohn Baldwin
7187bc3d5698SJohn Baldwin	vpslld	$30,%ymm8,%ymm1
7188bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
7189bc3d5698SJohn Baldwin	vpxor	%ymm8,%ymm9,%ymm3
7190bc3d5698SJohn Baldwin
7191bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm15,%ymm15
7192bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7193bc3d5698SJohn Baldwin
7194bc3d5698SJohn Baldwin	vpsrld	$13,%ymm8,%ymm1
7195bc3d5698SJohn Baldwin
7196bc3d5698SJohn Baldwin	vpslld	$19,%ymm8,%ymm2
7197bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
7198bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
7199bc3d5698SJohn Baldwin
7200bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm15,%ymm7
7201bc3d5698SJohn Baldwin
7202bc3d5698SJohn Baldwin	vpsrld	$22,%ymm8,%ymm1
7203bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7204bc3d5698SJohn Baldwin
7205bc3d5698SJohn Baldwin	vpslld	$10,%ymm8,%ymm2
7206bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm9,%ymm15
7207bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
7208bc3d5698SJohn Baldwin
7209bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7210bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7211bc3d5698SJohn Baldwin
7212bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
7213bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm15,%ymm15
7214bc3d5698SJohn Baldwin	vmovdqu	320-256-128(%rbx),%ymm5
7215bc3d5698SJohn Baldwin	vpaddd	64-128(%rax),%ymm6,%ymm6
7216bc3d5698SJohn Baldwin
7217bc3d5698SJohn Baldwin	vpsrld	$3,%ymm5,%ymm7
7218bc3d5698SJohn Baldwin	vpsrld	$7,%ymm5,%ymm1
7219bc3d5698SJohn Baldwin	vpslld	$25,%ymm5,%ymm2
7220bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7221bc3d5698SJohn Baldwin	vpsrld	$18,%ymm5,%ymm1
7222bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7223bc3d5698SJohn Baldwin	vpslld	$14,%ymm5,%ymm2
7224bc3d5698SJohn Baldwin	vmovdqu	224-128(%rax),%ymm0
7225bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm4
7226bc3d5698SJohn Baldwin
7227bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7228bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7229bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7230bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7231bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7232bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm4,%ymm7
7233bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7234bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7235bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7236bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7237bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7238bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7239bc3d5698SJohn Baldwin	vpsrld	$6,%ymm11,%ymm7
7240bc3d5698SJohn Baldwin	vpslld	$26,%ymm11,%ymm2
7241bc3d5698SJohn Baldwin	vmovdqu	%ymm6,288-256-128(%rbx)
7242bc3d5698SJohn Baldwin	vpaddd	%ymm14,%ymm6,%ymm6
7243bc3d5698SJohn Baldwin
7244bc3d5698SJohn Baldwin	vpsrld	$11,%ymm11,%ymm1
7245bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7246bc3d5698SJohn Baldwin	vpslld	$21,%ymm11,%ymm2
7247bc3d5698SJohn Baldwin	vpaddd	-96(%rbp),%ymm6,%ymm6
7248bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7249bc3d5698SJohn Baldwin
7250bc3d5698SJohn Baldwin	vpsrld	$25,%ymm11,%ymm1
7251bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7252bc3d5698SJohn Baldwin
7253bc3d5698SJohn Baldwin	vpslld	$7,%ymm11,%ymm2
7254bc3d5698SJohn Baldwin	vpandn	%ymm13,%ymm11,%ymm0
7255bc3d5698SJohn Baldwin	vpand	%ymm12,%ymm11,%ymm4
7256bc3d5698SJohn Baldwin
7257bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7258bc3d5698SJohn Baldwin
7259bc3d5698SJohn Baldwin	vpsrld	$2,%ymm15,%ymm14
7260bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7261bc3d5698SJohn Baldwin
7262bc3d5698SJohn Baldwin	vpslld	$30,%ymm15,%ymm1
7263bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
7264bc3d5698SJohn Baldwin	vpxor	%ymm15,%ymm8,%ymm4
7265bc3d5698SJohn Baldwin
7266bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm14,%ymm14
7267bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7268bc3d5698SJohn Baldwin
7269bc3d5698SJohn Baldwin	vpsrld	$13,%ymm15,%ymm1
7270bc3d5698SJohn Baldwin
7271bc3d5698SJohn Baldwin	vpslld	$19,%ymm15,%ymm2
7272bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm6,%ymm6
7273bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
7274bc3d5698SJohn Baldwin
7275bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm14,%ymm7
7276bc3d5698SJohn Baldwin
7277bc3d5698SJohn Baldwin	vpsrld	$22,%ymm15,%ymm1
7278bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7279bc3d5698SJohn Baldwin
7280bc3d5698SJohn Baldwin	vpslld	$10,%ymm15,%ymm2
7281bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm8,%ymm14
7282bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm10,%ymm10
7283bc3d5698SJohn Baldwin
7284bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7285bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7286bc3d5698SJohn Baldwin
7287bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm14,%ymm14
7288bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm14,%ymm14
7289bc3d5698SJohn Baldwin	vmovdqu	352-256-128(%rbx),%ymm6
7290bc3d5698SJohn Baldwin	vpaddd	96-128(%rax),%ymm5,%ymm5
7291bc3d5698SJohn Baldwin
7292bc3d5698SJohn Baldwin	vpsrld	$3,%ymm6,%ymm7
7293bc3d5698SJohn Baldwin	vpsrld	$7,%ymm6,%ymm1
7294bc3d5698SJohn Baldwin	vpslld	$25,%ymm6,%ymm2
7295bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7296bc3d5698SJohn Baldwin	vpsrld	$18,%ymm6,%ymm1
7297bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7298bc3d5698SJohn Baldwin	vpslld	$14,%ymm6,%ymm2
7299bc3d5698SJohn Baldwin	vmovdqu	256-256-128(%rbx),%ymm0
7300bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm3
7301bc3d5698SJohn Baldwin
7302bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7303bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7304bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7305bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7306bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7307bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm3,%ymm7
7308bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7309bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7310bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7311bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7312bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7313bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7314bc3d5698SJohn Baldwin	vpsrld	$6,%ymm10,%ymm7
7315bc3d5698SJohn Baldwin	vpslld	$26,%ymm10,%ymm2
7316bc3d5698SJohn Baldwin	vmovdqu	%ymm5,320-256-128(%rbx)
7317bc3d5698SJohn Baldwin	vpaddd	%ymm13,%ymm5,%ymm5
7318bc3d5698SJohn Baldwin
7319bc3d5698SJohn Baldwin	vpsrld	$11,%ymm10,%ymm1
7320bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7321bc3d5698SJohn Baldwin	vpslld	$21,%ymm10,%ymm2
7322bc3d5698SJohn Baldwin	vpaddd	-64(%rbp),%ymm5,%ymm5
7323bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7324bc3d5698SJohn Baldwin
7325bc3d5698SJohn Baldwin	vpsrld	$25,%ymm10,%ymm1
7326bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7327bc3d5698SJohn Baldwin
7328bc3d5698SJohn Baldwin	vpslld	$7,%ymm10,%ymm2
7329bc3d5698SJohn Baldwin	vpandn	%ymm12,%ymm10,%ymm0
7330bc3d5698SJohn Baldwin	vpand	%ymm11,%ymm10,%ymm3
7331bc3d5698SJohn Baldwin
7332bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7333bc3d5698SJohn Baldwin
7334bc3d5698SJohn Baldwin	vpsrld	$2,%ymm14,%ymm13
7335bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7336bc3d5698SJohn Baldwin
7337bc3d5698SJohn Baldwin	vpslld	$30,%ymm14,%ymm1
7338bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
7339bc3d5698SJohn Baldwin	vpxor	%ymm14,%ymm15,%ymm3
7340bc3d5698SJohn Baldwin
7341bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm13,%ymm13
7342bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7343bc3d5698SJohn Baldwin
7344bc3d5698SJohn Baldwin	vpsrld	$13,%ymm14,%ymm1
7345bc3d5698SJohn Baldwin
7346bc3d5698SJohn Baldwin	vpslld	$19,%ymm14,%ymm2
7347bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
7348bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
7349bc3d5698SJohn Baldwin
7350bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm13,%ymm7
7351bc3d5698SJohn Baldwin
7352bc3d5698SJohn Baldwin	vpsrld	$22,%ymm14,%ymm1
7353bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7354bc3d5698SJohn Baldwin
7355bc3d5698SJohn Baldwin	vpslld	$10,%ymm14,%ymm2
7356bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm15,%ymm13
7357bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm9,%ymm9
7358bc3d5698SJohn Baldwin
7359bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7360bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7361bc3d5698SJohn Baldwin
7362bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm13,%ymm13
7363bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm13,%ymm13
7364bc3d5698SJohn Baldwin	vmovdqu	384-256-128(%rbx),%ymm5
7365bc3d5698SJohn Baldwin	vpaddd	128-128(%rax),%ymm6,%ymm6
7366bc3d5698SJohn Baldwin
7367bc3d5698SJohn Baldwin	vpsrld	$3,%ymm5,%ymm7
7368bc3d5698SJohn Baldwin	vpsrld	$7,%ymm5,%ymm1
7369bc3d5698SJohn Baldwin	vpslld	$25,%ymm5,%ymm2
7370bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7371bc3d5698SJohn Baldwin	vpsrld	$18,%ymm5,%ymm1
7372bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7373bc3d5698SJohn Baldwin	vpslld	$14,%ymm5,%ymm2
7374bc3d5698SJohn Baldwin	vmovdqu	288-256-128(%rbx),%ymm0
7375bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm4
7376bc3d5698SJohn Baldwin
7377bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7378bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7379bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7380bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7381bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7382bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm4,%ymm7
7383bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7384bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7385bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7386bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7387bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7388bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7389bc3d5698SJohn Baldwin	vpsrld	$6,%ymm9,%ymm7
7390bc3d5698SJohn Baldwin	vpslld	$26,%ymm9,%ymm2
7391bc3d5698SJohn Baldwin	vmovdqu	%ymm6,352-256-128(%rbx)
7392bc3d5698SJohn Baldwin	vpaddd	%ymm12,%ymm6,%ymm6
7393bc3d5698SJohn Baldwin
7394bc3d5698SJohn Baldwin	vpsrld	$11,%ymm9,%ymm1
7395bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7396bc3d5698SJohn Baldwin	vpslld	$21,%ymm9,%ymm2
7397bc3d5698SJohn Baldwin	vpaddd	-32(%rbp),%ymm6,%ymm6
7398bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7399bc3d5698SJohn Baldwin
7400bc3d5698SJohn Baldwin	vpsrld	$25,%ymm9,%ymm1
7401bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7402bc3d5698SJohn Baldwin
7403bc3d5698SJohn Baldwin	vpslld	$7,%ymm9,%ymm2
7404bc3d5698SJohn Baldwin	vpandn	%ymm11,%ymm9,%ymm0
7405bc3d5698SJohn Baldwin	vpand	%ymm10,%ymm9,%ymm4
7406bc3d5698SJohn Baldwin
7407bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7408bc3d5698SJohn Baldwin
7409bc3d5698SJohn Baldwin	vpsrld	$2,%ymm13,%ymm12
7410bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7411bc3d5698SJohn Baldwin
7412bc3d5698SJohn Baldwin	vpslld	$30,%ymm13,%ymm1
7413bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
7414bc3d5698SJohn Baldwin	vpxor	%ymm13,%ymm14,%ymm4
7415bc3d5698SJohn Baldwin
7416bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm12,%ymm12
7417bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7418bc3d5698SJohn Baldwin
7419bc3d5698SJohn Baldwin	vpsrld	$13,%ymm13,%ymm1
7420bc3d5698SJohn Baldwin
7421bc3d5698SJohn Baldwin	vpslld	$19,%ymm13,%ymm2
7422bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm6,%ymm6
7423bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
7424bc3d5698SJohn Baldwin
7425bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm12,%ymm7
7426bc3d5698SJohn Baldwin
7427bc3d5698SJohn Baldwin	vpsrld	$22,%ymm13,%ymm1
7428bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7429bc3d5698SJohn Baldwin
7430bc3d5698SJohn Baldwin	vpslld	$10,%ymm13,%ymm2
7431bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm14,%ymm12
7432bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm8,%ymm8
7433bc3d5698SJohn Baldwin
7434bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7435bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7436bc3d5698SJohn Baldwin
7437bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm12,%ymm12
7438bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm12,%ymm12
7439bc3d5698SJohn Baldwin	vmovdqu	416-256-128(%rbx),%ymm6
7440bc3d5698SJohn Baldwin	vpaddd	160-128(%rax),%ymm5,%ymm5
7441bc3d5698SJohn Baldwin
7442bc3d5698SJohn Baldwin	vpsrld	$3,%ymm6,%ymm7
7443bc3d5698SJohn Baldwin	vpsrld	$7,%ymm6,%ymm1
7444bc3d5698SJohn Baldwin	vpslld	$25,%ymm6,%ymm2
7445bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7446bc3d5698SJohn Baldwin	vpsrld	$18,%ymm6,%ymm1
7447bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7448bc3d5698SJohn Baldwin	vpslld	$14,%ymm6,%ymm2
7449bc3d5698SJohn Baldwin	vmovdqu	320-256-128(%rbx),%ymm0
7450bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm3
7451bc3d5698SJohn Baldwin
7452bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7453bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7454bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7455bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7456bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7457bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm3,%ymm7
7458bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7459bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7460bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7461bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7462bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7463bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7464bc3d5698SJohn Baldwin	vpsrld	$6,%ymm8,%ymm7
7465bc3d5698SJohn Baldwin	vpslld	$26,%ymm8,%ymm2
7466bc3d5698SJohn Baldwin	vmovdqu	%ymm5,384-256-128(%rbx)
7467bc3d5698SJohn Baldwin	vpaddd	%ymm11,%ymm5,%ymm5
7468bc3d5698SJohn Baldwin
7469bc3d5698SJohn Baldwin	vpsrld	$11,%ymm8,%ymm1
7470bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7471bc3d5698SJohn Baldwin	vpslld	$21,%ymm8,%ymm2
7472bc3d5698SJohn Baldwin	vpaddd	0(%rbp),%ymm5,%ymm5
7473bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7474bc3d5698SJohn Baldwin
7475bc3d5698SJohn Baldwin	vpsrld	$25,%ymm8,%ymm1
7476bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7477bc3d5698SJohn Baldwin
7478bc3d5698SJohn Baldwin	vpslld	$7,%ymm8,%ymm2
7479bc3d5698SJohn Baldwin	vpandn	%ymm10,%ymm8,%ymm0
7480bc3d5698SJohn Baldwin	vpand	%ymm9,%ymm8,%ymm3
7481bc3d5698SJohn Baldwin
7482bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7483bc3d5698SJohn Baldwin
7484bc3d5698SJohn Baldwin	vpsrld	$2,%ymm12,%ymm11
7485bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7486bc3d5698SJohn Baldwin
7487bc3d5698SJohn Baldwin	vpslld	$30,%ymm12,%ymm1
7488bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
7489bc3d5698SJohn Baldwin	vpxor	%ymm12,%ymm13,%ymm3
7490bc3d5698SJohn Baldwin
7491bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm11,%ymm11
7492bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7493bc3d5698SJohn Baldwin
7494bc3d5698SJohn Baldwin	vpsrld	$13,%ymm12,%ymm1
7495bc3d5698SJohn Baldwin
7496bc3d5698SJohn Baldwin	vpslld	$19,%ymm12,%ymm2
7497bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
7498bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
7499bc3d5698SJohn Baldwin
7500bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm11,%ymm7
7501bc3d5698SJohn Baldwin
7502bc3d5698SJohn Baldwin	vpsrld	$22,%ymm12,%ymm1
7503bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7504bc3d5698SJohn Baldwin
7505bc3d5698SJohn Baldwin	vpslld	$10,%ymm12,%ymm2
7506bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm13,%ymm11
7507bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
7508bc3d5698SJohn Baldwin
7509bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7510bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7511bc3d5698SJohn Baldwin
7512bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
7513bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm11,%ymm11
7514bc3d5698SJohn Baldwin	vmovdqu	448-256-128(%rbx),%ymm5
7515bc3d5698SJohn Baldwin	vpaddd	192-128(%rax),%ymm6,%ymm6
7516bc3d5698SJohn Baldwin
7517bc3d5698SJohn Baldwin	vpsrld	$3,%ymm5,%ymm7
7518bc3d5698SJohn Baldwin	vpsrld	$7,%ymm5,%ymm1
7519bc3d5698SJohn Baldwin	vpslld	$25,%ymm5,%ymm2
7520bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7521bc3d5698SJohn Baldwin	vpsrld	$18,%ymm5,%ymm1
7522bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7523bc3d5698SJohn Baldwin	vpslld	$14,%ymm5,%ymm2
7524bc3d5698SJohn Baldwin	vmovdqu	352-256-128(%rbx),%ymm0
7525bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm4
7526bc3d5698SJohn Baldwin
7527bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7528bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7529bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7530bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7531bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7532bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm4,%ymm7
7533bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7534bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7535bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7536bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7537bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7538bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7539bc3d5698SJohn Baldwin	vpsrld	$6,%ymm15,%ymm7
7540bc3d5698SJohn Baldwin	vpslld	$26,%ymm15,%ymm2
7541bc3d5698SJohn Baldwin	vmovdqu	%ymm6,416-256-128(%rbx)
7542bc3d5698SJohn Baldwin	vpaddd	%ymm10,%ymm6,%ymm6
7543bc3d5698SJohn Baldwin
7544bc3d5698SJohn Baldwin	vpsrld	$11,%ymm15,%ymm1
7545bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7546bc3d5698SJohn Baldwin	vpslld	$21,%ymm15,%ymm2
7547bc3d5698SJohn Baldwin	vpaddd	32(%rbp),%ymm6,%ymm6
7548bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7549bc3d5698SJohn Baldwin
7550bc3d5698SJohn Baldwin	vpsrld	$25,%ymm15,%ymm1
7551bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7552bc3d5698SJohn Baldwin
7553bc3d5698SJohn Baldwin	vpslld	$7,%ymm15,%ymm2
7554bc3d5698SJohn Baldwin	vpandn	%ymm9,%ymm15,%ymm0
7555bc3d5698SJohn Baldwin	vpand	%ymm8,%ymm15,%ymm4
7556bc3d5698SJohn Baldwin
7557bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7558bc3d5698SJohn Baldwin
7559bc3d5698SJohn Baldwin	vpsrld	$2,%ymm11,%ymm10
7560bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7561bc3d5698SJohn Baldwin
7562bc3d5698SJohn Baldwin	vpslld	$30,%ymm11,%ymm1
7563bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
7564bc3d5698SJohn Baldwin	vpxor	%ymm11,%ymm12,%ymm4
7565bc3d5698SJohn Baldwin
7566bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm10,%ymm10
7567bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7568bc3d5698SJohn Baldwin
7569bc3d5698SJohn Baldwin	vpsrld	$13,%ymm11,%ymm1
7570bc3d5698SJohn Baldwin
7571bc3d5698SJohn Baldwin	vpslld	$19,%ymm11,%ymm2
7572bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm6,%ymm6
7573bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
7574bc3d5698SJohn Baldwin
7575bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm10,%ymm7
7576bc3d5698SJohn Baldwin
7577bc3d5698SJohn Baldwin	vpsrld	$22,%ymm11,%ymm1
7578bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7579bc3d5698SJohn Baldwin
7580bc3d5698SJohn Baldwin	vpslld	$10,%ymm11,%ymm2
7581bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm12,%ymm10
7582bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm14,%ymm14
7583bc3d5698SJohn Baldwin
7584bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7585bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7586bc3d5698SJohn Baldwin
7587bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm10,%ymm10
7588bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm10,%ymm10
7589bc3d5698SJohn Baldwin	vmovdqu	480-256-128(%rbx),%ymm6
7590bc3d5698SJohn Baldwin	vpaddd	224-128(%rax),%ymm5,%ymm5
7591bc3d5698SJohn Baldwin
7592bc3d5698SJohn Baldwin	vpsrld	$3,%ymm6,%ymm7
7593bc3d5698SJohn Baldwin	vpsrld	$7,%ymm6,%ymm1
7594bc3d5698SJohn Baldwin	vpslld	$25,%ymm6,%ymm2
7595bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7596bc3d5698SJohn Baldwin	vpsrld	$18,%ymm6,%ymm1
7597bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7598bc3d5698SJohn Baldwin	vpslld	$14,%ymm6,%ymm2
7599bc3d5698SJohn Baldwin	vmovdqu	384-256-128(%rbx),%ymm0
7600bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm3
7601bc3d5698SJohn Baldwin
7602bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7603bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7604bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7605bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7606bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7607bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm3,%ymm7
7608bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7609bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7610bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7611bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7612bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7613bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7614bc3d5698SJohn Baldwin	vpsrld	$6,%ymm14,%ymm7
7615bc3d5698SJohn Baldwin	vpslld	$26,%ymm14,%ymm2
7616bc3d5698SJohn Baldwin	vmovdqu	%ymm5,448-256-128(%rbx)
7617bc3d5698SJohn Baldwin	vpaddd	%ymm9,%ymm5,%ymm5
7618bc3d5698SJohn Baldwin
7619bc3d5698SJohn Baldwin	vpsrld	$11,%ymm14,%ymm1
7620bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7621bc3d5698SJohn Baldwin	vpslld	$21,%ymm14,%ymm2
7622bc3d5698SJohn Baldwin	vpaddd	64(%rbp),%ymm5,%ymm5
7623bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7624bc3d5698SJohn Baldwin
7625bc3d5698SJohn Baldwin	vpsrld	$25,%ymm14,%ymm1
7626bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7627bc3d5698SJohn Baldwin
7628bc3d5698SJohn Baldwin	vpslld	$7,%ymm14,%ymm2
7629bc3d5698SJohn Baldwin	vpandn	%ymm8,%ymm14,%ymm0
7630bc3d5698SJohn Baldwin	vpand	%ymm15,%ymm14,%ymm3
7631bc3d5698SJohn Baldwin
7632bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7633bc3d5698SJohn Baldwin
7634bc3d5698SJohn Baldwin	vpsrld	$2,%ymm10,%ymm9
7635bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7636bc3d5698SJohn Baldwin
7637bc3d5698SJohn Baldwin	vpslld	$30,%ymm10,%ymm1
7638bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm0,%ymm0
7639bc3d5698SJohn Baldwin	vpxor	%ymm10,%ymm11,%ymm3
7640bc3d5698SJohn Baldwin
7641bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm9,%ymm9
7642bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm5,%ymm5
7643bc3d5698SJohn Baldwin
7644bc3d5698SJohn Baldwin	vpsrld	$13,%ymm10,%ymm1
7645bc3d5698SJohn Baldwin
7646bc3d5698SJohn Baldwin	vpslld	$19,%ymm10,%ymm2
7647bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm5,%ymm5
7648bc3d5698SJohn Baldwin	vpand	%ymm3,%ymm4,%ymm4
7649bc3d5698SJohn Baldwin
7650bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm9,%ymm7
7651bc3d5698SJohn Baldwin
7652bc3d5698SJohn Baldwin	vpsrld	$22,%ymm10,%ymm1
7653bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7654bc3d5698SJohn Baldwin
7655bc3d5698SJohn Baldwin	vpslld	$10,%ymm10,%ymm2
7656bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm11,%ymm9
7657bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm13,%ymm13
7658bc3d5698SJohn Baldwin
7659bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7660bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7661bc3d5698SJohn Baldwin
7662bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm9,%ymm9
7663bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm9,%ymm9
7664bc3d5698SJohn Baldwin	vmovdqu	0-128(%rax),%ymm5
7665bc3d5698SJohn Baldwin	vpaddd	256-256-128(%rbx),%ymm6,%ymm6
7666bc3d5698SJohn Baldwin
7667bc3d5698SJohn Baldwin	vpsrld	$3,%ymm5,%ymm7
7668bc3d5698SJohn Baldwin	vpsrld	$7,%ymm5,%ymm1
7669bc3d5698SJohn Baldwin	vpslld	$25,%ymm5,%ymm2
7670bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7671bc3d5698SJohn Baldwin	vpsrld	$18,%ymm5,%ymm1
7672bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7673bc3d5698SJohn Baldwin	vpslld	$14,%ymm5,%ymm2
7674bc3d5698SJohn Baldwin	vmovdqu	416-256-128(%rbx),%ymm0
7675bc3d5698SJohn Baldwin	vpsrld	$10,%ymm0,%ymm4
7676bc3d5698SJohn Baldwin
7677bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7678bc3d5698SJohn Baldwin	vpsrld	$17,%ymm0,%ymm1
7679bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7680bc3d5698SJohn Baldwin	vpslld	$15,%ymm0,%ymm2
7681bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7682bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm4,%ymm7
7683bc3d5698SJohn Baldwin	vpsrld	$19,%ymm0,%ymm1
7684bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7685bc3d5698SJohn Baldwin	vpslld	$13,%ymm0,%ymm2
7686bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7687bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7688bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7689bc3d5698SJohn Baldwin	vpsrld	$6,%ymm13,%ymm7
7690bc3d5698SJohn Baldwin	vpslld	$26,%ymm13,%ymm2
7691bc3d5698SJohn Baldwin	vmovdqu	%ymm6,480-256-128(%rbx)
7692bc3d5698SJohn Baldwin	vpaddd	%ymm8,%ymm6,%ymm6
7693bc3d5698SJohn Baldwin
7694bc3d5698SJohn Baldwin	vpsrld	$11,%ymm13,%ymm1
7695bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7696bc3d5698SJohn Baldwin	vpslld	$21,%ymm13,%ymm2
7697bc3d5698SJohn Baldwin	vpaddd	96(%rbp),%ymm6,%ymm6
7698bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7699bc3d5698SJohn Baldwin
7700bc3d5698SJohn Baldwin	vpsrld	$25,%ymm13,%ymm1
7701bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7702bc3d5698SJohn Baldwin
7703bc3d5698SJohn Baldwin	vpslld	$7,%ymm13,%ymm2
7704bc3d5698SJohn Baldwin	vpandn	%ymm15,%ymm13,%ymm0
7705bc3d5698SJohn Baldwin	vpand	%ymm14,%ymm13,%ymm4
7706bc3d5698SJohn Baldwin
7707bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7708bc3d5698SJohn Baldwin
7709bc3d5698SJohn Baldwin	vpsrld	$2,%ymm9,%ymm8
7710bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7711bc3d5698SJohn Baldwin
7712bc3d5698SJohn Baldwin	vpslld	$30,%ymm9,%ymm1
7713bc3d5698SJohn Baldwin	vpxor	%ymm4,%ymm0,%ymm0
7714bc3d5698SJohn Baldwin	vpxor	%ymm9,%ymm10,%ymm4
7715bc3d5698SJohn Baldwin
7716bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm8,%ymm8
7717bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm6,%ymm6
7718bc3d5698SJohn Baldwin
7719bc3d5698SJohn Baldwin	vpsrld	$13,%ymm9,%ymm1
7720bc3d5698SJohn Baldwin
7721bc3d5698SJohn Baldwin	vpslld	$19,%ymm9,%ymm2
7722bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm6,%ymm6
7723bc3d5698SJohn Baldwin	vpand	%ymm4,%ymm3,%ymm3
7724bc3d5698SJohn Baldwin
7725bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm8,%ymm7
7726bc3d5698SJohn Baldwin
7727bc3d5698SJohn Baldwin	vpsrld	$22,%ymm9,%ymm1
7728bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7729bc3d5698SJohn Baldwin
7730bc3d5698SJohn Baldwin	vpslld	$10,%ymm9,%ymm2
7731bc3d5698SJohn Baldwin	vpxor	%ymm3,%ymm10,%ymm8
7732bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm12,%ymm12
7733bc3d5698SJohn Baldwin
7734bc3d5698SJohn Baldwin	vpxor	%ymm1,%ymm7,%ymm7
7735bc3d5698SJohn Baldwin	vpxor	%ymm2,%ymm7,%ymm7
7736bc3d5698SJohn Baldwin
7737bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm8,%ymm8
7738bc3d5698SJohn Baldwin	vpaddd	%ymm7,%ymm8,%ymm8
7739bc3d5698SJohn Baldwin	addq	$256,%rbp
7740bc3d5698SJohn Baldwin	decl	%ecx
7741bc3d5698SJohn Baldwin	jnz	.Loop_16_xx_avx2
7742bc3d5698SJohn Baldwin
7743bc3d5698SJohn Baldwin	movl	$1,%ecx
7744bc3d5698SJohn Baldwin	leaq	512(%rsp),%rbx
7745bc3d5698SJohn Baldwin	leaq	K256+128(%rip),%rbp
7746bc3d5698SJohn Baldwin	cmpl	0(%rbx),%ecx
7747bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r12
7748bc3d5698SJohn Baldwin	cmpl	4(%rbx),%ecx
7749bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r13
7750bc3d5698SJohn Baldwin	cmpl	8(%rbx),%ecx
7751bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r14
7752bc3d5698SJohn Baldwin	cmpl	12(%rbx),%ecx
7753bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r15
7754bc3d5698SJohn Baldwin	cmpl	16(%rbx),%ecx
7755bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r8
7756bc3d5698SJohn Baldwin	cmpl	20(%rbx),%ecx
7757bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r9
7758bc3d5698SJohn Baldwin	cmpl	24(%rbx),%ecx
7759bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r10
7760bc3d5698SJohn Baldwin	cmpl	28(%rbx),%ecx
7761bc3d5698SJohn Baldwin	cmovgeq	%rbp,%r11
7762bc3d5698SJohn Baldwin	vmovdqa	(%rbx),%ymm7
7763bc3d5698SJohn Baldwin	vpxor	%ymm0,%ymm0,%ymm0
7764bc3d5698SJohn Baldwin	vmovdqa	%ymm7,%ymm6
7765bc3d5698SJohn Baldwin	vpcmpgtd	%ymm0,%ymm6,%ymm6
7766bc3d5698SJohn Baldwin	vpaddd	%ymm6,%ymm7,%ymm7
7767bc3d5698SJohn Baldwin
7768bc3d5698SJohn Baldwin	vmovdqu	0-128(%rdi),%ymm0
7769bc3d5698SJohn Baldwin	vpand	%ymm6,%ymm8,%ymm8
7770bc3d5698SJohn Baldwin	vmovdqu	32-128(%rdi),%ymm1
7771bc3d5698SJohn Baldwin	vpand	%ymm6,%ymm9,%ymm9
7772bc3d5698SJohn Baldwin	vmovdqu	64-128(%rdi),%ymm2
7773bc3d5698SJohn Baldwin	vpand	%ymm6,%ymm10,%ymm10
7774bc3d5698SJohn Baldwin	vmovdqu	96-128(%rdi),%ymm5
7775bc3d5698SJohn Baldwin	vpand	%ymm6,%ymm11,%ymm11
7776bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm8,%ymm8
7777bc3d5698SJohn Baldwin	vmovdqu	128-128(%rdi),%ymm0
7778bc3d5698SJohn Baldwin	vpand	%ymm6,%ymm12,%ymm12
7779bc3d5698SJohn Baldwin	vpaddd	%ymm1,%ymm9,%ymm9
7780bc3d5698SJohn Baldwin	vmovdqu	160-128(%rdi),%ymm1
7781bc3d5698SJohn Baldwin	vpand	%ymm6,%ymm13,%ymm13
7782bc3d5698SJohn Baldwin	vpaddd	%ymm2,%ymm10,%ymm10
7783bc3d5698SJohn Baldwin	vmovdqu	192-128(%rdi),%ymm2
7784bc3d5698SJohn Baldwin	vpand	%ymm6,%ymm14,%ymm14
7785bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm11,%ymm11
7786bc3d5698SJohn Baldwin	vmovdqu	224-128(%rdi),%ymm5
7787bc3d5698SJohn Baldwin	vpand	%ymm6,%ymm15,%ymm15
7788bc3d5698SJohn Baldwin	vpaddd	%ymm0,%ymm12,%ymm12
7789bc3d5698SJohn Baldwin	vpaddd	%ymm1,%ymm13,%ymm13
7790bc3d5698SJohn Baldwin	vmovdqu	%ymm8,0-128(%rdi)
7791bc3d5698SJohn Baldwin	vpaddd	%ymm2,%ymm14,%ymm14
7792bc3d5698SJohn Baldwin	vmovdqu	%ymm9,32-128(%rdi)
7793bc3d5698SJohn Baldwin	vpaddd	%ymm5,%ymm15,%ymm15
7794bc3d5698SJohn Baldwin	vmovdqu	%ymm10,64-128(%rdi)
7795bc3d5698SJohn Baldwin	vmovdqu	%ymm11,96-128(%rdi)
7796bc3d5698SJohn Baldwin	vmovdqu	%ymm12,128-128(%rdi)
7797bc3d5698SJohn Baldwin	vmovdqu	%ymm13,160-128(%rdi)
7798bc3d5698SJohn Baldwin	vmovdqu	%ymm14,192-128(%rdi)
7799bc3d5698SJohn Baldwin	vmovdqu	%ymm15,224-128(%rdi)
7800bc3d5698SJohn Baldwin
7801bc3d5698SJohn Baldwin	vmovdqu	%ymm7,(%rbx)
7802bc3d5698SJohn Baldwin	leaq	256+128(%rsp),%rbx
7803bc3d5698SJohn Baldwin	vmovdqu	.Lpbswap(%rip),%ymm6
7804bc3d5698SJohn Baldwin	decl	%edx
7805bc3d5698SJohn Baldwin	jnz	.Loop_avx2
7806bc3d5698SJohn Baldwin
7807bc3d5698SJohn Baldwin
7808bc3d5698SJohn Baldwin
7809bc3d5698SJohn Baldwin
7810bc3d5698SJohn Baldwin
7811bc3d5698SJohn Baldwin
7812bc3d5698SJohn Baldwin
7813bc3d5698SJohn Baldwin.Ldone_avx2:
7814bc3d5698SJohn Baldwin	movq	544(%rsp),%rax
7815bc3d5698SJohn Baldwin.cfi_def_cfa	%rax,8
7816bc3d5698SJohn Baldwin	vzeroupper
7817bc3d5698SJohn Baldwin	movq	-48(%rax),%r15
7818bc3d5698SJohn Baldwin.cfi_restore	%r15
7819bc3d5698SJohn Baldwin	movq	-40(%rax),%r14
7820bc3d5698SJohn Baldwin.cfi_restore	%r14
7821bc3d5698SJohn Baldwin	movq	-32(%rax),%r13
7822bc3d5698SJohn Baldwin.cfi_restore	%r13
7823bc3d5698SJohn Baldwin	movq	-24(%rax),%r12
7824bc3d5698SJohn Baldwin.cfi_restore	%r12
7825bc3d5698SJohn Baldwin	movq	-16(%rax),%rbp
7826bc3d5698SJohn Baldwin.cfi_restore	%rbp
7827bc3d5698SJohn Baldwin	movq	-8(%rax),%rbx
7828bc3d5698SJohn Baldwin.cfi_restore	%rbx
7829bc3d5698SJohn Baldwin	leaq	(%rax),%rsp
7830bc3d5698SJohn Baldwin.cfi_def_cfa_register	%rsp
7831bc3d5698SJohn Baldwin.Lepilogue_avx2:
7832bc3d5698SJohn Baldwin	.byte	0xf3,0xc3
7833bc3d5698SJohn Baldwin.cfi_endproc
7834bc3d5698SJohn Baldwin.size	sha256_multi_block_avx2,.-sha256_multi_block_avx2
7835bc3d5698SJohn Baldwin.align	256
7836bc3d5698SJohn BaldwinK256:
7837bc3d5698SJohn Baldwin.long	1116352408,1116352408,1116352408,1116352408
7838bc3d5698SJohn Baldwin.long	1116352408,1116352408,1116352408,1116352408
7839bc3d5698SJohn Baldwin.long	1899447441,1899447441,1899447441,1899447441
7840bc3d5698SJohn Baldwin.long	1899447441,1899447441,1899447441,1899447441
7841bc3d5698SJohn Baldwin.long	3049323471,3049323471,3049323471,3049323471
7842bc3d5698SJohn Baldwin.long	3049323471,3049323471,3049323471,3049323471
7843bc3d5698SJohn Baldwin.long	3921009573,3921009573,3921009573,3921009573
7844bc3d5698SJohn Baldwin.long	3921009573,3921009573,3921009573,3921009573
7845bc3d5698SJohn Baldwin.long	961987163,961987163,961987163,961987163
7846bc3d5698SJohn Baldwin.long	961987163,961987163,961987163,961987163
7847bc3d5698SJohn Baldwin.long	1508970993,1508970993,1508970993,1508970993
7848bc3d5698SJohn Baldwin.long	1508970993,1508970993,1508970993,1508970993
7849bc3d5698SJohn Baldwin.long	2453635748,2453635748,2453635748,2453635748
7850bc3d5698SJohn Baldwin.long	2453635748,2453635748,2453635748,2453635748
7851bc3d5698SJohn Baldwin.long	2870763221,2870763221,2870763221,2870763221
7852bc3d5698SJohn Baldwin.long	2870763221,2870763221,2870763221,2870763221
7853bc3d5698SJohn Baldwin.long	3624381080,3624381080,3624381080,3624381080
7854bc3d5698SJohn Baldwin.long	3624381080,3624381080,3624381080,3624381080
7855bc3d5698SJohn Baldwin.long	310598401,310598401,310598401,310598401
7856bc3d5698SJohn Baldwin.long	310598401,310598401,310598401,310598401
7857bc3d5698SJohn Baldwin.long	607225278,607225278,607225278,607225278
7858bc3d5698SJohn Baldwin.long	607225278,607225278,607225278,607225278
7859bc3d5698SJohn Baldwin.long	1426881987,1426881987,1426881987,1426881987
7860bc3d5698SJohn Baldwin.long	1426881987,1426881987,1426881987,1426881987
7861bc3d5698SJohn Baldwin.long	1925078388,1925078388,1925078388,1925078388
7862bc3d5698SJohn Baldwin.long	1925078388,1925078388,1925078388,1925078388
7863bc3d5698SJohn Baldwin.long	2162078206,2162078206,2162078206,2162078206
7864bc3d5698SJohn Baldwin.long	2162078206,2162078206,2162078206,2162078206
7865bc3d5698SJohn Baldwin.long	2614888103,2614888103,2614888103,2614888103
7866bc3d5698SJohn Baldwin.long	2614888103,2614888103,2614888103,2614888103
7867bc3d5698SJohn Baldwin.long	3248222580,3248222580,3248222580,3248222580
7868bc3d5698SJohn Baldwin.long	3248222580,3248222580,3248222580,3248222580
7869bc3d5698SJohn Baldwin.long	3835390401,3835390401,3835390401,3835390401
7870bc3d5698SJohn Baldwin.long	3835390401,3835390401,3835390401,3835390401
7871bc3d5698SJohn Baldwin.long	4022224774,4022224774,4022224774,4022224774
7872bc3d5698SJohn Baldwin.long	4022224774,4022224774,4022224774,4022224774
7873bc3d5698SJohn Baldwin.long	264347078,264347078,264347078,264347078
7874bc3d5698SJohn Baldwin.long	264347078,264347078,264347078,264347078
7875bc3d5698SJohn Baldwin.long	604807628,604807628,604807628,604807628
7876bc3d5698SJohn Baldwin.long	604807628,604807628,604807628,604807628
7877bc3d5698SJohn Baldwin.long	770255983,770255983,770255983,770255983
7878bc3d5698SJohn Baldwin.long	770255983,770255983,770255983,770255983
7879bc3d5698SJohn Baldwin.long	1249150122,1249150122,1249150122,1249150122
7880bc3d5698SJohn Baldwin.long	1249150122,1249150122,1249150122,1249150122
7881bc3d5698SJohn Baldwin.long	1555081692,1555081692,1555081692,1555081692
7882bc3d5698SJohn Baldwin.long	1555081692,1555081692,1555081692,1555081692
7883bc3d5698SJohn Baldwin.long	1996064986,1996064986,1996064986,1996064986
7884bc3d5698SJohn Baldwin.long	1996064986,1996064986,1996064986,1996064986
7885bc3d5698SJohn Baldwin.long	2554220882,2554220882,2554220882,2554220882
7886bc3d5698SJohn Baldwin.long	2554220882,2554220882,2554220882,2554220882
7887bc3d5698SJohn Baldwin.long	2821834349,2821834349,2821834349,2821834349
7888bc3d5698SJohn Baldwin.long	2821834349,2821834349,2821834349,2821834349
7889bc3d5698SJohn Baldwin.long	2952996808,2952996808,2952996808,2952996808
7890bc3d5698SJohn Baldwin.long	2952996808,2952996808,2952996808,2952996808
7891bc3d5698SJohn Baldwin.long	3210313671,3210313671,3210313671,3210313671
7892bc3d5698SJohn Baldwin.long	3210313671,3210313671,3210313671,3210313671
7893bc3d5698SJohn Baldwin.long	3336571891,3336571891,3336571891,3336571891
7894bc3d5698SJohn Baldwin.long	3336571891,3336571891,3336571891,3336571891
7895bc3d5698SJohn Baldwin.long	3584528711,3584528711,3584528711,3584528711
7896bc3d5698SJohn Baldwin.long	3584528711,3584528711,3584528711,3584528711
7897bc3d5698SJohn Baldwin.long	113926993,113926993,113926993,113926993
7898bc3d5698SJohn Baldwin.long	113926993,113926993,113926993,113926993
7899bc3d5698SJohn Baldwin.long	338241895,338241895,338241895,338241895
7900bc3d5698SJohn Baldwin.long	338241895,338241895,338241895,338241895
7901bc3d5698SJohn Baldwin.long	666307205,666307205,666307205,666307205
7902bc3d5698SJohn Baldwin.long	666307205,666307205,666307205,666307205
7903bc3d5698SJohn Baldwin.long	773529912,773529912,773529912,773529912
7904bc3d5698SJohn Baldwin.long	773529912,773529912,773529912,773529912
7905bc3d5698SJohn Baldwin.long	1294757372,1294757372,1294757372,1294757372
7906bc3d5698SJohn Baldwin.long	1294757372,1294757372,1294757372,1294757372
7907bc3d5698SJohn Baldwin.long	1396182291,1396182291,1396182291,1396182291
7908bc3d5698SJohn Baldwin.long	1396182291,1396182291,1396182291,1396182291
7909bc3d5698SJohn Baldwin.long	1695183700,1695183700,1695183700,1695183700
7910bc3d5698SJohn Baldwin.long	1695183700,1695183700,1695183700,1695183700
7911bc3d5698SJohn Baldwin.long	1986661051,1986661051,1986661051,1986661051
7912bc3d5698SJohn Baldwin.long	1986661051,1986661051,1986661051,1986661051
7913bc3d5698SJohn Baldwin.long	2177026350,2177026350,2177026350,2177026350
7914bc3d5698SJohn Baldwin.long	2177026350,2177026350,2177026350,2177026350
7915bc3d5698SJohn Baldwin.long	2456956037,2456956037,2456956037,2456956037
7916bc3d5698SJohn Baldwin.long	2456956037,2456956037,2456956037,2456956037
7917bc3d5698SJohn Baldwin.long	2730485921,2730485921,2730485921,2730485921
7918bc3d5698SJohn Baldwin.long	2730485921,2730485921,2730485921,2730485921
7919bc3d5698SJohn Baldwin.long	2820302411,2820302411,2820302411,2820302411
7920bc3d5698SJohn Baldwin.long	2820302411,2820302411,2820302411,2820302411
7921bc3d5698SJohn Baldwin.long	3259730800,3259730800,3259730800,3259730800
7922bc3d5698SJohn Baldwin.long	3259730800,3259730800,3259730800,3259730800
7923bc3d5698SJohn Baldwin.long	3345764771,3345764771,3345764771,3345764771
7924bc3d5698SJohn Baldwin.long	3345764771,3345764771,3345764771,3345764771
7925bc3d5698SJohn Baldwin.long	3516065817,3516065817,3516065817,3516065817
7926bc3d5698SJohn Baldwin.long	3516065817,3516065817,3516065817,3516065817
7927bc3d5698SJohn Baldwin.long	3600352804,3600352804,3600352804,3600352804
7928bc3d5698SJohn Baldwin.long	3600352804,3600352804,3600352804,3600352804
7929bc3d5698SJohn Baldwin.long	4094571909,4094571909,4094571909,4094571909
7930bc3d5698SJohn Baldwin.long	4094571909,4094571909,4094571909,4094571909
7931bc3d5698SJohn Baldwin.long	275423344,275423344,275423344,275423344
7932bc3d5698SJohn Baldwin.long	275423344,275423344,275423344,275423344
7933bc3d5698SJohn Baldwin.long	430227734,430227734,430227734,430227734
7934bc3d5698SJohn Baldwin.long	430227734,430227734,430227734,430227734
7935bc3d5698SJohn Baldwin.long	506948616,506948616,506948616,506948616
7936bc3d5698SJohn Baldwin.long	506948616,506948616,506948616,506948616
7937bc3d5698SJohn Baldwin.long	659060556,659060556,659060556,659060556
7938bc3d5698SJohn Baldwin.long	659060556,659060556,659060556,659060556
7939bc3d5698SJohn Baldwin.long	883997877,883997877,883997877,883997877
7940bc3d5698SJohn Baldwin.long	883997877,883997877,883997877,883997877
7941bc3d5698SJohn Baldwin.long	958139571,958139571,958139571,958139571
7942bc3d5698SJohn Baldwin.long	958139571,958139571,958139571,958139571
7943bc3d5698SJohn Baldwin.long	1322822218,1322822218,1322822218,1322822218
7944bc3d5698SJohn Baldwin.long	1322822218,1322822218,1322822218,1322822218
7945bc3d5698SJohn Baldwin.long	1537002063,1537002063,1537002063,1537002063
7946bc3d5698SJohn Baldwin.long	1537002063,1537002063,1537002063,1537002063
7947bc3d5698SJohn Baldwin.long	1747873779,1747873779,1747873779,1747873779
7948bc3d5698SJohn Baldwin.long	1747873779,1747873779,1747873779,1747873779
7949bc3d5698SJohn Baldwin.long	1955562222,1955562222,1955562222,1955562222
7950bc3d5698SJohn Baldwin.long	1955562222,1955562222,1955562222,1955562222
7951bc3d5698SJohn Baldwin.long	2024104815,2024104815,2024104815,2024104815
7952bc3d5698SJohn Baldwin.long	2024104815,2024104815,2024104815,2024104815
7953bc3d5698SJohn Baldwin.long	2227730452,2227730452,2227730452,2227730452
7954bc3d5698SJohn Baldwin.long	2227730452,2227730452,2227730452,2227730452
7955bc3d5698SJohn Baldwin.long	2361852424,2361852424,2361852424,2361852424
7956bc3d5698SJohn Baldwin.long	2361852424,2361852424,2361852424,2361852424
7957bc3d5698SJohn Baldwin.long	2428436474,2428436474,2428436474,2428436474
7958bc3d5698SJohn Baldwin.long	2428436474,2428436474,2428436474,2428436474
7959bc3d5698SJohn Baldwin.long	2756734187,2756734187,2756734187,2756734187
7960bc3d5698SJohn Baldwin.long	2756734187,2756734187,2756734187,2756734187
7961bc3d5698SJohn Baldwin.long	3204031479,3204031479,3204031479,3204031479
7962bc3d5698SJohn Baldwin.long	3204031479,3204031479,3204031479,3204031479
7963bc3d5698SJohn Baldwin.long	3329325298,3329325298,3329325298,3329325298
7964bc3d5698SJohn Baldwin.long	3329325298,3329325298,3329325298,3329325298
7965bc3d5698SJohn Baldwin.Lpbswap:
7966bc3d5698SJohn Baldwin.long	0x00010203,0x04050607,0x08090a0b,0x0c0d0e0f
7967bc3d5698SJohn Baldwin.long	0x00010203,0x04050607,0x08090a0b,0x0c0d0e0f
7968bc3d5698SJohn BaldwinK256_shaext:
7969bc3d5698SJohn Baldwin.long	0x428a2f98,0x71374491,0xb5c0fbcf,0xe9b5dba5
7970bc3d5698SJohn Baldwin.long	0x3956c25b,0x59f111f1,0x923f82a4,0xab1c5ed5
7971bc3d5698SJohn Baldwin.long	0xd807aa98,0x12835b01,0x243185be,0x550c7dc3
7972bc3d5698SJohn Baldwin.long	0x72be5d74,0x80deb1fe,0x9bdc06a7,0xc19bf174
7973bc3d5698SJohn Baldwin.long	0xe49b69c1,0xefbe4786,0x0fc19dc6,0x240ca1cc
7974bc3d5698SJohn Baldwin.long	0x2de92c6f,0x4a7484aa,0x5cb0a9dc,0x76f988da
7975bc3d5698SJohn Baldwin.long	0x983e5152,0xa831c66d,0xb00327c8,0xbf597fc7
7976bc3d5698SJohn Baldwin.long	0xc6e00bf3,0xd5a79147,0x06ca6351,0x14292967
7977bc3d5698SJohn Baldwin.long	0x27b70a85,0x2e1b2138,0x4d2c6dfc,0x53380d13
7978bc3d5698SJohn Baldwin.long	0x650a7354,0x766a0abb,0x81c2c92e,0x92722c85
7979bc3d5698SJohn Baldwin.long	0xa2bfe8a1,0xa81a664b,0xc24b8b70,0xc76c51a3
7980bc3d5698SJohn Baldwin.long	0xd192e819,0xd6990624,0xf40e3585,0x106aa070
7981bc3d5698SJohn Baldwin.long	0x19a4c116,0x1e376c08,0x2748774c,0x34b0bcb5
7982bc3d5698SJohn Baldwin.long	0x391c0cb3,0x4ed8aa4a,0x5b9cca4f,0x682e6ff3
7983bc3d5698SJohn Baldwin.long	0x748f82ee,0x78a5636f,0x84c87814,0x8cc70208
7984bc3d5698SJohn Baldwin.long	0x90befffa,0xa4506ceb,0xbef9a3f7,0xc67178f2
7985bc3d5698SJohn Baldwin.byte	83,72,65,50,53,54,32,109,117,108,116,105,45,98,108,111,99,107,32,116,114,97,110,115,102,111,114,109,32,102,111,114,32,120,56,54,95,54,52,44,32,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0
7986*c0855eaaSJohn Baldwin	.section ".note.gnu.property", "a"
7987*c0855eaaSJohn Baldwin	.p2align 3
7988*c0855eaaSJohn Baldwin	.long 1f - 0f
7989*c0855eaaSJohn Baldwin	.long 4f - 1f
7990*c0855eaaSJohn Baldwin	.long 5
7991*c0855eaaSJohn Baldwin0:
7992*c0855eaaSJohn Baldwin	# "GNU" encoded with .byte, since .asciz isn't supported
7993*c0855eaaSJohn Baldwin	# on Solaris.
7994*c0855eaaSJohn Baldwin	.byte 0x47
7995*c0855eaaSJohn Baldwin	.byte 0x4e
7996*c0855eaaSJohn Baldwin	.byte 0x55
7997*c0855eaaSJohn Baldwin	.byte 0
7998*c0855eaaSJohn Baldwin1:
7999*c0855eaaSJohn Baldwin	.p2align 3
8000*c0855eaaSJohn Baldwin	.long 0xc0000002
8001*c0855eaaSJohn Baldwin	.long 3f - 2f
8002*c0855eaaSJohn Baldwin2:
8003*c0855eaaSJohn Baldwin	.long 3
8004*c0855eaaSJohn Baldwin3:
8005*c0855eaaSJohn Baldwin	.p2align 3
8006*c0855eaaSJohn Baldwin4:
8007