xref: /freebsd/sys/crypto/openssl/amd64/sha256-x86_64.S (revision 4543ef516683042d46f3bd3bb8a4f3f746e00499)
1/* Do not modify. This file is auto-generated from sha512-x86_64.pl. */
2.text
3
4
5.globl	sha256_block_data_order
6.type	sha256_block_data_order,@function
7.align	16
8sha256_block_data_order:
9.cfi_startproc
10	leaq	OPENSSL_ia32cap_P(%rip),%r11
11	movl	0(%r11),%r9d
12	movl	4(%r11),%r10d
13	movl	8(%r11),%r11d
14	testl	$536870912,%r11d
15	jnz	_shaext_shortcut
16	andl	$296,%r11d
17	cmpl	$296,%r11d
18	je	.Lavx2_shortcut
19	andl	$1073741824,%r9d
20	andl	$268435968,%r10d
21	orl	%r9d,%r10d
22	cmpl	$1342177792,%r10d
23	je	.Lavx_shortcut
24	testl	$512,%r10d
25	jnz	.Lssse3_shortcut
26	movq	%rsp,%rax
27.cfi_def_cfa_register	%rax
28	pushq	%rbx
29.cfi_offset	%rbx,-16
30	pushq	%rbp
31.cfi_offset	%rbp,-24
32	pushq	%r12
33.cfi_offset	%r12,-32
34	pushq	%r13
35.cfi_offset	%r13,-40
36	pushq	%r14
37.cfi_offset	%r14,-48
38	pushq	%r15
39.cfi_offset	%r15,-56
40	shlq	$4,%rdx
41	subq	$64+32,%rsp
42	leaq	(%rsi,%rdx,4),%rdx
43	andq	$-64,%rsp
44	movq	%rdi,64+0(%rsp)
45	movq	%rsi,64+8(%rsp)
46	movq	%rdx,64+16(%rsp)
47	movq	%rax,88(%rsp)
48.cfi_escape	0x0f,0x06,0x77,0xd8,0x00,0x06,0x23,0x08
49.Lprologue:
50
51	movl	0(%rdi),%eax
52	movl	4(%rdi),%ebx
53	movl	8(%rdi),%ecx
54	movl	12(%rdi),%edx
55	movl	16(%rdi),%r8d
56	movl	20(%rdi),%r9d
57	movl	24(%rdi),%r10d
58	movl	28(%rdi),%r11d
59	jmp	.Lloop
60
61.align	16
62.Lloop:
63	movl	%ebx,%edi
64	leaq	K256(%rip),%rbp
65	xorl	%ecx,%edi
66	movl	0(%rsi),%r12d
67	movl	%r8d,%r13d
68	movl	%eax,%r14d
69	bswapl	%r12d
70	rorl	$14,%r13d
71	movl	%r9d,%r15d
72
73	xorl	%r8d,%r13d
74	rorl	$9,%r14d
75	xorl	%r10d,%r15d
76
77	movl	%r12d,0(%rsp)
78	xorl	%eax,%r14d
79	andl	%r8d,%r15d
80
81	rorl	$5,%r13d
82	addl	%r11d,%r12d
83	xorl	%r10d,%r15d
84
85	rorl	$11,%r14d
86	xorl	%r8d,%r13d
87	addl	%r15d,%r12d
88
89	movl	%eax,%r15d
90	addl	(%rbp),%r12d
91	xorl	%eax,%r14d
92
93	xorl	%ebx,%r15d
94	rorl	$6,%r13d
95	movl	%ebx,%r11d
96
97	andl	%r15d,%edi
98	rorl	$2,%r14d
99	addl	%r13d,%r12d
100
101	xorl	%edi,%r11d
102	addl	%r12d,%edx
103	addl	%r12d,%r11d
104
105	leaq	4(%rbp),%rbp
106	addl	%r14d,%r11d
107	movl	4(%rsi),%r12d
108	movl	%edx,%r13d
109	movl	%r11d,%r14d
110	bswapl	%r12d
111	rorl	$14,%r13d
112	movl	%r8d,%edi
113
114	xorl	%edx,%r13d
115	rorl	$9,%r14d
116	xorl	%r9d,%edi
117
118	movl	%r12d,4(%rsp)
119	xorl	%r11d,%r14d
120	andl	%edx,%edi
121
122	rorl	$5,%r13d
123	addl	%r10d,%r12d
124	xorl	%r9d,%edi
125
126	rorl	$11,%r14d
127	xorl	%edx,%r13d
128	addl	%edi,%r12d
129
130	movl	%r11d,%edi
131	addl	(%rbp),%r12d
132	xorl	%r11d,%r14d
133
134	xorl	%eax,%edi
135	rorl	$6,%r13d
136	movl	%eax,%r10d
137
138	andl	%edi,%r15d
139	rorl	$2,%r14d
140	addl	%r13d,%r12d
141
142	xorl	%r15d,%r10d
143	addl	%r12d,%ecx
144	addl	%r12d,%r10d
145
146	leaq	4(%rbp),%rbp
147	addl	%r14d,%r10d
148	movl	8(%rsi),%r12d
149	movl	%ecx,%r13d
150	movl	%r10d,%r14d
151	bswapl	%r12d
152	rorl	$14,%r13d
153	movl	%edx,%r15d
154
155	xorl	%ecx,%r13d
156	rorl	$9,%r14d
157	xorl	%r8d,%r15d
158
159	movl	%r12d,8(%rsp)
160	xorl	%r10d,%r14d
161	andl	%ecx,%r15d
162
163	rorl	$5,%r13d
164	addl	%r9d,%r12d
165	xorl	%r8d,%r15d
166
167	rorl	$11,%r14d
168	xorl	%ecx,%r13d
169	addl	%r15d,%r12d
170
171	movl	%r10d,%r15d
172	addl	(%rbp),%r12d
173	xorl	%r10d,%r14d
174
175	xorl	%r11d,%r15d
176	rorl	$6,%r13d
177	movl	%r11d,%r9d
178
179	andl	%r15d,%edi
180	rorl	$2,%r14d
181	addl	%r13d,%r12d
182
183	xorl	%edi,%r9d
184	addl	%r12d,%ebx
185	addl	%r12d,%r9d
186
187	leaq	4(%rbp),%rbp
188	addl	%r14d,%r9d
189	movl	12(%rsi),%r12d
190	movl	%ebx,%r13d
191	movl	%r9d,%r14d
192	bswapl	%r12d
193	rorl	$14,%r13d
194	movl	%ecx,%edi
195
196	xorl	%ebx,%r13d
197	rorl	$9,%r14d
198	xorl	%edx,%edi
199
200	movl	%r12d,12(%rsp)
201	xorl	%r9d,%r14d
202	andl	%ebx,%edi
203
204	rorl	$5,%r13d
205	addl	%r8d,%r12d
206	xorl	%edx,%edi
207
208	rorl	$11,%r14d
209	xorl	%ebx,%r13d
210	addl	%edi,%r12d
211
212	movl	%r9d,%edi
213	addl	(%rbp),%r12d
214	xorl	%r9d,%r14d
215
216	xorl	%r10d,%edi
217	rorl	$6,%r13d
218	movl	%r10d,%r8d
219
220	andl	%edi,%r15d
221	rorl	$2,%r14d
222	addl	%r13d,%r12d
223
224	xorl	%r15d,%r8d
225	addl	%r12d,%eax
226	addl	%r12d,%r8d
227
228	leaq	20(%rbp),%rbp
229	addl	%r14d,%r8d
230	movl	16(%rsi),%r12d
231	movl	%eax,%r13d
232	movl	%r8d,%r14d
233	bswapl	%r12d
234	rorl	$14,%r13d
235	movl	%ebx,%r15d
236
237	xorl	%eax,%r13d
238	rorl	$9,%r14d
239	xorl	%ecx,%r15d
240
241	movl	%r12d,16(%rsp)
242	xorl	%r8d,%r14d
243	andl	%eax,%r15d
244
245	rorl	$5,%r13d
246	addl	%edx,%r12d
247	xorl	%ecx,%r15d
248
249	rorl	$11,%r14d
250	xorl	%eax,%r13d
251	addl	%r15d,%r12d
252
253	movl	%r8d,%r15d
254	addl	(%rbp),%r12d
255	xorl	%r8d,%r14d
256
257	xorl	%r9d,%r15d
258	rorl	$6,%r13d
259	movl	%r9d,%edx
260
261	andl	%r15d,%edi
262	rorl	$2,%r14d
263	addl	%r13d,%r12d
264
265	xorl	%edi,%edx
266	addl	%r12d,%r11d
267	addl	%r12d,%edx
268
269	leaq	4(%rbp),%rbp
270	addl	%r14d,%edx
271	movl	20(%rsi),%r12d
272	movl	%r11d,%r13d
273	movl	%edx,%r14d
274	bswapl	%r12d
275	rorl	$14,%r13d
276	movl	%eax,%edi
277
278	xorl	%r11d,%r13d
279	rorl	$9,%r14d
280	xorl	%ebx,%edi
281
282	movl	%r12d,20(%rsp)
283	xorl	%edx,%r14d
284	andl	%r11d,%edi
285
286	rorl	$5,%r13d
287	addl	%ecx,%r12d
288	xorl	%ebx,%edi
289
290	rorl	$11,%r14d
291	xorl	%r11d,%r13d
292	addl	%edi,%r12d
293
294	movl	%edx,%edi
295	addl	(%rbp),%r12d
296	xorl	%edx,%r14d
297
298	xorl	%r8d,%edi
299	rorl	$6,%r13d
300	movl	%r8d,%ecx
301
302	andl	%edi,%r15d
303	rorl	$2,%r14d
304	addl	%r13d,%r12d
305
306	xorl	%r15d,%ecx
307	addl	%r12d,%r10d
308	addl	%r12d,%ecx
309
310	leaq	4(%rbp),%rbp
311	addl	%r14d,%ecx
312	movl	24(%rsi),%r12d
313	movl	%r10d,%r13d
314	movl	%ecx,%r14d
315	bswapl	%r12d
316	rorl	$14,%r13d
317	movl	%r11d,%r15d
318
319	xorl	%r10d,%r13d
320	rorl	$9,%r14d
321	xorl	%eax,%r15d
322
323	movl	%r12d,24(%rsp)
324	xorl	%ecx,%r14d
325	andl	%r10d,%r15d
326
327	rorl	$5,%r13d
328	addl	%ebx,%r12d
329	xorl	%eax,%r15d
330
331	rorl	$11,%r14d
332	xorl	%r10d,%r13d
333	addl	%r15d,%r12d
334
335	movl	%ecx,%r15d
336	addl	(%rbp),%r12d
337	xorl	%ecx,%r14d
338
339	xorl	%edx,%r15d
340	rorl	$6,%r13d
341	movl	%edx,%ebx
342
343	andl	%r15d,%edi
344	rorl	$2,%r14d
345	addl	%r13d,%r12d
346
347	xorl	%edi,%ebx
348	addl	%r12d,%r9d
349	addl	%r12d,%ebx
350
351	leaq	4(%rbp),%rbp
352	addl	%r14d,%ebx
353	movl	28(%rsi),%r12d
354	movl	%r9d,%r13d
355	movl	%ebx,%r14d
356	bswapl	%r12d
357	rorl	$14,%r13d
358	movl	%r10d,%edi
359
360	xorl	%r9d,%r13d
361	rorl	$9,%r14d
362	xorl	%r11d,%edi
363
364	movl	%r12d,28(%rsp)
365	xorl	%ebx,%r14d
366	andl	%r9d,%edi
367
368	rorl	$5,%r13d
369	addl	%eax,%r12d
370	xorl	%r11d,%edi
371
372	rorl	$11,%r14d
373	xorl	%r9d,%r13d
374	addl	%edi,%r12d
375
376	movl	%ebx,%edi
377	addl	(%rbp),%r12d
378	xorl	%ebx,%r14d
379
380	xorl	%ecx,%edi
381	rorl	$6,%r13d
382	movl	%ecx,%eax
383
384	andl	%edi,%r15d
385	rorl	$2,%r14d
386	addl	%r13d,%r12d
387
388	xorl	%r15d,%eax
389	addl	%r12d,%r8d
390	addl	%r12d,%eax
391
392	leaq	20(%rbp),%rbp
393	addl	%r14d,%eax
394	movl	32(%rsi),%r12d
395	movl	%r8d,%r13d
396	movl	%eax,%r14d
397	bswapl	%r12d
398	rorl	$14,%r13d
399	movl	%r9d,%r15d
400
401	xorl	%r8d,%r13d
402	rorl	$9,%r14d
403	xorl	%r10d,%r15d
404
405	movl	%r12d,32(%rsp)
406	xorl	%eax,%r14d
407	andl	%r8d,%r15d
408
409	rorl	$5,%r13d
410	addl	%r11d,%r12d
411	xorl	%r10d,%r15d
412
413	rorl	$11,%r14d
414	xorl	%r8d,%r13d
415	addl	%r15d,%r12d
416
417	movl	%eax,%r15d
418	addl	(%rbp),%r12d
419	xorl	%eax,%r14d
420
421	xorl	%ebx,%r15d
422	rorl	$6,%r13d
423	movl	%ebx,%r11d
424
425	andl	%r15d,%edi
426	rorl	$2,%r14d
427	addl	%r13d,%r12d
428
429	xorl	%edi,%r11d
430	addl	%r12d,%edx
431	addl	%r12d,%r11d
432
433	leaq	4(%rbp),%rbp
434	addl	%r14d,%r11d
435	movl	36(%rsi),%r12d
436	movl	%edx,%r13d
437	movl	%r11d,%r14d
438	bswapl	%r12d
439	rorl	$14,%r13d
440	movl	%r8d,%edi
441
442	xorl	%edx,%r13d
443	rorl	$9,%r14d
444	xorl	%r9d,%edi
445
446	movl	%r12d,36(%rsp)
447	xorl	%r11d,%r14d
448	andl	%edx,%edi
449
450	rorl	$5,%r13d
451	addl	%r10d,%r12d
452	xorl	%r9d,%edi
453
454	rorl	$11,%r14d
455	xorl	%edx,%r13d
456	addl	%edi,%r12d
457
458	movl	%r11d,%edi
459	addl	(%rbp),%r12d
460	xorl	%r11d,%r14d
461
462	xorl	%eax,%edi
463	rorl	$6,%r13d
464	movl	%eax,%r10d
465
466	andl	%edi,%r15d
467	rorl	$2,%r14d
468	addl	%r13d,%r12d
469
470	xorl	%r15d,%r10d
471	addl	%r12d,%ecx
472	addl	%r12d,%r10d
473
474	leaq	4(%rbp),%rbp
475	addl	%r14d,%r10d
476	movl	40(%rsi),%r12d
477	movl	%ecx,%r13d
478	movl	%r10d,%r14d
479	bswapl	%r12d
480	rorl	$14,%r13d
481	movl	%edx,%r15d
482
483	xorl	%ecx,%r13d
484	rorl	$9,%r14d
485	xorl	%r8d,%r15d
486
487	movl	%r12d,40(%rsp)
488	xorl	%r10d,%r14d
489	andl	%ecx,%r15d
490
491	rorl	$5,%r13d
492	addl	%r9d,%r12d
493	xorl	%r8d,%r15d
494
495	rorl	$11,%r14d
496	xorl	%ecx,%r13d
497	addl	%r15d,%r12d
498
499	movl	%r10d,%r15d
500	addl	(%rbp),%r12d
501	xorl	%r10d,%r14d
502
503	xorl	%r11d,%r15d
504	rorl	$6,%r13d
505	movl	%r11d,%r9d
506
507	andl	%r15d,%edi
508	rorl	$2,%r14d
509	addl	%r13d,%r12d
510
511	xorl	%edi,%r9d
512	addl	%r12d,%ebx
513	addl	%r12d,%r9d
514
515	leaq	4(%rbp),%rbp
516	addl	%r14d,%r9d
517	movl	44(%rsi),%r12d
518	movl	%ebx,%r13d
519	movl	%r9d,%r14d
520	bswapl	%r12d
521	rorl	$14,%r13d
522	movl	%ecx,%edi
523
524	xorl	%ebx,%r13d
525	rorl	$9,%r14d
526	xorl	%edx,%edi
527
528	movl	%r12d,44(%rsp)
529	xorl	%r9d,%r14d
530	andl	%ebx,%edi
531
532	rorl	$5,%r13d
533	addl	%r8d,%r12d
534	xorl	%edx,%edi
535
536	rorl	$11,%r14d
537	xorl	%ebx,%r13d
538	addl	%edi,%r12d
539
540	movl	%r9d,%edi
541	addl	(%rbp),%r12d
542	xorl	%r9d,%r14d
543
544	xorl	%r10d,%edi
545	rorl	$6,%r13d
546	movl	%r10d,%r8d
547
548	andl	%edi,%r15d
549	rorl	$2,%r14d
550	addl	%r13d,%r12d
551
552	xorl	%r15d,%r8d
553	addl	%r12d,%eax
554	addl	%r12d,%r8d
555
556	leaq	20(%rbp),%rbp
557	addl	%r14d,%r8d
558	movl	48(%rsi),%r12d
559	movl	%eax,%r13d
560	movl	%r8d,%r14d
561	bswapl	%r12d
562	rorl	$14,%r13d
563	movl	%ebx,%r15d
564
565	xorl	%eax,%r13d
566	rorl	$9,%r14d
567	xorl	%ecx,%r15d
568
569	movl	%r12d,48(%rsp)
570	xorl	%r8d,%r14d
571	andl	%eax,%r15d
572
573	rorl	$5,%r13d
574	addl	%edx,%r12d
575	xorl	%ecx,%r15d
576
577	rorl	$11,%r14d
578	xorl	%eax,%r13d
579	addl	%r15d,%r12d
580
581	movl	%r8d,%r15d
582	addl	(%rbp),%r12d
583	xorl	%r8d,%r14d
584
585	xorl	%r9d,%r15d
586	rorl	$6,%r13d
587	movl	%r9d,%edx
588
589	andl	%r15d,%edi
590	rorl	$2,%r14d
591	addl	%r13d,%r12d
592
593	xorl	%edi,%edx
594	addl	%r12d,%r11d
595	addl	%r12d,%edx
596
597	leaq	4(%rbp),%rbp
598	addl	%r14d,%edx
599	movl	52(%rsi),%r12d
600	movl	%r11d,%r13d
601	movl	%edx,%r14d
602	bswapl	%r12d
603	rorl	$14,%r13d
604	movl	%eax,%edi
605
606	xorl	%r11d,%r13d
607	rorl	$9,%r14d
608	xorl	%ebx,%edi
609
610	movl	%r12d,52(%rsp)
611	xorl	%edx,%r14d
612	andl	%r11d,%edi
613
614	rorl	$5,%r13d
615	addl	%ecx,%r12d
616	xorl	%ebx,%edi
617
618	rorl	$11,%r14d
619	xorl	%r11d,%r13d
620	addl	%edi,%r12d
621
622	movl	%edx,%edi
623	addl	(%rbp),%r12d
624	xorl	%edx,%r14d
625
626	xorl	%r8d,%edi
627	rorl	$6,%r13d
628	movl	%r8d,%ecx
629
630	andl	%edi,%r15d
631	rorl	$2,%r14d
632	addl	%r13d,%r12d
633
634	xorl	%r15d,%ecx
635	addl	%r12d,%r10d
636	addl	%r12d,%ecx
637
638	leaq	4(%rbp),%rbp
639	addl	%r14d,%ecx
640	movl	56(%rsi),%r12d
641	movl	%r10d,%r13d
642	movl	%ecx,%r14d
643	bswapl	%r12d
644	rorl	$14,%r13d
645	movl	%r11d,%r15d
646
647	xorl	%r10d,%r13d
648	rorl	$9,%r14d
649	xorl	%eax,%r15d
650
651	movl	%r12d,56(%rsp)
652	xorl	%ecx,%r14d
653	andl	%r10d,%r15d
654
655	rorl	$5,%r13d
656	addl	%ebx,%r12d
657	xorl	%eax,%r15d
658
659	rorl	$11,%r14d
660	xorl	%r10d,%r13d
661	addl	%r15d,%r12d
662
663	movl	%ecx,%r15d
664	addl	(%rbp),%r12d
665	xorl	%ecx,%r14d
666
667	xorl	%edx,%r15d
668	rorl	$6,%r13d
669	movl	%edx,%ebx
670
671	andl	%r15d,%edi
672	rorl	$2,%r14d
673	addl	%r13d,%r12d
674
675	xorl	%edi,%ebx
676	addl	%r12d,%r9d
677	addl	%r12d,%ebx
678
679	leaq	4(%rbp),%rbp
680	addl	%r14d,%ebx
681	movl	60(%rsi),%r12d
682	movl	%r9d,%r13d
683	movl	%ebx,%r14d
684	bswapl	%r12d
685	rorl	$14,%r13d
686	movl	%r10d,%edi
687
688	xorl	%r9d,%r13d
689	rorl	$9,%r14d
690	xorl	%r11d,%edi
691
692	movl	%r12d,60(%rsp)
693	xorl	%ebx,%r14d
694	andl	%r9d,%edi
695
696	rorl	$5,%r13d
697	addl	%eax,%r12d
698	xorl	%r11d,%edi
699
700	rorl	$11,%r14d
701	xorl	%r9d,%r13d
702	addl	%edi,%r12d
703
704	movl	%ebx,%edi
705	addl	(%rbp),%r12d
706	xorl	%ebx,%r14d
707
708	xorl	%ecx,%edi
709	rorl	$6,%r13d
710	movl	%ecx,%eax
711
712	andl	%edi,%r15d
713	rorl	$2,%r14d
714	addl	%r13d,%r12d
715
716	xorl	%r15d,%eax
717	addl	%r12d,%r8d
718	addl	%r12d,%eax
719
720	leaq	20(%rbp),%rbp
721	jmp	.Lrounds_16_xx
722.align	16
723.Lrounds_16_xx:
724	movl	4(%rsp),%r13d
725	movl	56(%rsp),%r15d
726
727	movl	%r13d,%r12d
728	rorl	$11,%r13d
729	addl	%r14d,%eax
730	movl	%r15d,%r14d
731	rorl	$2,%r15d
732
733	xorl	%r12d,%r13d
734	shrl	$3,%r12d
735	rorl	$7,%r13d
736	xorl	%r14d,%r15d
737	shrl	$10,%r14d
738
739	rorl	$17,%r15d
740	xorl	%r13d,%r12d
741	xorl	%r14d,%r15d
742	addl	36(%rsp),%r12d
743
744	addl	0(%rsp),%r12d
745	movl	%r8d,%r13d
746	addl	%r15d,%r12d
747	movl	%eax,%r14d
748	rorl	$14,%r13d
749	movl	%r9d,%r15d
750
751	xorl	%r8d,%r13d
752	rorl	$9,%r14d
753	xorl	%r10d,%r15d
754
755	movl	%r12d,0(%rsp)
756	xorl	%eax,%r14d
757	andl	%r8d,%r15d
758
759	rorl	$5,%r13d
760	addl	%r11d,%r12d
761	xorl	%r10d,%r15d
762
763	rorl	$11,%r14d
764	xorl	%r8d,%r13d
765	addl	%r15d,%r12d
766
767	movl	%eax,%r15d
768	addl	(%rbp),%r12d
769	xorl	%eax,%r14d
770
771	xorl	%ebx,%r15d
772	rorl	$6,%r13d
773	movl	%ebx,%r11d
774
775	andl	%r15d,%edi
776	rorl	$2,%r14d
777	addl	%r13d,%r12d
778
779	xorl	%edi,%r11d
780	addl	%r12d,%edx
781	addl	%r12d,%r11d
782
783	leaq	4(%rbp),%rbp
784	movl	8(%rsp),%r13d
785	movl	60(%rsp),%edi
786
787	movl	%r13d,%r12d
788	rorl	$11,%r13d
789	addl	%r14d,%r11d
790	movl	%edi,%r14d
791	rorl	$2,%edi
792
793	xorl	%r12d,%r13d
794	shrl	$3,%r12d
795	rorl	$7,%r13d
796	xorl	%r14d,%edi
797	shrl	$10,%r14d
798
799	rorl	$17,%edi
800	xorl	%r13d,%r12d
801	xorl	%r14d,%edi
802	addl	40(%rsp),%r12d
803
804	addl	4(%rsp),%r12d
805	movl	%edx,%r13d
806	addl	%edi,%r12d
807	movl	%r11d,%r14d
808	rorl	$14,%r13d
809	movl	%r8d,%edi
810
811	xorl	%edx,%r13d
812	rorl	$9,%r14d
813	xorl	%r9d,%edi
814
815	movl	%r12d,4(%rsp)
816	xorl	%r11d,%r14d
817	andl	%edx,%edi
818
819	rorl	$5,%r13d
820	addl	%r10d,%r12d
821	xorl	%r9d,%edi
822
823	rorl	$11,%r14d
824	xorl	%edx,%r13d
825	addl	%edi,%r12d
826
827	movl	%r11d,%edi
828	addl	(%rbp),%r12d
829	xorl	%r11d,%r14d
830
831	xorl	%eax,%edi
832	rorl	$6,%r13d
833	movl	%eax,%r10d
834
835	andl	%edi,%r15d
836	rorl	$2,%r14d
837	addl	%r13d,%r12d
838
839	xorl	%r15d,%r10d
840	addl	%r12d,%ecx
841	addl	%r12d,%r10d
842
843	leaq	4(%rbp),%rbp
844	movl	12(%rsp),%r13d
845	movl	0(%rsp),%r15d
846
847	movl	%r13d,%r12d
848	rorl	$11,%r13d
849	addl	%r14d,%r10d
850	movl	%r15d,%r14d
851	rorl	$2,%r15d
852
853	xorl	%r12d,%r13d
854	shrl	$3,%r12d
855	rorl	$7,%r13d
856	xorl	%r14d,%r15d
857	shrl	$10,%r14d
858
859	rorl	$17,%r15d
860	xorl	%r13d,%r12d
861	xorl	%r14d,%r15d
862	addl	44(%rsp),%r12d
863
864	addl	8(%rsp),%r12d
865	movl	%ecx,%r13d
866	addl	%r15d,%r12d
867	movl	%r10d,%r14d
868	rorl	$14,%r13d
869	movl	%edx,%r15d
870
871	xorl	%ecx,%r13d
872	rorl	$9,%r14d
873	xorl	%r8d,%r15d
874
875	movl	%r12d,8(%rsp)
876	xorl	%r10d,%r14d
877	andl	%ecx,%r15d
878
879	rorl	$5,%r13d
880	addl	%r9d,%r12d
881	xorl	%r8d,%r15d
882
883	rorl	$11,%r14d
884	xorl	%ecx,%r13d
885	addl	%r15d,%r12d
886
887	movl	%r10d,%r15d
888	addl	(%rbp),%r12d
889	xorl	%r10d,%r14d
890
891	xorl	%r11d,%r15d
892	rorl	$6,%r13d
893	movl	%r11d,%r9d
894
895	andl	%r15d,%edi
896	rorl	$2,%r14d
897	addl	%r13d,%r12d
898
899	xorl	%edi,%r9d
900	addl	%r12d,%ebx
901	addl	%r12d,%r9d
902
903	leaq	4(%rbp),%rbp
904	movl	16(%rsp),%r13d
905	movl	4(%rsp),%edi
906
907	movl	%r13d,%r12d
908	rorl	$11,%r13d
909	addl	%r14d,%r9d
910	movl	%edi,%r14d
911	rorl	$2,%edi
912
913	xorl	%r12d,%r13d
914	shrl	$3,%r12d
915	rorl	$7,%r13d
916	xorl	%r14d,%edi
917	shrl	$10,%r14d
918
919	rorl	$17,%edi
920	xorl	%r13d,%r12d
921	xorl	%r14d,%edi
922	addl	48(%rsp),%r12d
923
924	addl	12(%rsp),%r12d
925	movl	%ebx,%r13d
926	addl	%edi,%r12d
927	movl	%r9d,%r14d
928	rorl	$14,%r13d
929	movl	%ecx,%edi
930
931	xorl	%ebx,%r13d
932	rorl	$9,%r14d
933	xorl	%edx,%edi
934
935	movl	%r12d,12(%rsp)
936	xorl	%r9d,%r14d
937	andl	%ebx,%edi
938
939	rorl	$5,%r13d
940	addl	%r8d,%r12d
941	xorl	%edx,%edi
942
943	rorl	$11,%r14d
944	xorl	%ebx,%r13d
945	addl	%edi,%r12d
946
947	movl	%r9d,%edi
948	addl	(%rbp),%r12d
949	xorl	%r9d,%r14d
950
951	xorl	%r10d,%edi
952	rorl	$6,%r13d
953	movl	%r10d,%r8d
954
955	andl	%edi,%r15d
956	rorl	$2,%r14d
957	addl	%r13d,%r12d
958
959	xorl	%r15d,%r8d
960	addl	%r12d,%eax
961	addl	%r12d,%r8d
962
963	leaq	20(%rbp),%rbp
964	movl	20(%rsp),%r13d
965	movl	8(%rsp),%r15d
966
967	movl	%r13d,%r12d
968	rorl	$11,%r13d
969	addl	%r14d,%r8d
970	movl	%r15d,%r14d
971	rorl	$2,%r15d
972
973	xorl	%r12d,%r13d
974	shrl	$3,%r12d
975	rorl	$7,%r13d
976	xorl	%r14d,%r15d
977	shrl	$10,%r14d
978
979	rorl	$17,%r15d
980	xorl	%r13d,%r12d
981	xorl	%r14d,%r15d
982	addl	52(%rsp),%r12d
983
984	addl	16(%rsp),%r12d
985	movl	%eax,%r13d
986	addl	%r15d,%r12d
987	movl	%r8d,%r14d
988	rorl	$14,%r13d
989	movl	%ebx,%r15d
990
991	xorl	%eax,%r13d
992	rorl	$9,%r14d
993	xorl	%ecx,%r15d
994
995	movl	%r12d,16(%rsp)
996	xorl	%r8d,%r14d
997	andl	%eax,%r15d
998
999	rorl	$5,%r13d
1000	addl	%edx,%r12d
1001	xorl	%ecx,%r15d
1002
1003	rorl	$11,%r14d
1004	xorl	%eax,%r13d
1005	addl	%r15d,%r12d
1006
1007	movl	%r8d,%r15d
1008	addl	(%rbp),%r12d
1009	xorl	%r8d,%r14d
1010
1011	xorl	%r9d,%r15d
1012	rorl	$6,%r13d
1013	movl	%r9d,%edx
1014
1015	andl	%r15d,%edi
1016	rorl	$2,%r14d
1017	addl	%r13d,%r12d
1018
1019	xorl	%edi,%edx
1020	addl	%r12d,%r11d
1021	addl	%r12d,%edx
1022
1023	leaq	4(%rbp),%rbp
1024	movl	24(%rsp),%r13d
1025	movl	12(%rsp),%edi
1026
1027	movl	%r13d,%r12d
1028	rorl	$11,%r13d
1029	addl	%r14d,%edx
1030	movl	%edi,%r14d
1031	rorl	$2,%edi
1032
1033	xorl	%r12d,%r13d
1034	shrl	$3,%r12d
1035	rorl	$7,%r13d
1036	xorl	%r14d,%edi
1037	shrl	$10,%r14d
1038
1039	rorl	$17,%edi
1040	xorl	%r13d,%r12d
1041	xorl	%r14d,%edi
1042	addl	56(%rsp),%r12d
1043
1044	addl	20(%rsp),%r12d
1045	movl	%r11d,%r13d
1046	addl	%edi,%r12d
1047	movl	%edx,%r14d
1048	rorl	$14,%r13d
1049	movl	%eax,%edi
1050
1051	xorl	%r11d,%r13d
1052	rorl	$9,%r14d
1053	xorl	%ebx,%edi
1054
1055	movl	%r12d,20(%rsp)
1056	xorl	%edx,%r14d
1057	andl	%r11d,%edi
1058
1059	rorl	$5,%r13d
1060	addl	%ecx,%r12d
1061	xorl	%ebx,%edi
1062
1063	rorl	$11,%r14d
1064	xorl	%r11d,%r13d
1065	addl	%edi,%r12d
1066
1067	movl	%edx,%edi
1068	addl	(%rbp),%r12d
1069	xorl	%edx,%r14d
1070
1071	xorl	%r8d,%edi
1072	rorl	$6,%r13d
1073	movl	%r8d,%ecx
1074
1075	andl	%edi,%r15d
1076	rorl	$2,%r14d
1077	addl	%r13d,%r12d
1078
1079	xorl	%r15d,%ecx
1080	addl	%r12d,%r10d
1081	addl	%r12d,%ecx
1082
1083	leaq	4(%rbp),%rbp
1084	movl	28(%rsp),%r13d
1085	movl	16(%rsp),%r15d
1086
1087	movl	%r13d,%r12d
1088	rorl	$11,%r13d
1089	addl	%r14d,%ecx
1090	movl	%r15d,%r14d
1091	rorl	$2,%r15d
1092
1093	xorl	%r12d,%r13d
1094	shrl	$3,%r12d
1095	rorl	$7,%r13d
1096	xorl	%r14d,%r15d
1097	shrl	$10,%r14d
1098
1099	rorl	$17,%r15d
1100	xorl	%r13d,%r12d
1101	xorl	%r14d,%r15d
1102	addl	60(%rsp),%r12d
1103
1104	addl	24(%rsp),%r12d
1105	movl	%r10d,%r13d
1106	addl	%r15d,%r12d
1107	movl	%ecx,%r14d
1108	rorl	$14,%r13d
1109	movl	%r11d,%r15d
1110
1111	xorl	%r10d,%r13d
1112	rorl	$9,%r14d
1113	xorl	%eax,%r15d
1114
1115	movl	%r12d,24(%rsp)
1116	xorl	%ecx,%r14d
1117	andl	%r10d,%r15d
1118
1119	rorl	$5,%r13d
1120	addl	%ebx,%r12d
1121	xorl	%eax,%r15d
1122
1123	rorl	$11,%r14d
1124	xorl	%r10d,%r13d
1125	addl	%r15d,%r12d
1126
1127	movl	%ecx,%r15d
1128	addl	(%rbp),%r12d
1129	xorl	%ecx,%r14d
1130
1131	xorl	%edx,%r15d
1132	rorl	$6,%r13d
1133	movl	%edx,%ebx
1134
1135	andl	%r15d,%edi
1136	rorl	$2,%r14d
1137	addl	%r13d,%r12d
1138
1139	xorl	%edi,%ebx
1140	addl	%r12d,%r9d
1141	addl	%r12d,%ebx
1142
1143	leaq	4(%rbp),%rbp
1144	movl	32(%rsp),%r13d
1145	movl	20(%rsp),%edi
1146
1147	movl	%r13d,%r12d
1148	rorl	$11,%r13d
1149	addl	%r14d,%ebx
1150	movl	%edi,%r14d
1151	rorl	$2,%edi
1152
1153	xorl	%r12d,%r13d
1154	shrl	$3,%r12d
1155	rorl	$7,%r13d
1156	xorl	%r14d,%edi
1157	shrl	$10,%r14d
1158
1159	rorl	$17,%edi
1160	xorl	%r13d,%r12d
1161	xorl	%r14d,%edi
1162	addl	0(%rsp),%r12d
1163
1164	addl	28(%rsp),%r12d
1165	movl	%r9d,%r13d
1166	addl	%edi,%r12d
1167	movl	%ebx,%r14d
1168	rorl	$14,%r13d
1169	movl	%r10d,%edi
1170
1171	xorl	%r9d,%r13d
1172	rorl	$9,%r14d
1173	xorl	%r11d,%edi
1174
1175	movl	%r12d,28(%rsp)
1176	xorl	%ebx,%r14d
1177	andl	%r9d,%edi
1178
1179	rorl	$5,%r13d
1180	addl	%eax,%r12d
1181	xorl	%r11d,%edi
1182
1183	rorl	$11,%r14d
1184	xorl	%r9d,%r13d
1185	addl	%edi,%r12d
1186
1187	movl	%ebx,%edi
1188	addl	(%rbp),%r12d
1189	xorl	%ebx,%r14d
1190
1191	xorl	%ecx,%edi
1192	rorl	$6,%r13d
1193	movl	%ecx,%eax
1194
1195	andl	%edi,%r15d
1196	rorl	$2,%r14d
1197	addl	%r13d,%r12d
1198
1199	xorl	%r15d,%eax
1200	addl	%r12d,%r8d
1201	addl	%r12d,%eax
1202
1203	leaq	20(%rbp),%rbp
1204	movl	36(%rsp),%r13d
1205	movl	24(%rsp),%r15d
1206
1207	movl	%r13d,%r12d
1208	rorl	$11,%r13d
1209	addl	%r14d,%eax
1210	movl	%r15d,%r14d
1211	rorl	$2,%r15d
1212
1213	xorl	%r12d,%r13d
1214	shrl	$3,%r12d
1215	rorl	$7,%r13d
1216	xorl	%r14d,%r15d
1217	shrl	$10,%r14d
1218
1219	rorl	$17,%r15d
1220	xorl	%r13d,%r12d
1221	xorl	%r14d,%r15d
1222	addl	4(%rsp),%r12d
1223
1224	addl	32(%rsp),%r12d
1225	movl	%r8d,%r13d
1226	addl	%r15d,%r12d
1227	movl	%eax,%r14d
1228	rorl	$14,%r13d
1229	movl	%r9d,%r15d
1230
1231	xorl	%r8d,%r13d
1232	rorl	$9,%r14d
1233	xorl	%r10d,%r15d
1234
1235	movl	%r12d,32(%rsp)
1236	xorl	%eax,%r14d
1237	andl	%r8d,%r15d
1238
1239	rorl	$5,%r13d
1240	addl	%r11d,%r12d
1241	xorl	%r10d,%r15d
1242
1243	rorl	$11,%r14d
1244	xorl	%r8d,%r13d
1245	addl	%r15d,%r12d
1246
1247	movl	%eax,%r15d
1248	addl	(%rbp),%r12d
1249	xorl	%eax,%r14d
1250
1251	xorl	%ebx,%r15d
1252	rorl	$6,%r13d
1253	movl	%ebx,%r11d
1254
1255	andl	%r15d,%edi
1256	rorl	$2,%r14d
1257	addl	%r13d,%r12d
1258
1259	xorl	%edi,%r11d
1260	addl	%r12d,%edx
1261	addl	%r12d,%r11d
1262
1263	leaq	4(%rbp),%rbp
1264	movl	40(%rsp),%r13d
1265	movl	28(%rsp),%edi
1266
1267	movl	%r13d,%r12d
1268	rorl	$11,%r13d
1269	addl	%r14d,%r11d
1270	movl	%edi,%r14d
1271	rorl	$2,%edi
1272
1273	xorl	%r12d,%r13d
1274	shrl	$3,%r12d
1275	rorl	$7,%r13d
1276	xorl	%r14d,%edi
1277	shrl	$10,%r14d
1278
1279	rorl	$17,%edi
1280	xorl	%r13d,%r12d
1281	xorl	%r14d,%edi
1282	addl	8(%rsp),%r12d
1283
1284	addl	36(%rsp),%r12d
1285	movl	%edx,%r13d
1286	addl	%edi,%r12d
1287	movl	%r11d,%r14d
1288	rorl	$14,%r13d
1289	movl	%r8d,%edi
1290
1291	xorl	%edx,%r13d
1292	rorl	$9,%r14d
1293	xorl	%r9d,%edi
1294
1295	movl	%r12d,36(%rsp)
1296	xorl	%r11d,%r14d
1297	andl	%edx,%edi
1298
1299	rorl	$5,%r13d
1300	addl	%r10d,%r12d
1301	xorl	%r9d,%edi
1302
1303	rorl	$11,%r14d
1304	xorl	%edx,%r13d
1305	addl	%edi,%r12d
1306
1307	movl	%r11d,%edi
1308	addl	(%rbp),%r12d
1309	xorl	%r11d,%r14d
1310
1311	xorl	%eax,%edi
1312	rorl	$6,%r13d
1313	movl	%eax,%r10d
1314
1315	andl	%edi,%r15d
1316	rorl	$2,%r14d
1317	addl	%r13d,%r12d
1318
1319	xorl	%r15d,%r10d
1320	addl	%r12d,%ecx
1321	addl	%r12d,%r10d
1322
1323	leaq	4(%rbp),%rbp
1324	movl	44(%rsp),%r13d
1325	movl	32(%rsp),%r15d
1326
1327	movl	%r13d,%r12d
1328	rorl	$11,%r13d
1329	addl	%r14d,%r10d
1330	movl	%r15d,%r14d
1331	rorl	$2,%r15d
1332
1333	xorl	%r12d,%r13d
1334	shrl	$3,%r12d
1335	rorl	$7,%r13d
1336	xorl	%r14d,%r15d
1337	shrl	$10,%r14d
1338
1339	rorl	$17,%r15d
1340	xorl	%r13d,%r12d
1341	xorl	%r14d,%r15d
1342	addl	12(%rsp),%r12d
1343
1344	addl	40(%rsp),%r12d
1345	movl	%ecx,%r13d
1346	addl	%r15d,%r12d
1347	movl	%r10d,%r14d
1348	rorl	$14,%r13d
1349	movl	%edx,%r15d
1350
1351	xorl	%ecx,%r13d
1352	rorl	$9,%r14d
1353	xorl	%r8d,%r15d
1354
1355	movl	%r12d,40(%rsp)
1356	xorl	%r10d,%r14d
1357	andl	%ecx,%r15d
1358
1359	rorl	$5,%r13d
1360	addl	%r9d,%r12d
1361	xorl	%r8d,%r15d
1362
1363	rorl	$11,%r14d
1364	xorl	%ecx,%r13d
1365	addl	%r15d,%r12d
1366
1367	movl	%r10d,%r15d
1368	addl	(%rbp),%r12d
1369	xorl	%r10d,%r14d
1370
1371	xorl	%r11d,%r15d
1372	rorl	$6,%r13d
1373	movl	%r11d,%r9d
1374
1375	andl	%r15d,%edi
1376	rorl	$2,%r14d
1377	addl	%r13d,%r12d
1378
1379	xorl	%edi,%r9d
1380	addl	%r12d,%ebx
1381	addl	%r12d,%r9d
1382
1383	leaq	4(%rbp),%rbp
1384	movl	48(%rsp),%r13d
1385	movl	36(%rsp),%edi
1386
1387	movl	%r13d,%r12d
1388	rorl	$11,%r13d
1389	addl	%r14d,%r9d
1390	movl	%edi,%r14d
1391	rorl	$2,%edi
1392
1393	xorl	%r12d,%r13d
1394	shrl	$3,%r12d
1395	rorl	$7,%r13d
1396	xorl	%r14d,%edi
1397	shrl	$10,%r14d
1398
1399	rorl	$17,%edi
1400	xorl	%r13d,%r12d
1401	xorl	%r14d,%edi
1402	addl	16(%rsp),%r12d
1403
1404	addl	44(%rsp),%r12d
1405	movl	%ebx,%r13d
1406	addl	%edi,%r12d
1407	movl	%r9d,%r14d
1408	rorl	$14,%r13d
1409	movl	%ecx,%edi
1410
1411	xorl	%ebx,%r13d
1412	rorl	$9,%r14d
1413	xorl	%edx,%edi
1414
1415	movl	%r12d,44(%rsp)
1416	xorl	%r9d,%r14d
1417	andl	%ebx,%edi
1418
1419	rorl	$5,%r13d
1420	addl	%r8d,%r12d
1421	xorl	%edx,%edi
1422
1423	rorl	$11,%r14d
1424	xorl	%ebx,%r13d
1425	addl	%edi,%r12d
1426
1427	movl	%r9d,%edi
1428	addl	(%rbp),%r12d
1429	xorl	%r9d,%r14d
1430
1431	xorl	%r10d,%edi
1432	rorl	$6,%r13d
1433	movl	%r10d,%r8d
1434
1435	andl	%edi,%r15d
1436	rorl	$2,%r14d
1437	addl	%r13d,%r12d
1438
1439	xorl	%r15d,%r8d
1440	addl	%r12d,%eax
1441	addl	%r12d,%r8d
1442
1443	leaq	20(%rbp),%rbp
1444	movl	52(%rsp),%r13d
1445	movl	40(%rsp),%r15d
1446
1447	movl	%r13d,%r12d
1448	rorl	$11,%r13d
1449	addl	%r14d,%r8d
1450	movl	%r15d,%r14d
1451	rorl	$2,%r15d
1452
1453	xorl	%r12d,%r13d
1454	shrl	$3,%r12d
1455	rorl	$7,%r13d
1456	xorl	%r14d,%r15d
1457	shrl	$10,%r14d
1458
1459	rorl	$17,%r15d
1460	xorl	%r13d,%r12d
1461	xorl	%r14d,%r15d
1462	addl	20(%rsp),%r12d
1463
1464	addl	48(%rsp),%r12d
1465	movl	%eax,%r13d
1466	addl	%r15d,%r12d
1467	movl	%r8d,%r14d
1468	rorl	$14,%r13d
1469	movl	%ebx,%r15d
1470
1471	xorl	%eax,%r13d
1472	rorl	$9,%r14d
1473	xorl	%ecx,%r15d
1474
1475	movl	%r12d,48(%rsp)
1476	xorl	%r8d,%r14d
1477	andl	%eax,%r15d
1478
1479	rorl	$5,%r13d
1480	addl	%edx,%r12d
1481	xorl	%ecx,%r15d
1482
1483	rorl	$11,%r14d
1484	xorl	%eax,%r13d
1485	addl	%r15d,%r12d
1486
1487	movl	%r8d,%r15d
1488	addl	(%rbp),%r12d
1489	xorl	%r8d,%r14d
1490
1491	xorl	%r9d,%r15d
1492	rorl	$6,%r13d
1493	movl	%r9d,%edx
1494
1495	andl	%r15d,%edi
1496	rorl	$2,%r14d
1497	addl	%r13d,%r12d
1498
1499	xorl	%edi,%edx
1500	addl	%r12d,%r11d
1501	addl	%r12d,%edx
1502
1503	leaq	4(%rbp),%rbp
1504	movl	56(%rsp),%r13d
1505	movl	44(%rsp),%edi
1506
1507	movl	%r13d,%r12d
1508	rorl	$11,%r13d
1509	addl	%r14d,%edx
1510	movl	%edi,%r14d
1511	rorl	$2,%edi
1512
1513	xorl	%r12d,%r13d
1514	shrl	$3,%r12d
1515	rorl	$7,%r13d
1516	xorl	%r14d,%edi
1517	shrl	$10,%r14d
1518
1519	rorl	$17,%edi
1520	xorl	%r13d,%r12d
1521	xorl	%r14d,%edi
1522	addl	24(%rsp),%r12d
1523
1524	addl	52(%rsp),%r12d
1525	movl	%r11d,%r13d
1526	addl	%edi,%r12d
1527	movl	%edx,%r14d
1528	rorl	$14,%r13d
1529	movl	%eax,%edi
1530
1531	xorl	%r11d,%r13d
1532	rorl	$9,%r14d
1533	xorl	%ebx,%edi
1534
1535	movl	%r12d,52(%rsp)
1536	xorl	%edx,%r14d
1537	andl	%r11d,%edi
1538
1539	rorl	$5,%r13d
1540	addl	%ecx,%r12d
1541	xorl	%ebx,%edi
1542
1543	rorl	$11,%r14d
1544	xorl	%r11d,%r13d
1545	addl	%edi,%r12d
1546
1547	movl	%edx,%edi
1548	addl	(%rbp),%r12d
1549	xorl	%edx,%r14d
1550
1551	xorl	%r8d,%edi
1552	rorl	$6,%r13d
1553	movl	%r8d,%ecx
1554
1555	andl	%edi,%r15d
1556	rorl	$2,%r14d
1557	addl	%r13d,%r12d
1558
1559	xorl	%r15d,%ecx
1560	addl	%r12d,%r10d
1561	addl	%r12d,%ecx
1562
1563	leaq	4(%rbp),%rbp
1564	movl	60(%rsp),%r13d
1565	movl	48(%rsp),%r15d
1566
1567	movl	%r13d,%r12d
1568	rorl	$11,%r13d
1569	addl	%r14d,%ecx
1570	movl	%r15d,%r14d
1571	rorl	$2,%r15d
1572
1573	xorl	%r12d,%r13d
1574	shrl	$3,%r12d
1575	rorl	$7,%r13d
1576	xorl	%r14d,%r15d
1577	shrl	$10,%r14d
1578
1579	rorl	$17,%r15d
1580	xorl	%r13d,%r12d
1581	xorl	%r14d,%r15d
1582	addl	28(%rsp),%r12d
1583
1584	addl	56(%rsp),%r12d
1585	movl	%r10d,%r13d
1586	addl	%r15d,%r12d
1587	movl	%ecx,%r14d
1588	rorl	$14,%r13d
1589	movl	%r11d,%r15d
1590
1591	xorl	%r10d,%r13d
1592	rorl	$9,%r14d
1593	xorl	%eax,%r15d
1594
1595	movl	%r12d,56(%rsp)
1596	xorl	%ecx,%r14d
1597	andl	%r10d,%r15d
1598
1599	rorl	$5,%r13d
1600	addl	%ebx,%r12d
1601	xorl	%eax,%r15d
1602
1603	rorl	$11,%r14d
1604	xorl	%r10d,%r13d
1605	addl	%r15d,%r12d
1606
1607	movl	%ecx,%r15d
1608	addl	(%rbp),%r12d
1609	xorl	%ecx,%r14d
1610
1611	xorl	%edx,%r15d
1612	rorl	$6,%r13d
1613	movl	%edx,%ebx
1614
1615	andl	%r15d,%edi
1616	rorl	$2,%r14d
1617	addl	%r13d,%r12d
1618
1619	xorl	%edi,%ebx
1620	addl	%r12d,%r9d
1621	addl	%r12d,%ebx
1622
1623	leaq	4(%rbp),%rbp
1624	movl	0(%rsp),%r13d
1625	movl	52(%rsp),%edi
1626
1627	movl	%r13d,%r12d
1628	rorl	$11,%r13d
1629	addl	%r14d,%ebx
1630	movl	%edi,%r14d
1631	rorl	$2,%edi
1632
1633	xorl	%r12d,%r13d
1634	shrl	$3,%r12d
1635	rorl	$7,%r13d
1636	xorl	%r14d,%edi
1637	shrl	$10,%r14d
1638
1639	rorl	$17,%edi
1640	xorl	%r13d,%r12d
1641	xorl	%r14d,%edi
1642	addl	32(%rsp),%r12d
1643
1644	addl	60(%rsp),%r12d
1645	movl	%r9d,%r13d
1646	addl	%edi,%r12d
1647	movl	%ebx,%r14d
1648	rorl	$14,%r13d
1649	movl	%r10d,%edi
1650
1651	xorl	%r9d,%r13d
1652	rorl	$9,%r14d
1653	xorl	%r11d,%edi
1654
1655	movl	%r12d,60(%rsp)
1656	xorl	%ebx,%r14d
1657	andl	%r9d,%edi
1658
1659	rorl	$5,%r13d
1660	addl	%eax,%r12d
1661	xorl	%r11d,%edi
1662
1663	rorl	$11,%r14d
1664	xorl	%r9d,%r13d
1665	addl	%edi,%r12d
1666
1667	movl	%ebx,%edi
1668	addl	(%rbp),%r12d
1669	xorl	%ebx,%r14d
1670
1671	xorl	%ecx,%edi
1672	rorl	$6,%r13d
1673	movl	%ecx,%eax
1674
1675	andl	%edi,%r15d
1676	rorl	$2,%r14d
1677	addl	%r13d,%r12d
1678
1679	xorl	%r15d,%eax
1680	addl	%r12d,%r8d
1681	addl	%r12d,%eax
1682
1683	leaq	20(%rbp),%rbp
1684	cmpb	$0,3(%rbp)
1685	jnz	.Lrounds_16_xx
1686
1687	movq	64+0(%rsp),%rdi
1688	addl	%r14d,%eax
1689	leaq	64(%rsi),%rsi
1690
1691	addl	0(%rdi),%eax
1692	addl	4(%rdi),%ebx
1693	addl	8(%rdi),%ecx
1694	addl	12(%rdi),%edx
1695	addl	16(%rdi),%r8d
1696	addl	20(%rdi),%r9d
1697	addl	24(%rdi),%r10d
1698	addl	28(%rdi),%r11d
1699
1700	cmpq	64+16(%rsp),%rsi
1701
1702	movl	%eax,0(%rdi)
1703	movl	%ebx,4(%rdi)
1704	movl	%ecx,8(%rdi)
1705	movl	%edx,12(%rdi)
1706	movl	%r8d,16(%rdi)
1707	movl	%r9d,20(%rdi)
1708	movl	%r10d,24(%rdi)
1709	movl	%r11d,28(%rdi)
1710	jb	.Lloop
1711
1712	movq	88(%rsp),%rsi
1713.cfi_def_cfa	%rsi,8
1714	movq	-48(%rsi),%r15
1715.cfi_restore	%r15
1716	movq	-40(%rsi),%r14
1717.cfi_restore	%r14
1718	movq	-32(%rsi),%r13
1719.cfi_restore	%r13
1720	movq	-24(%rsi),%r12
1721.cfi_restore	%r12
1722	movq	-16(%rsi),%rbp
1723.cfi_restore	%rbp
1724	movq	-8(%rsi),%rbx
1725.cfi_restore	%rbx
1726	leaq	(%rsi),%rsp
1727.cfi_def_cfa_register	%rsp
1728.Lepilogue:
1729	.byte	0xf3,0xc3
1730.cfi_endproc
1731.size	sha256_block_data_order,.-sha256_block_data_order
1732.align	64
1733.type	K256,@object
1734K256:
1735.long	0x428a2f98,0x71374491,0xb5c0fbcf,0xe9b5dba5
1736.long	0x428a2f98,0x71374491,0xb5c0fbcf,0xe9b5dba5
1737.long	0x3956c25b,0x59f111f1,0x923f82a4,0xab1c5ed5
1738.long	0x3956c25b,0x59f111f1,0x923f82a4,0xab1c5ed5
1739.long	0xd807aa98,0x12835b01,0x243185be,0x550c7dc3
1740.long	0xd807aa98,0x12835b01,0x243185be,0x550c7dc3
1741.long	0x72be5d74,0x80deb1fe,0x9bdc06a7,0xc19bf174
1742.long	0x72be5d74,0x80deb1fe,0x9bdc06a7,0xc19bf174
1743.long	0xe49b69c1,0xefbe4786,0x0fc19dc6,0x240ca1cc
1744.long	0xe49b69c1,0xefbe4786,0x0fc19dc6,0x240ca1cc
1745.long	0x2de92c6f,0x4a7484aa,0x5cb0a9dc,0x76f988da
1746.long	0x2de92c6f,0x4a7484aa,0x5cb0a9dc,0x76f988da
1747.long	0x983e5152,0xa831c66d,0xb00327c8,0xbf597fc7
1748.long	0x983e5152,0xa831c66d,0xb00327c8,0xbf597fc7
1749.long	0xc6e00bf3,0xd5a79147,0x06ca6351,0x14292967
1750.long	0xc6e00bf3,0xd5a79147,0x06ca6351,0x14292967
1751.long	0x27b70a85,0x2e1b2138,0x4d2c6dfc,0x53380d13
1752.long	0x27b70a85,0x2e1b2138,0x4d2c6dfc,0x53380d13
1753.long	0x650a7354,0x766a0abb,0x81c2c92e,0x92722c85
1754.long	0x650a7354,0x766a0abb,0x81c2c92e,0x92722c85
1755.long	0xa2bfe8a1,0xa81a664b,0xc24b8b70,0xc76c51a3
1756.long	0xa2bfe8a1,0xa81a664b,0xc24b8b70,0xc76c51a3
1757.long	0xd192e819,0xd6990624,0xf40e3585,0x106aa070
1758.long	0xd192e819,0xd6990624,0xf40e3585,0x106aa070
1759.long	0x19a4c116,0x1e376c08,0x2748774c,0x34b0bcb5
1760.long	0x19a4c116,0x1e376c08,0x2748774c,0x34b0bcb5
1761.long	0x391c0cb3,0x4ed8aa4a,0x5b9cca4f,0x682e6ff3
1762.long	0x391c0cb3,0x4ed8aa4a,0x5b9cca4f,0x682e6ff3
1763.long	0x748f82ee,0x78a5636f,0x84c87814,0x8cc70208
1764.long	0x748f82ee,0x78a5636f,0x84c87814,0x8cc70208
1765.long	0x90befffa,0xa4506ceb,0xbef9a3f7,0xc67178f2
1766.long	0x90befffa,0xa4506ceb,0xbef9a3f7,0xc67178f2
1767
1768.long	0x00010203,0x04050607,0x08090a0b,0x0c0d0e0f
1769.long	0x00010203,0x04050607,0x08090a0b,0x0c0d0e0f
1770.long	0x03020100,0x0b0a0908,0xffffffff,0xffffffff
1771.long	0x03020100,0x0b0a0908,0xffffffff,0xffffffff
1772.long	0xffffffff,0xffffffff,0x03020100,0x0b0a0908
1773.long	0xffffffff,0xffffffff,0x03020100,0x0b0a0908
1774.byte	83,72,65,50,53,54,32,98,108,111,99,107,32,116,114,97,110,115,102,111,114,109,32,102,111,114,32,120,56,54,95,54,52,44,32,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0
1775.type	sha256_block_data_order_shaext,@function
1776.align	64
1777sha256_block_data_order_shaext:
1778_shaext_shortcut:
1779.cfi_startproc
1780	leaq	K256+128(%rip),%rcx
1781	movdqu	(%rdi),%xmm1
1782	movdqu	16(%rdi),%xmm2
1783	movdqa	512-128(%rcx),%xmm7
1784
1785	pshufd	$0x1b,%xmm1,%xmm0
1786	pshufd	$0xb1,%xmm1,%xmm1
1787	pshufd	$0x1b,%xmm2,%xmm2
1788	movdqa	%xmm7,%xmm8
1789.byte	102,15,58,15,202,8
1790	punpcklqdq	%xmm0,%xmm2
1791	jmp	.Loop_shaext
1792
1793.align	16
1794.Loop_shaext:
1795	movdqu	(%rsi),%xmm3
1796	movdqu	16(%rsi),%xmm4
1797	movdqu	32(%rsi),%xmm5
1798.byte	102,15,56,0,223
1799	movdqu	48(%rsi),%xmm6
1800
1801	movdqa	0-128(%rcx),%xmm0
1802	paddd	%xmm3,%xmm0
1803.byte	102,15,56,0,231
1804	movdqa	%xmm2,%xmm10
1805.byte	15,56,203,209
1806	pshufd	$0x0e,%xmm0,%xmm0
1807	nop
1808	movdqa	%xmm1,%xmm9
1809.byte	15,56,203,202
1810
1811	movdqa	32-128(%rcx),%xmm0
1812	paddd	%xmm4,%xmm0
1813.byte	102,15,56,0,239
1814.byte	15,56,203,209
1815	pshufd	$0x0e,%xmm0,%xmm0
1816	leaq	64(%rsi),%rsi
1817.byte	15,56,204,220
1818.byte	15,56,203,202
1819
1820	movdqa	64-128(%rcx),%xmm0
1821	paddd	%xmm5,%xmm0
1822.byte	102,15,56,0,247
1823.byte	15,56,203,209
1824	pshufd	$0x0e,%xmm0,%xmm0
1825	movdqa	%xmm6,%xmm7
1826.byte	102,15,58,15,253,4
1827	nop
1828	paddd	%xmm7,%xmm3
1829.byte	15,56,204,229
1830.byte	15,56,203,202
1831
1832	movdqa	96-128(%rcx),%xmm0
1833	paddd	%xmm6,%xmm0
1834.byte	15,56,205,222
1835.byte	15,56,203,209
1836	pshufd	$0x0e,%xmm0,%xmm0
1837	movdqa	%xmm3,%xmm7
1838.byte	102,15,58,15,254,4
1839	nop
1840	paddd	%xmm7,%xmm4
1841.byte	15,56,204,238
1842.byte	15,56,203,202
1843	movdqa	128-128(%rcx),%xmm0
1844	paddd	%xmm3,%xmm0
1845.byte	15,56,205,227
1846.byte	15,56,203,209
1847	pshufd	$0x0e,%xmm0,%xmm0
1848	movdqa	%xmm4,%xmm7
1849.byte	102,15,58,15,251,4
1850	nop
1851	paddd	%xmm7,%xmm5
1852.byte	15,56,204,243
1853.byte	15,56,203,202
1854	movdqa	160-128(%rcx),%xmm0
1855	paddd	%xmm4,%xmm0
1856.byte	15,56,205,236
1857.byte	15,56,203,209
1858	pshufd	$0x0e,%xmm0,%xmm0
1859	movdqa	%xmm5,%xmm7
1860.byte	102,15,58,15,252,4
1861	nop
1862	paddd	%xmm7,%xmm6
1863.byte	15,56,204,220
1864.byte	15,56,203,202
1865	movdqa	192-128(%rcx),%xmm0
1866	paddd	%xmm5,%xmm0
1867.byte	15,56,205,245
1868.byte	15,56,203,209
1869	pshufd	$0x0e,%xmm0,%xmm0
1870	movdqa	%xmm6,%xmm7
1871.byte	102,15,58,15,253,4
1872	nop
1873	paddd	%xmm7,%xmm3
1874.byte	15,56,204,229
1875.byte	15,56,203,202
1876	movdqa	224-128(%rcx),%xmm0
1877	paddd	%xmm6,%xmm0
1878.byte	15,56,205,222
1879.byte	15,56,203,209
1880	pshufd	$0x0e,%xmm0,%xmm0
1881	movdqa	%xmm3,%xmm7
1882.byte	102,15,58,15,254,4
1883	nop
1884	paddd	%xmm7,%xmm4
1885.byte	15,56,204,238
1886.byte	15,56,203,202
1887	movdqa	256-128(%rcx),%xmm0
1888	paddd	%xmm3,%xmm0
1889.byte	15,56,205,227
1890.byte	15,56,203,209
1891	pshufd	$0x0e,%xmm0,%xmm0
1892	movdqa	%xmm4,%xmm7
1893.byte	102,15,58,15,251,4
1894	nop
1895	paddd	%xmm7,%xmm5
1896.byte	15,56,204,243
1897.byte	15,56,203,202
1898	movdqa	288-128(%rcx),%xmm0
1899	paddd	%xmm4,%xmm0
1900.byte	15,56,205,236
1901.byte	15,56,203,209
1902	pshufd	$0x0e,%xmm0,%xmm0
1903	movdqa	%xmm5,%xmm7
1904.byte	102,15,58,15,252,4
1905	nop
1906	paddd	%xmm7,%xmm6
1907.byte	15,56,204,220
1908.byte	15,56,203,202
1909	movdqa	320-128(%rcx),%xmm0
1910	paddd	%xmm5,%xmm0
1911.byte	15,56,205,245
1912.byte	15,56,203,209
1913	pshufd	$0x0e,%xmm0,%xmm0
1914	movdqa	%xmm6,%xmm7
1915.byte	102,15,58,15,253,4
1916	nop
1917	paddd	%xmm7,%xmm3
1918.byte	15,56,204,229
1919.byte	15,56,203,202
1920	movdqa	352-128(%rcx),%xmm0
1921	paddd	%xmm6,%xmm0
1922.byte	15,56,205,222
1923.byte	15,56,203,209
1924	pshufd	$0x0e,%xmm0,%xmm0
1925	movdqa	%xmm3,%xmm7
1926.byte	102,15,58,15,254,4
1927	nop
1928	paddd	%xmm7,%xmm4
1929.byte	15,56,204,238
1930.byte	15,56,203,202
1931	movdqa	384-128(%rcx),%xmm0
1932	paddd	%xmm3,%xmm0
1933.byte	15,56,205,227
1934.byte	15,56,203,209
1935	pshufd	$0x0e,%xmm0,%xmm0
1936	movdqa	%xmm4,%xmm7
1937.byte	102,15,58,15,251,4
1938	nop
1939	paddd	%xmm7,%xmm5
1940.byte	15,56,204,243
1941.byte	15,56,203,202
1942	movdqa	416-128(%rcx),%xmm0
1943	paddd	%xmm4,%xmm0
1944.byte	15,56,205,236
1945.byte	15,56,203,209
1946	pshufd	$0x0e,%xmm0,%xmm0
1947	movdqa	%xmm5,%xmm7
1948.byte	102,15,58,15,252,4
1949.byte	15,56,203,202
1950	paddd	%xmm7,%xmm6
1951
1952	movdqa	448-128(%rcx),%xmm0
1953	paddd	%xmm5,%xmm0
1954.byte	15,56,203,209
1955	pshufd	$0x0e,%xmm0,%xmm0
1956.byte	15,56,205,245
1957	movdqa	%xmm8,%xmm7
1958.byte	15,56,203,202
1959
1960	movdqa	480-128(%rcx),%xmm0
1961	paddd	%xmm6,%xmm0
1962	nop
1963.byte	15,56,203,209
1964	pshufd	$0x0e,%xmm0,%xmm0
1965	decq	%rdx
1966	nop
1967.byte	15,56,203,202
1968
1969	paddd	%xmm10,%xmm2
1970	paddd	%xmm9,%xmm1
1971	jnz	.Loop_shaext
1972
1973	pshufd	$0xb1,%xmm2,%xmm2
1974	pshufd	$0x1b,%xmm1,%xmm7
1975	pshufd	$0xb1,%xmm1,%xmm1
1976	punpckhqdq	%xmm2,%xmm1
1977.byte	102,15,58,15,215,8
1978
1979	movdqu	%xmm1,(%rdi)
1980	movdqu	%xmm2,16(%rdi)
1981	.byte	0xf3,0xc3
1982.cfi_endproc
1983.size	sha256_block_data_order_shaext,.-sha256_block_data_order_shaext
1984.type	sha256_block_data_order_ssse3,@function
1985.align	64
1986sha256_block_data_order_ssse3:
1987.cfi_startproc
1988.Lssse3_shortcut:
1989	movq	%rsp,%rax
1990.cfi_def_cfa_register	%rax
1991	pushq	%rbx
1992.cfi_offset	%rbx,-16
1993	pushq	%rbp
1994.cfi_offset	%rbp,-24
1995	pushq	%r12
1996.cfi_offset	%r12,-32
1997	pushq	%r13
1998.cfi_offset	%r13,-40
1999	pushq	%r14
2000.cfi_offset	%r14,-48
2001	pushq	%r15
2002.cfi_offset	%r15,-56
2003	shlq	$4,%rdx
2004	subq	$96,%rsp
2005	leaq	(%rsi,%rdx,4),%rdx
2006	andq	$-64,%rsp
2007	movq	%rdi,64+0(%rsp)
2008	movq	%rsi,64+8(%rsp)
2009	movq	%rdx,64+16(%rsp)
2010	movq	%rax,88(%rsp)
2011.cfi_escape	0x0f,0x06,0x77,0xd8,0x00,0x06,0x23,0x08
2012.Lprologue_ssse3:
2013
2014	movl	0(%rdi),%eax
2015	movl	4(%rdi),%ebx
2016	movl	8(%rdi),%ecx
2017	movl	12(%rdi),%edx
2018	movl	16(%rdi),%r8d
2019	movl	20(%rdi),%r9d
2020	movl	24(%rdi),%r10d
2021	movl	28(%rdi),%r11d
2022
2023
2024	jmp	.Lloop_ssse3
2025.align	16
2026.Lloop_ssse3:
2027	movdqa	K256+512(%rip),%xmm7
2028	movdqu	0(%rsi),%xmm0
2029	movdqu	16(%rsi),%xmm1
2030	movdqu	32(%rsi),%xmm2
2031.byte	102,15,56,0,199
2032	movdqu	48(%rsi),%xmm3
2033	leaq	K256(%rip),%rbp
2034.byte	102,15,56,0,207
2035	movdqa	0(%rbp),%xmm4
2036	movdqa	32(%rbp),%xmm5
2037.byte	102,15,56,0,215
2038	paddd	%xmm0,%xmm4
2039	movdqa	64(%rbp),%xmm6
2040.byte	102,15,56,0,223
2041	movdqa	96(%rbp),%xmm7
2042	paddd	%xmm1,%xmm5
2043	paddd	%xmm2,%xmm6
2044	paddd	%xmm3,%xmm7
2045	movdqa	%xmm4,0(%rsp)
2046	movl	%eax,%r14d
2047	movdqa	%xmm5,16(%rsp)
2048	movl	%ebx,%edi
2049	movdqa	%xmm6,32(%rsp)
2050	xorl	%ecx,%edi
2051	movdqa	%xmm7,48(%rsp)
2052	movl	%r8d,%r13d
2053	jmp	.Lssse3_00_47
2054
2055.align	16
2056.Lssse3_00_47:
2057	subq	$-128,%rbp
2058	rorl	$14,%r13d
2059	movdqa	%xmm1,%xmm4
2060	movl	%r14d,%eax
2061	movl	%r9d,%r12d
2062	movdqa	%xmm3,%xmm7
2063	rorl	$9,%r14d
2064	xorl	%r8d,%r13d
2065	xorl	%r10d,%r12d
2066	rorl	$5,%r13d
2067	xorl	%eax,%r14d
2068.byte	102,15,58,15,224,4
2069	andl	%r8d,%r12d
2070	xorl	%r8d,%r13d
2071.byte	102,15,58,15,250,4
2072	addl	0(%rsp),%r11d
2073	movl	%eax,%r15d
2074	xorl	%r10d,%r12d
2075	rorl	$11,%r14d
2076	movdqa	%xmm4,%xmm5
2077	xorl	%ebx,%r15d
2078	addl	%r12d,%r11d
2079	movdqa	%xmm4,%xmm6
2080	rorl	$6,%r13d
2081	andl	%r15d,%edi
2082	psrld	$3,%xmm4
2083	xorl	%eax,%r14d
2084	addl	%r13d,%r11d
2085	xorl	%ebx,%edi
2086	paddd	%xmm7,%xmm0
2087	rorl	$2,%r14d
2088	addl	%r11d,%edx
2089	psrld	$7,%xmm6
2090	addl	%edi,%r11d
2091	movl	%edx,%r13d
2092	pshufd	$250,%xmm3,%xmm7
2093	addl	%r11d,%r14d
2094	rorl	$14,%r13d
2095	pslld	$14,%xmm5
2096	movl	%r14d,%r11d
2097	movl	%r8d,%r12d
2098	pxor	%xmm6,%xmm4
2099	rorl	$9,%r14d
2100	xorl	%edx,%r13d
2101	xorl	%r9d,%r12d
2102	rorl	$5,%r13d
2103	psrld	$11,%xmm6
2104	xorl	%r11d,%r14d
2105	pxor	%xmm5,%xmm4
2106	andl	%edx,%r12d
2107	xorl	%edx,%r13d
2108	pslld	$11,%xmm5
2109	addl	4(%rsp),%r10d
2110	movl	%r11d,%edi
2111	pxor	%xmm6,%xmm4
2112	xorl	%r9d,%r12d
2113	rorl	$11,%r14d
2114	movdqa	%xmm7,%xmm6
2115	xorl	%eax,%edi
2116	addl	%r12d,%r10d
2117	pxor	%xmm5,%xmm4
2118	rorl	$6,%r13d
2119	andl	%edi,%r15d
2120	xorl	%r11d,%r14d
2121	psrld	$10,%xmm7
2122	addl	%r13d,%r10d
2123	xorl	%eax,%r15d
2124	paddd	%xmm4,%xmm0
2125	rorl	$2,%r14d
2126	addl	%r10d,%ecx
2127	psrlq	$17,%xmm6
2128	addl	%r15d,%r10d
2129	movl	%ecx,%r13d
2130	addl	%r10d,%r14d
2131	pxor	%xmm6,%xmm7
2132	rorl	$14,%r13d
2133	movl	%r14d,%r10d
2134	movl	%edx,%r12d
2135	rorl	$9,%r14d
2136	psrlq	$2,%xmm6
2137	xorl	%ecx,%r13d
2138	xorl	%r8d,%r12d
2139	pxor	%xmm6,%xmm7
2140	rorl	$5,%r13d
2141	xorl	%r10d,%r14d
2142	andl	%ecx,%r12d
2143	pshufd	$128,%xmm7,%xmm7
2144	xorl	%ecx,%r13d
2145	addl	8(%rsp),%r9d
2146	movl	%r10d,%r15d
2147	psrldq	$8,%xmm7
2148	xorl	%r8d,%r12d
2149	rorl	$11,%r14d
2150	xorl	%r11d,%r15d
2151	addl	%r12d,%r9d
2152	rorl	$6,%r13d
2153	paddd	%xmm7,%xmm0
2154	andl	%r15d,%edi
2155	xorl	%r10d,%r14d
2156	addl	%r13d,%r9d
2157	pshufd	$80,%xmm0,%xmm7
2158	xorl	%r11d,%edi
2159	rorl	$2,%r14d
2160	addl	%r9d,%ebx
2161	movdqa	%xmm7,%xmm6
2162	addl	%edi,%r9d
2163	movl	%ebx,%r13d
2164	psrld	$10,%xmm7
2165	addl	%r9d,%r14d
2166	rorl	$14,%r13d
2167	psrlq	$17,%xmm6
2168	movl	%r14d,%r9d
2169	movl	%ecx,%r12d
2170	pxor	%xmm6,%xmm7
2171	rorl	$9,%r14d
2172	xorl	%ebx,%r13d
2173	xorl	%edx,%r12d
2174	rorl	$5,%r13d
2175	xorl	%r9d,%r14d
2176	psrlq	$2,%xmm6
2177	andl	%ebx,%r12d
2178	xorl	%ebx,%r13d
2179	addl	12(%rsp),%r8d
2180	pxor	%xmm6,%xmm7
2181	movl	%r9d,%edi
2182	xorl	%edx,%r12d
2183	rorl	$11,%r14d
2184	pshufd	$8,%xmm7,%xmm7
2185	xorl	%r10d,%edi
2186	addl	%r12d,%r8d
2187	movdqa	0(%rbp),%xmm6
2188	rorl	$6,%r13d
2189	andl	%edi,%r15d
2190	pslldq	$8,%xmm7
2191	xorl	%r9d,%r14d
2192	addl	%r13d,%r8d
2193	xorl	%r10d,%r15d
2194	paddd	%xmm7,%xmm0
2195	rorl	$2,%r14d
2196	addl	%r8d,%eax
2197	addl	%r15d,%r8d
2198	paddd	%xmm0,%xmm6
2199	movl	%eax,%r13d
2200	addl	%r8d,%r14d
2201	movdqa	%xmm6,0(%rsp)
2202	rorl	$14,%r13d
2203	movdqa	%xmm2,%xmm4
2204	movl	%r14d,%r8d
2205	movl	%ebx,%r12d
2206	movdqa	%xmm0,%xmm7
2207	rorl	$9,%r14d
2208	xorl	%eax,%r13d
2209	xorl	%ecx,%r12d
2210	rorl	$5,%r13d
2211	xorl	%r8d,%r14d
2212.byte	102,15,58,15,225,4
2213	andl	%eax,%r12d
2214	xorl	%eax,%r13d
2215.byte	102,15,58,15,251,4
2216	addl	16(%rsp),%edx
2217	movl	%r8d,%r15d
2218	xorl	%ecx,%r12d
2219	rorl	$11,%r14d
2220	movdqa	%xmm4,%xmm5
2221	xorl	%r9d,%r15d
2222	addl	%r12d,%edx
2223	movdqa	%xmm4,%xmm6
2224	rorl	$6,%r13d
2225	andl	%r15d,%edi
2226	psrld	$3,%xmm4
2227	xorl	%r8d,%r14d
2228	addl	%r13d,%edx
2229	xorl	%r9d,%edi
2230	paddd	%xmm7,%xmm1
2231	rorl	$2,%r14d
2232	addl	%edx,%r11d
2233	psrld	$7,%xmm6
2234	addl	%edi,%edx
2235	movl	%r11d,%r13d
2236	pshufd	$250,%xmm0,%xmm7
2237	addl	%edx,%r14d
2238	rorl	$14,%r13d
2239	pslld	$14,%xmm5
2240	movl	%r14d,%edx
2241	movl	%eax,%r12d
2242	pxor	%xmm6,%xmm4
2243	rorl	$9,%r14d
2244	xorl	%r11d,%r13d
2245	xorl	%ebx,%r12d
2246	rorl	$5,%r13d
2247	psrld	$11,%xmm6
2248	xorl	%edx,%r14d
2249	pxor	%xmm5,%xmm4
2250	andl	%r11d,%r12d
2251	xorl	%r11d,%r13d
2252	pslld	$11,%xmm5
2253	addl	20(%rsp),%ecx
2254	movl	%edx,%edi
2255	pxor	%xmm6,%xmm4
2256	xorl	%ebx,%r12d
2257	rorl	$11,%r14d
2258	movdqa	%xmm7,%xmm6
2259	xorl	%r8d,%edi
2260	addl	%r12d,%ecx
2261	pxor	%xmm5,%xmm4
2262	rorl	$6,%r13d
2263	andl	%edi,%r15d
2264	xorl	%edx,%r14d
2265	psrld	$10,%xmm7
2266	addl	%r13d,%ecx
2267	xorl	%r8d,%r15d
2268	paddd	%xmm4,%xmm1
2269	rorl	$2,%r14d
2270	addl	%ecx,%r10d
2271	psrlq	$17,%xmm6
2272	addl	%r15d,%ecx
2273	movl	%r10d,%r13d
2274	addl	%ecx,%r14d
2275	pxor	%xmm6,%xmm7
2276	rorl	$14,%r13d
2277	movl	%r14d,%ecx
2278	movl	%r11d,%r12d
2279	rorl	$9,%r14d
2280	psrlq	$2,%xmm6
2281	xorl	%r10d,%r13d
2282	xorl	%eax,%r12d
2283	pxor	%xmm6,%xmm7
2284	rorl	$5,%r13d
2285	xorl	%ecx,%r14d
2286	andl	%r10d,%r12d
2287	pshufd	$128,%xmm7,%xmm7
2288	xorl	%r10d,%r13d
2289	addl	24(%rsp),%ebx
2290	movl	%ecx,%r15d
2291	psrldq	$8,%xmm7
2292	xorl	%eax,%r12d
2293	rorl	$11,%r14d
2294	xorl	%edx,%r15d
2295	addl	%r12d,%ebx
2296	rorl	$6,%r13d
2297	paddd	%xmm7,%xmm1
2298	andl	%r15d,%edi
2299	xorl	%ecx,%r14d
2300	addl	%r13d,%ebx
2301	pshufd	$80,%xmm1,%xmm7
2302	xorl	%edx,%edi
2303	rorl	$2,%r14d
2304	addl	%ebx,%r9d
2305	movdqa	%xmm7,%xmm6
2306	addl	%edi,%ebx
2307	movl	%r9d,%r13d
2308	psrld	$10,%xmm7
2309	addl	%ebx,%r14d
2310	rorl	$14,%r13d
2311	psrlq	$17,%xmm6
2312	movl	%r14d,%ebx
2313	movl	%r10d,%r12d
2314	pxor	%xmm6,%xmm7
2315	rorl	$9,%r14d
2316	xorl	%r9d,%r13d
2317	xorl	%r11d,%r12d
2318	rorl	$5,%r13d
2319	xorl	%ebx,%r14d
2320	psrlq	$2,%xmm6
2321	andl	%r9d,%r12d
2322	xorl	%r9d,%r13d
2323	addl	28(%rsp),%eax
2324	pxor	%xmm6,%xmm7
2325	movl	%ebx,%edi
2326	xorl	%r11d,%r12d
2327	rorl	$11,%r14d
2328	pshufd	$8,%xmm7,%xmm7
2329	xorl	%ecx,%edi
2330	addl	%r12d,%eax
2331	movdqa	32(%rbp),%xmm6
2332	rorl	$6,%r13d
2333	andl	%edi,%r15d
2334	pslldq	$8,%xmm7
2335	xorl	%ebx,%r14d
2336	addl	%r13d,%eax
2337	xorl	%ecx,%r15d
2338	paddd	%xmm7,%xmm1
2339	rorl	$2,%r14d
2340	addl	%eax,%r8d
2341	addl	%r15d,%eax
2342	paddd	%xmm1,%xmm6
2343	movl	%r8d,%r13d
2344	addl	%eax,%r14d
2345	movdqa	%xmm6,16(%rsp)
2346	rorl	$14,%r13d
2347	movdqa	%xmm3,%xmm4
2348	movl	%r14d,%eax
2349	movl	%r9d,%r12d
2350	movdqa	%xmm1,%xmm7
2351	rorl	$9,%r14d
2352	xorl	%r8d,%r13d
2353	xorl	%r10d,%r12d
2354	rorl	$5,%r13d
2355	xorl	%eax,%r14d
2356.byte	102,15,58,15,226,4
2357	andl	%r8d,%r12d
2358	xorl	%r8d,%r13d
2359.byte	102,15,58,15,248,4
2360	addl	32(%rsp),%r11d
2361	movl	%eax,%r15d
2362	xorl	%r10d,%r12d
2363	rorl	$11,%r14d
2364	movdqa	%xmm4,%xmm5
2365	xorl	%ebx,%r15d
2366	addl	%r12d,%r11d
2367	movdqa	%xmm4,%xmm6
2368	rorl	$6,%r13d
2369	andl	%r15d,%edi
2370	psrld	$3,%xmm4
2371	xorl	%eax,%r14d
2372	addl	%r13d,%r11d
2373	xorl	%ebx,%edi
2374	paddd	%xmm7,%xmm2
2375	rorl	$2,%r14d
2376	addl	%r11d,%edx
2377	psrld	$7,%xmm6
2378	addl	%edi,%r11d
2379	movl	%edx,%r13d
2380	pshufd	$250,%xmm1,%xmm7
2381	addl	%r11d,%r14d
2382	rorl	$14,%r13d
2383	pslld	$14,%xmm5
2384	movl	%r14d,%r11d
2385	movl	%r8d,%r12d
2386	pxor	%xmm6,%xmm4
2387	rorl	$9,%r14d
2388	xorl	%edx,%r13d
2389	xorl	%r9d,%r12d
2390	rorl	$5,%r13d
2391	psrld	$11,%xmm6
2392	xorl	%r11d,%r14d
2393	pxor	%xmm5,%xmm4
2394	andl	%edx,%r12d
2395	xorl	%edx,%r13d
2396	pslld	$11,%xmm5
2397	addl	36(%rsp),%r10d
2398	movl	%r11d,%edi
2399	pxor	%xmm6,%xmm4
2400	xorl	%r9d,%r12d
2401	rorl	$11,%r14d
2402	movdqa	%xmm7,%xmm6
2403	xorl	%eax,%edi
2404	addl	%r12d,%r10d
2405	pxor	%xmm5,%xmm4
2406	rorl	$6,%r13d
2407	andl	%edi,%r15d
2408	xorl	%r11d,%r14d
2409	psrld	$10,%xmm7
2410	addl	%r13d,%r10d
2411	xorl	%eax,%r15d
2412	paddd	%xmm4,%xmm2
2413	rorl	$2,%r14d
2414	addl	%r10d,%ecx
2415	psrlq	$17,%xmm6
2416	addl	%r15d,%r10d
2417	movl	%ecx,%r13d
2418	addl	%r10d,%r14d
2419	pxor	%xmm6,%xmm7
2420	rorl	$14,%r13d
2421	movl	%r14d,%r10d
2422	movl	%edx,%r12d
2423	rorl	$9,%r14d
2424	psrlq	$2,%xmm6
2425	xorl	%ecx,%r13d
2426	xorl	%r8d,%r12d
2427	pxor	%xmm6,%xmm7
2428	rorl	$5,%r13d
2429	xorl	%r10d,%r14d
2430	andl	%ecx,%r12d
2431	pshufd	$128,%xmm7,%xmm7
2432	xorl	%ecx,%r13d
2433	addl	40(%rsp),%r9d
2434	movl	%r10d,%r15d
2435	psrldq	$8,%xmm7
2436	xorl	%r8d,%r12d
2437	rorl	$11,%r14d
2438	xorl	%r11d,%r15d
2439	addl	%r12d,%r9d
2440	rorl	$6,%r13d
2441	paddd	%xmm7,%xmm2
2442	andl	%r15d,%edi
2443	xorl	%r10d,%r14d
2444	addl	%r13d,%r9d
2445	pshufd	$80,%xmm2,%xmm7
2446	xorl	%r11d,%edi
2447	rorl	$2,%r14d
2448	addl	%r9d,%ebx
2449	movdqa	%xmm7,%xmm6
2450	addl	%edi,%r9d
2451	movl	%ebx,%r13d
2452	psrld	$10,%xmm7
2453	addl	%r9d,%r14d
2454	rorl	$14,%r13d
2455	psrlq	$17,%xmm6
2456	movl	%r14d,%r9d
2457	movl	%ecx,%r12d
2458	pxor	%xmm6,%xmm7
2459	rorl	$9,%r14d
2460	xorl	%ebx,%r13d
2461	xorl	%edx,%r12d
2462	rorl	$5,%r13d
2463	xorl	%r9d,%r14d
2464	psrlq	$2,%xmm6
2465	andl	%ebx,%r12d
2466	xorl	%ebx,%r13d
2467	addl	44(%rsp),%r8d
2468	pxor	%xmm6,%xmm7
2469	movl	%r9d,%edi
2470	xorl	%edx,%r12d
2471	rorl	$11,%r14d
2472	pshufd	$8,%xmm7,%xmm7
2473	xorl	%r10d,%edi
2474	addl	%r12d,%r8d
2475	movdqa	64(%rbp),%xmm6
2476	rorl	$6,%r13d
2477	andl	%edi,%r15d
2478	pslldq	$8,%xmm7
2479	xorl	%r9d,%r14d
2480	addl	%r13d,%r8d
2481	xorl	%r10d,%r15d
2482	paddd	%xmm7,%xmm2
2483	rorl	$2,%r14d
2484	addl	%r8d,%eax
2485	addl	%r15d,%r8d
2486	paddd	%xmm2,%xmm6
2487	movl	%eax,%r13d
2488	addl	%r8d,%r14d
2489	movdqa	%xmm6,32(%rsp)
2490	rorl	$14,%r13d
2491	movdqa	%xmm0,%xmm4
2492	movl	%r14d,%r8d
2493	movl	%ebx,%r12d
2494	movdqa	%xmm2,%xmm7
2495	rorl	$9,%r14d
2496	xorl	%eax,%r13d
2497	xorl	%ecx,%r12d
2498	rorl	$5,%r13d
2499	xorl	%r8d,%r14d
2500.byte	102,15,58,15,227,4
2501	andl	%eax,%r12d
2502	xorl	%eax,%r13d
2503.byte	102,15,58,15,249,4
2504	addl	48(%rsp),%edx
2505	movl	%r8d,%r15d
2506	xorl	%ecx,%r12d
2507	rorl	$11,%r14d
2508	movdqa	%xmm4,%xmm5
2509	xorl	%r9d,%r15d
2510	addl	%r12d,%edx
2511	movdqa	%xmm4,%xmm6
2512	rorl	$6,%r13d
2513	andl	%r15d,%edi
2514	psrld	$3,%xmm4
2515	xorl	%r8d,%r14d
2516	addl	%r13d,%edx
2517	xorl	%r9d,%edi
2518	paddd	%xmm7,%xmm3
2519	rorl	$2,%r14d
2520	addl	%edx,%r11d
2521	psrld	$7,%xmm6
2522	addl	%edi,%edx
2523	movl	%r11d,%r13d
2524	pshufd	$250,%xmm2,%xmm7
2525	addl	%edx,%r14d
2526	rorl	$14,%r13d
2527	pslld	$14,%xmm5
2528	movl	%r14d,%edx
2529	movl	%eax,%r12d
2530	pxor	%xmm6,%xmm4
2531	rorl	$9,%r14d
2532	xorl	%r11d,%r13d
2533	xorl	%ebx,%r12d
2534	rorl	$5,%r13d
2535	psrld	$11,%xmm6
2536	xorl	%edx,%r14d
2537	pxor	%xmm5,%xmm4
2538	andl	%r11d,%r12d
2539	xorl	%r11d,%r13d
2540	pslld	$11,%xmm5
2541	addl	52(%rsp),%ecx
2542	movl	%edx,%edi
2543	pxor	%xmm6,%xmm4
2544	xorl	%ebx,%r12d
2545	rorl	$11,%r14d
2546	movdqa	%xmm7,%xmm6
2547	xorl	%r8d,%edi
2548	addl	%r12d,%ecx
2549	pxor	%xmm5,%xmm4
2550	rorl	$6,%r13d
2551	andl	%edi,%r15d
2552	xorl	%edx,%r14d
2553	psrld	$10,%xmm7
2554	addl	%r13d,%ecx
2555	xorl	%r8d,%r15d
2556	paddd	%xmm4,%xmm3
2557	rorl	$2,%r14d
2558	addl	%ecx,%r10d
2559	psrlq	$17,%xmm6
2560	addl	%r15d,%ecx
2561	movl	%r10d,%r13d
2562	addl	%ecx,%r14d
2563	pxor	%xmm6,%xmm7
2564	rorl	$14,%r13d
2565	movl	%r14d,%ecx
2566	movl	%r11d,%r12d
2567	rorl	$9,%r14d
2568	psrlq	$2,%xmm6
2569	xorl	%r10d,%r13d
2570	xorl	%eax,%r12d
2571	pxor	%xmm6,%xmm7
2572	rorl	$5,%r13d
2573	xorl	%ecx,%r14d
2574	andl	%r10d,%r12d
2575	pshufd	$128,%xmm7,%xmm7
2576	xorl	%r10d,%r13d
2577	addl	56(%rsp),%ebx
2578	movl	%ecx,%r15d
2579	psrldq	$8,%xmm7
2580	xorl	%eax,%r12d
2581	rorl	$11,%r14d
2582	xorl	%edx,%r15d
2583	addl	%r12d,%ebx
2584	rorl	$6,%r13d
2585	paddd	%xmm7,%xmm3
2586	andl	%r15d,%edi
2587	xorl	%ecx,%r14d
2588	addl	%r13d,%ebx
2589	pshufd	$80,%xmm3,%xmm7
2590	xorl	%edx,%edi
2591	rorl	$2,%r14d
2592	addl	%ebx,%r9d
2593	movdqa	%xmm7,%xmm6
2594	addl	%edi,%ebx
2595	movl	%r9d,%r13d
2596	psrld	$10,%xmm7
2597	addl	%ebx,%r14d
2598	rorl	$14,%r13d
2599	psrlq	$17,%xmm6
2600	movl	%r14d,%ebx
2601	movl	%r10d,%r12d
2602	pxor	%xmm6,%xmm7
2603	rorl	$9,%r14d
2604	xorl	%r9d,%r13d
2605	xorl	%r11d,%r12d
2606	rorl	$5,%r13d
2607	xorl	%ebx,%r14d
2608	psrlq	$2,%xmm6
2609	andl	%r9d,%r12d
2610	xorl	%r9d,%r13d
2611	addl	60(%rsp),%eax
2612	pxor	%xmm6,%xmm7
2613	movl	%ebx,%edi
2614	xorl	%r11d,%r12d
2615	rorl	$11,%r14d
2616	pshufd	$8,%xmm7,%xmm7
2617	xorl	%ecx,%edi
2618	addl	%r12d,%eax
2619	movdqa	96(%rbp),%xmm6
2620	rorl	$6,%r13d
2621	andl	%edi,%r15d
2622	pslldq	$8,%xmm7
2623	xorl	%ebx,%r14d
2624	addl	%r13d,%eax
2625	xorl	%ecx,%r15d
2626	paddd	%xmm7,%xmm3
2627	rorl	$2,%r14d
2628	addl	%eax,%r8d
2629	addl	%r15d,%eax
2630	paddd	%xmm3,%xmm6
2631	movl	%r8d,%r13d
2632	addl	%eax,%r14d
2633	movdqa	%xmm6,48(%rsp)
2634	cmpb	$0,131(%rbp)
2635	jne	.Lssse3_00_47
2636	rorl	$14,%r13d
2637	movl	%r14d,%eax
2638	movl	%r9d,%r12d
2639	rorl	$9,%r14d
2640	xorl	%r8d,%r13d
2641	xorl	%r10d,%r12d
2642	rorl	$5,%r13d
2643	xorl	%eax,%r14d
2644	andl	%r8d,%r12d
2645	xorl	%r8d,%r13d
2646	addl	0(%rsp),%r11d
2647	movl	%eax,%r15d
2648	xorl	%r10d,%r12d
2649	rorl	$11,%r14d
2650	xorl	%ebx,%r15d
2651	addl	%r12d,%r11d
2652	rorl	$6,%r13d
2653	andl	%r15d,%edi
2654	xorl	%eax,%r14d
2655	addl	%r13d,%r11d
2656	xorl	%ebx,%edi
2657	rorl	$2,%r14d
2658	addl	%r11d,%edx
2659	addl	%edi,%r11d
2660	movl	%edx,%r13d
2661	addl	%r11d,%r14d
2662	rorl	$14,%r13d
2663	movl	%r14d,%r11d
2664	movl	%r8d,%r12d
2665	rorl	$9,%r14d
2666	xorl	%edx,%r13d
2667	xorl	%r9d,%r12d
2668	rorl	$5,%r13d
2669	xorl	%r11d,%r14d
2670	andl	%edx,%r12d
2671	xorl	%edx,%r13d
2672	addl	4(%rsp),%r10d
2673	movl	%r11d,%edi
2674	xorl	%r9d,%r12d
2675	rorl	$11,%r14d
2676	xorl	%eax,%edi
2677	addl	%r12d,%r10d
2678	rorl	$6,%r13d
2679	andl	%edi,%r15d
2680	xorl	%r11d,%r14d
2681	addl	%r13d,%r10d
2682	xorl	%eax,%r15d
2683	rorl	$2,%r14d
2684	addl	%r10d,%ecx
2685	addl	%r15d,%r10d
2686	movl	%ecx,%r13d
2687	addl	%r10d,%r14d
2688	rorl	$14,%r13d
2689	movl	%r14d,%r10d
2690	movl	%edx,%r12d
2691	rorl	$9,%r14d
2692	xorl	%ecx,%r13d
2693	xorl	%r8d,%r12d
2694	rorl	$5,%r13d
2695	xorl	%r10d,%r14d
2696	andl	%ecx,%r12d
2697	xorl	%ecx,%r13d
2698	addl	8(%rsp),%r9d
2699	movl	%r10d,%r15d
2700	xorl	%r8d,%r12d
2701	rorl	$11,%r14d
2702	xorl	%r11d,%r15d
2703	addl	%r12d,%r9d
2704	rorl	$6,%r13d
2705	andl	%r15d,%edi
2706	xorl	%r10d,%r14d
2707	addl	%r13d,%r9d
2708	xorl	%r11d,%edi
2709	rorl	$2,%r14d
2710	addl	%r9d,%ebx
2711	addl	%edi,%r9d
2712	movl	%ebx,%r13d
2713	addl	%r9d,%r14d
2714	rorl	$14,%r13d
2715	movl	%r14d,%r9d
2716	movl	%ecx,%r12d
2717	rorl	$9,%r14d
2718	xorl	%ebx,%r13d
2719	xorl	%edx,%r12d
2720	rorl	$5,%r13d
2721	xorl	%r9d,%r14d
2722	andl	%ebx,%r12d
2723	xorl	%ebx,%r13d
2724	addl	12(%rsp),%r8d
2725	movl	%r9d,%edi
2726	xorl	%edx,%r12d
2727	rorl	$11,%r14d
2728	xorl	%r10d,%edi
2729	addl	%r12d,%r8d
2730	rorl	$6,%r13d
2731	andl	%edi,%r15d
2732	xorl	%r9d,%r14d
2733	addl	%r13d,%r8d
2734	xorl	%r10d,%r15d
2735	rorl	$2,%r14d
2736	addl	%r8d,%eax
2737	addl	%r15d,%r8d
2738	movl	%eax,%r13d
2739	addl	%r8d,%r14d
2740	rorl	$14,%r13d
2741	movl	%r14d,%r8d
2742	movl	%ebx,%r12d
2743	rorl	$9,%r14d
2744	xorl	%eax,%r13d
2745	xorl	%ecx,%r12d
2746	rorl	$5,%r13d
2747	xorl	%r8d,%r14d
2748	andl	%eax,%r12d
2749	xorl	%eax,%r13d
2750	addl	16(%rsp),%edx
2751	movl	%r8d,%r15d
2752	xorl	%ecx,%r12d
2753	rorl	$11,%r14d
2754	xorl	%r9d,%r15d
2755	addl	%r12d,%edx
2756	rorl	$6,%r13d
2757	andl	%r15d,%edi
2758	xorl	%r8d,%r14d
2759	addl	%r13d,%edx
2760	xorl	%r9d,%edi
2761	rorl	$2,%r14d
2762	addl	%edx,%r11d
2763	addl	%edi,%edx
2764	movl	%r11d,%r13d
2765	addl	%edx,%r14d
2766	rorl	$14,%r13d
2767	movl	%r14d,%edx
2768	movl	%eax,%r12d
2769	rorl	$9,%r14d
2770	xorl	%r11d,%r13d
2771	xorl	%ebx,%r12d
2772	rorl	$5,%r13d
2773	xorl	%edx,%r14d
2774	andl	%r11d,%r12d
2775	xorl	%r11d,%r13d
2776	addl	20(%rsp),%ecx
2777	movl	%edx,%edi
2778	xorl	%ebx,%r12d
2779	rorl	$11,%r14d
2780	xorl	%r8d,%edi
2781	addl	%r12d,%ecx
2782	rorl	$6,%r13d
2783	andl	%edi,%r15d
2784	xorl	%edx,%r14d
2785	addl	%r13d,%ecx
2786	xorl	%r8d,%r15d
2787	rorl	$2,%r14d
2788	addl	%ecx,%r10d
2789	addl	%r15d,%ecx
2790	movl	%r10d,%r13d
2791	addl	%ecx,%r14d
2792	rorl	$14,%r13d
2793	movl	%r14d,%ecx
2794	movl	%r11d,%r12d
2795	rorl	$9,%r14d
2796	xorl	%r10d,%r13d
2797	xorl	%eax,%r12d
2798	rorl	$5,%r13d
2799	xorl	%ecx,%r14d
2800	andl	%r10d,%r12d
2801	xorl	%r10d,%r13d
2802	addl	24(%rsp),%ebx
2803	movl	%ecx,%r15d
2804	xorl	%eax,%r12d
2805	rorl	$11,%r14d
2806	xorl	%edx,%r15d
2807	addl	%r12d,%ebx
2808	rorl	$6,%r13d
2809	andl	%r15d,%edi
2810	xorl	%ecx,%r14d
2811	addl	%r13d,%ebx
2812	xorl	%edx,%edi
2813	rorl	$2,%r14d
2814	addl	%ebx,%r9d
2815	addl	%edi,%ebx
2816	movl	%r9d,%r13d
2817	addl	%ebx,%r14d
2818	rorl	$14,%r13d
2819	movl	%r14d,%ebx
2820	movl	%r10d,%r12d
2821	rorl	$9,%r14d
2822	xorl	%r9d,%r13d
2823	xorl	%r11d,%r12d
2824	rorl	$5,%r13d
2825	xorl	%ebx,%r14d
2826	andl	%r9d,%r12d
2827	xorl	%r9d,%r13d
2828	addl	28(%rsp),%eax
2829	movl	%ebx,%edi
2830	xorl	%r11d,%r12d
2831	rorl	$11,%r14d
2832	xorl	%ecx,%edi
2833	addl	%r12d,%eax
2834	rorl	$6,%r13d
2835	andl	%edi,%r15d
2836	xorl	%ebx,%r14d
2837	addl	%r13d,%eax
2838	xorl	%ecx,%r15d
2839	rorl	$2,%r14d
2840	addl	%eax,%r8d
2841	addl	%r15d,%eax
2842	movl	%r8d,%r13d
2843	addl	%eax,%r14d
2844	rorl	$14,%r13d
2845	movl	%r14d,%eax
2846	movl	%r9d,%r12d
2847	rorl	$9,%r14d
2848	xorl	%r8d,%r13d
2849	xorl	%r10d,%r12d
2850	rorl	$5,%r13d
2851	xorl	%eax,%r14d
2852	andl	%r8d,%r12d
2853	xorl	%r8d,%r13d
2854	addl	32(%rsp),%r11d
2855	movl	%eax,%r15d
2856	xorl	%r10d,%r12d
2857	rorl	$11,%r14d
2858	xorl	%ebx,%r15d
2859	addl	%r12d,%r11d
2860	rorl	$6,%r13d
2861	andl	%r15d,%edi
2862	xorl	%eax,%r14d
2863	addl	%r13d,%r11d
2864	xorl	%ebx,%edi
2865	rorl	$2,%r14d
2866	addl	%r11d,%edx
2867	addl	%edi,%r11d
2868	movl	%edx,%r13d
2869	addl	%r11d,%r14d
2870	rorl	$14,%r13d
2871	movl	%r14d,%r11d
2872	movl	%r8d,%r12d
2873	rorl	$9,%r14d
2874	xorl	%edx,%r13d
2875	xorl	%r9d,%r12d
2876	rorl	$5,%r13d
2877	xorl	%r11d,%r14d
2878	andl	%edx,%r12d
2879	xorl	%edx,%r13d
2880	addl	36(%rsp),%r10d
2881	movl	%r11d,%edi
2882	xorl	%r9d,%r12d
2883	rorl	$11,%r14d
2884	xorl	%eax,%edi
2885	addl	%r12d,%r10d
2886	rorl	$6,%r13d
2887	andl	%edi,%r15d
2888	xorl	%r11d,%r14d
2889	addl	%r13d,%r10d
2890	xorl	%eax,%r15d
2891	rorl	$2,%r14d
2892	addl	%r10d,%ecx
2893	addl	%r15d,%r10d
2894	movl	%ecx,%r13d
2895	addl	%r10d,%r14d
2896	rorl	$14,%r13d
2897	movl	%r14d,%r10d
2898	movl	%edx,%r12d
2899	rorl	$9,%r14d
2900	xorl	%ecx,%r13d
2901	xorl	%r8d,%r12d
2902	rorl	$5,%r13d
2903	xorl	%r10d,%r14d
2904	andl	%ecx,%r12d
2905	xorl	%ecx,%r13d
2906	addl	40(%rsp),%r9d
2907	movl	%r10d,%r15d
2908	xorl	%r8d,%r12d
2909	rorl	$11,%r14d
2910	xorl	%r11d,%r15d
2911	addl	%r12d,%r9d
2912	rorl	$6,%r13d
2913	andl	%r15d,%edi
2914	xorl	%r10d,%r14d
2915	addl	%r13d,%r9d
2916	xorl	%r11d,%edi
2917	rorl	$2,%r14d
2918	addl	%r9d,%ebx
2919	addl	%edi,%r9d
2920	movl	%ebx,%r13d
2921	addl	%r9d,%r14d
2922	rorl	$14,%r13d
2923	movl	%r14d,%r9d
2924	movl	%ecx,%r12d
2925	rorl	$9,%r14d
2926	xorl	%ebx,%r13d
2927	xorl	%edx,%r12d
2928	rorl	$5,%r13d
2929	xorl	%r9d,%r14d
2930	andl	%ebx,%r12d
2931	xorl	%ebx,%r13d
2932	addl	44(%rsp),%r8d
2933	movl	%r9d,%edi
2934	xorl	%edx,%r12d
2935	rorl	$11,%r14d
2936	xorl	%r10d,%edi
2937	addl	%r12d,%r8d
2938	rorl	$6,%r13d
2939	andl	%edi,%r15d
2940	xorl	%r9d,%r14d
2941	addl	%r13d,%r8d
2942	xorl	%r10d,%r15d
2943	rorl	$2,%r14d
2944	addl	%r8d,%eax
2945	addl	%r15d,%r8d
2946	movl	%eax,%r13d
2947	addl	%r8d,%r14d
2948	rorl	$14,%r13d
2949	movl	%r14d,%r8d
2950	movl	%ebx,%r12d
2951	rorl	$9,%r14d
2952	xorl	%eax,%r13d
2953	xorl	%ecx,%r12d
2954	rorl	$5,%r13d
2955	xorl	%r8d,%r14d
2956	andl	%eax,%r12d
2957	xorl	%eax,%r13d
2958	addl	48(%rsp),%edx
2959	movl	%r8d,%r15d
2960	xorl	%ecx,%r12d
2961	rorl	$11,%r14d
2962	xorl	%r9d,%r15d
2963	addl	%r12d,%edx
2964	rorl	$6,%r13d
2965	andl	%r15d,%edi
2966	xorl	%r8d,%r14d
2967	addl	%r13d,%edx
2968	xorl	%r9d,%edi
2969	rorl	$2,%r14d
2970	addl	%edx,%r11d
2971	addl	%edi,%edx
2972	movl	%r11d,%r13d
2973	addl	%edx,%r14d
2974	rorl	$14,%r13d
2975	movl	%r14d,%edx
2976	movl	%eax,%r12d
2977	rorl	$9,%r14d
2978	xorl	%r11d,%r13d
2979	xorl	%ebx,%r12d
2980	rorl	$5,%r13d
2981	xorl	%edx,%r14d
2982	andl	%r11d,%r12d
2983	xorl	%r11d,%r13d
2984	addl	52(%rsp),%ecx
2985	movl	%edx,%edi
2986	xorl	%ebx,%r12d
2987	rorl	$11,%r14d
2988	xorl	%r8d,%edi
2989	addl	%r12d,%ecx
2990	rorl	$6,%r13d
2991	andl	%edi,%r15d
2992	xorl	%edx,%r14d
2993	addl	%r13d,%ecx
2994	xorl	%r8d,%r15d
2995	rorl	$2,%r14d
2996	addl	%ecx,%r10d
2997	addl	%r15d,%ecx
2998	movl	%r10d,%r13d
2999	addl	%ecx,%r14d
3000	rorl	$14,%r13d
3001	movl	%r14d,%ecx
3002	movl	%r11d,%r12d
3003	rorl	$9,%r14d
3004	xorl	%r10d,%r13d
3005	xorl	%eax,%r12d
3006	rorl	$5,%r13d
3007	xorl	%ecx,%r14d
3008	andl	%r10d,%r12d
3009	xorl	%r10d,%r13d
3010	addl	56(%rsp),%ebx
3011	movl	%ecx,%r15d
3012	xorl	%eax,%r12d
3013	rorl	$11,%r14d
3014	xorl	%edx,%r15d
3015	addl	%r12d,%ebx
3016	rorl	$6,%r13d
3017	andl	%r15d,%edi
3018	xorl	%ecx,%r14d
3019	addl	%r13d,%ebx
3020	xorl	%edx,%edi
3021	rorl	$2,%r14d
3022	addl	%ebx,%r9d
3023	addl	%edi,%ebx
3024	movl	%r9d,%r13d
3025	addl	%ebx,%r14d
3026	rorl	$14,%r13d
3027	movl	%r14d,%ebx
3028	movl	%r10d,%r12d
3029	rorl	$9,%r14d
3030	xorl	%r9d,%r13d
3031	xorl	%r11d,%r12d
3032	rorl	$5,%r13d
3033	xorl	%ebx,%r14d
3034	andl	%r9d,%r12d
3035	xorl	%r9d,%r13d
3036	addl	60(%rsp),%eax
3037	movl	%ebx,%edi
3038	xorl	%r11d,%r12d
3039	rorl	$11,%r14d
3040	xorl	%ecx,%edi
3041	addl	%r12d,%eax
3042	rorl	$6,%r13d
3043	andl	%edi,%r15d
3044	xorl	%ebx,%r14d
3045	addl	%r13d,%eax
3046	xorl	%ecx,%r15d
3047	rorl	$2,%r14d
3048	addl	%eax,%r8d
3049	addl	%r15d,%eax
3050	movl	%r8d,%r13d
3051	addl	%eax,%r14d
3052	movq	64+0(%rsp),%rdi
3053	movl	%r14d,%eax
3054
3055	addl	0(%rdi),%eax
3056	leaq	64(%rsi),%rsi
3057	addl	4(%rdi),%ebx
3058	addl	8(%rdi),%ecx
3059	addl	12(%rdi),%edx
3060	addl	16(%rdi),%r8d
3061	addl	20(%rdi),%r9d
3062	addl	24(%rdi),%r10d
3063	addl	28(%rdi),%r11d
3064
3065	cmpq	64+16(%rsp),%rsi
3066
3067	movl	%eax,0(%rdi)
3068	movl	%ebx,4(%rdi)
3069	movl	%ecx,8(%rdi)
3070	movl	%edx,12(%rdi)
3071	movl	%r8d,16(%rdi)
3072	movl	%r9d,20(%rdi)
3073	movl	%r10d,24(%rdi)
3074	movl	%r11d,28(%rdi)
3075	jb	.Lloop_ssse3
3076
3077	movq	88(%rsp),%rsi
3078.cfi_def_cfa	%rsi,8
3079	movq	-48(%rsi),%r15
3080.cfi_restore	%r15
3081	movq	-40(%rsi),%r14
3082.cfi_restore	%r14
3083	movq	-32(%rsi),%r13
3084.cfi_restore	%r13
3085	movq	-24(%rsi),%r12
3086.cfi_restore	%r12
3087	movq	-16(%rsi),%rbp
3088.cfi_restore	%rbp
3089	movq	-8(%rsi),%rbx
3090.cfi_restore	%rbx
3091	leaq	(%rsi),%rsp
3092.cfi_def_cfa_register	%rsp
3093.Lepilogue_ssse3:
3094	.byte	0xf3,0xc3
3095.cfi_endproc
3096.size	sha256_block_data_order_ssse3,.-sha256_block_data_order_ssse3
3097.type	sha256_block_data_order_avx,@function
3098.align	64
3099sha256_block_data_order_avx:
3100.cfi_startproc
3101.Lavx_shortcut:
3102	movq	%rsp,%rax
3103.cfi_def_cfa_register	%rax
3104	pushq	%rbx
3105.cfi_offset	%rbx,-16
3106	pushq	%rbp
3107.cfi_offset	%rbp,-24
3108	pushq	%r12
3109.cfi_offset	%r12,-32
3110	pushq	%r13
3111.cfi_offset	%r13,-40
3112	pushq	%r14
3113.cfi_offset	%r14,-48
3114	pushq	%r15
3115.cfi_offset	%r15,-56
3116	shlq	$4,%rdx
3117	subq	$96,%rsp
3118	leaq	(%rsi,%rdx,4),%rdx
3119	andq	$-64,%rsp
3120	movq	%rdi,64+0(%rsp)
3121	movq	%rsi,64+8(%rsp)
3122	movq	%rdx,64+16(%rsp)
3123	movq	%rax,88(%rsp)
3124.cfi_escape	0x0f,0x06,0x77,0xd8,0x00,0x06,0x23,0x08
3125.Lprologue_avx:
3126
3127	vzeroupper
3128	movl	0(%rdi),%eax
3129	movl	4(%rdi),%ebx
3130	movl	8(%rdi),%ecx
3131	movl	12(%rdi),%edx
3132	movl	16(%rdi),%r8d
3133	movl	20(%rdi),%r9d
3134	movl	24(%rdi),%r10d
3135	movl	28(%rdi),%r11d
3136	vmovdqa	K256+512+32(%rip),%xmm8
3137	vmovdqa	K256+512+64(%rip),%xmm9
3138	jmp	.Lloop_avx
3139.align	16
3140.Lloop_avx:
3141	vmovdqa	K256+512(%rip),%xmm7
3142	vmovdqu	0(%rsi),%xmm0
3143	vmovdqu	16(%rsi),%xmm1
3144	vmovdqu	32(%rsi),%xmm2
3145	vmovdqu	48(%rsi),%xmm3
3146	vpshufb	%xmm7,%xmm0,%xmm0
3147	leaq	K256(%rip),%rbp
3148	vpshufb	%xmm7,%xmm1,%xmm1
3149	vpshufb	%xmm7,%xmm2,%xmm2
3150	vpaddd	0(%rbp),%xmm0,%xmm4
3151	vpshufb	%xmm7,%xmm3,%xmm3
3152	vpaddd	32(%rbp),%xmm1,%xmm5
3153	vpaddd	64(%rbp),%xmm2,%xmm6
3154	vpaddd	96(%rbp),%xmm3,%xmm7
3155	vmovdqa	%xmm4,0(%rsp)
3156	movl	%eax,%r14d
3157	vmovdqa	%xmm5,16(%rsp)
3158	movl	%ebx,%edi
3159	vmovdqa	%xmm6,32(%rsp)
3160	xorl	%ecx,%edi
3161	vmovdqa	%xmm7,48(%rsp)
3162	movl	%r8d,%r13d
3163	jmp	.Lavx_00_47
3164
3165.align	16
3166.Lavx_00_47:
3167	subq	$-128,%rbp
3168	vpalignr	$4,%xmm0,%xmm1,%xmm4
3169	shrdl	$14,%r13d,%r13d
3170	movl	%r14d,%eax
3171	movl	%r9d,%r12d
3172	vpalignr	$4,%xmm2,%xmm3,%xmm7
3173	shrdl	$9,%r14d,%r14d
3174	xorl	%r8d,%r13d
3175	xorl	%r10d,%r12d
3176	vpsrld	$7,%xmm4,%xmm6
3177	shrdl	$5,%r13d,%r13d
3178	xorl	%eax,%r14d
3179	andl	%r8d,%r12d
3180	vpaddd	%xmm7,%xmm0,%xmm0
3181	xorl	%r8d,%r13d
3182	addl	0(%rsp),%r11d
3183	movl	%eax,%r15d
3184	vpsrld	$3,%xmm4,%xmm7
3185	xorl	%r10d,%r12d
3186	shrdl	$11,%r14d,%r14d
3187	xorl	%ebx,%r15d
3188	vpslld	$14,%xmm4,%xmm5
3189	addl	%r12d,%r11d
3190	shrdl	$6,%r13d,%r13d
3191	andl	%r15d,%edi
3192	vpxor	%xmm6,%xmm7,%xmm4
3193	xorl	%eax,%r14d
3194	addl	%r13d,%r11d
3195	xorl	%ebx,%edi
3196	vpshufd	$250,%xmm3,%xmm7
3197	shrdl	$2,%r14d,%r14d
3198	addl	%r11d,%edx
3199	addl	%edi,%r11d
3200	vpsrld	$11,%xmm6,%xmm6
3201	movl	%edx,%r13d
3202	addl	%r11d,%r14d
3203	shrdl	$14,%r13d,%r13d
3204	vpxor	%xmm5,%xmm4,%xmm4
3205	movl	%r14d,%r11d
3206	movl	%r8d,%r12d
3207	shrdl	$9,%r14d,%r14d
3208	vpslld	$11,%xmm5,%xmm5
3209	xorl	%edx,%r13d
3210	xorl	%r9d,%r12d
3211	shrdl	$5,%r13d,%r13d
3212	vpxor	%xmm6,%xmm4,%xmm4
3213	xorl	%r11d,%r14d
3214	andl	%edx,%r12d
3215	xorl	%edx,%r13d
3216	vpsrld	$10,%xmm7,%xmm6
3217	addl	4(%rsp),%r10d
3218	movl	%r11d,%edi
3219	xorl	%r9d,%r12d
3220	vpxor	%xmm5,%xmm4,%xmm4
3221	shrdl	$11,%r14d,%r14d
3222	xorl	%eax,%edi
3223	addl	%r12d,%r10d
3224	vpsrlq	$17,%xmm7,%xmm7
3225	shrdl	$6,%r13d,%r13d
3226	andl	%edi,%r15d
3227	xorl	%r11d,%r14d
3228	vpaddd	%xmm4,%xmm0,%xmm0
3229	addl	%r13d,%r10d
3230	xorl	%eax,%r15d
3231	shrdl	$2,%r14d,%r14d
3232	vpxor	%xmm7,%xmm6,%xmm6
3233	addl	%r10d,%ecx
3234	addl	%r15d,%r10d
3235	movl	%ecx,%r13d
3236	vpsrlq	$2,%xmm7,%xmm7
3237	addl	%r10d,%r14d
3238	shrdl	$14,%r13d,%r13d
3239	movl	%r14d,%r10d
3240	vpxor	%xmm7,%xmm6,%xmm6
3241	movl	%edx,%r12d
3242	shrdl	$9,%r14d,%r14d
3243	xorl	%ecx,%r13d
3244	vpshufb	%xmm8,%xmm6,%xmm6
3245	xorl	%r8d,%r12d
3246	shrdl	$5,%r13d,%r13d
3247	xorl	%r10d,%r14d
3248	vpaddd	%xmm6,%xmm0,%xmm0
3249	andl	%ecx,%r12d
3250	xorl	%ecx,%r13d
3251	addl	8(%rsp),%r9d
3252	vpshufd	$80,%xmm0,%xmm7
3253	movl	%r10d,%r15d
3254	xorl	%r8d,%r12d
3255	shrdl	$11,%r14d,%r14d
3256	vpsrld	$10,%xmm7,%xmm6
3257	xorl	%r11d,%r15d
3258	addl	%r12d,%r9d
3259	shrdl	$6,%r13d,%r13d
3260	vpsrlq	$17,%xmm7,%xmm7
3261	andl	%r15d,%edi
3262	xorl	%r10d,%r14d
3263	addl	%r13d,%r9d
3264	vpxor	%xmm7,%xmm6,%xmm6
3265	xorl	%r11d,%edi
3266	shrdl	$2,%r14d,%r14d
3267	addl	%r9d,%ebx
3268	vpsrlq	$2,%xmm7,%xmm7
3269	addl	%edi,%r9d
3270	movl	%ebx,%r13d
3271	addl	%r9d,%r14d
3272	vpxor	%xmm7,%xmm6,%xmm6
3273	shrdl	$14,%r13d,%r13d
3274	movl	%r14d,%r9d
3275	movl	%ecx,%r12d
3276	vpshufb	%xmm9,%xmm6,%xmm6
3277	shrdl	$9,%r14d,%r14d
3278	xorl	%ebx,%r13d
3279	xorl	%edx,%r12d
3280	vpaddd	%xmm6,%xmm0,%xmm0
3281	shrdl	$5,%r13d,%r13d
3282	xorl	%r9d,%r14d
3283	andl	%ebx,%r12d
3284	vpaddd	0(%rbp),%xmm0,%xmm6
3285	xorl	%ebx,%r13d
3286	addl	12(%rsp),%r8d
3287	movl	%r9d,%edi
3288	xorl	%edx,%r12d
3289	shrdl	$11,%r14d,%r14d
3290	xorl	%r10d,%edi
3291	addl	%r12d,%r8d
3292	shrdl	$6,%r13d,%r13d
3293	andl	%edi,%r15d
3294	xorl	%r9d,%r14d
3295	addl	%r13d,%r8d
3296	xorl	%r10d,%r15d
3297	shrdl	$2,%r14d,%r14d
3298	addl	%r8d,%eax
3299	addl	%r15d,%r8d
3300	movl	%eax,%r13d
3301	addl	%r8d,%r14d
3302	vmovdqa	%xmm6,0(%rsp)
3303	vpalignr	$4,%xmm1,%xmm2,%xmm4
3304	shrdl	$14,%r13d,%r13d
3305	movl	%r14d,%r8d
3306	movl	%ebx,%r12d
3307	vpalignr	$4,%xmm3,%xmm0,%xmm7
3308	shrdl	$9,%r14d,%r14d
3309	xorl	%eax,%r13d
3310	xorl	%ecx,%r12d
3311	vpsrld	$7,%xmm4,%xmm6
3312	shrdl	$5,%r13d,%r13d
3313	xorl	%r8d,%r14d
3314	andl	%eax,%r12d
3315	vpaddd	%xmm7,%xmm1,%xmm1
3316	xorl	%eax,%r13d
3317	addl	16(%rsp),%edx
3318	movl	%r8d,%r15d
3319	vpsrld	$3,%xmm4,%xmm7
3320	xorl	%ecx,%r12d
3321	shrdl	$11,%r14d,%r14d
3322	xorl	%r9d,%r15d
3323	vpslld	$14,%xmm4,%xmm5
3324	addl	%r12d,%edx
3325	shrdl	$6,%r13d,%r13d
3326	andl	%r15d,%edi
3327	vpxor	%xmm6,%xmm7,%xmm4
3328	xorl	%r8d,%r14d
3329	addl	%r13d,%edx
3330	xorl	%r9d,%edi
3331	vpshufd	$250,%xmm0,%xmm7
3332	shrdl	$2,%r14d,%r14d
3333	addl	%edx,%r11d
3334	addl	%edi,%edx
3335	vpsrld	$11,%xmm6,%xmm6
3336	movl	%r11d,%r13d
3337	addl	%edx,%r14d
3338	shrdl	$14,%r13d,%r13d
3339	vpxor	%xmm5,%xmm4,%xmm4
3340	movl	%r14d,%edx
3341	movl	%eax,%r12d
3342	shrdl	$9,%r14d,%r14d
3343	vpslld	$11,%xmm5,%xmm5
3344	xorl	%r11d,%r13d
3345	xorl	%ebx,%r12d
3346	shrdl	$5,%r13d,%r13d
3347	vpxor	%xmm6,%xmm4,%xmm4
3348	xorl	%edx,%r14d
3349	andl	%r11d,%r12d
3350	xorl	%r11d,%r13d
3351	vpsrld	$10,%xmm7,%xmm6
3352	addl	20(%rsp),%ecx
3353	movl	%edx,%edi
3354	xorl	%ebx,%r12d
3355	vpxor	%xmm5,%xmm4,%xmm4
3356	shrdl	$11,%r14d,%r14d
3357	xorl	%r8d,%edi
3358	addl	%r12d,%ecx
3359	vpsrlq	$17,%xmm7,%xmm7
3360	shrdl	$6,%r13d,%r13d
3361	andl	%edi,%r15d
3362	xorl	%edx,%r14d
3363	vpaddd	%xmm4,%xmm1,%xmm1
3364	addl	%r13d,%ecx
3365	xorl	%r8d,%r15d
3366	shrdl	$2,%r14d,%r14d
3367	vpxor	%xmm7,%xmm6,%xmm6
3368	addl	%ecx,%r10d
3369	addl	%r15d,%ecx
3370	movl	%r10d,%r13d
3371	vpsrlq	$2,%xmm7,%xmm7
3372	addl	%ecx,%r14d
3373	shrdl	$14,%r13d,%r13d
3374	movl	%r14d,%ecx
3375	vpxor	%xmm7,%xmm6,%xmm6
3376	movl	%r11d,%r12d
3377	shrdl	$9,%r14d,%r14d
3378	xorl	%r10d,%r13d
3379	vpshufb	%xmm8,%xmm6,%xmm6
3380	xorl	%eax,%r12d
3381	shrdl	$5,%r13d,%r13d
3382	xorl	%ecx,%r14d
3383	vpaddd	%xmm6,%xmm1,%xmm1
3384	andl	%r10d,%r12d
3385	xorl	%r10d,%r13d
3386	addl	24(%rsp),%ebx
3387	vpshufd	$80,%xmm1,%xmm7
3388	movl	%ecx,%r15d
3389	xorl	%eax,%r12d
3390	shrdl	$11,%r14d,%r14d
3391	vpsrld	$10,%xmm7,%xmm6
3392	xorl	%edx,%r15d
3393	addl	%r12d,%ebx
3394	shrdl	$6,%r13d,%r13d
3395	vpsrlq	$17,%xmm7,%xmm7
3396	andl	%r15d,%edi
3397	xorl	%ecx,%r14d
3398	addl	%r13d,%ebx
3399	vpxor	%xmm7,%xmm6,%xmm6
3400	xorl	%edx,%edi
3401	shrdl	$2,%r14d,%r14d
3402	addl	%ebx,%r9d
3403	vpsrlq	$2,%xmm7,%xmm7
3404	addl	%edi,%ebx
3405	movl	%r9d,%r13d
3406	addl	%ebx,%r14d
3407	vpxor	%xmm7,%xmm6,%xmm6
3408	shrdl	$14,%r13d,%r13d
3409	movl	%r14d,%ebx
3410	movl	%r10d,%r12d
3411	vpshufb	%xmm9,%xmm6,%xmm6
3412	shrdl	$9,%r14d,%r14d
3413	xorl	%r9d,%r13d
3414	xorl	%r11d,%r12d
3415	vpaddd	%xmm6,%xmm1,%xmm1
3416	shrdl	$5,%r13d,%r13d
3417	xorl	%ebx,%r14d
3418	andl	%r9d,%r12d
3419	vpaddd	32(%rbp),%xmm1,%xmm6
3420	xorl	%r9d,%r13d
3421	addl	28(%rsp),%eax
3422	movl	%ebx,%edi
3423	xorl	%r11d,%r12d
3424	shrdl	$11,%r14d,%r14d
3425	xorl	%ecx,%edi
3426	addl	%r12d,%eax
3427	shrdl	$6,%r13d,%r13d
3428	andl	%edi,%r15d
3429	xorl	%ebx,%r14d
3430	addl	%r13d,%eax
3431	xorl	%ecx,%r15d
3432	shrdl	$2,%r14d,%r14d
3433	addl	%eax,%r8d
3434	addl	%r15d,%eax
3435	movl	%r8d,%r13d
3436	addl	%eax,%r14d
3437	vmovdqa	%xmm6,16(%rsp)
3438	vpalignr	$4,%xmm2,%xmm3,%xmm4
3439	shrdl	$14,%r13d,%r13d
3440	movl	%r14d,%eax
3441	movl	%r9d,%r12d
3442	vpalignr	$4,%xmm0,%xmm1,%xmm7
3443	shrdl	$9,%r14d,%r14d
3444	xorl	%r8d,%r13d
3445	xorl	%r10d,%r12d
3446	vpsrld	$7,%xmm4,%xmm6
3447	shrdl	$5,%r13d,%r13d
3448	xorl	%eax,%r14d
3449	andl	%r8d,%r12d
3450	vpaddd	%xmm7,%xmm2,%xmm2
3451	xorl	%r8d,%r13d
3452	addl	32(%rsp),%r11d
3453	movl	%eax,%r15d
3454	vpsrld	$3,%xmm4,%xmm7
3455	xorl	%r10d,%r12d
3456	shrdl	$11,%r14d,%r14d
3457	xorl	%ebx,%r15d
3458	vpslld	$14,%xmm4,%xmm5
3459	addl	%r12d,%r11d
3460	shrdl	$6,%r13d,%r13d
3461	andl	%r15d,%edi
3462	vpxor	%xmm6,%xmm7,%xmm4
3463	xorl	%eax,%r14d
3464	addl	%r13d,%r11d
3465	xorl	%ebx,%edi
3466	vpshufd	$250,%xmm1,%xmm7
3467	shrdl	$2,%r14d,%r14d
3468	addl	%r11d,%edx
3469	addl	%edi,%r11d
3470	vpsrld	$11,%xmm6,%xmm6
3471	movl	%edx,%r13d
3472	addl	%r11d,%r14d
3473	shrdl	$14,%r13d,%r13d
3474	vpxor	%xmm5,%xmm4,%xmm4
3475	movl	%r14d,%r11d
3476	movl	%r8d,%r12d
3477	shrdl	$9,%r14d,%r14d
3478	vpslld	$11,%xmm5,%xmm5
3479	xorl	%edx,%r13d
3480	xorl	%r9d,%r12d
3481	shrdl	$5,%r13d,%r13d
3482	vpxor	%xmm6,%xmm4,%xmm4
3483	xorl	%r11d,%r14d
3484	andl	%edx,%r12d
3485	xorl	%edx,%r13d
3486	vpsrld	$10,%xmm7,%xmm6
3487	addl	36(%rsp),%r10d
3488	movl	%r11d,%edi
3489	xorl	%r9d,%r12d
3490	vpxor	%xmm5,%xmm4,%xmm4
3491	shrdl	$11,%r14d,%r14d
3492	xorl	%eax,%edi
3493	addl	%r12d,%r10d
3494	vpsrlq	$17,%xmm7,%xmm7
3495	shrdl	$6,%r13d,%r13d
3496	andl	%edi,%r15d
3497	xorl	%r11d,%r14d
3498	vpaddd	%xmm4,%xmm2,%xmm2
3499	addl	%r13d,%r10d
3500	xorl	%eax,%r15d
3501	shrdl	$2,%r14d,%r14d
3502	vpxor	%xmm7,%xmm6,%xmm6
3503	addl	%r10d,%ecx
3504	addl	%r15d,%r10d
3505	movl	%ecx,%r13d
3506	vpsrlq	$2,%xmm7,%xmm7
3507	addl	%r10d,%r14d
3508	shrdl	$14,%r13d,%r13d
3509	movl	%r14d,%r10d
3510	vpxor	%xmm7,%xmm6,%xmm6
3511	movl	%edx,%r12d
3512	shrdl	$9,%r14d,%r14d
3513	xorl	%ecx,%r13d
3514	vpshufb	%xmm8,%xmm6,%xmm6
3515	xorl	%r8d,%r12d
3516	shrdl	$5,%r13d,%r13d
3517	xorl	%r10d,%r14d
3518	vpaddd	%xmm6,%xmm2,%xmm2
3519	andl	%ecx,%r12d
3520	xorl	%ecx,%r13d
3521	addl	40(%rsp),%r9d
3522	vpshufd	$80,%xmm2,%xmm7
3523	movl	%r10d,%r15d
3524	xorl	%r8d,%r12d
3525	shrdl	$11,%r14d,%r14d
3526	vpsrld	$10,%xmm7,%xmm6
3527	xorl	%r11d,%r15d
3528	addl	%r12d,%r9d
3529	shrdl	$6,%r13d,%r13d
3530	vpsrlq	$17,%xmm7,%xmm7
3531	andl	%r15d,%edi
3532	xorl	%r10d,%r14d
3533	addl	%r13d,%r9d
3534	vpxor	%xmm7,%xmm6,%xmm6
3535	xorl	%r11d,%edi
3536	shrdl	$2,%r14d,%r14d
3537	addl	%r9d,%ebx
3538	vpsrlq	$2,%xmm7,%xmm7
3539	addl	%edi,%r9d
3540	movl	%ebx,%r13d
3541	addl	%r9d,%r14d
3542	vpxor	%xmm7,%xmm6,%xmm6
3543	shrdl	$14,%r13d,%r13d
3544	movl	%r14d,%r9d
3545	movl	%ecx,%r12d
3546	vpshufb	%xmm9,%xmm6,%xmm6
3547	shrdl	$9,%r14d,%r14d
3548	xorl	%ebx,%r13d
3549	xorl	%edx,%r12d
3550	vpaddd	%xmm6,%xmm2,%xmm2
3551	shrdl	$5,%r13d,%r13d
3552	xorl	%r9d,%r14d
3553	andl	%ebx,%r12d
3554	vpaddd	64(%rbp),%xmm2,%xmm6
3555	xorl	%ebx,%r13d
3556	addl	44(%rsp),%r8d
3557	movl	%r9d,%edi
3558	xorl	%edx,%r12d
3559	shrdl	$11,%r14d,%r14d
3560	xorl	%r10d,%edi
3561	addl	%r12d,%r8d
3562	shrdl	$6,%r13d,%r13d
3563	andl	%edi,%r15d
3564	xorl	%r9d,%r14d
3565	addl	%r13d,%r8d
3566	xorl	%r10d,%r15d
3567	shrdl	$2,%r14d,%r14d
3568	addl	%r8d,%eax
3569	addl	%r15d,%r8d
3570	movl	%eax,%r13d
3571	addl	%r8d,%r14d
3572	vmovdqa	%xmm6,32(%rsp)
3573	vpalignr	$4,%xmm3,%xmm0,%xmm4
3574	shrdl	$14,%r13d,%r13d
3575	movl	%r14d,%r8d
3576	movl	%ebx,%r12d
3577	vpalignr	$4,%xmm1,%xmm2,%xmm7
3578	shrdl	$9,%r14d,%r14d
3579	xorl	%eax,%r13d
3580	xorl	%ecx,%r12d
3581	vpsrld	$7,%xmm4,%xmm6
3582	shrdl	$5,%r13d,%r13d
3583	xorl	%r8d,%r14d
3584	andl	%eax,%r12d
3585	vpaddd	%xmm7,%xmm3,%xmm3
3586	xorl	%eax,%r13d
3587	addl	48(%rsp),%edx
3588	movl	%r8d,%r15d
3589	vpsrld	$3,%xmm4,%xmm7
3590	xorl	%ecx,%r12d
3591	shrdl	$11,%r14d,%r14d
3592	xorl	%r9d,%r15d
3593	vpslld	$14,%xmm4,%xmm5
3594	addl	%r12d,%edx
3595	shrdl	$6,%r13d,%r13d
3596	andl	%r15d,%edi
3597	vpxor	%xmm6,%xmm7,%xmm4
3598	xorl	%r8d,%r14d
3599	addl	%r13d,%edx
3600	xorl	%r9d,%edi
3601	vpshufd	$250,%xmm2,%xmm7
3602	shrdl	$2,%r14d,%r14d
3603	addl	%edx,%r11d
3604	addl	%edi,%edx
3605	vpsrld	$11,%xmm6,%xmm6
3606	movl	%r11d,%r13d
3607	addl	%edx,%r14d
3608	shrdl	$14,%r13d,%r13d
3609	vpxor	%xmm5,%xmm4,%xmm4
3610	movl	%r14d,%edx
3611	movl	%eax,%r12d
3612	shrdl	$9,%r14d,%r14d
3613	vpslld	$11,%xmm5,%xmm5
3614	xorl	%r11d,%r13d
3615	xorl	%ebx,%r12d
3616	shrdl	$5,%r13d,%r13d
3617	vpxor	%xmm6,%xmm4,%xmm4
3618	xorl	%edx,%r14d
3619	andl	%r11d,%r12d
3620	xorl	%r11d,%r13d
3621	vpsrld	$10,%xmm7,%xmm6
3622	addl	52(%rsp),%ecx
3623	movl	%edx,%edi
3624	xorl	%ebx,%r12d
3625	vpxor	%xmm5,%xmm4,%xmm4
3626	shrdl	$11,%r14d,%r14d
3627	xorl	%r8d,%edi
3628	addl	%r12d,%ecx
3629	vpsrlq	$17,%xmm7,%xmm7
3630	shrdl	$6,%r13d,%r13d
3631	andl	%edi,%r15d
3632	xorl	%edx,%r14d
3633	vpaddd	%xmm4,%xmm3,%xmm3
3634	addl	%r13d,%ecx
3635	xorl	%r8d,%r15d
3636	shrdl	$2,%r14d,%r14d
3637	vpxor	%xmm7,%xmm6,%xmm6
3638	addl	%ecx,%r10d
3639	addl	%r15d,%ecx
3640	movl	%r10d,%r13d
3641	vpsrlq	$2,%xmm7,%xmm7
3642	addl	%ecx,%r14d
3643	shrdl	$14,%r13d,%r13d
3644	movl	%r14d,%ecx
3645	vpxor	%xmm7,%xmm6,%xmm6
3646	movl	%r11d,%r12d
3647	shrdl	$9,%r14d,%r14d
3648	xorl	%r10d,%r13d
3649	vpshufb	%xmm8,%xmm6,%xmm6
3650	xorl	%eax,%r12d
3651	shrdl	$5,%r13d,%r13d
3652	xorl	%ecx,%r14d
3653	vpaddd	%xmm6,%xmm3,%xmm3
3654	andl	%r10d,%r12d
3655	xorl	%r10d,%r13d
3656	addl	56(%rsp),%ebx
3657	vpshufd	$80,%xmm3,%xmm7
3658	movl	%ecx,%r15d
3659	xorl	%eax,%r12d
3660	shrdl	$11,%r14d,%r14d
3661	vpsrld	$10,%xmm7,%xmm6
3662	xorl	%edx,%r15d
3663	addl	%r12d,%ebx
3664	shrdl	$6,%r13d,%r13d
3665	vpsrlq	$17,%xmm7,%xmm7
3666	andl	%r15d,%edi
3667	xorl	%ecx,%r14d
3668	addl	%r13d,%ebx
3669	vpxor	%xmm7,%xmm6,%xmm6
3670	xorl	%edx,%edi
3671	shrdl	$2,%r14d,%r14d
3672	addl	%ebx,%r9d
3673	vpsrlq	$2,%xmm7,%xmm7
3674	addl	%edi,%ebx
3675	movl	%r9d,%r13d
3676	addl	%ebx,%r14d
3677	vpxor	%xmm7,%xmm6,%xmm6
3678	shrdl	$14,%r13d,%r13d
3679	movl	%r14d,%ebx
3680	movl	%r10d,%r12d
3681	vpshufb	%xmm9,%xmm6,%xmm6
3682	shrdl	$9,%r14d,%r14d
3683	xorl	%r9d,%r13d
3684	xorl	%r11d,%r12d
3685	vpaddd	%xmm6,%xmm3,%xmm3
3686	shrdl	$5,%r13d,%r13d
3687	xorl	%ebx,%r14d
3688	andl	%r9d,%r12d
3689	vpaddd	96(%rbp),%xmm3,%xmm6
3690	xorl	%r9d,%r13d
3691	addl	60(%rsp),%eax
3692	movl	%ebx,%edi
3693	xorl	%r11d,%r12d
3694	shrdl	$11,%r14d,%r14d
3695	xorl	%ecx,%edi
3696	addl	%r12d,%eax
3697	shrdl	$6,%r13d,%r13d
3698	andl	%edi,%r15d
3699	xorl	%ebx,%r14d
3700	addl	%r13d,%eax
3701	xorl	%ecx,%r15d
3702	shrdl	$2,%r14d,%r14d
3703	addl	%eax,%r8d
3704	addl	%r15d,%eax
3705	movl	%r8d,%r13d
3706	addl	%eax,%r14d
3707	vmovdqa	%xmm6,48(%rsp)
3708	cmpb	$0,131(%rbp)
3709	jne	.Lavx_00_47
3710	shrdl	$14,%r13d,%r13d
3711	movl	%r14d,%eax
3712	movl	%r9d,%r12d
3713	shrdl	$9,%r14d,%r14d
3714	xorl	%r8d,%r13d
3715	xorl	%r10d,%r12d
3716	shrdl	$5,%r13d,%r13d
3717	xorl	%eax,%r14d
3718	andl	%r8d,%r12d
3719	xorl	%r8d,%r13d
3720	addl	0(%rsp),%r11d
3721	movl	%eax,%r15d
3722	xorl	%r10d,%r12d
3723	shrdl	$11,%r14d,%r14d
3724	xorl	%ebx,%r15d
3725	addl	%r12d,%r11d
3726	shrdl	$6,%r13d,%r13d
3727	andl	%r15d,%edi
3728	xorl	%eax,%r14d
3729	addl	%r13d,%r11d
3730	xorl	%ebx,%edi
3731	shrdl	$2,%r14d,%r14d
3732	addl	%r11d,%edx
3733	addl	%edi,%r11d
3734	movl	%edx,%r13d
3735	addl	%r11d,%r14d
3736	shrdl	$14,%r13d,%r13d
3737	movl	%r14d,%r11d
3738	movl	%r8d,%r12d
3739	shrdl	$9,%r14d,%r14d
3740	xorl	%edx,%r13d
3741	xorl	%r9d,%r12d
3742	shrdl	$5,%r13d,%r13d
3743	xorl	%r11d,%r14d
3744	andl	%edx,%r12d
3745	xorl	%edx,%r13d
3746	addl	4(%rsp),%r10d
3747	movl	%r11d,%edi
3748	xorl	%r9d,%r12d
3749	shrdl	$11,%r14d,%r14d
3750	xorl	%eax,%edi
3751	addl	%r12d,%r10d
3752	shrdl	$6,%r13d,%r13d
3753	andl	%edi,%r15d
3754	xorl	%r11d,%r14d
3755	addl	%r13d,%r10d
3756	xorl	%eax,%r15d
3757	shrdl	$2,%r14d,%r14d
3758	addl	%r10d,%ecx
3759	addl	%r15d,%r10d
3760	movl	%ecx,%r13d
3761	addl	%r10d,%r14d
3762	shrdl	$14,%r13d,%r13d
3763	movl	%r14d,%r10d
3764	movl	%edx,%r12d
3765	shrdl	$9,%r14d,%r14d
3766	xorl	%ecx,%r13d
3767	xorl	%r8d,%r12d
3768	shrdl	$5,%r13d,%r13d
3769	xorl	%r10d,%r14d
3770	andl	%ecx,%r12d
3771	xorl	%ecx,%r13d
3772	addl	8(%rsp),%r9d
3773	movl	%r10d,%r15d
3774	xorl	%r8d,%r12d
3775	shrdl	$11,%r14d,%r14d
3776	xorl	%r11d,%r15d
3777	addl	%r12d,%r9d
3778	shrdl	$6,%r13d,%r13d
3779	andl	%r15d,%edi
3780	xorl	%r10d,%r14d
3781	addl	%r13d,%r9d
3782	xorl	%r11d,%edi
3783	shrdl	$2,%r14d,%r14d
3784	addl	%r9d,%ebx
3785	addl	%edi,%r9d
3786	movl	%ebx,%r13d
3787	addl	%r9d,%r14d
3788	shrdl	$14,%r13d,%r13d
3789	movl	%r14d,%r9d
3790	movl	%ecx,%r12d
3791	shrdl	$9,%r14d,%r14d
3792	xorl	%ebx,%r13d
3793	xorl	%edx,%r12d
3794	shrdl	$5,%r13d,%r13d
3795	xorl	%r9d,%r14d
3796	andl	%ebx,%r12d
3797	xorl	%ebx,%r13d
3798	addl	12(%rsp),%r8d
3799	movl	%r9d,%edi
3800	xorl	%edx,%r12d
3801	shrdl	$11,%r14d,%r14d
3802	xorl	%r10d,%edi
3803	addl	%r12d,%r8d
3804	shrdl	$6,%r13d,%r13d
3805	andl	%edi,%r15d
3806	xorl	%r9d,%r14d
3807	addl	%r13d,%r8d
3808	xorl	%r10d,%r15d
3809	shrdl	$2,%r14d,%r14d
3810	addl	%r8d,%eax
3811	addl	%r15d,%r8d
3812	movl	%eax,%r13d
3813	addl	%r8d,%r14d
3814	shrdl	$14,%r13d,%r13d
3815	movl	%r14d,%r8d
3816	movl	%ebx,%r12d
3817	shrdl	$9,%r14d,%r14d
3818	xorl	%eax,%r13d
3819	xorl	%ecx,%r12d
3820	shrdl	$5,%r13d,%r13d
3821	xorl	%r8d,%r14d
3822	andl	%eax,%r12d
3823	xorl	%eax,%r13d
3824	addl	16(%rsp),%edx
3825	movl	%r8d,%r15d
3826	xorl	%ecx,%r12d
3827	shrdl	$11,%r14d,%r14d
3828	xorl	%r9d,%r15d
3829	addl	%r12d,%edx
3830	shrdl	$6,%r13d,%r13d
3831	andl	%r15d,%edi
3832	xorl	%r8d,%r14d
3833	addl	%r13d,%edx
3834	xorl	%r9d,%edi
3835	shrdl	$2,%r14d,%r14d
3836	addl	%edx,%r11d
3837	addl	%edi,%edx
3838	movl	%r11d,%r13d
3839	addl	%edx,%r14d
3840	shrdl	$14,%r13d,%r13d
3841	movl	%r14d,%edx
3842	movl	%eax,%r12d
3843	shrdl	$9,%r14d,%r14d
3844	xorl	%r11d,%r13d
3845	xorl	%ebx,%r12d
3846	shrdl	$5,%r13d,%r13d
3847	xorl	%edx,%r14d
3848	andl	%r11d,%r12d
3849	xorl	%r11d,%r13d
3850	addl	20(%rsp),%ecx
3851	movl	%edx,%edi
3852	xorl	%ebx,%r12d
3853	shrdl	$11,%r14d,%r14d
3854	xorl	%r8d,%edi
3855	addl	%r12d,%ecx
3856	shrdl	$6,%r13d,%r13d
3857	andl	%edi,%r15d
3858	xorl	%edx,%r14d
3859	addl	%r13d,%ecx
3860	xorl	%r8d,%r15d
3861	shrdl	$2,%r14d,%r14d
3862	addl	%ecx,%r10d
3863	addl	%r15d,%ecx
3864	movl	%r10d,%r13d
3865	addl	%ecx,%r14d
3866	shrdl	$14,%r13d,%r13d
3867	movl	%r14d,%ecx
3868	movl	%r11d,%r12d
3869	shrdl	$9,%r14d,%r14d
3870	xorl	%r10d,%r13d
3871	xorl	%eax,%r12d
3872	shrdl	$5,%r13d,%r13d
3873	xorl	%ecx,%r14d
3874	andl	%r10d,%r12d
3875	xorl	%r10d,%r13d
3876	addl	24(%rsp),%ebx
3877	movl	%ecx,%r15d
3878	xorl	%eax,%r12d
3879	shrdl	$11,%r14d,%r14d
3880	xorl	%edx,%r15d
3881	addl	%r12d,%ebx
3882	shrdl	$6,%r13d,%r13d
3883	andl	%r15d,%edi
3884	xorl	%ecx,%r14d
3885	addl	%r13d,%ebx
3886	xorl	%edx,%edi
3887	shrdl	$2,%r14d,%r14d
3888	addl	%ebx,%r9d
3889	addl	%edi,%ebx
3890	movl	%r9d,%r13d
3891	addl	%ebx,%r14d
3892	shrdl	$14,%r13d,%r13d
3893	movl	%r14d,%ebx
3894	movl	%r10d,%r12d
3895	shrdl	$9,%r14d,%r14d
3896	xorl	%r9d,%r13d
3897	xorl	%r11d,%r12d
3898	shrdl	$5,%r13d,%r13d
3899	xorl	%ebx,%r14d
3900	andl	%r9d,%r12d
3901	xorl	%r9d,%r13d
3902	addl	28(%rsp),%eax
3903	movl	%ebx,%edi
3904	xorl	%r11d,%r12d
3905	shrdl	$11,%r14d,%r14d
3906	xorl	%ecx,%edi
3907	addl	%r12d,%eax
3908	shrdl	$6,%r13d,%r13d
3909	andl	%edi,%r15d
3910	xorl	%ebx,%r14d
3911	addl	%r13d,%eax
3912	xorl	%ecx,%r15d
3913	shrdl	$2,%r14d,%r14d
3914	addl	%eax,%r8d
3915	addl	%r15d,%eax
3916	movl	%r8d,%r13d
3917	addl	%eax,%r14d
3918	shrdl	$14,%r13d,%r13d
3919	movl	%r14d,%eax
3920	movl	%r9d,%r12d
3921	shrdl	$9,%r14d,%r14d
3922	xorl	%r8d,%r13d
3923	xorl	%r10d,%r12d
3924	shrdl	$5,%r13d,%r13d
3925	xorl	%eax,%r14d
3926	andl	%r8d,%r12d
3927	xorl	%r8d,%r13d
3928	addl	32(%rsp),%r11d
3929	movl	%eax,%r15d
3930	xorl	%r10d,%r12d
3931	shrdl	$11,%r14d,%r14d
3932	xorl	%ebx,%r15d
3933	addl	%r12d,%r11d
3934	shrdl	$6,%r13d,%r13d
3935	andl	%r15d,%edi
3936	xorl	%eax,%r14d
3937	addl	%r13d,%r11d
3938	xorl	%ebx,%edi
3939	shrdl	$2,%r14d,%r14d
3940	addl	%r11d,%edx
3941	addl	%edi,%r11d
3942	movl	%edx,%r13d
3943	addl	%r11d,%r14d
3944	shrdl	$14,%r13d,%r13d
3945	movl	%r14d,%r11d
3946	movl	%r8d,%r12d
3947	shrdl	$9,%r14d,%r14d
3948	xorl	%edx,%r13d
3949	xorl	%r9d,%r12d
3950	shrdl	$5,%r13d,%r13d
3951	xorl	%r11d,%r14d
3952	andl	%edx,%r12d
3953	xorl	%edx,%r13d
3954	addl	36(%rsp),%r10d
3955	movl	%r11d,%edi
3956	xorl	%r9d,%r12d
3957	shrdl	$11,%r14d,%r14d
3958	xorl	%eax,%edi
3959	addl	%r12d,%r10d
3960	shrdl	$6,%r13d,%r13d
3961	andl	%edi,%r15d
3962	xorl	%r11d,%r14d
3963	addl	%r13d,%r10d
3964	xorl	%eax,%r15d
3965	shrdl	$2,%r14d,%r14d
3966	addl	%r10d,%ecx
3967	addl	%r15d,%r10d
3968	movl	%ecx,%r13d
3969	addl	%r10d,%r14d
3970	shrdl	$14,%r13d,%r13d
3971	movl	%r14d,%r10d
3972	movl	%edx,%r12d
3973	shrdl	$9,%r14d,%r14d
3974	xorl	%ecx,%r13d
3975	xorl	%r8d,%r12d
3976	shrdl	$5,%r13d,%r13d
3977	xorl	%r10d,%r14d
3978	andl	%ecx,%r12d
3979	xorl	%ecx,%r13d
3980	addl	40(%rsp),%r9d
3981	movl	%r10d,%r15d
3982	xorl	%r8d,%r12d
3983	shrdl	$11,%r14d,%r14d
3984	xorl	%r11d,%r15d
3985	addl	%r12d,%r9d
3986	shrdl	$6,%r13d,%r13d
3987	andl	%r15d,%edi
3988	xorl	%r10d,%r14d
3989	addl	%r13d,%r9d
3990	xorl	%r11d,%edi
3991	shrdl	$2,%r14d,%r14d
3992	addl	%r9d,%ebx
3993	addl	%edi,%r9d
3994	movl	%ebx,%r13d
3995	addl	%r9d,%r14d
3996	shrdl	$14,%r13d,%r13d
3997	movl	%r14d,%r9d
3998	movl	%ecx,%r12d
3999	shrdl	$9,%r14d,%r14d
4000	xorl	%ebx,%r13d
4001	xorl	%edx,%r12d
4002	shrdl	$5,%r13d,%r13d
4003	xorl	%r9d,%r14d
4004	andl	%ebx,%r12d
4005	xorl	%ebx,%r13d
4006	addl	44(%rsp),%r8d
4007	movl	%r9d,%edi
4008	xorl	%edx,%r12d
4009	shrdl	$11,%r14d,%r14d
4010	xorl	%r10d,%edi
4011	addl	%r12d,%r8d
4012	shrdl	$6,%r13d,%r13d
4013	andl	%edi,%r15d
4014	xorl	%r9d,%r14d
4015	addl	%r13d,%r8d
4016	xorl	%r10d,%r15d
4017	shrdl	$2,%r14d,%r14d
4018	addl	%r8d,%eax
4019	addl	%r15d,%r8d
4020	movl	%eax,%r13d
4021	addl	%r8d,%r14d
4022	shrdl	$14,%r13d,%r13d
4023	movl	%r14d,%r8d
4024	movl	%ebx,%r12d
4025	shrdl	$9,%r14d,%r14d
4026	xorl	%eax,%r13d
4027	xorl	%ecx,%r12d
4028	shrdl	$5,%r13d,%r13d
4029	xorl	%r8d,%r14d
4030	andl	%eax,%r12d
4031	xorl	%eax,%r13d
4032	addl	48(%rsp),%edx
4033	movl	%r8d,%r15d
4034	xorl	%ecx,%r12d
4035	shrdl	$11,%r14d,%r14d
4036	xorl	%r9d,%r15d
4037	addl	%r12d,%edx
4038	shrdl	$6,%r13d,%r13d
4039	andl	%r15d,%edi
4040	xorl	%r8d,%r14d
4041	addl	%r13d,%edx
4042	xorl	%r9d,%edi
4043	shrdl	$2,%r14d,%r14d
4044	addl	%edx,%r11d
4045	addl	%edi,%edx
4046	movl	%r11d,%r13d
4047	addl	%edx,%r14d
4048	shrdl	$14,%r13d,%r13d
4049	movl	%r14d,%edx
4050	movl	%eax,%r12d
4051	shrdl	$9,%r14d,%r14d
4052	xorl	%r11d,%r13d
4053	xorl	%ebx,%r12d
4054	shrdl	$5,%r13d,%r13d
4055	xorl	%edx,%r14d
4056	andl	%r11d,%r12d
4057	xorl	%r11d,%r13d
4058	addl	52(%rsp),%ecx
4059	movl	%edx,%edi
4060	xorl	%ebx,%r12d
4061	shrdl	$11,%r14d,%r14d
4062	xorl	%r8d,%edi
4063	addl	%r12d,%ecx
4064	shrdl	$6,%r13d,%r13d
4065	andl	%edi,%r15d
4066	xorl	%edx,%r14d
4067	addl	%r13d,%ecx
4068	xorl	%r8d,%r15d
4069	shrdl	$2,%r14d,%r14d
4070	addl	%ecx,%r10d
4071	addl	%r15d,%ecx
4072	movl	%r10d,%r13d
4073	addl	%ecx,%r14d
4074	shrdl	$14,%r13d,%r13d
4075	movl	%r14d,%ecx
4076	movl	%r11d,%r12d
4077	shrdl	$9,%r14d,%r14d
4078	xorl	%r10d,%r13d
4079	xorl	%eax,%r12d
4080	shrdl	$5,%r13d,%r13d
4081	xorl	%ecx,%r14d
4082	andl	%r10d,%r12d
4083	xorl	%r10d,%r13d
4084	addl	56(%rsp),%ebx
4085	movl	%ecx,%r15d
4086	xorl	%eax,%r12d
4087	shrdl	$11,%r14d,%r14d
4088	xorl	%edx,%r15d
4089	addl	%r12d,%ebx
4090	shrdl	$6,%r13d,%r13d
4091	andl	%r15d,%edi
4092	xorl	%ecx,%r14d
4093	addl	%r13d,%ebx
4094	xorl	%edx,%edi
4095	shrdl	$2,%r14d,%r14d
4096	addl	%ebx,%r9d
4097	addl	%edi,%ebx
4098	movl	%r9d,%r13d
4099	addl	%ebx,%r14d
4100	shrdl	$14,%r13d,%r13d
4101	movl	%r14d,%ebx
4102	movl	%r10d,%r12d
4103	shrdl	$9,%r14d,%r14d
4104	xorl	%r9d,%r13d
4105	xorl	%r11d,%r12d
4106	shrdl	$5,%r13d,%r13d
4107	xorl	%ebx,%r14d
4108	andl	%r9d,%r12d
4109	xorl	%r9d,%r13d
4110	addl	60(%rsp),%eax
4111	movl	%ebx,%edi
4112	xorl	%r11d,%r12d
4113	shrdl	$11,%r14d,%r14d
4114	xorl	%ecx,%edi
4115	addl	%r12d,%eax
4116	shrdl	$6,%r13d,%r13d
4117	andl	%edi,%r15d
4118	xorl	%ebx,%r14d
4119	addl	%r13d,%eax
4120	xorl	%ecx,%r15d
4121	shrdl	$2,%r14d,%r14d
4122	addl	%eax,%r8d
4123	addl	%r15d,%eax
4124	movl	%r8d,%r13d
4125	addl	%eax,%r14d
4126	movq	64+0(%rsp),%rdi
4127	movl	%r14d,%eax
4128
4129	addl	0(%rdi),%eax
4130	leaq	64(%rsi),%rsi
4131	addl	4(%rdi),%ebx
4132	addl	8(%rdi),%ecx
4133	addl	12(%rdi),%edx
4134	addl	16(%rdi),%r8d
4135	addl	20(%rdi),%r9d
4136	addl	24(%rdi),%r10d
4137	addl	28(%rdi),%r11d
4138
4139	cmpq	64+16(%rsp),%rsi
4140
4141	movl	%eax,0(%rdi)
4142	movl	%ebx,4(%rdi)
4143	movl	%ecx,8(%rdi)
4144	movl	%edx,12(%rdi)
4145	movl	%r8d,16(%rdi)
4146	movl	%r9d,20(%rdi)
4147	movl	%r10d,24(%rdi)
4148	movl	%r11d,28(%rdi)
4149	jb	.Lloop_avx
4150
4151	movq	88(%rsp),%rsi
4152.cfi_def_cfa	%rsi,8
4153	vzeroupper
4154	movq	-48(%rsi),%r15
4155.cfi_restore	%r15
4156	movq	-40(%rsi),%r14
4157.cfi_restore	%r14
4158	movq	-32(%rsi),%r13
4159.cfi_restore	%r13
4160	movq	-24(%rsi),%r12
4161.cfi_restore	%r12
4162	movq	-16(%rsi),%rbp
4163.cfi_restore	%rbp
4164	movq	-8(%rsi),%rbx
4165.cfi_restore	%rbx
4166	leaq	(%rsi),%rsp
4167.cfi_def_cfa_register	%rsp
4168.Lepilogue_avx:
4169	.byte	0xf3,0xc3
4170.cfi_endproc
4171.size	sha256_block_data_order_avx,.-sha256_block_data_order_avx
4172.type	sha256_block_data_order_avx2,@function
4173.align	64
4174sha256_block_data_order_avx2:
4175.cfi_startproc
4176.Lavx2_shortcut:
4177	movq	%rsp,%rax
4178.cfi_def_cfa_register	%rax
4179	pushq	%rbx
4180.cfi_offset	%rbx,-16
4181	pushq	%rbp
4182.cfi_offset	%rbp,-24
4183	pushq	%r12
4184.cfi_offset	%r12,-32
4185	pushq	%r13
4186.cfi_offset	%r13,-40
4187	pushq	%r14
4188.cfi_offset	%r14,-48
4189	pushq	%r15
4190.cfi_offset	%r15,-56
4191	subq	$544,%rsp
4192	shlq	$4,%rdx
4193	andq	$-1024,%rsp
4194	leaq	(%rsi,%rdx,4),%rdx
4195	addq	$448,%rsp
4196	movq	%rdi,64+0(%rsp)
4197	movq	%rsi,64+8(%rsp)
4198	movq	%rdx,64+16(%rsp)
4199	movq	%rax,88(%rsp)
4200.cfi_escape	0x0f,0x06,0x77,0xd8,0x00,0x06,0x23,0x08
4201.Lprologue_avx2:
4202
4203	vzeroupper
4204	subq	$-64,%rsi
4205	movl	0(%rdi),%eax
4206	movq	%rsi,%r12
4207	movl	4(%rdi),%ebx
4208	cmpq	%rdx,%rsi
4209	movl	8(%rdi),%ecx
4210	cmoveq	%rsp,%r12
4211	movl	12(%rdi),%edx
4212	movl	16(%rdi),%r8d
4213	movl	20(%rdi),%r9d
4214	movl	24(%rdi),%r10d
4215	movl	28(%rdi),%r11d
4216	vmovdqa	K256+512+32(%rip),%ymm8
4217	vmovdqa	K256+512+64(%rip),%ymm9
4218	jmp	.Loop_avx2
4219.align	16
4220.Loop_avx2:
4221	vmovdqa	K256+512(%rip),%ymm7
4222	vmovdqu	-64+0(%rsi),%xmm0
4223	vmovdqu	-64+16(%rsi),%xmm1
4224	vmovdqu	-64+32(%rsi),%xmm2
4225	vmovdqu	-64+48(%rsi),%xmm3
4226
4227	vinserti128	$1,(%r12),%ymm0,%ymm0
4228	vinserti128	$1,16(%r12),%ymm1,%ymm1
4229	vpshufb	%ymm7,%ymm0,%ymm0
4230	vinserti128	$1,32(%r12),%ymm2,%ymm2
4231	vpshufb	%ymm7,%ymm1,%ymm1
4232	vinserti128	$1,48(%r12),%ymm3,%ymm3
4233
4234	leaq	K256(%rip),%rbp
4235	vpshufb	%ymm7,%ymm2,%ymm2
4236	vpaddd	0(%rbp),%ymm0,%ymm4
4237	vpshufb	%ymm7,%ymm3,%ymm3
4238	vpaddd	32(%rbp),%ymm1,%ymm5
4239	vpaddd	64(%rbp),%ymm2,%ymm6
4240	vpaddd	96(%rbp),%ymm3,%ymm7
4241	vmovdqa	%ymm4,0(%rsp)
4242	xorl	%r14d,%r14d
4243	vmovdqa	%ymm5,32(%rsp)
4244
4245	movq	88(%rsp),%rdi
4246.cfi_def_cfa	%rdi,8
4247	leaq	-64(%rsp),%rsp
4248
4249
4250
4251	movq	%rdi,-8(%rsp)
4252.cfi_escape	0x0f,0x05,0x77,0x78,0x06,0x23,0x08
4253	movl	%ebx,%edi
4254	vmovdqa	%ymm6,0(%rsp)
4255	xorl	%ecx,%edi
4256	vmovdqa	%ymm7,32(%rsp)
4257	movl	%r9d,%r12d
4258	subq	$-32*4,%rbp
4259	jmp	.Lavx2_00_47
4260
4261.align	16
4262.Lavx2_00_47:
4263	leaq	-64(%rsp),%rsp
4264.cfi_escape	0x0f,0x05,0x77,0x38,0x06,0x23,0x08
4265
4266	pushq	64-8(%rsp)
4267.cfi_escape	0x0f,0x05,0x77,0x00,0x06,0x23,0x08
4268	leaq	8(%rsp),%rsp
4269.cfi_escape	0x0f,0x05,0x77,0x78,0x06,0x23,0x08
4270	vpalignr	$4,%ymm0,%ymm1,%ymm4
4271	addl	0+128(%rsp),%r11d
4272	andl	%r8d,%r12d
4273	rorxl	$25,%r8d,%r13d
4274	vpalignr	$4,%ymm2,%ymm3,%ymm7
4275	rorxl	$11,%r8d,%r15d
4276	leal	(%rax,%r14,1),%eax
4277	leal	(%r11,%r12,1),%r11d
4278	vpsrld	$7,%ymm4,%ymm6
4279	andnl	%r10d,%r8d,%r12d
4280	xorl	%r15d,%r13d
4281	rorxl	$6,%r8d,%r14d
4282	vpaddd	%ymm7,%ymm0,%ymm0
4283	leal	(%r11,%r12,1),%r11d
4284	xorl	%r14d,%r13d
4285	movl	%eax,%r15d
4286	vpsrld	$3,%ymm4,%ymm7
4287	rorxl	$22,%eax,%r12d
4288	leal	(%r11,%r13,1),%r11d
4289	xorl	%ebx,%r15d
4290	vpslld	$14,%ymm4,%ymm5
4291	rorxl	$13,%eax,%r14d
4292	rorxl	$2,%eax,%r13d
4293	leal	(%rdx,%r11,1),%edx
4294	vpxor	%ymm6,%ymm7,%ymm4
4295	andl	%r15d,%edi
4296	xorl	%r12d,%r14d
4297	xorl	%ebx,%edi
4298	vpshufd	$250,%ymm3,%ymm7
4299	xorl	%r13d,%r14d
4300	leal	(%r11,%rdi,1),%r11d
4301	movl	%r8d,%r12d
4302	vpsrld	$11,%ymm6,%ymm6
4303	addl	4+128(%rsp),%r10d
4304	andl	%edx,%r12d
4305	rorxl	$25,%edx,%r13d
4306	vpxor	%ymm5,%ymm4,%ymm4
4307	rorxl	$11,%edx,%edi
4308	leal	(%r11,%r14,1),%r11d
4309	leal	(%r10,%r12,1),%r10d
4310	vpslld	$11,%ymm5,%ymm5
4311	andnl	%r9d,%edx,%r12d
4312	xorl	%edi,%r13d
4313	rorxl	$6,%edx,%r14d
4314	vpxor	%ymm6,%ymm4,%ymm4
4315	leal	(%r10,%r12,1),%r10d
4316	xorl	%r14d,%r13d
4317	movl	%r11d,%edi
4318	vpsrld	$10,%ymm7,%ymm6
4319	rorxl	$22,%r11d,%r12d
4320	leal	(%r10,%r13,1),%r10d
4321	xorl	%eax,%edi
4322	vpxor	%ymm5,%ymm4,%ymm4
4323	rorxl	$13,%r11d,%r14d
4324	rorxl	$2,%r11d,%r13d
4325	leal	(%rcx,%r10,1),%ecx
4326	vpsrlq	$17,%ymm7,%ymm7
4327	andl	%edi,%r15d
4328	xorl	%r12d,%r14d
4329	xorl	%eax,%r15d
4330	vpaddd	%ymm4,%ymm0,%ymm0
4331	xorl	%r13d,%r14d
4332	leal	(%r10,%r15,1),%r10d
4333	movl	%edx,%r12d
4334	vpxor	%ymm7,%ymm6,%ymm6
4335	addl	8+128(%rsp),%r9d
4336	andl	%ecx,%r12d
4337	rorxl	$25,%ecx,%r13d
4338	vpsrlq	$2,%ymm7,%ymm7
4339	rorxl	$11,%ecx,%r15d
4340	leal	(%r10,%r14,1),%r10d
4341	leal	(%r9,%r12,1),%r9d
4342	vpxor	%ymm7,%ymm6,%ymm6
4343	andnl	%r8d,%ecx,%r12d
4344	xorl	%r15d,%r13d
4345	rorxl	$6,%ecx,%r14d
4346	vpshufb	%ymm8,%ymm6,%ymm6
4347	leal	(%r9,%r12,1),%r9d
4348	xorl	%r14d,%r13d
4349	movl	%r10d,%r15d
4350	vpaddd	%ymm6,%ymm0,%ymm0
4351	rorxl	$22,%r10d,%r12d
4352	leal	(%r9,%r13,1),%r9d
4353	xorl	%r11d,%r15d
4354	vpshufd	$80,%ymm0,%ymm7
4355	rorxl	$13,%r10d,%r14d
4356	rorxl	$2,%r10d,%r13d
4357	leal	(%rbx,%r9,1),%ebx
4358	vpsrld	$10,%ymm7,%ymm6
4359	andl	%r15d,%edi
4360	xorl	%r12d,%r14d
4361	xorl	%r11d,%edi
4362	vpsrlq	$17,%ymm7,%ymm7
4363	xorl	%r13d,%r14d
4364	leal	(%r9,%rdi,1),%r9d
4365	movl	%ecx,%r12d
4366	vpxor	%ymm7,%ymm6,%ymm6
4367	addl	12+128(%rsp),%r8d
4368	andl	%ebx,%r12d
4369	rorxl	$25,%ebx,%r13d
4370	vpsrlq	$2,%ymm7,%ymm7
4371	rorxl	$11,%ebx,%edi
4372	leal	(%r9,%r14,1),%r9d
4373	leal	(%r8,%r12,1),%r8d
4374	vpxor	%ymm7,%ymm6,%ymm6
4375	andnl	%edx,%ebx,%r12d
4376	xorl	%edi,%r13d
4377	rorxl	$6,%ebx,%r14d
4378	vpshufb	%ymm9,%ymm6,%ymm6
4379	leal	(%r8,%r12,1),%r8d
4380	xorl	%r14d,%r13d
4381	movl	%r9d,%edi
4382	vpaddd	%ymm6,%ymm0,%ymm0
4383	rorxl	$22,%r9d,%r12d
4384	leal	(%r8,%r13,1),%r8d
4385	xorl	%r10d,%edi
4386	vpaddd	0(%rbp),%ymm0,%ymm6
4387	rorxl	$13,%r9d,%r14d
4388	rorxl	$2,%r9d,%r13d
4389	leal	(%rax,%r8,1),%eax
4390	andl	%edi,%r15d
4391	xorl	%r12d,%r14d
4392	xorl	%r10d,%r15d
4393	xorl	%r13d,%r14d
4394	leal	(%r8,%r15,1),%r8d
4395	movl	%ebx,%r12d
4396	vmovdqa	%ymm6,0(%rsp)
4397	vpalignr	$4,%ymm1,%ymm2,%ymm4
4398	addl	32+128(%rsp),%edx
4399	andl	%eax,%r12d
4400	rorxl	$25,%eax,%r13d
4401	vpalignr	$4,%ymm3,%ymm0,%ymm7
4402	rorxl	$11,%eax,%r15d
4403	leal	(%r8,%r14,1),%r8d
4404	leal	(%rdx,%r12,1),%edx
4405	vpsrld	$7,%ymm4,%ymm6
4406	andnl	%ecx,%eax,%r12d
4407	xorl	%r15d,%r13d
4408	rorxl	$6,%eax,%r14d
4409	vpaddd	%ymm7,%ymm1,%ymm1
4410	leal	(%rdx,%r12,1),%edx
4411	xorl	%r14d,%r13d
4412	movl	%r8d,%r15d
4413	vpsrld	$3,%ymm4,%ymm7
4414	rorxl	$22,%r8d,%r12d
4415	leal	(%rdx,%r13,1),%edx
4416	xorl	%r9d,%r15d
4417	vpslld	$14,%ymm4,%ymm5
4418	rorxl	$13,%r8d,%r14d
4419	rorxl	$2,%r8d,%r13d
4420	leal	(%r11,%rdx,1),%r11d
4421	vpxor	%ymm6,%ymm7,%ymm4
4422	andl	%r15d,%edi
4423	xorl	%r12d,%r14d
4424	xorl	%r9d,%edi
4425	vpshufd	$250,%ymm0,%ymm7
4426	xorl	%r13d,%r14d
4427	leal	(%rdx,%rdi,1),%edx
4428	movl	%eax,%r12d
4429	vpsrld	$11,%ymm6,%ymm6
4430	addl	36+128(%rsp),%ecx
4431	andl	%r11d,%r12d
4432	rorxl	$25,%r11d,%r13d
4433	vpxor	%ymm5,%ymm4,%ymm4
4434	rorxl	$11,%r11d,%edi
4435	leal	(%rdx,%r14,1),%edx
4436	leal	(%rcx,%r12,1),%ecx
4437	vpslld	$11,%ymm5,%ymm5
4438	andnl	%ebx,%r11d,%r12d
4439	xorl	%edi,%r13d
4440	rorxl	$6,%r11d,%r14d
4441	vpxor	%ymm6,%ymm4,%ymm4
4442	leal	(%rcx,%r12,1),%ecx
4443	xorl	%r14d,%r13d
4444	movl	%edx,%edi
4445	vpsrld	$10,%ymm7,%ymm6
4446	rorxl	$22,%edx,%r12d
4447	leal	(%rcx,%r13,1),%ecx
4448	xorl	%r8d,%edi
4449	vpxor	%ymm5,%ymm4,%ymm4
4450	rorxl	$13,%edx,%r14d
4451	rorxl	$2,%edx,%r13d
4452	leal	(%r10,%rcx,1),%r10d
4453	vpsrlq	$17,%ymm7,%ymm7
4454	andl	%edi,%r15d
4455	xorl	%r12d,%r14d
4456	xorl	%r8d,%r15d
4457	vpaddd	%ymm4,%ymm1,%ymm1
4458	xorl	%r13d,%r14d
4459	leal	(%rcx,%r15,1),%ecx
4460	movl	%r11d,%r12d
4461	vpxor	%ymm7,%ymm6,%ymm6
4462	addl	40+128(%rsp),%ebx
4463	andl	%r10d,%r12d
4464	rorxl	$25,%r10d,%r13d
4465	vpsrlq	$2,%ymm7,%ymm7
4466	rorxl	$11,%r10d,%r15d
4467	leal	(%rcx,%r14,1),%ecx
4468	leal	(%rbx,%r12,1),%ebx
4469	vpxor	%ymm7,%ymm6,%ymm6
4470	andnl	%eax,%r10d,%r12d
4471	xorl	%r15d,%r13d
4472	rorxl	$6,%r10d,%r14d
4473	vpshufb	%ymm8,%ymm6,%ymm6
4474	leal	(%rbx,%r12,1),%ebx
4475	xorl	%r14d,%r13d
4476	movl	%ecx,%r15d
4477	vpaddd	%ymm6,%ymm1,%ymm1
4478	rorxl	$22,%ecx,%r12d
4479	leal	(%rbx,%r13,1),%ebx
4480	xorl	%edx,%r15d
4481	vpshufd	$80,%ymm1,%ymm7
4482	rorxl	$13,%ecx,%r14d
4483	rorxl	$2,%ecx,%r13d
4484	leal	(%r9,%rbx,1),%r9d
4485	vpsrld	$10,%ymm7,%ymm6
4486	andl	%r15d,%edi
4487	xorl	%r12d,%r14d
4488	xorl	%edx,%edi
4489	vpsrlq	$17,%ymm7,%ymm7
4490	xorl	%r13d,%r14d
4491	leal	(%rbx,%rdi,1),%ebx
4492	movl	%r10d,%r12d
4493	vpxor	%ymm7,%ymm6,%ymm6
4494	addl	44+128(%rsp),%eax
4495	andl	%r9d,%r12d
4496	rorxl	$25,%r9d,%r13d
4497	vpsrlq	$2,%ymm7,%ymm7
4498	rorxl	$11,%r9d,%edi
4499	leal	(%rbx,%r14,1),%ebx
4500	leal	(%rax,%r12,1),%eax
4501	vpxor	%ymm7,%ymm6,%ymm6
4502	andnl	%r11d,%r9d,%r12d
4503	xorl	%edi,%r13d
4504	rorxl	$6,%r9d,%r14d
4505	vpshufb	%ymm9,%ymm6,%ymm6
4506	leal	(%rax,%r12,1),%eax
4507	xorl	%r14d,%r13d
4508	movl	%ebx,%edi
4509	vpaddd	%ymm6,%ymm1,%ymm1
4510	rorxl	$22,%ebx,%r12d
4511	leal	(%rax,%r13,1),%eax
4512	xorl	%ecx,%edi
4513	vpaddd	32(%rbp),%ymm1,%ymm6
4514	rorxl	$13,%ebx,%r14d
4515	rorxl	$2,%ebx,%r13d
4516	leal	(%r8,%rax,1),%r8d
4517	andl	%edi,%r15d
4518	xorl	%r12d,%r14d
4519	xorl	%ecx,%r15d
4520	xorl	%r13d,%r14d
4521	leal	(%rax,%r15,1),%eax
4522	movl	%r9d,%r12d
4523	vmovdqa	%ymm6,32(%rsp)
4524	leaq	-64(%rsp),%rsp
4525.cfi_escape	0x0f,0x05,0x77,0x38,0x06,0x23,0x08
4526
4527	pushq	64-8(%rsp)
4528.cfi_escape	0x0f,0x05,0x77,0x00,0x06,0x23,0x08
4529	leaq	8(%rsp),%rsp
4530.cfi_escape	0x0f,0x05,0x77,0x78,0x06,0x23,0x08
4531	vpalignr	$4,%ymm2,%ymm3,%ymm4
4532	addl	0+128(%rsp),%r11d
4533	andl	%r8d,%r12d
4534	rorxl	$25,%r8d,%r13d
4535	vpalignr	$4,%ymm0,%ymm1,%ymm7
4536	rorxl	$11,%r8d,%r15d
4537	leal	(%rax,%r14,1),%eax
4538	leal	(%r11,%r12,1),%r11d
4539	vpsrld	$7,%ymm4,%ymm6
4540	andnl	%r10d,%r8d,%r12d
4541	xorl	%r15d,%r13d
4542	rorxl	$6,%r8d,%r14d
4543	vpaddd	%ymm7,%ymm2,%ymm2
4544	leal	(%r11,%r12,1),%r11d
4545	xorl	%r14d,%r13d
4546	movl	%eax,%r15d
4547	vpsrld	$3,%ymm4,%ymm7
4548	rorxl	$22,%eax,%r12d
4549	leal	(%r11,%r13,1),%r11d
4550	xorl	%ebx,%r15d
4551	vpslld	$14,%ymm4,%ymm5
4552	rorxl	$13,%eax,%r14d
4553	rorxl	$2,%eax,%r13d
4554	leal	(%rdx,%r11,1),%edx
4555	vpxor	%ymm6,%ymm7,%ymm4
4556	andl	%r15d,%edi
4557	xorl	%r12d,%r14d
4558	xorl	%ebx,%edi
4559	vpshufd	$250,%ymm1,%ymm7
4560	xorl	%r13d,%r14d
4561	leal	(%r11,%rdi,1),%r11d
4562	movl	%r8d,%r12d
4563	vpsrld	$11,%ymm6,%ymm6
4564	addl	4+128(%rsp),%r10d
4565	andl	%edx,%r12d
4566	rorxl	$25,%edx,%r13d
4567	vpxor	%ymm5,%ymm4,%ymm4
4568	rorxl	$11,%edx,%edi
4569	leal	(%r11,%r14,1),%r11d
4570	leal	(%r10,%r12,1),%r10d
4571	vpslld	$11,%ymm5,%ymm5
4572	andnl	%r9d,%edx,%r12d
4573	xorl	%edi,%r13d
4574	rorxl	$6,%edx,%r14d
4575	vpxor	%ymm6,%ymm4,%ymm4
4576	leal	(%r10,%r12,1),%r10d
4577	xorl	%r14d,%r13d
4578	movl	%r11d,%edi
4579	vpsrld	$10,%ymm7,%ymm6
4580	rorxl	$22,%r11d,%r12d
4581	leal	(%r10,%r13,1),%r10d
4582	xorl	%eax,%edi
4583	vpxor	%ymm5,%ymm4,%ymm4
4584	rorxl	$13,%r11d,%r14d
4585	rorxl	$2,%r11d,%r13d
4586	leal	(%rcx,%r10,1),%ecx
4587	vpsrlq	$17,%ymm7,%ymm7
4588	andl	%edi,%r15d
4589	xorl	%r12d,%r14d
4590	xorl	%eax,%r15d
4591	vpaddd	%ymm4,%ymm2,%ymm2
4592	xorl	%r13d,%r14d
4593	leal	(%r10,%r15,1),%r10d
4594	movl	%edx,%r12d
4595	vpxor	%ymm7,%ymm6,%ymm6
4596	addl	8+128(%rsp),%r9d
4597	andl	%ecx,%r12d
4598	rorxl	$25,%ecx,%r13d
4599	vpsrlq	$2,%ymm7,%ymm7
4600	rorxl	$11,%ecx,%r15d
4601	leal	(%r10,%r14,1),%r10d
4602	leal	(%r9,%r12,1),%r9d
4603	vpxor	%ymm7,%ymm6,%ymm6
4604	andnl	%r8d,%ecx,%r12d
4605	xorl	%r15d,%r13d
4606	rorxl	$6,%ecx,%r14d
4607	vpshufb	%ymm8,%ymm6,%ymm6
4608	leal	(%r9,%r12,1),%r9d
4609	xorl	%r14d,%r13d
4610	movl	%r10d,%r15d
4611	vpaddd	%ymm6,%ymm2,%ymm2
4612	rorxl	$22,%r10d,%r12d
4613	leal	(%r9,%r13,1),%r9d
4614	xorl	%r11d,%r15d
4615	vpshufd	$80,%ymm2,%ymm7
4616	rorxl	$13,%r10d,%r14d
4617	rorxl	$2,%r10d,%r13d
4618	leal	(%rbx,%r9,1),%ebx
4619	vpsrld	$10,%ymm7,%ymm6
4620	andl	%r15d,%edi
4621	xorl	%r12d,%r14d
4622	xorl	%r11d,%edi
4623	vpsrlq	$17,%ymm7,%ymm7
4624	xorl	%r13d,%r14d
4625	leal	(%r9,%rdi,1),%r9d
4626	movl	%ecx,%r12d
4627	vpxor	%ymm7,%ymm6,%ymm6
4628	addl	12+128(%rsp),%r8d
4629	andl	%ebx,%r12d
4630	rorxl	$25,%ebx,%r13d
4631	vpsrlq	$2,%ymm7,%ymm7
4632	rorxl	$11,%ebx,%edi
4633	leal	(%r9,%r14,1),%r9d
4634	leal	(%r8,%r12,1),%r8d
4635	vpxor	%ymm7,%ymm6,%ymm6
4636	andnl	%edx,%ebx,%r12d
4637	xorl	%edi,%r13d
4638	rorxl	$6,%ebx,%r14d
4639	vpshufb	%ymm9,%ymm6,%ymm6
4640	leal	(%r8,%r12,1),%r8d
4641	xorl	%r14d,%r13d
4642	movl	%r9d,%edi
4643	vpaddd	%ymm6,%ymm2,%ymm2
4644	rorxl	$22,%r9d,%r12d
4645	leal	(%r8,%r13,1),%r8d
4646	xorl	%r10d,%edi
4647	vpaddd	64(%rbp),%ymm2,%ymm6
4648	rorxl	$13,%r9d,%r14d
4649	rorxl	$2,%r9d,%r13d
4650	leal	(%rax,%r8,1),%eax
4651	andl	%edi,%r15d
4652	xorl	%r12d,%r14d
4653	xorl	%r10d,%r15d
4654	xorl	%r13d,%r14d
4655	leal	(%r8,%r15,1),%r8d
4656	movl	%ebx,%r12d
4657	vmovdqa	%ymm6,0(%rsp)
4658	vpalignr	$4,%ymm3,%ymm0,%ymm4
4659	addl	32+128(%rsp),%edx
4660	andl	%eax,%r12d
4661	rorxl	$25,%eax,%r13d
4662	vpalignr	$4,%ymm1,%ymm2,%ymm7
4663	rorxl	$11,%eax,%r15d
4664	leal	(%r8,%r14,1),%r8d
4665	leal	(%rdx,%r12,1),%edx
4666	vpsrld	$7,%ymm4,%ymm6
4667	andnl	%ecx,%eax,%r12d
4668	xorl	%r15d,%r13d
4669	rorxl	$6,%eax,%r14d
4670	vpaddd	%ymm7,%ymm3,%ymm3
4671	leal	(%rdx,%r12,1),%edx
4672	xorl	%r14d,%r13d
4673	movl	%r8d,%r15d
4674	vpsrld	$3,%ymm4,%ymm7
4675	rorxl	$22,%r8d,%r12d
4676	leal	(%rdx,%r13,1),%edx
4677	xorl	%r9d,%r15d
4678	vpslld	$14,%ymm4,%ymm5
4679	rorxl	$13,%r8d,%r14d
4680	rorxl	$2,%r8d,%r13d
4681	leal	(%r11,%rdx,1),%r11d
4682	vpxor	%ymm6,%ymm7,%ymm4
4683	andl	%r15d,%edi
4684	xorl	%r12d,%r14d
4685	xorl	%r9d,%edi
4686	vpshufd	$250,%ymm2,%ymm7
4687	xorl	%r13d,%r14d
4688	leal	(%rdx,%rdi,1),%edx
4689	movl	%eax,%r12d
4690	vpsrld	$11,%ymm6,%ymm6
4691	addl	36+128(%rsp),%ecx
4692	andl	%r11d,%r12d
4693	rorxl	$25,%r11d,%r13d
4694	vpxor	%ymm5,%ymm4,%ymm4
4695	rorxl	$11,%r11d,%edi
4696	leal	(%rdx,%r14,1),%edx
4697	leal	(%rcx,%r12,1),%ecx
4698	vpslld	$11,%ymm5,%ymm5
4699	andnl	%ebx,%r11d,%r12d
4700	xorl	%edi,%r13d
4701	rorxl	$6,%r11d,%r14d
4702	vpxor	%ymm6,%ymm4,%ymm4
4703	leal	(%rcx,%r12,1),%ecx
4704	xorl	%r14d,%r13d
4705	movl	%edx,%edi
4706	vpsrld	$10,%ymm7,%ymm6
4707	rorxl	$22,%edx,%r12d
4708	leal	(%rcx,%r13,1),%ecx
4709	xorl	%r8d,%edi
4710	vpxor	%ymm5,%ymm4,%ymm4
4711	rorxl	$13,%edx,%r14d
4712	rorxl	$2,%edx,%r13d
4713	leal	(%r10,%rcx,1),%r10d
4714	vpsrlq	$17,%ymm7,%ymm7
4715	andl	%edi,%r15d
4716	xorl	%r12d,%r14d
4717	xorl	%r8d,%r15d
4718	vpaddd	%ymm4,%ymm3,%ymm3
4719	xorl	%r13d,%r14d
4720	leal	(%rcx,%r15,1),%ecx
4721	movl	%r11d,%r12d
4722	vpxor	%ymm7,%ymm6,%ymm6
4723	addl	40+128(%rsp),%ebx
4724	andl	%r10d,%r12d
4725	rorxl	$25,%r10d,%r13d
4726	vpsrlq	$2,%ymm7,%ymm7
4727	rorxl	$11,%r10d,%r15d
4728	leal	(%rcx,%r14,1),%ecx
4729	leal	(%rbx,%r12,1),%ebx
4730	vpxor	%ymm7,%ymm6,%ymm6
4731	andnl	%eax,%r10d,%r12d
4732	xorl	%r15d,%r13d
4733	rorxl	$6,%r10d,%r14d
4734	vpshufb	%ymm8,%ymm6,%ymm6
4735	leal	(%rbx,%r12,1),%ebx
4736	xorl	%r14d,%r13d
4737	movl	%ecx,%r15d
4738	vpaddd	%ymm6,%ymm3,%ymm3
4739	rorxl	$22,%ecx,%r12d
4740	leal	(%rbx,%r13,1),%ebx
4741	xorl	%edx,%r15d
4742	vpshufd	$80,%ymm3,%ymm7
4743	rorxl	$13,%ecx,%r14d
4744	rorxl	$2,%ecx,%r13d
4745	leal	(%r9,%rbx,1),%r9d
4746	vpsrld	$10,%ymm7,%ymm6
4747	andl	%r15d,%edi
4748	xorl	%r12d,%r14d
4749	xorl	%edx,%edi
4750	vpsrlq	$17,%ymm7,%ymm7
4751	xorl	%r13d,%r14d
4752	leal	(%rbx,%rdi,1),%ebx
4753	movl	%r10d,%r12d
4754	vpxor	%ymm7,%ymm6,%ymm6
4755	addl	44+128(%rsp),%eax
4756	andl	%r9d,%r12d
4757	rorxl	$25,%r9d,%r13d
4758	vpsrlq	$2,%ymm7,%ymm7
4759	rorxl	$11,%r9d,%edi
4760	leal	(%rbx,%r14,1),%ebx
4761	leal	(%rax,%r12,1),%eax
4762	vpxor	%ymm7,%ymm6,%ymm6
4763	andnl	%r11d,%r9d,%r12d
4764	xorl	%edi,%r13d
4765	rorxl	$6,%r9d,%r14d
4766	vpshufb	%ymm9,%ymm6,%ymm6
4767	leal	(%rax,%r12,1),%eax
4768	xorl	%r14d,%r13d
4769	movl	%ebx,%edi
4770	vpaddd	%ymm6,%ymm3,%ymm3
4771	rorxl	$22,%ebx,%r12d
4772	leal	(%rax,%r13,1),%eax
4773	xorl	%ecx,%edi
4774	vpaddd	96(%rbp),%ymm3,%ymm6
4775	rorxl	$13,%ebx,%r14d
4776	rorxl	$2,%ebx,%r13d
4777	leal	(%r8,%rax,1),%r8d
4778	andl	%edi,%r15d
4779	xorl	%r12d,%r14d
4780	xorl	%ecx,%r15d
4781	xorl	%r13d,%r14d
4782	leal	(%rax,%r15,1),%eax
4783	movl	%r9d,%r12d
4784	vmovdqa	%ymm6,32(%rsp)
4785	leaq	128(%rbp),%rbp
4786	cmpb	$0,3(%rbp)
4787	jne	.Lavx2_00_47
4788	addl	0+64(%rsp),%r11d
4789	andl	%r8d,%r12d
4790	rorxl	$25,%r8d,%r13d
4791	rorxl	$11,%r8d,%r15d
4792	leal	(%rax,%r14,1),%eax
4793	leal	(%r11,%r12,1),%r11d
4794	andnl	%r10d,%r8d,%r12d
4795	xorl	%r15d,%r13d
4796	rorxl	$6,%r8d,%r14d
4797	leal	(%r11,%r12,1),%r11d
4798	xorl	%r14d,%r13d
4799	movl	%eax,%r15d
4800	rorxl	$22,%eax,%r12d
4801	leal	(%r11,%r13,1),%r11d
4802	xorl	%ebx,%r15d
4803	rorxl	$13,%eax,%r14d
4804	rorxl	$2,%eax,%r13d
4805	leal	(%rdx,%r11,1),%edx
4806	andl	%r15d,%edi
4807	xorl	%r12d,%r14d
4808	xorl	%ebx,%edi
4809	xorl	%r13d,%r14d
4810	leal	(%r11,%rdi,1),%r11d
4811	movl	%r8d,%r12d
4812	addl	4+64(%rsp),%r10d
4813	andl	%edx,%r12d
4814	rorxl	$25,%edx,%r13d
4815	rorxl	$11,%edx,%edi
4816	leal	(%r11,%r14,1),%r11d
4817	leal	(%r10,%r12,1),%r10d
4818	andnl	%r9d,%edx,%r12d
4819	xorl	%edi,%r13d
4820	rorxl	$6,%edx,%r14d
4821	leal	(%r10,%r12,1),%r10d
4822	xorl	%r14d,%r13d
4823	movl	%r11d,%edi
4824	rorxl	$22,%r11d,%r12d
4825	leal	(%r10,%r13,1),%r10d
4826	xorl	%eax,%edi
4827	rorxl	$13,%r11d,%r14d
4828	rorxl	$2,%r11d,%r13d
4829	leal	(%rcx,%r10,1),%ecx
4830	andl	%edi,%r15d
4831	xorl	%r12d,%r14d
4832	xorl	%eax,%r15d
4833	xorl	%r13d,%r14d
4834	leal	(%r10,%r15,1),%r10d
4835	movl	%edx,%r12d
4836	addl	8+64(%rsp),%r9d
4837	andl	%ecx,%r12d
4838	rorxl	$25,%ecx,%r13d
4839	rorxl	$11,%ecx,%r15d
4840	leal	(%r10,%r14,1),%r10d
4841	leal	(%r9,%r12,1),%r9d
4842	andnl	%r8d,%ecx,%r12d
4843	xorl	%r15d,%r13d
4844	rorxl	$6,%ecx,%r14d
4845	leal	(%r9,%r12,1),%r9d
4846	xorl	%r14d,%r13d
4847	movl	%r10d,%r15d
4848	rorxl	$22,%r10d,%r12d
4849	leal	(%r9,%r13,1),%r9d
4850	xorl	%r11d,%r15d
4851	rorxl	$13,%r10d,%r14d
4852	rorxl	$2,%r10d,%r13d
4853	leal	(%rbx,%r9,1),%ebx
4854	andl	%r15d,%edi
4855	xorl	%r12d,%r14d
4856	xorl	%r11d,%edi
4857	xorl	%r13d,%r14d
4858	leal	(%r9,%rdi,1),%r9d
4859	movl	%ecx,%r12d
4860	addl	12+64(%rsp),%r8d
4861	andl	%ebx,%r12d
4862	rorxl	$25,%ebx,%r13d
4863	rorxl	$11,%ebx,%edi
4864	leal	(%r9,%r14,1),%r9d
4865	leal	(%r8,%r12,1),%r8d
4866	andnl	%edx,%ebx,%r12d
4867	xorl	%edi,%r13d
4868	rorxl	$6,%ebx,%r14d
4869	leal	(%r8,%r12,1),%r8d
4870	xorl	%r14d,%r13d
4871	movl	%r9d,%edi
4872	rorxl	$22,%r9d,%r12d
4873	leal	(%r8,%r13,1),%r8d
4874	xorl	%r10d,%edi
4875	rorxl	$13,%r9d,%r14d
4876	rorxl	$2,%r9d,%r13d
4877	leal	(%rax,%r8,1),%eax
4878	andl	%edi,%r15d
4879	xorl	%r12d,%r14d
4880	xorl	%r10d,%r15d
4881	xorl	%r13d,%r14d
4882	leal	(%r8,%r15,1),%r8d
4883	movl	%ebx,%r12d
4884	addl	32+64(%rsp),%edx
4885	andl	%eax,%r12d
4886	rorxl	$25,%eax,%r13d
4887	rorxl	$11,%eax,%r15d
4888	leal	(%r8,%r14,1),%r8d
4889	leal	(%rdx,%r12,1),%edx
4890	andnl	%ecx,%eax,%r12d
4891	xorl	%r15d,%r13d
4892	rorxl	$6,%eax,%r14d
4893	leal	(%rdx,%r12,1),%edx
4894	xorl	%r14d,%r13d
4895	movl	%r8d,%r15d
4896	rorxl	$22,%r8d,%r12d
4897	leal	(%rdx,%r13,1),%edx
4898	xorl	%r9d,%r15d
4899	rorxl	$13,%r8d,%r14d
4900	rorxl	$2,%r8d,%r13d
4901	leal	(%r11,%rdx,1),%r11d
4902	andl	%r15d,%edi
4903	xorl	%r12d,%r14d
4904	xorl	%r9d,%edi
4905	xorl	%r13d,%r14d
4906	leal	(%rdx,%rdi,1),%edx
4907	movl	%eax,%r12d
4908	addl	36+64(%rsp),%ecx
4909	andl	%r11d,%r12d
4910	rorxl	$25,%r11d,%r13d
4911	rorxl	$11,%r11d,%edi
4912	leal	(%rdx,%r14,1),%edx
4913	leal	(%rcx,%r12,1),%ecx
4914	andnl	%ebx,%r11d,%r12d
4915	xorl	%edi,%r13d
4916	rorxl	$6,%r11d,%r14d
4917	leal	(%rcx,%r12,1),%ecx
4918	xorl	%r14d,%r13d
4919	movl	%edx,%edi
4920	rorxl	$22,%edx,%r12d
4921	leal	(%rcx,%r13,1),%ecx
4922	xorl	%r8d,%edi
4923	rorxl	$13,%edx,%r14d
4924	rorxl	$2,%edx,%r13d
4925	leal	(%r10,%rcx,1),%r10d
4926	andl	%edi,%r15d
4927	xorl	%r12d,%r14d
4928	xorl	%r8d,%r15d
4929	xorl	%r13d,%r14d
4930	leal	(%rcx,%r15,1),%ecx
4931	movl	%r11d,%r12d
4932	addl	40+64(%rsp),%ebx
4933	andl	%r10d,%r12d
4934	rorxl	$25,%r10d,%r13d
4935	rorxl	$11,%r10d,%r15d
4936	leal	(%rcx,%r14,1),%ecx
4937	leal	(%rbx,%r12,1),%ebx
4938	andnl	%eax,%r10d,%r12d
4939	xorl	%r15d,%r13d
4940	rorxl	$6,%r10d,%r14d
4941	leal	(%rbx,%r12,1),%ebx
4942	xorl	%r14d,%r13d
4943	movl	%ecx,%r15d
4944	rorxl	$22,%ecx,%r12d
4945	leal	(%rbx,%r13,1),%ebx
4946	xorl	%edx,%r15d
4947	rorxl	$13,%ecx,%r14d
4948	rorxl	$2,%ecx,%r13d
4949	leal	(%r9,%rbx,1),%r9d
4950	andl	%r15d,%edi
4951	xorl	%r12d,%r14d
4952	xorl	%edx,%edi
4953	xorl	%r13d,%r14d
4954	leal	(%rbx,%rdi,1),%ebx
4955	movl	%r10d,%r12d
4956	addl	44+64(%rsp),%eax
4957	andl	%r9d,%r12d
4958	rorxl	$25,%r9d,%r13d
4959	rorxl	$11,%r9d,%edi
4960	leal	(%rbx,%r14,1),%ebx
4961	leal	(%rax,%r12,1),%eax
4962	andnl	%r11d,%r9d,%r12d
4963	xorl	%edi,%r13d
4964	rorxl	$6,%r9d,%r14d
4965	leal	(%rax,%r12,1),%eax
4966	xorl	%r14d,%r13d
4967	movl	%ebx,%edi
4968	rorxl	$22,%ebx,%r12d
4969	leal	(%rax,%r13,1),%eax
4970	xorl	%ecx,%edi
4971	rorxl	$13,%ebx,%r14d
4972	rorxl	$2,%ebx,%r13d
4973	leal	(%r8,%rax,1),%r8d
4974	andl	%edi,%r15d
4975	xorl	%r12d,%r14d
4976	xorl	%ecx,%r15d
4977	xorl	%r13d,%r14d
4978	leal	(%rax,%r15,1),%eax
4979	movl	%r9d,%r12d
4980	addl	0(%rsp),%r11d
4981	andl	%r8d,%r12d
4982	rorxl	$25,%r8d,%r13d
4983	rorxl	$11,%r8d,%r15d
4984	leal	(%rax,%r14,1),%eax
4985	leal	(%r11,%r12,1),%r11d
4986	andnl	%r10d,%r8d,%r12d
4987	xorl	%r15d,%r13d
4988	rorxl	$6,%r8d,%r14d
4989	leal	(%r11,%r12,1),%r11d
4990	xorl	%r14d,%r13d
4991	movl	%eax,%r15d
4992	rorxl	$22,%eax,%r12d
4993	leal	(%r11,%r13,1),%r11d
4994	xorl	%ebx,%r15d
4995	rorxl	$13,%eax,%r14d
4996	rorxl	$2,%eax,%r13d
4997	leal	(%rdx,%r11,1),%edx
4998	andl	%r15d,%edi
4999	xorl	%r12d,%r14d
5000	xorl	%ebx,%edi
5001	xorl	%r13d,%r14d
5002	leal	(%r11,%rdi,1),%r11d
5003	movl	%r8d,%r12d
5004	addl	4(%rsp),%r10d
5005	andl	%edx,%r12d
5006	rorxl	$25,%edx,%r13d
5007	rorxl	$11,%edx,%edi
5008	leal	(%r11,%r14,1),%r11d
5009	leal	(%r10,%r12,1),%r10d
5010	andnl	%r9d,%edx,%r12d
5011	xorl	%edi,%r13d
5012	rorxl	$6,%edx,%r14d
5013	leal	(%r10,%r12,1),%r10d
5014	xorl	%r14d,%r13d
5015	movl	%r11d,%edi
5016	rorxl	$22,%r11d,%r12d
5017	leal	(%r10,%r13,1),%r10d
5018	xorl	%eax,%edi
5019	rorxl	$13,%r11d,%r14d
5020	rorxl	$2,%r11d,%r13d
5021	leal	(%rcx,%r10,1),%ecx
5022	andl	%edi,%r15d
5023	xorl	%r12d,%r14d
5024	xorl	%eax,%r15d
5025	xorl	%r13d,%r14d
5026	leal	(%r10,%r15,1),%r10d
5027	movl	%edx,%r12d
5028	addl	8(%rsp),%r9d
5029	andl	%ecx,%r12d
5030	rorxl	$25,%ecx,%r13d
5031	rorxl	$11,%ecx,%r15d
5032	leal	(%r10,%r14,1),%r10d
5033	leal	(%r9,%r12,1),%r9d
5034	andnl	%r8d,%ecx,%r12d
5035	xorl	%r15d,%r13d
5036	rorxl	$6,%ecx,%r14d
5037	leal	(%r9,%r12,1),%r9d
5038	xorl	%r14d,%r13d
5039	movl	%r10d,%r15d
5040	rorxl	$22,%r10d,%r12d
5041	leal	(%r9,%r13,1),%r9d
5042	xorl	%r11d,%r15d
5043	rorxl	$13,%r10d,%r14d
5044	rorxl	$2,%r10d,%r13d
5045	leal	(%rbx,%r9,1),%ebx
5046	andl	%r15d,%edi
5047	xorl	%r12d,%r14d
5048	xorl	%r11d,%edi
5049	xorl	%r13d,%r14d
5050	leal	(%r9,%rdi,1),%r9d
5051	movl	%ecx,%r12d
5052	addl	12(%rsp),%r8d
5053	andl	%ebx,%r12d
5054	rorxl	$25,%ebx,%r13d
5055	rorxl	$11,%ebx,%edi
5056	leal	(%r9,%r14,1),%r9d
5057	leal	(%r8,%r12,1),%r8d
5058	andnl	%edx,%ebx,%r12d
5059	xorl	%edi,%r13d
5060	rorxl	$6,%ebx,%r14d
5061	leal	(%r8,%r12,1),%r8d
5062	xorl	%r14d,%r13d
5063	movl	%r9d,%edi
5064	rorxl	$22,%r9d,%r12d
5065	leal	(%r8,%r13,1),%r8d
5066	xorl	%r10d,%edi
5067	rorxl	$13,%r9d,%r14d
5068	rorxl	$2,%r9d,%r13d
5069	leal	(%rax,%r8,1),%eax
5070	andl	%edi,%r15d
5071	xorl	%r12d,%r14d
5072	xorl	%r10d,%r15d
5073	xorl	%r13d,%r14d
5074	leal	(%r8,%r15,1),%r8d
5075	movl	%ebx,%r12d
5076	addl	32(%rsp),%edx
5077	andl	%eax,%r12d
5078	rorxl	$25,%eax,%r13d
5079	rorxl	$11,%eax,%r15d
5080	leal	(%r8,%r14,1),%r8d
5081	leal	(%rdx,%r12,1),%edx
5082	andnl	%ecx,%eax,%r12d
5083	xorl	%r15d,%r13d
5084	rorxl	$6,%eax,%r14d
5085	leal	(%rdx,%r12,1),%edx
5086	xorl	%r14d,%r13d
5087	movl	%r8d,%r15d
5088	rorxl	$22,%r8d,%r12d
5089	leal	(%rdx,%r13,1),%edx
5090	xorl	%r9d,%r15d
5091	rorxl	$13,%r8d,%r14d
5092	rorxl	$2,%r8d,%r13d
5093	leal	(%r11,%rdx,1),%r11d
5094	andl	%r15d,%edi
5095	xorl	%r12d,%r14d
5096	xorl	%r9d,%edi
5097	xorl	%r13d,%r14d
5098	leal	(%rdx,%rdi,1),%edx
5099	movl	%eax,%r12d
5100	addl	36(%rsp),%ecx
5101	andl	%r11d,%r12d
5102	rorxl	$25,%r11d,%r13d
5103	rorxl	$11,%r11d,%edi
5104	leal	(%rdx,%r14,1),%edx
5105	leal	(%rcx,%r12,1),%ecx
5106	andnl	%ebx,%r11d,%r12d
5107	xorl	%edi,%r13d
5108	rorxl	$6,%r11d,%r14d
5109	leal	(%rcx,%r12,1),%ecx
5110	xorl	%r14d,%r13d
5111	movl	%edx,%edi
5112	rorxl	$22,%edx,%r12d
5113	leal	(%rcx,%r13,1),%ecx
5114	xorl	%r8d,%edi
5115	rorxl	$13,%edx,%r14d
5116	rorxl	$2,%edx,%r13d
5117	leal	(%r10,%rcx,1),%r10d
5118	andl	%edi,%r15d
5119	xorl	%r12d,%r14d
5120	xorl	%r8d,%r15d
5121	xorl	%r13d,%r14d
5122	leal	(%rcx,%r15,1),%ecx
5123	movl	%r11d,%r12d
5124	addl	40(%rsp),%ebx
5125	andl	%r10d,%r12d
5126	rorxl	$25,%r10d,%r13d
5127	rorxl	$11,%r10d,%r15d
5128	leal	(%rcx,%r14,1),%ecx
5129	leal	(%rbx,%r12,1),%ebx
5130	andnl	%eax,%r10d,%r12d
5131	xorl	%r15d,%r13d
5132	rorxl	$6,%r10d,%r14d
5133	leal	(%rbx,%r12,1),%ebx
5134	xorl	%r14d,%r13d
5135	movl	%ecx,%r15d
5136	rorxl	$22,%ecx,%r12d
5137	leal	(%rbx,%r13,1),%ebx
5138	xorl	%edx,%r15d
5139	rorxl	$13,%ecx,%r14d
5140	rorxl	$2,%ecx,%r13d
5141	leal	(%r9,%rbx,1),%r9d
5142	andl	%r15d,%edi
5143	xorl	%r12d,%r14d
5144	xorl	%edx,%edi
5145	xorl	%r13d,%r14d
5146	leal	(%rbx,%rdi,1),%ebx
5147	movl	%r10d,%r12d
5148	addl	44(%rsp),%eax
5149	andl	%r9d,%r12d
5150	rorxl	$25,%r9d,%r13d
5151	rorxl	$11,%r9d,%edi
5152	leal	(%rbx,%r14,1),%ebx
5153	leal	(%rax,%r12,1),%eax
5154	andnl	%r11d,%r9d,%r12d
5155	xorl	%edi,%r13d
5156	rorxl	$6,%r9d,%r14d
5157	leal	(%rax,%r12,1),%eax
5158	xorl	%r14d,%r13d
5159	movl	%ebx,%edi
5160	rorxl	$22,%ebx,%r12d
5161	leal	(%rax,%r13,1),%eax
5162	xorl	%ecx,%edi
5163	rorxl	$13,%ebx,%r14d
5164	rorxl	$2,%ebx,%r13d
5165	leal	(%r8,%rax,1),%r8d
5166	andl	%edi,%r15d
5167	xorl	%r12d,%r14d
5168	xorl	%ecx,%r15d
5169	xorl	%r13d,%r14d
5170	leal	(%rax,%r15,1),%eax
5171	movl	%r9d,%r12d
5172	movq	512(%rsp),%rdi
5173	addl	%r14d,%eax
5174
5175	leaq	448(%rsp),%rbp
5176
5177	addl	0(%rdi),%eax
5178	addl	4(%rdi),%ebx
5179	addl	8(%rdi),%ecx
5180	addl	12(%rdi),%edx
5181	addl	16(%rdi),%r8d
5182	addl	20(%rdi),%r9d
5183	addl	24(%rdi),%r10d
5184	addl	28(%rdi),%r11d
5185
5186	movl	%eax,0(%rdi)
5187	movl	%ebx,4(%rdi)
5188	movl	%ecx,8(%rdi)
5189	movl	%edx,12(%rdi)
5190	movl	%r8d,16(%rdi)
5191	movl	%r9d,20(%rdi)
5192	movl	%r10d,24(%rdi)
5193	movl	%r11d,28(%rdi)
5194
5195	cmpq	80(%rbp),%rsi
5196	je	.Ldone_avx2
5197
5198	xorl	%r14d,%r14d
5199	movl	%ebx,%edi
5200	xorl	%ecx,%edi
5201	movl	%r9d,%r12d
5202	jmp	.Lower_avx2
5203.align	16
5204.Lower_avx2:
5205	addl	0+16(%rbp),%r11d
5206	andl	%r8d,%r12d
5207	rorxl	$25,%r8d,%r13d
5208	rorxl	$11,%r8d,%r15d
5209	leal	(%rax,%r14,1),%eax
5210	leal	(%r11,%r12,1),%r11d
5211	andnl	%r10d,%r8d,%r12d
5212	xorl	%r15d,%r13d
5213	rorxl	$6,%r8d,%r14d
5214	leal	(%r11,%r12,1),%r11d
5215	xorl	%r14d,%r13d
5216	movl	%eax,%r15d
5217	rorxl	$22,%eax,%r12d
5218	leal	(%r11,%r13,1),%r11d
5219	xorl	%ebx,%r15d
5220	rorxl	$13,%eax,%r14d
5221	rorxl	$2,%eax,%r13d
5222	leal	(%rdx,%r11,1),%edx
5223	andl	%r15d,%edi
5224	xorl	%r12d,%r14d
5225	xorl	%ebx,%edi
5226	xorl	%r13d,%r14d
5227	leal	(%r11,%rdi,1),%r11d
5228	movl	%r8d,%r12d
5229	addl	4+16(%rbp),%r10d
5230	andl	%edx,%r12d
5231	rorxl	$25,%edx,%r13d
5232	rorxl	$11,%edx,%edi
5233	leal	(%r11,%r14,1),%r11d
5234	leal	(%r10,%r12,1),%r10d
5235	andnl	%r9d,%edx,%r12d
5236	xorl	%edi,%r13d
5237	rorxl	$6,%edx,%r14d
5238	leal	(%r10,%r12,1),%r10d
5239	xorl	%r14d,%r13d
5240	movl	%r11d,%edi
5241	rorxl	$22,%r11d,%r12d
5242	leal	(%r10,%r13,1),%r10d
5243	xorl	%eax,%edi
5244	rorxl	$13,%r11d,%r14d
5245	rorxl	$2,%r11d,%r13d
5246	leal	(%rcx,%r10,1),%ecx
5247	andl	%edi,%r15d
5248	xorl	%r12d,%r14d
5249	xorl	%eax,%r15d
5250	xorl	%r13d,%r14d
5251	leal	(%r10,%r15,1),%r10d
5252	movl	%edx,%r12d
5253	addl	8+16(%rbp),%r9d
5254	andl	%ecx,%r12d
5255	rorxl	$25,%ecx,%r13d
5256	rorxl	$11,%ecx,%r15d
5257	leal	(%r10,%r14,1),%r10d
5258	leal	(%r9,%r12,1),%r9d
5259	andnl	%r8d,%ecx,%r12d
5260	xorl	%r15d,%r13d
5261	rorxl	$6,%ecx,%r14d
5262	leal	(%r9,%r12,1),%r9d
5263	xorl	%r14d,%r13d
5264	movl	%r10d,%r15d
5265	rorxl	$22,%r10d,%r12d
5266	leal	(%r9,%r13,1),%r9d
5267	xorl	%r11d,%r15d
5268	rorxl	$13,%r10d,%r14d
5269	rorxl	$2,%r10d,%r13d
5270	leal	(%rbx,%r9,1),%ebx
5271	andl	%r15d,%edi
5272	xorl	%r12d,%r14d
5273	xorl	%r11d,%edi
5274	xorl	%r13d,%r14d
5275	leal	(%r9,%rdi,1),%r9d
5276	movl	%ecx,%r12d
5277	addl	12+16(%rbp),%r8d
5278	andl	%ebx,%r12d
5279	rorxl	$25,%ebx,%r13d
5280	rorxl	$11,%ebx,%edi
5281	leal	(%r9,%r14,1),%r9d
5282	leal	(%r8,%r12,1),%r8d
5283	andnl	%edx,%ebx,%r12d
5284	xorl	%edi,%r13d
5285	rorxl	$6,%ebx,%r14d
5286	leal	(%r8,%r12,1),%r8d
5287	xorl	%r14d,%r13d
5288	movl	%r9d,%edi
5289	rorxl	$22,%r9d,%r12d
5290	leal	(%r8,%r13,1),%r8d
5291	xorl	%r10d,%edi
5292	rorxl	$13,%r9d,%r14d
5293	rorxl	$2,%r9d,%r13d
5294	leal	(%rax,%r8,1),%eax
5295	andl	%edi,%r15d
5296	xorl	%r12d,%r14d
5297	xorl	%r10d,%r15d
5298	xorl	%r13d,%r14d
5299	leal	(%r8,%r15,1),%r8d
5300	movl	%ebx,%r12d
5301	addl	32+16(%rbp),%edx
5302	andl	%eax,%r12d
5303	rorxl	$25,%eax,%r13d
5304	rorxl	$11,%eax,%r15d
5305	leal	(%r8,%r14,1),%r8d
5306	leal	(%rdx,%r12,1),%edx
5307	andnl	%ecx,%eax,%r12d
5308	xorl	%r15d,%r13d
5309	rorxl	$6,%eax,%r14d
5310	leal	(%rdx,%r12,1),%edx
5311	xorl	%r14d,%r13d
5312	movl	%r8d,%r15d
5313	rorxl	$22,%r8d,%r12d
5314	leal	(%rdx,%r13,1),%edx
5315	xorl	%r9d,%r15d
5316	rorxl	$13,%r8d,%r14d
5317	rorxl	$2,%r8d,%r13d
5318	leal	(%r11,%rdx,1),%r11d
5319	andl	%r15d,%edi
5320	xorl	%r12d,%r14d
5321	xorl	%r9d,%edi
5322	xorl	%r13d,%r14d
5323	leal	(%rdx,%rdi,1),%edx
5324	movl	%eax,%r12d
5325	addl	36+16(%rbp),%ecx
5326	andl	%r11d,%r12d
5327	rorxl	$25,%r11d,%r13d
5328	rorxl	$11,%r11d,%edi
5329	leal	(%rdx,%r14,1),%edx
5330	leal	(%rcx,%r12,1),%ecx
5331	andnl	%ebx,%r11d,%r12d
5332	xorl	%edi,%r13d
5333	rorxl	$6,%r11d,%r14d
5334	leal	(%rcx,%r12,1),%ecx
5335	xorl	%r14d,%r13d
5336	movl	%edx,%edi
5337	rorxl	$22,%edx,%r12d
5338	leal	(%rcx,%r13,1),%ecx
5339	xorl	%r8d,%edi
5340	rorxl	$13,%edx,%r14d
5341	rorxl	$2,%edx,%r13d
5342	leal	(%r10,%rcx,1),%r10d
5343	andl	%edi,%r15d
5344	xorl	%r12d,%r14d
5345	xorl	%r8d,%r15d
5346	xorl	%r13d,%r14d
5347	leal	(%rcx,%r15,1),%ecx
5348	movl	%r11d,%r12d
5349	addl	40+16(%rbp),%ebx
5350	andl	%r10d,%r12d
5351	rorxl	$25,%r10d,%r13d
5352	rorxl	$11,%r10d,%r15d
5353	leal	(%rcx,%r14,1),%ecx
5354	leal	(%rbx,%r12,1),%ebx
5355	andnl	%eax,%r10d,%r12d
5356	xorl	%r15d,%r13d
5357	rorxl	$6,%r10d,%r14d
5358	leal	(%rbx,%r12,1),%ebx
5359	xorl	%r14d,%r13d
5360	movl	%ecx,%r15d
5361	rorxl	$22,%ecx,%r12d
5362	leal	(%rbx,%r13,1),%ebx
5363	xorl	%edx,%r15d
5364	rorxl	$13,%ecx,%r14d
5365	rorxl	$2,%ecx,%r13d
5366	leal	(%r9,%rbx,1),%r9d
5367	andl	%r15d,%edi
5368	xorl	%r12d,%r14d
5369	xorl	%edx,%edi
5370	xorl	%r13d,%r14d
5371	leal	(%rbx,%rdi,1),%ebx
5372	movl	%r10d,%r12d
5373	addl	44+16(%rbp),%eax
5374	andl	%r9d,%r12d
5375	rorxl	$25,%r9d,%r13d
5376	rorxl	$11,%r9d,%edi
5377	leal	(%rbx,%r14,1),%ebx
5378	leal	(%rax,%r12,1),%eax
5379	andnl	%r11d,%r9d,%r12d
5380	xorl	%edi,%r13d
5381	rorxl	$6,%r9d,%r14d
5382	leal	(%rax,%r12,1),%eax
5383	xorl	%r14d,%r13d
5384	movl	%ebx,%edi
5385	rorxl	$22,%ebx,%r12d
5386	leal	(%rax,%r13,1),%eax
5387	xorl	%ecx,%edi
5388	rorxl	$13,%ebx,%r14d
5389	rorxl	$2,%ebx,%r13d
5390	leal	(%r8,%rax,1),%r8d
5391	andl	%edi,%r15d
5392	xorl	%r12d,%r14d
5393	xorl	%ecx,%r15d
5394	xorl	%r13d,%r14d
5395	leal	(%rax,%r15,1),%eax
5396	movl	%r9d,%r12d
5397	leaq	-64(%rbp),%rbp
5398	cmpq	%rsp,%rbp
5399	jae	.Lower_avx2
5400
5401	movq	512(%rsp),%rdi
5402	addl	%r14d,%eax
5403
5404	leaq	448(%rsp),%rsp
5405
5406.cfi_escape	0x0f,0x06,0x77,0xd8,0x00,0x06,0x23,0x08
5407
5408	addl	0(%rdi),%eax
5409	addl	4(%rdi),%ebx
5410	addl	8(%rdi),%ecx
5411	addl	12(%rdi),%edx
5412	addl	16(%rdi),%r8d
5413	addl	20(%rdi),%r9d
5414	leaq	128(%rsi),%rsi
5415	addl	24(%rdi),%r10d
5416	movq	%rsi,%r12
5417	addl	28(%rdi),%r11d
5418	cmpq	64+16(%rsp),%rsi
5419
5420	movl	%eax,0(%rdi)
5421	cmoveq	%rsp,%r12
5422	movl	%ebx,4(%rdi)
5423	movl	%ecx,8(%rdi)
5424	movl	%edx,12(%rdi)
5425	movl	%r8d,16(%rdi)
5426	movl	%r9d,20(%rdi)
5427	movl	%r10d,24(%rdi)
5428	movl	%r11d,28(%rdi)
5429
5430	jbe	.Loop_avx2
5431	leaq	(%rsp),%rbp
5432
5433
5434.cfi_escape	0x0f,0x06,0x76,0xd8,0x00,0x06,0x23,0x08
5435
5436.Ldone_avx2:
5437	movq	88(%rbp),%rsi
5438.cfi_def_cfa	%rsi,8
5439	vzeroupper
5440	movq	-48(%rsi),%r15
5441.cfi_restore	%r15
5442	movq	-40(%rsi),%r14
5443.cfi_restore	%r14
5444	movq	-32(%rsi),%r13
5445.cfi_restore	%r13
5446	movq	-24(%rsi),%r12
5447.cfi_restore	%r12
5448	movq	-16(%rsi),%rbp
5449.cfi_restore	%rbp
5450	movq	-8(%rsi),%rbx
5451.cfi_restore	%rbx
5452	leaq	(%rsi),%rsp
5453.cfi_def_cfa_register	%rsp
5454.Lepilogue_avx2:
5455	.byte	0xf3,0xc3
5456.cfi_endproc
5457.size	sha256_block_data_order_avx2,.-sha256_block_data_order_avx2
5458	.section ".note.gnu.property", "a"
5459	.p2align 3
5460	.long 1f - 0f
5461	.long 4f - 1f
5462	.long 5
54630:
5464	# "GNU" encoded with .byte, since .asciz isn't supported
5465	# on Solaris.
5466	.byte 0x47
5467	.byte 0x4e
5468	.byte 0x55
5469	.byte 0
54701:
5471	.p2align 3
5472	.long 0xc0000002
5473	.long 3f - 2f
54742:
5475	.long 3
54763:
5477	.p2align 3
54784:
5479