xref: /freebsd/sys/crypto/aesni/aesencdec.h (revision b78ee15e9f04ae15c3e1200df974473167524d17)
1 /*-
2  * Copyright 2013 John-Mark Gurney <jmg@FreeBSD.org>
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  *
14  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24  * SUCH DAMAGE.
25  *
26  * $FreeBSD$
27  *
28  */
29 
30 #include <crypto/aesni/aesni_os.h>
31 
32 #include <wmmintrin.h>
33 
34 static inline void
35 aesni_enc8(int rounds, const __m128i *keysched, __m128i a,
36     __m128i b, __m128i c, __m128i d, __m128i e, __m128i f, __m128i g,
37     __m128i h, __m128i out[8])
38 {
39 	int i;
40 
41 	a ^= keysched[0];
42 	b ^= keysched[0];
43 	c ^= keysched[0];
44 	d ^= keysched[0];
45 	e ^= keysched[0];
46 	f ^= keysched[0];
47 	g ^= keysched[0];
48 	h ^= keysched[0];
49 
50 	for (i = 0; i < rounds; i++) {
51 		a = _mm_aesenc_si128(a, keysched[i + 1]);
52 		b = _mm_aesenc_si128(b, keysched[i + 1]);
53 		c = _mm_aesenc_si128(c, keysched[i + 1]);
54 		d = _mm_aesenc_si128(d, keysched[i + 1]);
55 		e = _mm_aesenc_si128(e, keysched[i + 1]);
56 		f = _mm_aesenc_si128(f, keysched[i + 1]);
57 		g = _mm_aesenc_si128(g, keysched[i + 1]);
58 		h = _mm_aesenc_si128(h, keysched[i + 1]);
59 	}
60 
61 	out[0] = _mm_aesenclast_si128(a, keysched[i + 1]);
62 	out[1] = _mm_aesenclast_si128(b, keysched[i + 1]);
63 	out[2] = _mm_aesenclast_si128(c, keysched[i + 1]);
64 	out[3] = _mm_aesenclast_si128(d, keysched[i + 1]);
65 	out[4] = _mm_aesenclast_si128(e, keysched[i + 1]);
66 	out[5] = _mm_aesenclast_si128(f, keysched[i + 1]);
67 	out[6] = _mm_aesenclast_si128(g, keysched[i + 1]);
68 	out[7] = _mm_aesenclast_si128(h, keysched[i + 1]);
69 }
70 
71 static inline void
72 aesni_dec8(int rounds, const __m128i *keysched, __m128i a,
73     __m128i b, __m128i c, __m128i d, __m128i e, __m128i f, __m128i g,
74     __m128i h, __m128i out[8])
75 {
76 	int i;
77 
78 	a ^= keysched[0];
79 	b ^= keysched[0];
80 	c ^= keysched[0];
81 	d ^= keysched[0];
82 	e ^= keysched[0];
83 	f ^= keysched[0];
84 	g ^= keysched[0];
85 	h ^= keysched[0];
86 
87 	for (i = 0; i < rounds; i++) {
88 		a = _mm_aesdec_si128(a, keysched[i + 1]);
89 		b = _mm_aesdec_si128(b, keysched[i + 1]);
90 		c = _mm_aesdec_si128(c, keysched[i + 1]);
91 		d = _mm_aesdec_si128(d, keysched[i + 1]);
92 		e = _mm_aesdec_si128(e, keysched[i + 1]);
93 		f = _mm_aesdec_si128(f, keysched[i + 1]);
94 		g = _mm_aesdec_si128(g, keysched[i + 1]);
95 		h = _mm_aesdec_si128(h, keysched[i + 1]);
96 	}
97 
98 	out[0] = _mm_aesdeclast_si128(a, keysched[i + 1]);
99 	out[1] = _mm_aesdeclast_si128(b, keysched[i + 1]);
100 	out[2] = _mm_aesdeclast_si128(c, keysched[i + 1]);
101 	out[3] = _mm_aesdeclast_si128(d, keysched[i + 1]);
102 	out[4] = _mm_aesdeclast_si128(e, keysched[i + 1]);
103 	out[5] = _mm_aesdeclast_si128(f, keysched[i + 1]);
104 	out[6] = _mm_aesdeclast_si128(g, keysched[i + 1]);
105 	out[7] = _mm_aesdeclast_si128(h, keysched[i + 1]);
106 }
107 
108 static inline __m128i
109 aesni_enc(int rounds, const __m128i *keysched, const __m128i from)
110 {
111 	__m128i tmp;
112 	int i;
113 
114 	tmp = from ^ keysched[0];
115 
116 	for (i = 0; i < rounds; i++)
117 		tmp = _mm_aesenc_si128(tmp, keysched[i + 1]);
118 
119 	return _mm_aesenclast_si128(tmp, keysched[i + 1]);
120 }
121 
122 static inline __m128i
123 aesni_dec(int rounds, const __m128i *keysched, const __m128i from)
124 {
125 	__m128i tmp;
126 	int i;
127 
128 	tmp = from ^ keysched[0];
129 
130 	for (i = 0; i < rounds; i++)
131 		tmp = _mm_aesdec_si128(tmp, keysched[i + 1]);
132 
133 	return _mm_aesdeclast_si128(tmp, keysched[i + 1]);
134 }
135