xref: /linux/arch/sparc/include/asm/checksum_32.h (revision cbecf716ca618fd44feda6bd9a64a8179d031fc5)
1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */
2a439fe51SSam Ravnborg #ifndef __SPARC_CHECKSUM_H
3a439fe51SSam Ravnborg #define __SPARC_CHECKSUM_H
4a439fe51SSam Ravnborg 
5a439fe51SSam Ravnborg /*  checksum.h:  IP/UDP/TCP checksum routines on the Sparc.
6a439fe51SSam Ravnborg  *
7a439fe51SSam Ravnborg  *  Copyright(C) 1995 Linus Torvalds
8a439fe51SSam Ravnborg  *  Copyright(C) 1995 Miguel de Icaza
9a439fe51SSam Ravnborg  *  Copyright(C) 1996 David S. Miller
10a439fe51SSam Ravnborg  *  Copyright(C) 1996 Eddie C. Dost
11a439fe51SSam Ravnborg  *  Copyright(C) 1997 Jakub Jelinek
12a439fe51SSam Ravnborg  *
13a439fe51SSam Ravnborg  * derived from:
14a439fe51SSam Ravnborg  *	Alpha checksum c-code
15a439fe51SSam Ravnborg  *      ix86 inline assembly
16a439fe51SSam Ravnborg  *      RFC1071 Computing the Internet Checksum
17a439fe51SSam Ravnborg  */
18a439fe51SSam Ravnborg 
19a439fe51SSam Ravnborg #include <linux/in6.h>
207c0f6ba6SLinus Torvalds #include <linux/uaccess.h>
21a439fe51SSam Ravnborg 
22a439fe51SSam Ravnborg /* computes the checksum of a memory block at buff, length len,
23a439fe51SSam Ravnborg  * and adds in "sum" (32-bit)
24a439fe51SSam Ravnborg  *
25a439fe51SSam Ravnborg  * returns a 32-bit number suitable for feeding into itself
26a439fe51SSam Ravnborg  * or csum_tcpudp_magic
27a439fe51SSam Ravnborg  *
28a439fe51SSam Ravnborg  * this function must be called with even lengths, except
29a439fe51SSam Ravnborg  * for the last fragment, which may be odd
30a439fe51SSam Ravnborg  *
31a439fe51SSam Ravnborg  * it's best to have buff aligned on a 32-bit boundary
32a439fe51SSam Ravnborg  */
33f05a6865SSam Ravnborg __wsum csum_partial(const void *buff, int len, __wsum sum);
34a439fe51SSam Ravnborg 
35a439fe51SSam Ravnborg /* the same as csum_partial, but copies from fs:src while it
36a439fe51SSam Ravnborg  * checksums
37a439fe51SSam Ravnborg  *
38a439fe51SSam Ravnborg  * here even more important to align src and dst on a 32-bit (or even
39a439fe51SSam Ravnborg  * better 64-bit) boundary
40a439fe51SSam Ravnborg  */
41a439fe51SSam Ravnborg 
42f05a6865SSam Ravnborg unsigned int __csum_partial_copy_sparc_generic (const unsigned char *, unsigned char *);
43a439fe51SSam Ravnborg 
44a439fe51SSam Ravnborg static inline __wsum
csum_partial_copy_nocheck(const void * src,void * dst,int len)45cc44c17bSAl Viro csum_partial_copy_nocheck(const void *src, void *dst, int len)
46a439fe51SSam Ravnborg {
47a439fe51SSam Ravnborg 	register unsigned int ret asm("o0") = (unsigned int)src;
48a439fe51SSam Ravnborg 	register char *d asm("o1") = dst;
49a439fe51SSam Ravnborg 	register int l asm("g1") = len;
50a439fe51SSam Ravnborg 
51a439fe51SSam Ravnborg 	__asm__ __volatile__ (
52a439fe51SSam Ravnborg 		"call __csum_partial_copy_sparc_generic\n\t"
53*ab5e8b33SAl Viro 		" mov -1, %%g7\n"
54a439fe51SSam Ravnborg 	: "=&r" (ret), "=&r" (d), "=&r" (l)
55*ab5e8b33SAl Viro 	: "0" (ret), "1" (d), "2" (l)
56a439fe51SSam Ravnborg 	: "o2", "o3", "o4", "o5", "o7",
57a439fe51SSam Ravnborg 	  "g2", "g3", "g4", "g5", "g7",
58a439fe51SSam Ravnborg 	  "memory", "cc");
59a439fe51SSam Ravnborg 	return (__force __wsum)ret;
60a439fe51SSam Ravnborg }
61a439fe51SSam Ravnborg 
62a439fe51SSam Ravnborg static inline __wsum
csum_and_copy_from_user(const void __user * src,void * dst,int len)63c693cc46SAl Viro csum_and_copy_from_user(const void __user *src, void *dst, int len)
64a439fe51SSam Ravnborg {
65c693cc46SAl Viro 	if (unlikely(!access_ok(src, len)))
66c693cc46SAl Viro 		return 0;
67*ab5e8b33SAl Viro 	return csum_partial_copy_nocheck((__force void *)src, dst, len);
68a439fe51SSam Ravnborg }
69a439fe51SSam Ravnborg 
70a439fe51SSam Ravnborg static inline __wsum
csum_and_copy_to_user(const void * src,void __user * dst,int len)71c693cc46SAl Viro csum_and_copy_to_user(const void *src, void __user *dst, int len)
72a439fe51SSam Ravnborg {
73c693cc46SAl Viro 	if (!access_ok(dst, len))
74c693cc46SAl Viro 		return 0;
75*ab5e8b33SAl Viro 	return csum_partial_copy_nocheck(src, (__force void *)dst, len);
76a439fe51SSam Ravnborg }
77a439fe51SSam Ravnborg 
78a439fe51SSam Ravnborg /* ihl is always 5 or greater, almost always is 5, and iph is word aligned
79a439fe51SSam Ravnborg  * the majority of the time.
80a439fe51SSam Ravnborg  */
ip_fast_csum(const void * iph,unsigned int ihl)81a439fe51SSam Ravnborg static inline __sum16 ip_fast_csum(const void *iph, unsigned int ihl)
82a439fe51SSam Ravnborg {
83a439fe51SSam Ravnborg 	__sum16 sum;
84a439fe51SSam Ravnborg 
85a439fe51SSam Ravnborg 	/* Note: We must read %2 before we touch %0 for the first time,
86a439fe51SSam Ravnborg 	 *       because GCC can legitimately use the same register for
87a439fe51SSam Ravnborg 	 *       both operands.
88a439fe51SSam Ravnborg 	 */
89a439fe51SSam Ravnborg 	__asm__ __volatile__("sub\t%2, 4, %%g4\n\t"
90a439fe51SSam Ravnborg 			     "ld\t[%1 + 0x00], %0\n\t"
91a439fe51SSam Ravnborg 			     "ld\t[%1 + 0x04], %%g2\n\t"
92a439fe51SSam Ravnborg 			     "ld\t[%1 + 0x08], %%g3\n\t"
93a439fe51SSam Ravnborg 			     "addcc\t%%g2, %0, %0\n\t"
94a439fe51SSam Ravnborg 			     "addxcc\t%%g3, %0, %0\n\t"
95a439fe51SSam Ravnborg 			     "ld\t[%1 + 0x0c], %%g2\n\t"
96a439fe51SSam Ravnborg 			     "ld\t[%1 + 0x10], %%g3\n\t"
97a439fe51SSam Ravnborg 			     "addxcc\t%%g2, %0, %0\n\t"
98a439fe51SSam Ravnborg 			     "addx\t%0, %%g0, %0\n"
99a439fe51SSam Ravnborg 			     "1:\taddcc\t%%g3, %0, %0\n\t"
100a439fe51SSam Ravnborg 			     "add\t%1, 4, %1\n\t"
101a439fe51SSam Ravnborg 			     "addxcc\t%0, %%g0, %0\n\t"
102a439fe51SSam Ravnborg 			     "subcc\t%%g4, 1, %%g4\n\t"
103a439fe51SSam Ravnborg 			     "be,a\t2f\n\t"
104a439fe51SSam Ravnborg 			     "sll\t%0, 16, %%g2\n\t"
105a439fe51SSam Ravnborg 			     "b\t1b\n\t"
106a439fe51SSam Ravnborg 			     "ld\t[%1 + 0x10], %%g3\n"
107a439fe51SSam Ravnborg 			     "2:\taddcc\t%0, %%g2, %%g2\n\t"
108a439fe51SSam Ravnborg 			     "srl\t%%g2, 16, %0\n\t"
109a439fe51SSam Ravnborg 			     "addx\t%0, %%g0, %0\n\t"
110a439fe51SSam Ravnborg 			     "xnor\t%%g0, %0, %0"
111a439fe51SSam Ravnborg 			     : "=r" (sum), "=&r" (iph)
112a439fe51SSam Ravnborg 			     : "r" (ihl), "1" (iph)
113a439fe51SSam Ravnborg 			     : "g2", "g3", "g4", "cc", "memory");
114a439fe51SSam Ravnborg 	return sum;
115a439fe51SSam Ravnborg }
116a439fe51SSam Ravnborg 
117a439fe51SSam Ravnborg /* Fold a partial checksum without adding pseudo headers. */
csum_fold(__wsum sum)118a439fe51SSam Ravnborg static inline __sum16 csum_fold(__wsum sum)
119a439fe51SSam Ravnborg {
120a439fe51SSam Ravnborg 	unsigned int tmp;
121a439fe51SSam Ravnborg 
122a439fe51SSam Ravnborg 	__asm__ __volatile__("addcc\t%0, %1, %1\n\t"
123a439fe51SSam Ravnborg 			     "srl\t%1, 16, %1\n\t"
124a439fe51SSam Ravnborg 			     "addx\t%1, %%g0, %1\n\t"
125a439fe51SSam Ravnborg 			     "xnor\t%%g0, %1, %0"
126a439fe51SSam Ravnborg 			     : "=&r" (sum), "=r" (tmp)
127a439fe51SSam Ravnborg 			     : "0" (sum), "1" ((__force u32)sum<<16)
128a439fe51SSam Ravnborg 			     : "cc");
129a439fe51SSam Ravnborg 	return (__force __sum16)sum;
130a439fe51SSam Ravnborg }
131a439fe51SSam Ravnborg 
csum_tcpudp_nofold(__be32 saddr,__be32 daddr,__u32 len,__u8 proto,__wsum sum)132a439fe51SSam Ravnborg static inline __wsum csum_tcpudp_nofold(__be32 saddr, __be32 daddr,
13301cfbad7SAlexander Duyck 					__u32 len, __u8 proto,
134a439fe51SSam Ravnborg 					__wsum sum)
135a439fe51SSam Ravnborg {
136a439fe51SSam Ravnborg 	__asm__ __volatile__("addcc\t%1, %0, %0\n\t"
137a439fe51SSam Ravnborg 			     "addxcc\t%2, %0, %0\n\t"
138a439fe51SSam Ravnborg 			     "addxcc\t%3, %0, %0\n\t"
139a439fe51SSam Ravnborg 			     "addx\t%0, %%g0, %0\n\t"
140a439fe51SSam Ravnborg 			     : "=r" (sum), "=r" (saddr)
141a439fe51SSam Ravnborg 			     : "r" (daddr), "r" (proto + len), "0" (sum),
142a439fe51SSam Ravnborg 			       "1" (saddr)
143a439fe51SSam Ravnborg 			     : "cc");
144a439fe51SSam Ravnborg 	return sum;
145a439fe51SSam Ravnborg }
146a439fe51SSam Ravnborg 
147a439fe51SSam Ravnborg /*
148a439fe51SSam Ravnborg  * computes the checksum of the TCP/UDP pseudo-header
149a439fe51SSam Ravnborg  * returns a 16-bit checksum, already complemented
150a439fe51SSam Ravnborg  */
csum_tcpudp_magic(__be32 saddr,__be32 daddr,__u32 len,__u8 proto,__wsum sum)151a439fe51SSam Ravnborg static inline __sum16 csum_tcpudp_magic(__be32 saddr, __be32 daddr,
15201cfbad7SAlexander Duyck 					__u32 len, __u8 proto,
153a439fe51SSam Ravnborg 					__wsum sum)
154a439fe51SSam Ravnborg {
155a439fe51SSam Ravnborg 	return csum_fold(csum_tcpudp_nofold(saddr,daddr,len,proto,sum));
156a439fe51SSam Ravnborg }
157a439fe51SSam Ravnborg 
158a439fe51SSam Ravnborg #define _HAVE_ARCH_IPV6_CSUM
159a439fe51SSam Ravnborg 
csum_ipv6_magic(const struct in6_addr * saddr,const struct in6_addr * daddr,__u32 len,__u8 proto,__wsum sum)160a439fe51SSam Ravnborg static inline __sum16 csum_ipv6_magic(const struct in6_addr *saddr,
161a439fe51SSam Ravnborg 				      const struct in6_addr *daddr,
1621e940829SAlexander Duyck 				      __u32 len, __u8 proto, __wsum sum)
163a439fe51SSam Ravnborg {
164a439fe51SSam Ravnborg 	__asm__ __volatile__ (
165a439fe51SSam Ravnborg 		"addcc	%3, %4, %%g4\n\t"
166a439fe51SSam Ravnborg 		"addxcc	%5, %%g4, %%g4\n\t"
167a439fe51SSam Ravnborg 		"ld	[%2 + 0x0c], %%g2\n\t"
168a439fe51SSam Ravnborg 		"ld	[%2 + 0x08], %%g3\n\t"
169a439fe51SSam Ravnborg 		"addxcc	%%g2, %%g4, %%g4\n\t"
170a439fe51SSam Ravnborg 		"ld	[%2 + 0x04], %%g2\n\t"
171a439fe51SSam Ravnborg 		"addxcc	%%g3, %%g4, %%g4\n\t"
172a439fe51SSam Ravnborg 		"ld	[%2 + 0x00], %%g3\n\t"
173a439fe51SSam Ravnborg 		"addxcc	%%g2, %%g4, %%g4\n\t"
174a439fe51SSam Ravnborg 		"ld	[%1 + 0x0c], %%g2\n\t"
175a439fe51SSam Ravnborg 		"addxcc	%%g3, %%g4, %%g4\n\t"
176a439fe51SSam Ravnborg 		"ld	[%1 + 0x08], %%g3\n\t"
177a439fe51SSam Ravnborg 		"addxcc	%%g2, %%g4, %%g4\n\t"
178a439fe51SSam Ravnborg 		"ld	[%1 + 0x04], %%g2\n\t"
179a439fe51SSam Ravnborg 		"addxcc	%%g3, %%g4, %%g4\n\t"
180a439fe51SSam Ravnborg 		"ld	[%1 + 0x00], %%g3\n\t"
181a439fe51SSam Ravnborg 		"addxcc	%%g2, %%g4, %%g4\n\t"
182a439fe51SSam Ravnborg 		"addxcc	%%g3, %%g4, %0\n\t"
183a439fe51SSam Ravnborg 		"addx	0, %0, %0\n"
184a439fe51SSam Ravnborg 		: "=&r" (sum)
185a439fe51SSam Ravnborg 		: "r" (saddr), "r" (daddr),
186a439fe51SSam Ravnborg 		  "r"(htonl(len)), "r"(htonl(proto)), "r"(sum)
187a439fe51SSam Ravnborg 		: "g2", "g3", "g4", "cc");
188a439fe51SSam Ravnborg 
189a439fe51SSam Ravnborg 	return csum_fold(sum);
190a439fe51SSam Ravnborg }
191a439fe51SSam Ravnborg 
192a439fe51SSam Ravnborg /* this routine is used for miscellaneous IP-like checksums, mainly in icmp.c */
ip_compute_csum(const void * buff,int len)193a439fe51SSam Ravnborg static inline __sum16 ip_compute_csum(const void *buff, int len)
194a439fe51SSam Ravnborg {
195a439fe51SSam Ravnborg 	return csum_fold(csum_partial(buff, len, 0));
196a439fe51SSam Ravnborg }
197a439fe51SSam Ravnborg 
19820fce54fSTom Herbert #define HAVE_ARCH_CSUM_ADD
csum_add(__wsum csum,__wsum addend)19920fce54fSTom Herbert static inline __wsum csum_add(__wsum csum, __wsum addend)
20020fce54fSTom Herbert {
20120fce54fSTom Herbert 	__asm__ __volatile__(
20220fce54fSTom Herbert 		"addcc   %0, %1, %0\n"
20320fce54fSTom Herbert 		"addx    %0, %%g0, %0"
20420fce54fSTom Herbert 		: "=r" (csum)
20520fce54fSTom Herbert 		: "r" (addend), "0" (csum));
20620fce54fSTom Herbert 
20720fce54fSTom Herbert 	return csum;
20820fce54fSTom Herbert }
20920fce54fSTom Herbert 
210a439fe51SSam Ravnborg #endif /* !(__SPARC_CHECKSUM_H) */
211