1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0 21da177e4SLinus Torvalds /* 31da177e4SLinus Torvalds * arch/alpha/lib/checksum.c 41da177e4SLinus Torvalds * 51da177e4SLinus Torvalds * This file contains network checksum routines that are better done 61da177e4SLinus Torvalds * in an architecture-specific manner due to speed.. 71da177e4SLinus Torvalds * Comments in other versions indicate that the algorithms are from RFC1071 81da177e4SLinus Torvalds * 9c3a2ddeeSSimon Arlott * accelerated versions (and 21264 assembly versions ) contributed by 101da177e4SLinus Torvalds * Rick Gorton <rick.gorton@alpha-processor.com> 111da177e4SLinus Torvalds */ 121da177e4SLinus Torvalds 131da177e4SLinus Torvalds #include <linux/module.h> 141da177e4SLinus Torvalds #include <linux/string.h> 156e8d0237SAl Viro #include <net/checksum.h> 161da177e4SLinus Torvalds 171da177e4SLinus Torvalds #include <asm/byteorder.h> 18*0069455bSKent Overstreet #include <asm/checksum.h> 191da177e4SLinus Torvalds 201da177e4SLinus Torvalds static inline unsigned short from64to16(unsigned long x) 211da177e4SLinus Torvalds { 221da177e4SLinus Torvalds /* Using extract instructions is a bit more efficient 231da177e4SLinus Torvalds than the original shift/bitmask version. */ 241da177e4SLinus Torvalds 251da177e4SLinus Torvalds union { 261da177e4SLinus Torvalds unsigned long ul; 271da177e4SLinus Torvalds unsigned int ui[2]; 281da177e4SLinus Torvalds unsigned short us[4]; 291da177e4SLinus Torvalds } in_v, tmp_v, out_v; 301da177e4SLinus Torvalds 311da177e4SLinus Torvalds in_v.ul = x; 321da177e4SLinus Torvalds tmp_v.ul = (unsigned long) in_v.ui[0] + (unsigned long) in_v.ui[1]; 331da177e4SLinus Torvalds 341da177e4SLinus Torvalds /* Since the bits of tmp_v.sh[3] are going to always be zero, 351da177e4SLinus Torvalds we don't have to bother to add that in. */ 361da177e4SLinus Torvalds out_v.ul = (unsigned long) tmp_v.us[0] + (unsigned long) tmp_v.us[1] 371da177e4SLinus Torvalds + (unsigned long) tmp_v.us[2]; 381da177e4SLinus Torvalds 391da177e4SLinus Torvalds /* Similarly, out_v.us[2] is always zero for the final add. */ 401da177e4SLinus Torvalds return out_v.us[0] + out_v.us[1]; 411da177e4SLinus Torvalds } 421da177e4SLinus Torvalds 431da177e4SLinus Torvalds /* 441da177e4SLinus Torvalds * computes the checksum of the TCP/UDP pseudo-header 451da177e4SLinus Torvalds * returns a 16-bit checksum, already complemented. 461da177e4SLinus Torvalds */ 479be259aaSAl Viro __sum16 csum_tcpudp_magic(__be32 saddr, __be32 daddr, 4801cfbad7SAlexander Duyck __u32 len, __u8 proto, __wsum sum) 491da177e4SLinus Torvalds { 509be259aaSAl Viro return (__force __sum16)~from64to16( 519be259aaSAl Viro (__force u64)saddr + (__force u64)daddr + 529be259aaSAl Viro (__force u64)sum + ((len + proto) << 8)); 531da177e4SLinus Torvalds } 5400fc0e0dSAl Viro EXPORT_SYMBOL(csum_tcpudp_magic); 551da177e4SLinus Torvalds 569be259aaSAl Viro __wsum csum_tcpudp_nofold(__be32 saddr, __be32 daddr, 5701cfbad7SAlexander Duyck __u32 len, __u8 proto, __wsum sum) 581da177e4SLinus Torvalds { 591da177e4SLinus Torvalds unsigned long result; 601da177e4SLinus Torvalds 619be259aaSAl Viro result = (__force u64)saddr + (__force u64)daddr + 629be259aaSAl Viro (__force u64)sum + ((len + proto) << 8); 631da177e4SLinus Torvalds 641da177e4SLinus Torvalds /* Fold down to 32-bits so we don't lose in the typedef-less 651da177e4SLinus Torvalds network stack. */ 661da177e4SLinus Torvalds /* 64 to 33 */ 671da177e4SLinus Torvalds result = (result & 0xffffffff) + (result >> 32); 681da177e4SLinus Torvalds /* 33 to 32 */ 691da177e4SLinus Torvalds result = (result & 0xffffffff) + (result >> 32); 709be259aaSAl Viro return (__force __wsum)result; 711da177e4SLinus Torvalds } 72547c178bSAl Viro EXPORT_SYMBOL(csum_tcpudp_nofold); 731da177e4SLinus Torvalds 741da177e4SLinus Torvalds /* 751da177e4SLinus Torvalds * Do a 64-bit checksum on an arbitrary memory area.. 761da177e4SLinus Torvalds * 771da177e4SLinus Torvalds * This isn't a great routine, but it's not _horrible_ either. The 781da177e4SLinus Torvalds * inner loop could be unrolled a bit further, and there are better 791da177e4SLinus Torvalds * ways to do the carry, but this is reasonable. 801da177e4SLinus Torvalds */ 811da177e4SLinus Torvalds static inline unsigned long do_csum(const unsigned char * buff, int len) 821da177e4SLinus Torvalds { 831da177e4SLinus Torvalds int odd, count; 841da177e4SLinus Torvalds unsigned long result = 0; 851da177e4SLinus Torvalds 861da177e4SLinus Torvalds if (len <= 0) 871da177e4SLinus Torvalds goto out; 881da177e4SLinus Torvalds odd = 1 & (unsigned long) buff; 891da177e4SLinus Torvalds if (odd) { 901da177e4SLinus Torvalds result = *buff << 8; 911da177e4SLinus Torvalds len--; 921da177e4SLinus Torvalds buff++; 931da177e4SLinus Torvalds } 941da177e4SLinus Torvalds count = len >> 1; /* nr of 16-bit words.. */ 951da177e4SLinus Torvalds if (count) { 961da177e4SLinus Torvalds if (2 & (unsigned long) buff) { 971da177e4SLinus Torvalds result += *(unsigned short *) buff; 981da177e4SLinus Torvalds count--; 991da177e4SLinus Torvalds len -= 2; 1001da177e4SLinus Torvalds buff += 2; 1011da177e4SLinus Torvalds } 1021da177e4SLinus Torvalds count >>= 1; /* nr of 32-bit words.. */ 1031da177e4SLinus Torvalds if (count) { 1041da177e4SLinus Torvalds if (4 & (unsigned long) buff) { 1051da177e4SLinus Torvalds result += *(unsigned int *) buff; 1061da177e4SLinus Torvalds count--; 1071da177e4SLinus Torvalds len -= 4; 1081da177e4SLinus Torvalds buff += 4; 1091da177e4SLinus Torvalds } 1101da177e4SLinus Torvalds count >>= 1; /* nr of 64-bit words.. */ 1111da177e4SLinus Torvalds if (count) { 1121da177e4SLinus Torvalds unsigned long carry = 0; 1131da177e4SLinus Torvalds do { 1141da177e4SLinus Torvalds unsigned long w = *(unsigned long *) buff; 1151da177e4SLinus Torvalds count--; 1161da177e4SLinus Torvalds buff += 8; 1171da177e4SLinus Torvalds result += carry; 1181da177e4SLinus Torvalds result += w; 1191da177e4SLinus Torvalds carry = (w > result); 1201da177e4SLinus Torvalds } while (count); 1211da177e4SLinus Torvalds result += carry; 1221da177e4SLinus Torvalds result = (result & 0xffffffff) + (result >> 32); 1231da177e4SLinus Torvalds } 1241da177e4SLinus Torvalds if (len & 4) { 1251da177e4SLinus Torvalds result += *(unsigned int *) buff; 1261da177e4SLinus Torvalds buff += 4; 1271da177e4SLinus Torvalds } 1281da177e4SLinus Torvalds } 1291da177e4SLinus Torvalds if (len & 2) { 1301da177e4SLinus Torvalds result += *(unsigned short *) buff; 1311da177e4SLinus Torvalds buff += 2; 1321da177e4SLinus Torvalds } 1331da177e4SLinus Torvalds } 1341da177e4SLinus Torvalds if (len & 1) 1351da177e4SLinus Torvalds result += *buff; 1361da177e4SLinus Torvalds result = from64to16(result); 1371da177e4SLinus Torvalds if (odd) 1381da177e4SLinus Torvalds result = ((result >> 8) & 0xff) | ((result & 0xff) << 8); 1391da177e4SLinus Torvalds out: 1401da177e4SLinus Torvalds return result; 1411da177e4SLinus Torvalds } 1421da177e4SLinus Torvalds 1431da177e4SLinus Torvalds /* 1441da177e4SLinus Torvalds * This is a version of ip_compute_csum() optimized for IP headers, 1451da177e4SLinus Torvalds * which always checksum on 4 octet boundaries. 1461da177e4SLinus Torvalds */ 1479be259aaSAl Viro __sum16 ip_fast_csum(const void *iph, unsigned int ihl) 1481da177e4SLinus Torvalds { 1499be259aaSAl Viro return (__force __sum16)~do_csum(iph,ihl*4); 1501da177e4SLinus Torvalds } 15100fc0e0dSAl Viro EXPORT_SYMBOL(ip_fast_csum); 1521da177e4SLinus Torvalds 1531da177e4SLinus Torvalds /* 1541da177e4SLinus Torvalds * computes the checksum of a memory block at buff, length len, 1551da177e4SLinus Torvalds * and adds in "sum" (32-bit) 1561da177e4SLinus Torvalds * 1571da177e4SLinus Torvalds * returns a 32-bit number suitable for feeding into itself 1581da177e4SLinus Torvalds * or csum_tcpudp_magic 1591da177e4SLinus Torvalds * 1601da177e4SLinus Torvalds * this function must be called with even lengths, except 1611da177e4SLinus Torvalds * for the last fragment, which may be odd 1621da177e4SLinus Torvalds * 1631da177e4SLinus Torvalds * it's best to have buff aligned on a 32-bit boundary 1641da177e4SLinus Torvalds */ 1659be259aaSAl Viro __wsum csum_partial(const void *buff, int len, __wsum sum) 1661da177e4SLinus Torvalds { 1671da177e4SLinus Torvalds unsigned long result = do_csum(buff, len); 1681da177e4SLinus Torvalds 1691da177e4SLinus Torvalds /* add in old sum, and carry.. */ 1709be259aaSAl Viro result += (__force u32)sum; 1711da177e4SLinus Torvalds /* 32+c bits -> 32 bits */ 1721da177e4SLinus Torvalds result = (result & 0xffffffff) + (result >> 32); 1739be259aaSAl Viro return (__force __wsum)result; 1741da177e4SLinus Torvalds } 1751da177e4SLinus Torvalds 1761da177e4SLinus Torvalds EXPORT_SYMBOL(csum_partial); 1771da177e4SLinus Torvalds 1781da177e4SLinus Torvalds /* 1791da177e4SLinus Torvalds * this routine is used for miscellaneous IP-like checksums, mainly 1801da177e4SLinus Torvalds * in icmp.c 1811da177e4SLinus Torvalds */ 1829be259aaSAl Viro __sum16 ip_compute_csum(const void *buff, int len) 1831da177e4SLinus Torvalds { 1849be259aaSAl Viro return (__force __sum16)~from64to16(do_csum(buff,len)); 1851da177e4SLinus Torvalds } 18600fc0e0dSAl Viro EXPORT_SYMBOL(ip_compute_csum); 187