1*b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0
21da177e4SLinus Torvalds /*
31da177e4SLinus Torvalds * arch/alpha/lib/checksum.c
41da177e4SLinus Torvalds *
51da177e4SLinus Torvalds * This file contains network checksum routines that are better done
61da177e4SLinus Torvalds * in an architecture-specific manner due to speed..
71da177e4SLinus Torvalds * Comments in other versions indicate that the algorithms are from RFC1071
81da177e4SLinus Torvalds *
9c3a2ddeeSSimon Arlott * accelerated versions (and 21264 assembly versions ) contributed by
101da177e4SLinus Torvalds * Rick Gorton <rick.gorton@alpha-processor.com>
111da177e4SLinus Torvalds */
121da177e4SLinus Torvalds
131da177e4SLinus Torvalds #include <linux/module.h>
141da177e4SLinus Torvalds #include <linux/string.h>
151da177e4SLinus Torvalds
161da177e4SLinus Torvalds #include <asm/byteorder.h>
171da177e4SLinus Torvalds
from64to16(unsigned long x)181da177e4SLinus Torvalds static inline unsigned short from64to16(unsigned long x)
191da177e4SLinus Torvalds {
201da177e4SLinus Torvalds /* Using extract instructions is a bit more efficient
211da177e4SLinus Torvalds than the original shift/bitmask version. */
221da177e4SLinus Torvalds
231da177e4SLinus Torvalds union {
241da177e4SLinus Torvalds unsigned long ul;
251da177e4SLinus Torvalds unsigned int ui[2];
261da177e4SLinus Torvalds unsigned short us[4];
271da177e4SLinus Torvalds } in_v, tmp_v, out_v;
281da177e4SLinus Torvalds
291da177e4SLinus Torvalds in_v.ul = x;
301da177e4SLinus Torvalds tmp_v.ul = (unsigned long) in_v.ui[0] + (unsigned long) in_v.ui[1];
311da177e4SLinus Torvalds
321da177e4SLinus Torvalds /* Since the bits of tmp_v.sh[3] are going to always be zero,
331da177e4SLinus Torvalds we don't have to bother to add that in. */
341da177e4SLinus Torvalds out_v.ul = (unsigned long) tmp_v.us[0] + (unsigned long) tmp_v.us[1]
351da177e4SLinus Torvalds + (unsigned long) tmp_v.us[2];
361da177e4SLinus Torvalds
371da177e4SLinus Torvalds /* Similarly, out_v.us[2] is always zero for the final add. */
381da177e4SLinus Torvalds return out_v.us[0] + out_v.us[1];
391da177e4SLinus Torvalds }
401da177e4SLinus Torvalds
411da177e4SLinus Torvalds /*
421da177e4SLinus Torvalds * computes the checksum of the TCP/UDP pseudo-header
431da177e4SLinus Torvalds * returns a 16-bit checksum, already complemented.
441da177e4SLinus Torvalds */
csum_tcpudp_magic(__be32 saddr,__be32 daddr,__u32 len,__u8 proto,__wsum sum)459be259aaSAl Viro __sum16 csum_tcpudp_magic(__be32 saddr, __be32 daddr,
4601cfbad7SAlexander Duyck __u32 len, __u8 proto, __wsum sum)
471da177e4SLinus Torvalds {
489be259aaSAl Viro return (__force __sum16)~from64to16(
499be259aaSAl Viro (__force u64)saddr + (__force u64)daddr +
509be259aaSAl Viro (__force u64)sum + ((len + proto) << 8));
511da177e4SLinus Torvalds }
5200fc0e0dSAl Viro EXPORT_SYMBOL(csum_tcpudp_magic);
531da177e4SLinus Torvalds
csum_tcpudp_nofold(__be32 saddr,__be32 daddr,__u32 len,__u8 proto,__wsum sum)549be259aaSAl Viro __wsum csum_tcpudp_nofold(__be32 saddr, __be32 daddr,
5501cfbad7SAlexander Duyck __u32 len, __u8 proto, __wsum sum)
561da177e4SLinus Torvalds {
571da177e4SLinus Torvalds unsigned long result;
581da177e4SLinus Torvalds
599be259aaSAl Viro result = (__force u64)saddr + (__force u64)daddr +
609be259aaSAl Viro (__force u64)sum + ((len + proto) << 8);
611da177e4SLinus Torvalds
621da177e4SLinus Torvalds /* Fold down to 32-bits so we don't lose in the typedef-less
631da177e4SLinus Torvalds network stack. */
641da177e4SLinus Torvalds /* 64 to 33 */
651da177e4SLinus Torvalds result = (result & 0xffffffff) + (result >> 32);
661da177e4SLinus Torvalds /* 33 to 32 */
671da177e4SLinus Torvalds result = (result & 0xffffffff) + (result >> 32);
689be259aaSAl Viro return (__force __wsum)result;
691da177e4SLinus Torvalds }
70547c178bSAl Viro EXPORT_SYMBOL(csum_tcpudp_nofold);
711da177e4SLinus Torvalds
721da177e4SLinus Torvalds /*
731da177e4SLinus Torvalds * Do a 64-bit checksum on an arbitrary memory area..
741da177e4SLinus Torvalds *
751da177e4SLinus Torvalds * This isn't a great routine, but it's not _horrible_ either. The
761da177e4SLinus Torvalds * inner loop could be unrolled a bit further, and there are better
771da177e4SLinus Torvalds * ways to do the carry, but this is reasonable.
781da177e4SLinus Torvalds */
do_csum(const unsigned char * buff,int len)791da177e4SLinus Torvalds static inline unsigned long do_csum(const unsigned char * buff, int len)
801da177e4SLinus Torvalds {
811da177e4SLinus Torvalds int odd, count;
821da177e4SLinus Torvalds unsigned long result = 0;
831da177e4SLinus Torvalds
841da177e4SLinus Torvalds if (len <= 0)
851da177e4SLinus Torvalds goto out;
861da177e4SLinus Torvalds odd = 1 & (unsigned long) buff;
871da177e4SLinus Torvalds if (odd) {
881da177e4SLinus Torvalds result = *buff << 8;
891da177e4SLinus Torvalds len--;
901da177e4SLinus Torvalds buff++;
911da177e4SLinus Torvalds }
921da177e4SLinus Torvalds count = len >> 1; /* nr of 16-bit words.. */
931da177e4SLinus Torvalds if (count) {
941da177e4SLinus Torvalds if (2 & (unsigned long) buff) {
951da177e4SLinus Torvalds result += *(unsigned short *) buff;
961da177e4SLinus Torvalds count--;
971da177e4SLinus Torvalds len -= 2;
981da177e4SLinus Torvalds buff += 2;
991da177e4SLinus Torvalds }
1001da177e4SLinus Torvalds count >>= 1; /* nr of 32-bit words.. */
1011da177e4SLinus Torvalds if (count) {
1021da177e4SLinus Torvalds if (4 & (unsigned long) buff) {
1031da177e4SLinus Torvalds result += *(unsigned int *) buff;
1041da177e4SLinus Torvalds count--;
1051da177e4SLinus Torvalds len -= 4;
1061da177e4SLinus Torvalds buff += 4;
1071da177e4SLinus Torvalds }
1081da177e4SLinus Torvalds count >>= 1; /* nr of 64-bit words.. */
1091da177e4SLinus Torvalds if (count) {
1101da177e4SLinus Torvalds unsigned long carry = 0;
1111da177e4SLinus Torvalds do {
1121da177e4SLinus Torvalds unsigned long w = *(unsigned long *) buff;
1131da177e4SLinus Torvalds count--;
1141da177e4SLinus Torvalds buff += 8;
1151da177e4SLinus Torvalds result += carry;
1161da177e4SLinus Torvalds result += w;
1171da177e4SLinus Torvalds carry = (w > result);
1181da177e4SLinus Torvalds } while (count);
1191da177e4SLinus Torvalds result += carry;
1201da177e4SLinus Torvalds result = (result & 0xffffffff) + (result >> 32);
1211da177e4SLinus Torvalds }
1221da177e4SLinus Torvalds if (len & 4) {
1231da177e4SLinus Torvalds result += *(unsigned int *) buff;
1241da177e4SLinus Torvalds buff += 4;
1251da177e4SLinus Torvalds }
1261da177e4SLinus Torvalds }
1271da177e4SLinus Torvalds if (len & 2) {
1281da177e4SLinus Torvalds result += *(unsigned short *) buff;
1291da177e4SLinus Torvalds buff += 2;
1301da177e4SLinus Torvalds }
1311da177e4SLinus Torvalds }
1321da177e4SLinus Torvalds if (len & 1)
1331da177e4SLinus Torvalds result += *buff;
1341da177e4SLinus Torvalds result = from64to16(result);
1351da177e4SLinus Torvalds if (odd)
1361da177e4SLinus Torvalds result = ((result >> 8) & 0xff) | ((result & 0xff) << 8);
1371da177e4SLinus Torvalds out:
1381da177e4SLinus Torvalds return result;
1391da177e4SLinus Torvalds }
1401da177e4SLinus Torvalds
1411da177e4SLinus Torvalds /*
1421da177e4SLinus Torvalds * This is a version of ip_compute_csum() optimized for IP headers,
1431da177e4SLinus Torvalds * which always checksum on 4 octet boundaries.
1441da177e4SLinus Torvalds */
ip_fast_csum(const void * iph,unsigned int ihl)1459be259aaSAl Viro __sum16 ip_fast_csum(const void *iph, unsigned int ihl)
1461da177e4SLinus Torvalds {
1479be259aaSAl Viro return (__force __sum16)~do_csum(iph,ihl*4);
1481da177e4SLinus Torvalds }
14900fc0e0dSAl Viro EXPORT_SYMBOL(ip_fast_csum);
1501da177e4SLinus Torvalds
1511da177e4SLinus Torvalds /*
1521da177e4SLinus Torvalds * computes the checksum of a memory block at buff, length len,
1531da177e4SLinus Torvalds * and adds in "sum" (32-bit)
1541da177e4SLinus Torvalds *
1551da177e4SLinus Torvalds * returns a 32-bit number suitable for feeding into itself
1561da177e4SLinus Torvalds * or csum_tcpudp_magic
1571da177e4SLinus Torvalds *
1581da177e4SLinus Torvalds * this function must be called with even lengths, except
1591da177e4SLinus Torvalds * for the last fragment, which may be odd
1601da177e4SLinus Torvalds *
1611da177e4SLinus Torvalds * it's best to have buff aligned on a 32-bit boundary
1621da177e4SLinus Torvalds */
csum_partial(const void * buff,int len,__wsum sum)1639be259aaSAl Viro __wsum csum_partial(const void *buff, int len, __wsum sum)
1641da177e4SLinus Torvalds {
1651da177e4SLinus Torvalds unsigned long result = do_csum(buff, len);
1661da177e4SLinus Torvalds
1671da177e4SLinus Torvalds /* add in old sum, and carry.. */
1689be259aaSAl Viro result += (__force u32)sum;
1691da177e4SLinus Torvalds /* 32+c bits -> 32 bits */
1701da177e4SLinus Torvalds result = (result & 0xffffffff) + (result >> 32);
1719be259aaSAl Viro return (__force __wsum)result;
1721da177e4SLinus Torvalds }
1731da177e4SLinus Torvalds
1741da177e4SLinus Torvalds EXPORT_SYMBOL(csum_partial);
1751da177e4SLinus Torvalds
1761da177e4SLinus Torvalds /*
1771da177e4SLinus Torvalds * this routine is used for miscellaneous IP-like checksums, mainly
1781da177e4SLinus Torvalds * in icmp.c
1791da177e4SLinus Torvalds */
ip_compute_csum(const void * buff,int len)1809be259aaSAl Viro __sum16 ip_compute_csum(const void *buff, int len)
1811da177e4SLinus Torvalds {
1829be259aaSAl Viro return (__force __sum16)~from64to16(do_csum(buff,len));
1831da177e4SLinus Torvalds }
18400fc0e0dSAl Viro EXPORT_SYMBOL(ip_compute_csum);
185