18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
28c2ecf20Sopenharmony_ci/*
38c2ecf20Sopenharmony_ci * arch/alpha/lib/checksum.c
48c2ecf20Sopenharmony_ci *
58c2ecf20Sopenharmony_ci * This file contains network checksum routines that are better done
68c2ecf20Sopenharmony_ci * in an architecture-specific manner due to speed..
78c2ecf20Sopenharmony_ci * Comments in other versions indicate that the algorithms are from RFC1071
88c2ecf20Sopenharmony_ci *
98c2ecf20Sopenharmony_ci * accelerated versions (and 21264 assembly versions ) contributed by
108c2ecf20Sopenharmony_ci *	Rick Gorton	<rick.gorton@alpha-processor.com>
118c2ecf20Sopenharmony_ci */
128c2ecf20Sopenharmony_ci
138c2ecf20Sopenharmony_ci#include <linux/module.h>
148c2ecf20Sopenharmony_ci#include <linux/string.h>
158c2ecf20Sopenharmony_ci
168c2ecf20Sopenharmony_ci#include <asm/byteorder.h>
178c2ecf20Sopenharmony_ci
188c2ecf20Sopenharmony_cistatic inline unsigned short from64to16(unsigned long x)
198c2ecf20Sopenharmony_ci{
208c2ecf20Sopenharmony_ci	/* Using extract instructions is a bit more efficient
218c2ecf20Sopenharmony_ci	   than the original shift/bitmask version.  */
228c2ecf20Sopenharmony_ci
238c2ecf20Sopenharmony_ci	union {
248c2ecf20Sopenharmony_ci		unsigned long	ul;
258c2ecf20Sopenharmony_ci		unsigned int	ui[2];
268c2ecf20Sopenharmony_ci		unsigned short	us[4];
278c2ecf20Sopenharmony_ci	} in_v, tmp_v, out_v;
288c2ecf20Sopenharmony_ci
298c2ecf20Sopenharmony_ci	in_v.ul = x;
308c2ecf20Sopenharmony_ci	tmp_v.ul = (unsigned long) in_v.ui[0] + (unsigned long) in_v.ui[1];
318c2ecf20Sopenharmony_ci
328c2ecf20Sopenharmony_ci	/* Since the bits of tmp_v.sh[3] are going to always be zero,
338c2ecf20Sopenharmony_ci	   we don't have to bother to add that in.  */
348c2ecf20Sopenharmony_ci	out_v.ul = (unsigned long) tmp_v.us[0] + (unsigned long) tmp_v.us[1]
358c2ecf20Sopenharmony_ci			+ (unsigned long) tmp_v.us[2];
368c2ecf20Sopenharmony_ci
378c2ecf20Sopenharmony_ci	/* Similarly, out_v.us[2] is always zero for the final add.  */
388c2ecf20Sopenharmony_ci	return out_v.us[0] + out_v.us[1];
398c2ecf20Sopenharmony_ci}
408c2ecf20Sopenharmony_ci
418c2ecf20Sopenharmony_ci/*
428c2ecf20Sopenharmony_ci * computes the checksum of the TCP/UDP pseudo-header
438c2ecf20Sopenharmony_ci * returns a 16-bit checksum, already complemented.
448c2ecf20Sopenharmony_ci */
458c2ecf20Sopenharmony_ci__sum16 csum_tcpudp_magic(__be32 saddr, __be32 daddr,
468c2ecf20Sopenharmony_ci			  __u32 len, __u8 proto, __wsum sum)
478c2ecf20Sopenharmony_ci{
488c2ecf20Sopenharmony_ci	return (__force __sum16)~from64to16(
498c2ecf20Sopenharmony_ci		(__force u64)saddr + (__force u64)daddr +
508c2ecf20Sopenharmony_ci		(__force u64)sum + ((len + proto) << 8));
518c2ecf20Sopenharmony_ci}
528c2ecf20Sopenharmony_ciEXPORT_SYMBOL(csum_tcpudp_magic);
538c2ecf20Sopenharmony_ci
548c2ecf20Sopenharmony_ci__wsum csum_tcpudp_nofold(__be32 saddr, __be32 daddr,
558c2ecf20Sopenharmony_ci			  __u32 len, __u8 proto, __wsum sum)
568c2ecf20Sopenharmony_ci{
578c2ecf20Sopenharmony_ci	unsigned long result;
588c2ecf20Sopenharmony_ci
598c2ecf20Sopenharmony_ci	result = (__force u64)saddr + (__force u64)daddr +
608c2ecf20Sopenharmony_ci		 (__force u64)sum + ((len + proto) << 8);
618c2ecf20Sopenharmony_ci
628c2ecf20Sopenharmony_ci	/* Fold down to 32-bits so we don't lose in the typedef-less
638c2ecf20Sopenharmony_ci	   network stack.  */
648c2ecf20Sopenharmony_ci	/* 64 to 33 */
658c2ecf20Sopenharmony_ci	result = (result & 0xffffffff) + (result >> 32);
668c2ecf20Sopenharmony_ci	/* 33 to 32 */
678c2ecf20Sopenharmony_ci	result = (result & 0xffffffff) + (result >> 32);
688c2ecf20Sopenharmony_ci	return (__force __wsum)result;
698c2ecf20Sopenharmony_ci}
708c2ecf20Sopenharmony_ciEXPORT_SYMBOL(csum_tcpudp_nofold);
718c2ecf20Sopenharmony_ci
728c2ecf20Sopenharmony_ci/*
738c2ecf20Sopenharmony_ci * Do a 64-bit checksum on an arbitrary memory area..
748c2ecf20Sopenharmony_ci *
758c2ecf20Sopenharmony_ci * This isn't a great routine, but it's not _horrible_ either. The
768c2ecf20Sopenharmony_ci * inner loop could be unrolled a bit further, and there are better
778c2ecf20Sopenharmony_ci * ways to do the carry, but this is reasonable.
788c2ecf20Sopenharmony_ci */
798c2ecf20Sopenharmony_cistatic inline unsigned long do_csum(const unsigned char * buff, int len)
808c2ecf20Sopenharmony_ci{
818c2ecf20Sopenharmony_ci	int odd, count;
828c2ecf20Sopenharmony_ci	unsigned long result = 0;
838c2ecf20Sopenharmony_ci
848c2ecf20Sopenharmony_ci	if (len <= 0)
858c2ecf20Sopenharmony_ci		goto out;
868c2ecf20Sopenharmony_ci	odd = 1 & (unsigned long) buff;
878c2ecf20Sopenharmony_ci	if (odd) {
888c2ecf20Sopenharmony_ci		result = *buff << 8;
898c2ecf20Sopenharmony_ci		len--;
908c2ecf20Sopenharmony_ci		buff++;
918c2ecf20Sopenharmony_ci	}
928c2ecf20Sopenharmony_ci	count = len >> 1;		/* nr of 16-bit words.. */
938c2ecf20Sopenharmony_ci	if (count) {
948c2ecf20Sopenharmony_ci		if (2 & (unsigned long) buff) {
958c2ecf20Sopenharmony_ci			result += *(unsigned short *) buff;
968c2ecf20Sopenharmony_ci			count--;
978c2ecf20Sopenharmony_ci			len -= 2;
988c2ecf20Sopenharmony_ci			buff += 2;
998c2ecf20Sopenharmony_ci		}
1008c2ecf20Sopenharmony_ci		count >>= 1;		/* nr of 32-bit words.. */
1018c2ecf20Sopenharmony_ci		if (count) {
1028c2ecf20Sopenharmony_ci			if (4 & (unsigned long) buff) {
1038c2ecf20Sopenharmony_ci				result += *(unsigned int *) buff;
1048c2ecf20Sopenharmony_ci				count--;
1058c2ecf20Sopenharmony_ci				len -= 4;
1068c2ecf20Sopenharmony_ci				buff += 4;
1078c2ecf20Sopenharmony_ci			}
1088c2ecf20Sopenharmony_ci			count >>= 1;	/* nr of 64-bit words.. */
1098c2ecf20Sopenharmony_ci			if (count) {
1108c2ecf20Sopenharmony_ci				unsigned long carry = 0;
1118c2ecf20Sopenharmony_ci				do {
1128c2ecf20Sopenharmony_ci					unsigned long w = *(unsigned long *) buff;
1138c2ecf20Sopenharmony_ci					count--;
1148c2ecf20Sopenharmony_ci					buff += 8;
1158c2ecf20Sopenharmony_ci					result += carry;
1168c2ecf20Sopenharmony_ci					result += w;
1178c2ecf20Sopenharmony_ci					carry = (w > result);
1188c2ecf20Sopenharmony_ci				} while (count);
1198c2ecf20Sopenharmony_ci				result += carry;
1208c2ecf20Sopenharmony_ci				result = (result & 0xffffffff) + (result >> 32);
1218c2ecf20Sopenharmony_ci			}
1228c2ecf20Sopenharmony_ci			if (len & 4) {
1238c2ecf20Sopenharmony_ci				result += *(unsigned int *) buff;
1248c2ecf20Sopenharmony_ci				buff += 4;
1258c2ecf20Sopenharmony_ci			}
1268c2ecf20Sopenharmony_ci		}
1278c2ecf20Sopenharmony_ci		if (len & 2) {
1288c2ecf20Sopenharmony_ci			result += *(unsigned short *) buff;
1298c2ecf20Sopenharmony_ci			buff += 2;
1308c2ecf20Sopenharmony_ci		}
1318c2ecf20Sopenharmony_ci	}
1328c2ecf20Sopenharmony_ci	if (len & 1)
1338c2ecf20Sopenharmony_ci		result += *buff;
1348c2ecf20Sopenharmony_ci	result = from64to16(result);
1358c2ecf20Sopenharmony_ci	if (odd)
1368c2ecf20Sopenharmony_ci		result = ((result >> 8) & 0xff) | ((result & 0xff) << 8);
1378c2ecf20Sopenharmony_ciout:
1388c2ecf20Sopenharmony_ci	return result;
1398c2ecf20Sopenharmony_ci}
1408c2ecf20Sopenharmony_ci
1418c2ecf20Sopenharmony_ci/*
1428c2ecf20Sopenharmony_ci *	This is a version of ip_compute_csum() optimized for IP headers,
1438c2ecf20Sopenharmony_ci *	which always checksum on 4 octet boundaries.
1448c2ecf20Sopenharmony_ci */
1458c2ecf20Sopenharmony_ci__sum16 ip_fast_csum(const void *iph, unsigned int ihl)
1468c2ecf20Sopenharmony_ci{
1478c2ecf20Sopenharmony_ci	return (__force __sum16)~do_csum(iph,ihl*4);
1488c2ecf20Sopenharmony_ci}
1498c2ecf20Sopenharmony_ciEXPORT_SYMBOL(ip_fast_csum);
1508c2ecf20Sopenharmony_ci
1518c2ecf20Sopenharmony_ci/*
1528c2ecf20Sopenharmony_ci * computes the checksum of a memory block at buff, length len,
1538c2ecf20Sopenharmony_ci * and adds in "sum" (32-bit)
1548c2ecf20Sopenharmony_ci *
1558c2ecf20Sopenharmony_ci * returns a 32-bit number suitable for feeding into itself
1568c2ecf20Sopenharmony_ci * or csum_tcpudp_magic
1578c2ecf20Sopenharmony_ci *
1588c2ecf20Sopenharmony_ci * this function must be called with even lengths, except
1598c2ecf20Sopenharmony_ci * for the last fragment, which may be odd
1608c2ecf20Sopenharmony_ci *
1618c2ecf20Sopenharmony_ci * it's best to have buff aligned on a 32-bit boundary
1628c2ecf20Sopenharmony_ci */
1638c2ecf20Sopenharmony_ci__wsum csum_partial(const void *buff, int len, __wsum sum)
1648c2ecf20Sopenharmony_ci{
1658c2ecf20Sopenharmony_ci	unsigned long result = do_csum(buff, len);
1668c2ecf20Sopenharmony_ci
1678c2ecf20Sopenharmony_ci	/* add in old sum, and carry.. */
1688c2ecf20Sopenharmony_ci	result += (__force u32)sum;
1698c2ecf20Sopenharmony_ci	/* 32+c bits -> 32 bits */
1708c2ecf20Sopenharmony_ci	result = (result & 0xffffffff) + (result >> 32);
1718c2ecf20Sopenharmony_ci	return (__force __wsum)result;
1728c2ecf20Sopenharmony_ci}
1738c2ecf20Sopenharmony_ci
1748c2ecf20Sopenharmony_ciEXPORT_SYMBOL(csum_partial);
1758c2ecf20Sopenharmony_ci
1768c2ecf20Sopenharmony_ci/*
1778c2ecf20Sopenharmony_ci * this routine is used for miscellaneous IP-like checksums, mainly
1788c2ecf20Sopenharmony_ci * in icmp.c
1798c2ecf20Sopenharmony_ci */
1808c2ecf20Sopenharmony_ci__sum16 ip_compute_csum(const void *buff, int len)
1818c2ecf20Sopenharmony_ci{
1828c2ecf20Sopenharmony_ci	return (__force __sum16)~from64to16(do_csum(buff,len));
1838c2ecf20Sopenharmony_ci}
1848c2ecf20Sopenharmony_ciEXPORT_SYMBOL(ip_compute_csum);
185