1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-or-later */
2*4882a593Smuzhiyun #ifndef _ASM_POWERPC_CHECKSUM_H
3*4882a593Smuzhiyun #define _ASM_POWERPC_CHECKSUM_H
4*4882a593Smuzhiyun #ifdef __KERNEL__
5*4882a593Smuzhiyun
6*4882a593Smuzhiyun /*
7*4882a593Smuzhiyun */
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #include <linux/bitops.h>
10*4882a593Smuzhiyun #include <linux/in6.h>
11*4882a593Smuzhiyun /*
12*4882a593Smuzhiyun * Computes the checksum of a memory block at src, length len,
13*4882a593Smuzhiyun * and adds in "sum" (32-bit), while copying the block to dst.
14*4882a593Smuzhiyun * If an access exception occurs on src or dst, it stores -EFAULT
15*4882a593Smuzhiyun * to *src_err or *dst_err respectively (if that pointer is not
16*4882a593Smuzhiyun * NULL), and, for an error on src, zeroes the rest of dst.
17*4882a593Smuzhiyun *
18*4882a593Smuzhiyun * Like csum_partial, this must be called with even lengths,
19*4882a593Smuzhiyun * except for the last fragment.
20*4882a593Smuzhiyun */
21*4882a593Smuzhiyun extern __wsum csum_partial_copy_generic(const void *src, void *dst, int len);
22*4882a593Smuzhiyun
23*4882a593Smuzhiyun #define _HAVE_ARCH_COPY_AND_CSUM_FROM_USER
24*4882a593Smuzhiyun extern __wsum csum_and_copy_from_user(const void __user *src, void *dst,
25*4882a593Smuzhiyun int len);
26*4882a593Smuzhiyun #define HAVE_CSUM_COPY_USER
27*4882a593Smuzhiyun extern __wsum csum_and_copy_to_user(const void *src, void __user *dst,
28*4882a593Smuzhiyun int len);
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun #define _HAVE_ARCH_CSUM_AND_COPY
31*4882a593Smuzhiyun #define csum_partial_copy_nocheck(src, dst, len) \
32*4882a593Smuzhiyun csum_partial_copy_generic((src), (dst), (len))
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun /*
36*4882a593Smuzhiyun * turns a 32-bit partial checksum (e.g. from csum_partial) into a
37*4882a593Smuzhiyun * 1's complement 16-bit checksum.
38*4882a593Smuzhiyun */
csum_fold(__wsum sum)39*4882a593Smuzhiyun static inline __sum16 csum_fold(__wsum sum)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun unsigned int tmp;
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun /* swap the two 16-bit halves of sum */
44*4882a593Smuzhiyun __asm__("rlwinm %0,%1,16,0,31" : "=r" (tmp) : "r" (sum));
45*4882a593Smuzhiyun /* if there is a carry from adding the two 16-bit halves,
46*4882a593Smuzhiyun it will carry from the lower half into the upper half,
47*4882a593Smuzhiyun giving us the correct sum in the upper half. */
48*4882a593Smuzhiyun return (__force __sum16)(~((__force u32)sum + tmp) >> 16);
49*4882a593Smuzhiyun }
50*4882a593Smuzhiyun
from64to32(u64 x)51*4882a593Smuzhiyun static inline u32 from64to32(u64 x)
52*4882a593Smuzhiyun {
53*4882a593Smuzhiyun return (x + ror64(x, 32)) >> 32;
54*4882a593Smuzhiyun }
55*4882a593Smuzhiyun
csum_tcpudp_nofold(__be32 saddr,__be32 daddr,__u32 len,__u8 proto,__wsum sum)56*4882a593Smuzhiyun static inline __wsum csum_tcpudp_nofold(__be32 saddr, __be32 daddr, __u32 len,
57*4882a593Smuzhiyun __u8 proto, __wsum sum)
58*4882a593Smuzhiyun {
59*4882a593Smuzhiyun #ifdef __powerpc64__
60*4882a593Smuzhiyun u64 s = (__force u32)sum;
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun s += (__force u32)saddr;
63*4882a593Smuzhiyun s += (__force u32)daddr;
64*4882a593Smuzhiyun #ifdef __BIG_ENDIAN__
65*4882a593Smuzhiyun s += proto + len;
66*4882a593Smuzhiyun #else
67*4882a593Smuzhiyun s += (proto + len) << 8;
68*4882a593Smuzhiyun #endif
69*4882a593Smuzhiyun return (__force __wsum) from64to32(s);
70*4882a593Smuzhiyun #else
71*4882a593Smuzhiyun __asm__("\n\
72*4882a593Smuzhiyun addc %0,%0,%1 \n\
73*4882a593Smuzhiyun adde %0,%0,%2 \n\
74*4882a593Smuzhiyun adde %0,%0,%3 \n\
75*4882a593Smuzhiyun addze %0,%0 \n\
76*4882a593Smuzhiyun "
77*4882a593Smuzhiyun : "=r" (sum)
78*4882a593Smuzhiyun : "r" (daddr), "r"(saddr), "r"(proto + len), "0"(sum));
79*4882a593Smuzhiyun return sum;
80*4882a593Smuzhiyun #endif
81*4882a593Smuzhiyun }
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun /*
84*4882a593Smuzhiyun * computes the checksum of the TCP/UDP pseudo-header
85*4882a593Smuzhiyun * returns a 16-bit checksum, already complemented
86*4882a593Smuzhiyun */
csum_tcpudp_magic(__be32 saddr,__be32 daddr,__u32 len,__u8 proto,__wsum sum)87*4882a593Smuzhiyun static inline __sum16 csum_tcpudp_magic(__be32 saddr, __be32 daddr, __u32 len,
88*4882a593Smuzhiyun __u8 proto, __wsum sum)
89*4882a593Smuzhiyun {
90*4882a593Smuzhiyun return csum_fold(csum_tcpudp_nofold(saddr, daddr, len, proto, sum));
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun
93*4882a593Smuzhiyun #define HAVE_ARCH_CSUM_ADD
csum_add(__wsum csum,__wsum addend)94*4882a593Smuzhiyun static inline __wsum csum_add(__wsum csum, __wsum addend)
95*4882a593Smuzhiyun {
96*4882a593Smuzhiyun #ifdef __powerpc64__
97*4882a593Smuzhiyun u64 res = (__force u64)csum;
98*4882a593Smuzhiyun #endif
99*4882a593Smuzhiyun if (__builtin_constant_p(csum) && csum == 0)
100*4882a593Smuzhiyun return addend;
101*4882a593Smuzhiyun if (__builtin_constant_p(addend) && addend == 0)
102*4882a593Smuzhiyun return csum;
103*4882a593Smuzhiyun
104*4882a593Smuzhiyun #ifdef __powerpc64__
105*4882a593Smuzhiyun res += (__force u64)addend;
106*4882a593Smuzhiyun return (__force __wsum)((u32)res + (res >> 32));
107*4882a593Smuzhiyun #else
108*4882a593Smuzhiyun asm("addc %0,%0,%1;"
109*4882a593Smuzhiyun "addze %0,%0;"
110*4882a593Smuzhiyun : "+r" (csum) : "r" (addend) : "xer");
111*4882a593Smuzhiyun return csum;
112*4882a593Smuzhiyun #endif
113*4882a593Smuzhiyun }
114*4882a593Smuzhiyun
115*4882a593Smuzhiyun /*
116*4882a593Smuzhiyun * This is a version of ip_compute_csum() optimized for IP headers,
117*4882a593Smuzhiyun * which always checksum on 4 octet boundaries. ihl is the number
118*4882a593Smuzhiyun * of 32-bit words and is always >= 5.
119*4882a593Smuzhiyun */
ip_fast_csum_nofold(const void * iph,unsigned int ihl)120*4882a593Smuzhiyun static inline __wsum ip_fast_csum_nofold(const void *iph, unsigned int ihl)
121*4882a593Smuzhiyun {
122*4882a593Smuzhiyun const u32 *ptr = (const u32 *)iph + 1;
123*4882a593Smuzhiyun #ifdef __powerpc64__
124*4882a593Smuzhiyun unsigned int i;
125*4882a593Smuzhiyun u64 s = *(const u32 *)iph;
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun for (i = 0; i < ihl - 1; i++, ptr++)
128*4882a593Smuzhiyun s += *ptr;
129*4882a593Smuzhiyun return (__force __wsum)from64to32(s);
130*4882a593Smuzhiyun #else
131*4882a593Smuzhiyun __wsum sum, tmp;
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun asm("mtctr %3;"
134*4882a593Smuzhiyun "addc %0,%4,%5;"
135*4882a593Smuzhiyun "1: lwzu %1, 4(%2);"
136*4882a593Smuzhiyun "adde %0,%0,%1;"
137*4882a593Smuzhiyun "bdnz 1b;"
138*4882a593Smuzhiyun "addze %0,%0;"
139*4882a593Smuzhiyun : "=r" (sum), "=r" (tmp), "+b" (ptr)
140*4882a593Smuzhiyun : "r" (ihl - 2), "r" (*(const u32 *)iph), "r" (*ptr)
141*4882a593Smuzhiyun : "ctr", "xer", "memory");
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun return sum;
144*4882a593Smuzhiyun #endif
145*4882a593Smuzhiyun }
146*4882a593Smuzhiyun
ip_fast_csum(const void * iph,unsigned int ihl)147*4882a593Smuzhiyun static inline __sum16 ip_fast_csum(const void *iph, unsigned int ihl)
148*4882a593Smuzhiyun {
149*4882a593Smuzhiyun return csum_fold(ip_fast_csum_nofold(iph, ihl));
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun /*
153*4882a593Smuzhiyun * computes the checksum of a memory block at buff, length len,
154*4882a593Smuzhiyun * and adds in "sum" (32-bit)
155*4882a593Smuzhiyun *
156*4882a593Smuzhiyun * returns a 32-bit number suitable for feeding into itself
157*4882a593Smuzhiyun * or csum_tcpudp_magic
158*4882a593Smuzhiyun *
159*4882a593Smuzhiyun * this function must be called with even lengths, except
160*4882a593Smuzhiyun * for the last fragment, which may be odd
161*4882a593Smuzhiyun *
162*4882a593Smuzhiyun * it's best to have buff aligned on a 32-bit boundary
163*4882a593Smuzhiyun */
164*4882a593Smuzhiyun __wsum __csum_partial(const void *buff, int len, __wsum sum);
165*4882a593Smuzhiyun
csum_partial(const void * buff,int len,__wsum sum)166*4882a593Smuzhiyun static inline __wsum csum_partial(const void *buff, int len, __wsum sum)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun if (__builtin_constant_p(len) && len <= 16 && (len & 1) == 0) {
169*4882a593Smuzhiyun if (len == 2)
170*4882a593Smuzhiyun sum = csum_add(sum, (__force __wsum)*(const u16 *)buff);
171*4882a593Smuzhiyun if (len >= 4)
172*4882a593Smuzhiyun sum = csum_add(sum, (__force __wsum)*(const u32 *)buff);
173*4882a593Smuzhiyun if (len == 6)
174*4882a593Smuzhiyun sum = csum_add(sum, (__force __wsum)
175*4882a593Smuzhiyun *(const u16 *)(buff + 4));
176*4882a593Smuzhiyun if (len >= 8)
177*4882a593Smuzhiyun sum = csum_add(sum, (__force __wsum)
178*4882a593Smuzhiyun *(const u32 *)(buff + 4));
179*4882a593Smuzhiyun if (len == 10)
180*4882a593Smuzhiyun sum = csum_add(sum, (__force __wsum)
181*4882a593Smuzhiyun *(const u16 *)(buff + 8));
182*4882a593Smuzhiyun if (len >= 12)
183*4882a593Smuzhiyun sum = csum_add(sum, (__force __wsum)
184*4882a593Smuzhiyun *(const u32 *)(buff + 8));
185*4882a593Smuzhiyun if (len == 14)
186*4882a593Smuzhiyun sum = csum_add(sum, (__force __wsum)
187*4882a593Smuzhiyun *(const u16 *)(buff + 12));
188*4882a593Smuzhiyun if (len >= 16)
189*4882a593Smuzhiyun sum = csum_add(sum, (__force __wsum)
190*4882a593Smuzhiyun *(const u32 *)(buff + 12));
191*4882a593Smuzhiyun } else if (__builtin_constant_p(len) && (len & 3) == 0) {
192*4882a593Smuzhiyun sum = csum_add(sum, ip_fast_csum_nofold(buff, len >> 2));
193*4882a593Smuzhiyun } else {
194*4882a593Smuzhiyun sum = __csum_partial(buff, len, sum);
195*4882a593Smuzhiyun }
196*4882a593Smuzhiyun return sum;
197*4882a593Smuzhiyun }
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun /*
200*4882a593Smuzhiyun * this routine is used for miscellaneous IP-like checksums, mainly
201*4882a593Smuzhiyun * in icmp.c
202*4882a593Smuzhiyun */
ip_compute_csum(const void * buff,int len)203*4882a593Smuzhiyun static inline __sum16 ip_compute_csum(const void *buff, int len)
204*4882a593Smuzhiyun {
205*4882a593Smuzhiyun return csum_fold(csum_partial(buff, len, 0));
206*4882a593Smuzhiyun }
207*4882a593Smuzhiyun
208*4882a593Smuzhiyun #define _HAVE_ARCH_IPV6_CSUM
209*4882a593Smuzhiyun __sum16 csum_ipv6_magic(const struct in6_addr *saddr,
210*4882a593Smuzhiyun const struct in6_addr *daddr,
211*4882a593Smuzhiyun __u32 len, __u8 proto, __wsum sum);
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun #endif /* __KERNEL__ */
214*4882a593Smuzhiyun #endif
215