2 * arch/alpha/lib/checksum.c
4 * This file contains network checksum routines that are better done
5 * in an architecture-specific manner due to speed..
6 * Comments in other versions indicate that the algorithms are from RFC1071
8 * accellerated versions (and 21264 assembly versions ) contributed by
9 * Rick Gorton <rick.gorton@alpha-processor.com>
12 #include <linux/module.h>
13 #include <linux/string.h>
15 #include <asm/byteorder.h>
17 static inline unsigned short from64to16(unsigned long x
)
19 /* Using extract instructions is a bit more efficient
20 than the original shift/bitmask version. */
29 tmp_v
.ul
= (unsigned long) in_v
.ui
[0] + (unsigned long) in_v
.ui
[1];
31 /* Since the bits of tmp_v.sh[3] are going to always be zero,
32 we don't have to bother to add that in. */
33 out_v
.ul
= (unsigned long) tmp_v
.us
[0] + (unsigned long) tmp_v
.us
[1]
34 + (unsigned long) tmp_v
.us
[2];
36 /* Similarly, out_v.us[2] is always zero for the final add. */
37 return out_v
.us
[0] + out_v
.us
[1];
41 * computes the checksum of the TCP/UDP pseudo-header
42 * returns a 16-bit checksum, already complemented.
44 __sum16
csum_tcpudp_magic(__be32 saddr
, __be32 daddr
,
49 return (__force __sum16
)~from64to16(
50 (__force u64
)saddr
+ (__force u64
)daddr
+
51 (__force u64
)sum
+ ((len
+ proto
) << 8));
54 __wsum
csum_tcpudp_nofold(__be32 saddr
, __be32 daddr
,
61 result
= (__force u64
)saddr
+ (__force u64
)daddr
+
62 (__force u64
)sum
+ ((len
+ proto
) << 8);
64 /* Fold down to 32-bits so we don't lose in the typedef-less
67 result
= (result
& 0xffffffff) + (result
>> 32);
69 result
= (result
& 0xffffffff) + (result
>> 32);
70 return (__force __wsum
)result
;
74 * Do a 64-bit checksum on an arbitrary memory area..
76 * This isn't a great routine, but it's not _horrible_ either. The
77 * inner loop could be unrolled a bit further, and there are better
78 * ways to do the carry, but this is reasonable.
80 static inline unsigned long do_csum(const unsigned char * buff
, int len
)
83 unsigned long result
= 0;
87 odd
= 1 & (unsigned long) buff
;
93 count
= len
>> 1; /* nr of 16-bit words.. */
95 if (2 & (unsigned long) buff
) {
96 result
+= *(unsigned short *) buff
;
101 count
>>= 1; /* nr of 32-bit words.. */
103 if (4 & (unsigned long) buff
) {
104 result
+= *(unsigned int *) buff
;
109 count
>>= 1; /* nr of 64-bit words.. */
111 unsigned long carry
= 0;
113 unsigned long w
= *(unsigned long *) buff
;
118 carry
= (w
> result
);
121 result
= (result
& 0xffffffff) + (result
>> 32);
124 result
+= *(unsigned int *) buff
;
129 result
+= *(unsigned short *) buff
;
135 result
= from64to16(result
);
137 result
= ((result
>> 8) & 0xff) | ((result
& 0xff) << 8);
143 * This is a version of ip_compute_csum() optimized for IP headers,
144 * which always checksum on 4 octet boundaries.
146 __sum16
ip_fast_csum(const void *iph
, unsigned int ihl
)
148 return (__force __sum16
)~do_csum(iph
,ihl
*4);
152 * computes the checksum of a memory block at buff, length len,
153 * and adds in "sum" (32-bit)
155 * returns a 32-bit number suitable for feeding into itself
156 * or csum_tcpudp_magic
158 * this function must be called with even lengths, except
159 * for the last fragment, which may be odd
161 * it's best to have buff aligned on a 32-bit boundary
163 __wsum
csum_partial(const void *buff
, int len
, __wsum sum
)
165 unsigned long result
= do_csum(buff
, len
);
167 /* add in old sum, and carry.. */
168 result
+= (__force u32
)sum
;
169 /* 32+c bits -> 32 bits */
170 result
= (result
& 0xffffffff) + (result
>> 32);
171 return (__force __wsum
)result
;
174 EXPORT_SYMBOL(csum_partial
);
177 * this routine is used for miscellaneous IP-like checksums, mainly
180 __sum16
ip_compute_csum(const void *buff
, int len
)
182 return (__force __sum16
)~from64to16(do_csum(buff
,len
));