Merge git://git.kernel.org/pub/scm/linux/kernel/git/mason/btrfs-unstable
[deliverable/linux.git] / arch / alpha / lib / checksum.c
CommitLineData
1da177e4
LT
1/*
2 * arch/alpha/lib/checksum.c
3 *
4 * This file contains network checksum routines that are better done
5 * in an architecture-specific manner due to speed..
6 * Comments in other versions indicate that the algorithms are from RFC1071
7 *
c3a2ddee 8 * accelerated versions (and 21264 assembly versions ) contributed by
1da177e4
LT
9 * Rick Gorton <rick.gorton@alpha-processor.com>
10 */
11
12#include <linux/module.h>
13#include <linux/string.h>
14
15#include <asm/byteorder.h>
16
17static inline unsigned short from64to16(unsigned long x)
18{
19 /* Using extract instructions is a bit more efficient
20 than the original shift/bitmask version. */
21
22 union {
23 unsigned long ul;
24 unsigned int ui[2];
25 unsigned short us[4];
26 } in_v, tmp_v, out_v;
27
28 in_v.ul = x;
29 tmp_v.ul = (unsigned long) in_v.ui[0] + (unsigned long) in_v.ui[1];
30
31 /* Since the bits of tmp_v.sh[3] are going to always be zero,
32 we don't have to bother to add that in. */
33 out_v.ul = (unsigned long) tmp_v.us[0] + (unsigned long) tmp_v.us[1]
34 + (unsigned long) tmp_v.us[2];
35
36 /* Similarly, out_v.us[2] is always zero for the final add. */
37 return out_v.us[0] + out_v.us[1];
38}
39
40/*
41 * computes the checksum of the TCP/UDP pseudo-header
42 * returns a 16-bit checksum, already complemented.
43 */
9be259aa 44__sum16 csum_tcpudp_magic(__be32 saddr, __be32 daddr,
1da177e4
LT
45 unsigned short len,
46 unsigned short proto,
9be259aa 47 __wsum sum)
1da177e4 48{
9be259aa
AV
49 return (__force __sum16)~from64to16(
50 (__force u64)saddr + (__force u64)daddr +
51 (__force u64)sum + ((len + proto) << 8));
1da177e4
LT
52}
53
9be259aa 54__wsum csum_tcpudp_nofold(__be32 saddr, __be32 daddr,
1da177e4
LT
55 unsigned short len,
56 unsigned short proto,
9be259aa 57 __wsum sum)
1da177e4
LT
58{
59 unsigned long result;
60
9be259aa
AV
61 result = (__force u64)saddr + (__force u64)daddr +
62 (__force u64)sum + ((len + proto) << 8);
1da177e4
LT
63
64 /* Fold down to 32-bits so we don't lose in the typedef-less
65 network stack. */
66 /* 64 to 33 */
67 result = (result & 0xffffffff) + (result >> 32);
68 /* 33 to 32 */
69 result = (result & 0xffffffff) + (result >> 32);
9be259aa 70 return (__force __wsum)result;
1da177e4 71}
547c178b 72EXPORT_SYMBOL(csum_tcpudp_nofold);
1da177e4
LT
73
74/*
75 * Do a 64-bit checksum on an arbitrary memory area..
76 *
77 * This isn't a great routine, but it's not _horrible_ either. The
78 * inner loop could be unrolled a bit further, and there are better
79 * ways to do the carry, but this is reasonable.
80 */
81static inline unsigned long do_csum(const unsigned char * buff, int len)
82{
83 int odd, count;
84 unsigned long result = 0;
85
86 if (len <= 0)
87 goto out;
88 odd = 1 & (unsigned long) buff;
89 if (odd) {
90 result = *buff << 8;
91 len--;
92 buff++;
93 }
94 count = len >> 1; /* nr of 16-bit words.. */
95 if (count) {
96 if (2 & (unsigned long) buff) {
97 result += *(unsigned short *) buff;
98 count--;
99 len -= 2;
100 buff += 2;
101 }
102 count >>= 1; /* nr of 32-bit words.. */
103 if (count) {
104 if (4 & (unsigned long) buff) {
105 result += *(unsigned int *) buff;
106 count--;
107 len -= 4;
108 buff += 4;
109 }
110 count >>= 1; /* nr of 64-bit words.. */
111 if (count) {
112 unsigned long carry = 0;
113 do {
114 unsigned long w = *(unsigned long *) buff;
115 count--;
116 buff += 8;
117 result += carry;
118 result += w;
119 carry = (w > result);
120 } while (count);
121 result += carry;
122 result = (result & 0xffffffff) + (result >> 32);
123 }
124 if (len & 4) {
125 result += *(unsigned int *) buff;
126 buff += 4;
127 }
128 }
129 if (len & 2) {
130 result += *(unsigned short *) buff;
131 buff += 2;
132 }
133 }
134 if (len & 1)
135 result += *buff;
136 result = from64to16(result);
137 if (odd)
138 result = ((result >> 8) & 0xff) | ((result & 0xff) << 8);
139out:
140 return result;
141}
142
143/*
144 * This is a version of ip_compute_csum() optimized for IP headers,
145 * which always checksum on 4 octet boundaries.
146 */
9be259aa 147__sum16 ip_fast_csum(const void *iph, unsigned int ihl)
1da177e4 148{
9be259aa 149 return (__force __sum16)~do_csum(iph,ihl*4);
1da177e4
LT
150}
151
152/*
153 * computes the checksum of a memory block at buff, length len,
154 * and adds in "sum" (32-bit)
155 *
156 * returns a 32-bit number suitable for feeding into itself
157 * or csum_tcpudp_magic
158 *
159 * this function must be called with even lengths, except
160 * for the last fragment, which may be odd
161 *
162 * it's best to have buff aligned on a 32-bit boundary
163 */
9be259aa 164__wsum csum_partial(const void *buff, int len, __wsum sum)
1da177e4
LT
165{
166 unsigned long result = do_csum(buff, len);
167
168 /* add in old sum, and carry.. */
9be259aa 169 result += (__force u32)sum;
1da177e4
LT
170 /* 32+c bits -> 32 bits */
171 result = (result & 0xffffffff) + (result >> 32);
9be259aa 172 return (__force __wsum)result;
1da177e4
LT
173}
174
175EXPORT_SYMBOL(csum_partial);
176
177/*
178 * this routine is used for miscellaneous IP-like checksums, mainly
179 * in icmp.c
180 */
9be259aa 181__sum16 ip_compute_csum(const void *buff, int len)
1da177e4 182{
9be259aa 183 return (__force __sum16)~from64to16(do_csum(buff,len));
1da177e4 184}
This page took 0.570075 seconds and 5 git commands to generate.