Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tiwai/sound-2.6
[linux-2.6] / arch / alpha / lib / csum_partial_copy.c
1 /*
2  * csum_partial_copy - do IP checksumming and copy
3  *
4  * (C) Copyright 1996 Linus Torvalds
5  * accelerated versions (and 21264 assembly versions ) contributed by
6  *      Rick Gorton     <rick.gorton@alpha-processor.com>
7  *
8  * Don't look at this too closely - you'll go mad. The things
9  * we do for performance..
10  */
11
12 #include <linux/types.h>
13 #include <linux/string.h>
14 #include <asm/uaccess.h>
15
16
17 #define ldq_u(x,y) \
18 __asm__ __volatile__("ldq_u %0,%1":"=r" (x):"m" (*(const unsigned long *)(y)))
19
20 #define stq_u(x,y) \
21 __asm__ __volatile__("stq_u %1,%0":"=m" (*(unsigned long *)(y)):"r" (x))
22
23 #define extql(x,y,z) \
24 __asm__ __volatile__("extql %1,%2,%0":"=r" (z):"r" (x),"r" (y))
25
26 #define extqh(x,y,z) \
27 __asm__ __volatile__("extqh %1,%2,%0":"=r" (z):"r" (x),"r" (y))
28
29 #define mskql(x,y,z) \
30 __asm__ __volatile__("mskql %1,%2,%0":"=r" (z):"r" (x),"r" (y))
31
32 #define mskqh(x,y,z) \
33 __asm__ __volatile__("mskqh %1,%2,%0":"=r" (z):"r" (x),"r" (y))
34
35 #define insql(x,y,z) \
36 __asm__ __volatile__("insql %1,%2,%0":"=r" (z):"r" (x),"r" (y))
37
38 #define insqh(x,y,z) \
39 __asm__ __volatile__("insqh %1,%2,%0":"=r" (z):"r" (x),"r" (y))
40
41
42 #define __get_user_u(x,ptr)                             \
43 ({                                                      \
44         long __guu_err;                                 \
45         __asm__ __volatile__(                           \
46         "1:     ldq_u %0,%2\n"                          \
47         "2:\n"                                          \
48         ".section __ex_table,\"a\"\n"                   \
49         "       .long 1b - .\n"                         \
50         "       lda %0,2b-1b(%1)\n"                     \
51         ".previous"                                     \
52                 : "=r"(x), "=r"(__guu_err)              \
53                 : "m"(__m(ptr)), "1"(0));               \
54         __guu_err;                                      \
55 })
56
57 #define __put_user_u(x,ptr)                             \
58 ({                                                      \
59         long __puu_err;                                 \
60         __asm__ __volatile__(                           \
61         "1:     stq_u %2,%1\n"                          \
62         "2:\n"                                          \
63         ".section __ex_table,\"a\"\n"                   \
64         "       .long 1b - ."                           \
65         "       lda $31,2b-1b(%0)\n"                    \
66         ".previous"                                     \
67                 : "=r"(__puu_err)                       \
68                 : "m"(__m(addr)), "rJ"(x), "0"(0));     \
69         __puu_err;                                      \
70 })
71
72
73 static inline unsigned short from64to16(unsigned long x)
74 {
75         /* Using extract instructions is a bit more efficient
76            than the original shift/bitmask version.  */
77
78         union {
79                 unsigned long   ul;
80                 unsigned int    ui[2];
81                 unsigned short  us[4];
82         } in_v, tmp_v, out_v;
83
84         in_v.ul = x;
85         tmp_v.ul = (unsigned long) in_v.ui[0] + (unsigned long) in_v.ui[1];
86
87         /* Since the bits of tmp_v.sh[3] are going to always be zero,
88            we don't have to bother to add that in.  */
89         out_v.ul = (unsigned long) tmp_v.us[0] + (unsigned long) tmp_v.us[1]
90                         + (unsigned long) tmp_v.us[2];
91
92         /* Similarly, out_v.us[2] is always zero for the final add.  */
93         return out_v.us[0] + out_v.us[1];
94 }
95
96
97
98 /*
99  * Ok. This isn't fun, but this is the EASY case.
100  */
101 static inline unsigned long
102 csum_partial_cfu_aligned(const unsigned long __user *src, unsigned long *dst,
103                          long len, unsigned long checksum,
104                          int *errp)
105 {
106         unsigned long carry = 0;
107         int err = 0;
108
109         while (len >= 0) {
110                 unsigned long word;
111                 err |= __get_user(word, src);
112                 checksum += carry;
113                 src++;
114                 checksum += word;
115                 len -= 8;
116                 carry = checksum < word;
117                 *dst = word;
118                 dst++;
119         }
120         len += 8;
121         checksum += carry;
122         if (len) {
123                 unsigned long word, tmp;
124                 err |= __get_user(word, src);
125                 tmp = *dst;
126                 mskql(word, len, word);
127                 checksum += word;
128                 mskqh(tmp, len, tmp);
129                 carry = checksum < word;
130                 *dst = word | tmp;
131                 checksum += carry;
132         }
133         if (err) *errp = err;
134         return checksum;
135 }
136
137 /*
138  * This is even less fun, but this is still reasonably
139  * easy.
140  */
141 static inline unsigned long
142 csum_partial_cfu_dest_aligned(const unsigned long __user *src,
143                               unsigned long *dst,
144                               unsigned long soff,
145                               long len, unsigned long checksum,
146                               int *errp)
147 {
148         unsigned long first;
149         unsigned long word, carry;
150         unsigned long lastsrc = 7+len+(unsigned long)src;
151         int err = 0;
152
153         err |= __get_user_u(first,src);
154         carry = 0;
155         while (len >= 0) {
156                 unsigned long second;
157
158                 err |= __get_user_u(second, src+1);
159                 extql(first, soff, word);
160                 len -= 8;
161                 src++;
162                 extqh(second, soff, first);
163                 checksum += carry;
164                 word |= first;
165                 first = second;
166                 checksum += word;
167                 *dst = word;
168                 dst++;
169                 carry = checksum < word;
170         }
171         len += 8;
172         checksum += carry;
173         if (len) {
174                 unsigned long tmp;
175                 unsigned long second;
176                 err |= __get_user_u(second, lastsrc);
177                 tmp = *dst;
178                 extql(first, soff, word);
179                 extqh(second, soff, first);
180                 word |= first;
181                 mskql(word, len, word);
182                 checksum += word;
183                 mskqh(tmp, len, tmp);
184                 carry = checksum < word;
185                 *dst = word | tmp;
186                 checksum += carry;
187         }
188         if (err) *errp = err;
189         return checksum;
190 }
191
192 /*
193  * This is slightly less fun than the above..
194  */
195 static inline unsigned long
196 csum_partial_cfu_src_aligned(const unsigned long __user *src,
197                              unsigned long *dst,
198                              unsigned long doff,
199                              long len, unsigned long checksum,
200                              unsigned long partial_dest,
201                              int *errp)
202 {
203         unsigned long carry = 0;
204         unsigned long word;
205         unsigned long second_dest;
206         int err = 0;
207
208         mskql(partial_dest, doff, partial_dest);
209         while (len >= 0) {
210                 err |= __get_user(word, src);
211                 len -= 8;
212                 insql(word, doff, second_dest);
213                 checksum += carry;
214                 stq_u(partial_dest | second_dest, dst);
215                 src++;
216                 checksum += word;
217                 insqh(word, doff, partial_dest);
218                 carry = checksum < word;
219                 dst++;
220         }
221         len += 8;
222         if (len) {
223                 checksum += carry;
224                 err |= __get_user(word, src);
225                 mskql(word, len, word);
226                 len -= 8;
227                 checksum += word;
228                 insql(word, doff, second_dest);
229                 len += doff;
230                 carry = checksum < word;
231                 partial_dest |= second_dest;
232                 if (len >= 0) {
233                         stq_u(partial_dest, dst);
234                         if (!len) goto out;
235                         dst++;
236                         insqh(word, doff, partial_dest);
237                 }
238                 doff = len;
239         }
240         ldq_u(second_dest, dst);
241         mskqh(second_dest, doff, second_dest);
242         stq_u(partial_dest | second_dest, dst);
243 out:
244         checksum += carry;
245         if (err) *errp = err;
246         return checksum;
247 }
248
249 /*
250  * This is so totally un-fun that it's frightening. Don't
251  * look at this too closely, you'll go blind.
252  */
253 static inline unsigned long
254 csum_partial_cfu_unaligned(const unsigned long __user * src,
255                            unsigned long * dst,
256                            unsigned long soff, unsigned long doff,
257                            long len, unsigned long checksum,
258                            unsigned long partial_dest,
259                            int *errp)
260 {
261         unsigned long carry = 0;
262         unsigned long first;
263         unsigned long lastsrc;
264         int err = 0;
265
266         err |= __get_user_u(first, src);
267         lastsrc = 7+len+(unsigned long)src;
268         mskql(partial_dest, doff, partial_dest);
269         while (len >= 0) {
270                 unsigned long second, word;
271                 unsigned long second_dest;
272
273                 err |= __get_user_u(second, src+1);
274                 extql(first, soff, word);
275                 checksum += carry;
276                 len -= 8;
277                 extqh(second, soff, first);
278                 src++;
279                 word |= first;
280                 first = second;
281                 insql(word, doff, second_dest);
282                 checksum += word;
283                 stq_u(partial_dest | second_dest, dst);
284                 carry = checksum < word;
285                 insqh(word, doff, partial_dest);
286                 dst++;
287         }
288         len += doff;
289         checksum += carry;
290         if (len >= 0) {
291                 unsigned long second, word;
292                 unsigned long second_dest;
293
294                 err |= __get_user_u(second, lastsrc);
295                 extql(first, soff, word);
296                 extqh(second, soff, first);
297                 word |= first;
298                 first = second;
299                 mskql(word, len-doff, word);
300                 checksum += word;
301                 insql(word, doff, second_dest);
302                 carry = checksum < word;
303                 stq_u(partial_dest | second_dest, dst);
304                 if (len) {
305                         ldq_u(second_dest, dst+1);
306                         insqh(word, doff, partial_dest);
307                         mskqh(second_dest, len, second_dest);
308                         stq_u(partial_dest | second_dest, dst+1);
309                 }
310                 checksum += carry;
311         } else {
312                 unsigned long second, word;
313                 unsigned long second_dest;
314
315                 err |= __get_user_u(second, lastsrc);
316                 extql(first, soff, word);
317                 extqh(second, soff, first);
318                 word |= first;
319                 ldq_u(second_dest, dst);
320                 mskql(word, len-doff, word);
321                 checksum += word;
322                 mskqh(second_dest, len, second_dest);
323                 carry = checksum < word;
324                 insql(word, doff, word);
325                 stq_u(partial_dest | word | second_dest, dst);
326                 checksum += carry;
327         }
328         if (err) *errp = err;
329         return checksum;
330 }
331
332 __wsum
333 csum_partial_copy_from_user(const void __user *src, void *dst, int len,
334                                __wsum sum, int *errp)
335 {
336         unsigned long checksum = (__force u32) sum;
337         unsigned long soff = 7 & (unsigned long) src;
338         unsigned long doff = 7 & (unsigned long) dst;
339
340         if (len) {
341                 if (!doff) {
342                         if (!soff)
343                                 checksum = csum_partial_cfu_aligned(
344                                         (const unsigned long __user *) src,
345                                         (unsigned long *) dst,
346                                         len-8, checksum, errp);
347                         else
348                                 checksum = csum_partial_cfu_dest_aligned(
349                                         (const unsigned long __user *) src,
350                                         (unsigned long *) dst,
351                                         soff, len-8, checksum, errp);
352                 } else {
353                         unsigned long partial_dest;
354                         ldq_u(partial_dest, dst);
355                         if (!soff)
356                                 checksum = csum_partial_cfu_src_aligned(
357                                         (const unsigned long __user *) src,
358                                         (unsigned long *) dst,
359                                         doff, len-8, checksum,
360                                         partial_dest, errp);
361                         else
362                                 checksum = csum_partial_cfu_unaligned(
363                                         (const unsigned long __user *) src,
364                                         (unsigned long *) dst,
365                                         soff, doff, len-8, checksum,
366                                         partial_dest, errp);
367                 }
368                 checksum = from64to16 (checksum);
369         }
370         return (__force __wsum)checksum;
371 }
372
373 __wsum
374 csum_partial_copy_nocheck(const void *src, void *dst, int len, __wsum sum)
375 {
376         return csum_partial_copy_from_user((__force const void __user *)src,
377                         dst, len, sum, NULL);
378 }