Merge branch 'io_uring/io_uring-5.19' of https://github.com/isilence/linux into io_ur...
[platform/kernel/linux-starfive.git] / arch / alpha / lib / csum_partial_copy.c
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * csum_partial_copy - do IP checksumming and copy
4  *
5  * (C) Copyright 1996 Linus Torvalds
6  * accelerated versions (and 21264 assembly versions ) contributed by
7  *      Rick Gorton     <rick.gorton@alpha-processor.com>
8  *
9  * Don't look at this too closely - you'll go mad. The things
10  * we do for performance..
11  */
12
13 #include <linux/types.h>
14 #include <linux/string.h>
15 #include <linux/uaccess.h>
16 #include <net/checksum.h>
17
18
19 #define ldq_u(x,y) \
20 __asm__ __volatile__("ldq_u %0,%1":"=r" (x):"m" (*(const unsigned long *)(y)))
21
22 #define stq_u(x,y) \
23 __asm__ __volatile__("stq_u %1,%0":"=m" (*(unsigned long *)(y)):"r" (x))
24
25 #define extql(x,y,z) \
26 __asm__ __volatile__("extql %1,%2,%0":"=r" (z):"r" (x),"r" (y))
27
28 #define extqh(x,y,z) \
29 __asm__ __volatile__("extqh %1,%2,%0":"=r" (z):"r" (x),"r" (y))
30
31 #define mskql(x,y,z) \
32 __asm__ __volatile__("mskql %1,%2,%0":"=r" (z):"r" (x),"r" (y))
33
34 #define mskqh(x,y,z) \
35 __asm__ __volatile__("mskqh %1,%2,%0":"=r" (z):"r" (x),"r" (y))
36
37 #define insql(x,y,z) \
38 __asm__ __volatile__("insql %1,%2,%0":"=r" (z):"r" (x),"r" (y))
39
40 #define insqh(x,y,z) \
41 __asm__ __volatile__("insqh %1,%2,%0":"=r" (z):"r" (x),"r" (y))
42
43 #define __get_word(insn,x,ptr)                          \
44 ({                                                      \
45         long __guu_err;                                 \
46         __asm__ __volatile__(                           \
47         "1:     "#insn" %0,%2\n"                        \
48         "2:\n"                                          \
49         EXC(1b,2b,%0,%1)                                \
50                 : "=r"(x), "=r"(__guu_err)              \
51                 : "m"(__m(ptr)), "1"(0));               \
52         __guu_err;                                      \
53 })
54
55 static inline unsigned short from64to16(unsigned long x)
56 {
57         /* Using extract instructions is a bit more efficient
58            than the original shift/bitmask version.  */
59
60         union {
61                 unsigned long   ul;
62                 unsigned int    ui[2];
63                 unsigned short  us[4];
64         } in_v, tmp_v, out_v;
65
66         in_v.ul = x;
67         tmp_v.ul = (unsigned long) in_v.ui[0] + (unsigned long) in_v.ui[1];
68
69         /* Since the bits of tmp_v.sh[3] are going to always be zero,
70            we don't have to bother to add that in.  */
71         out_v.ul = (unsigned long) tmp_v.us[0] + (unsigned long) tmp_v.us[1]
72                         + (unsigned long) tmp_v.us[2];
73
74         /* Similarly, out_v.us[2] is always zero for the final add.  */
75         return out_v.us[0] + out_v.us[1];
76 }
77
78
79
80 /*
81  * Ok. This isn't fun, but this is the EASY case.
82  */
83 static inline unsigned long
84 csum_partial_cfu_aligned(const unsigned long __user *src, unsigned long *dst,
85                          long len)
86 {
87         unsigned long checksum = ~0U;
88         unsigned long carry = 0;
89
90         while (len >= 0) {
91                 unsigned long word;
92                 if (__get_word(ldq, word, src))
93                         return 0;
94                 checksum += carry;
95                 src++;
96                 checksum += word;
97                 len -= 8;
98                 carry = checksum < word;
99                 *dst = word;
100                 dst++;
101         }
102         len += 8;
103         checksum += carry;
104         if (len) {
105                 unsigned long word, tmp;
106                 if (__get_word(ldq, word, src))
107                         return 0;
108                 tmp = *dst;
109                 mskql(word, len, word);
110                 checksum += word;
111                 mskqh(tmp, len, tmp);
112                 carry = checksum < word;
113                 *dst = word | tmp;
114                 checksum += carry;
115         }
116         return checksum;
117 }
118
119 /*
120  * This is even less fun, but this is still reasonably
121  * easy.
122  */
123 static inline unsigned long
124 csum_partial_cfu_dest_aligned(const unsigned long __user *src,
125                               unsigned long *dst,
126                               unsigned long soff,
127                               long len)
128 {
129         unsigned long first;
130         unsigned long word, carry;
131         unsigned long lastsrc = 7+len+(unsigned long)src;
132         unsigned long checksum = ~0U;
133
134         if (__get_word(ldq_u, first,src))
135                 return 0;
136         carry = 0;
137         while (len >= 0) {
138                 unsigned long second;
139
140                 if (__get_word(ldq_u, second, src+1))
141                         return 0;
142                 extql(first, soff, word);
143                 len -= 8;
144                 src++;
145                 extqh(second, soff, first);
146                 checksum += carry;
147                 word |= first;
148                 first = second;
149                 checksum += word;
150                 *dst = word;
151                 dst++;
152                 carry = checksum < word;
153         }
154         len += 8;
155         checksum += carry;
156         if (len) {
157                 unsigned long tmp;
158                 unsigned long second;
159                 if (__get_word(ldq_u, second, lastsrc))
160                         return 0;
161                 tmp = *dst;
162                 extql(first, soff, word);
163                 extqh(second, soff, first);
164                 word |= first;
165                 mskql(word, len, word);
166                 checksum += word;
167                 mskqh(tmp, len, tmp);
168                 carry = checksum < word;
169                 *dst = word | tmp;
170                 checksum += carry;
171         }
172         return checksum;
173 }
174
175 /*
176  * This is slightly less fun than the above..
177  */
178 static inline unsigned long
179 csum_partial_cfu_src_aligned(const unsigned long __user *src,
180                              unsigned long *dst,
181                              unsigned long doff,
182                              long len,
183                              unsigned long partial_dest)
184 {
185         unsigned long carry = 0;
186         unsigned long word;
187         unsigned long second_dest;
188         unsigned long checksum = ~0U;
189
190         mskql(partial_dest, doff, partial_dest);
191         while (len >= 0) {
192                 if (__get_word(ldq, word, src))
193                         return 0;
194                 len -= 8;
195                 insql(word, doff, second_dest);
196                 checksum += carry;
197                 stq_u(partial_dest | second_dest, dst);
198                 src++;
199                 checksum += word;
200                 insqh(word, doff, partial_dest);
201                 carry = checksum < word;
202                 dst++;
203         }
204         len += 8;
205         if (len) {
206                 checksum += carry;
207                 if (__get_word(ldq, word, src))
208                         return 0;
209                 mskql(word, len, word);
210                 len -= 8;
211                 checksum += word;
212                 insql(word, doff, second_dest);
213                 len += doff;
214                 carry = checksum < word;
215                 partial_dest |= second_dest;
216                 if (len >= 0) {
217                         stq_u(partial_dest, dst);
218                         if (!len) goto out;
219                         dst++;
220                         insqh(word, doff, partial_dest);
221                 }
222                 doff = len;
223         }
224         ldq_u(second_dest, dst);
225         mskqh(second_dest, doff, second_dest);
226         stq_u(partial_dest | second_dest, dst);
227 out:
228         checksum += carry;
229         return checksum;
230 }
231
232 /*
233  * This is so totally un-fun that it's frightening. Don't
234  * look at this too closely, you'll go blind.
235  */
236 static inline unsigned long
237 csum_partial_cfu_unaligned(const unsigned long __user * src,
238                            unsigned long * dst,
239                            unsigned long soff, unsigned long doff,
240                            long len, unsigned long partial_dest)
241 {
242         unsigned long carry = 0;
243         unsigned long first;
244         unsigned long lastsrc;
245         unsigned long checksum = ~0U;
246
247         if (__get_word(ldq_u, first, src))
248                 return 0;
249         lastsrc = 7+len+(unsigned long)src;
250         mskql(partial_dest, doff, partial_dest);
251         while (len >= 0) {
252                 unsigned long second, word;
253                 unsigned long second_dest;
254
255                 if (__get_word(ldq_u, second, src+1))
256                         return 0;
257                 extql(first, soff, word);
258                 checksum += carry;
259                 len -= 8;
260                 extqh(second, soff, first);
261                 src++;
262                 word |= first;
263                 first = second;
264                 insql(word, doff, second_dest);
265                 checksum += word;
266                 stq_u(partial_dest | second_dest, dst);
267                 carry = checksum < word;
268                 insqh(word, doff, partial_dest);
269                 dst++;
270         }
271         len += doff;
272         checksum += carry;
273         if (len >= 0) {
274                 unsigned long second, word;
275                 unsigned long second_dest;
276
277                 if (__get_word(ldq_u, second, lastsrc))
278                         return 0;
279                 extql(first, soff, word);
280                 extqh(second, soff, first);
281                 word |= first;
282                 first = second;
283                 mskql(word, len-doff, word);
284                 checksum += word;
285                 insql(word, doff, second_dest);
286                 carry = checksum < word;
287                 stq_u(partial_dest | second_dest, dst);
288                 if (len) {
289                         ldq_u(second_dest, dst+1);
290                         insqh(word, doff, partial_dest);
291                         mskqh(second_dest, len, second_dest);
292                         stq_u(partial_dest | second_dest, dst+1);
293                 }
294                 checksum += carry;
295         } else {
296                 unsigned long second, word;
297                 unsigned long second_dest;
298
299                 if (__get_word(ldq_u, second, lastsrc))
300                         return 0;
301                 extql(first, soff, word);
302                 extqh(second, soff, first);
303                 word |= first;
304                 ldq_u(second_dest, dst);
305                 mskql(word, len-doff, word);
306                 checksum += word;
307                 mskqh(second_dest, len, second_dest);
308                 carry = checksum < word;
309                 insql(word, doff, word);
310                 stq_u(partial_dest | word | second_dest, dst);
311                 checksum += carry;
312         }
313         return checksum;
314 }
315
316 static __wsum __csum_and_copy(const void __user *src, void *dst, int len)
317 {
318         unsigned long soff = 7 & (unsigned long) src;
319         unsigned long doff = 7 & (unsigned long) dst;
320         unsigned long checksum;
321
322         if (!doff) {
323                 if (!soff)
324                         checksum = csum_partial_cfu_aligned(
325                                 (const unsigned long __user *) src,
326                                 (unsigned long *) dst, len-8);
327                 else
328                         checksum = csum_partial_cfu_dest_aligned(
329                                 (const unsigned long __user *) src,
330                                 (unsigned long *) dst,
331                                 soff, len-8);
332         } else {
333                 unsigned long partial_dest;
334                 ldq_u(partial_dest, dst);
335                 if (!soff)
336                         checksum = csum_partial_cfu_src_aligned(
337                                 (const unsigned long __user *) src,
338                                 (unsigned long *) dst,
339                                 doff, len-8, partial_dest);
340                 else
341                         checksum = csum_partial_cfu_unaligned(
342                                 (const unsigned long __user *) src,
343                                 (unsigned long *) dst,
344                                 soff, doff, len-8, partial_dest);
345         }
346         return (__force __wsum)from64to16 (checksum);
347 }
348
349 __wsum
350 csum_and_copy_from_user(const void __user *src, void *dst, int len)
351 {
352         if (!access_ok(src, len))
353                 return 0;
354         return __csum_and_copy(src, dst, len);
355 }
356
357 __wsum
358 csum_partial_copy_nocheck(const void *src, void *dst, int len)
359 {
360         return __csum_and_copy((__force const void __user *)src,
361                                                 dst, len);
362 }
363 EXPORT_SYMBOL(csum_partial_copy_nocheck);