blob: 0b706a39a6770296034c4421a7c7cf4f483949ba [file] [log] [blame]
Thomas Gleixnerd2912cb2019-06-04 10:11:33 +02001/* SPDX-License-Identifier: GPL-2.0-only */
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * linux/arch/arm/lib/csumpartialcopygeneric.S
4 *
5 * Copyright (C) 1995-2001 Russell King
Linus Torvalds1da177e2005-04-16 15:20:36 -07006 */
Russell King6ebbf2c2014-06-30 16:29:12 +01007#include <asm/assembler.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -07008
9/*
10 * unsigned int
11 * csum_partial_copy_xxx(const char *src, char *dst, int len, int sum, )
12 * r0 = src, r1 = dst, r2 = len, r3 = sum
13 * Returns : r0 = checksum
14 *
15 * Note that 'tst' and 'teq' preserve the carry flag.
16 */
17
18src .req r0
19dst .req r1
20len .req r2
21sum .req r3
22
Nicolas Pitre8adbb372005-11-11 21:51:49 +000023.Lzero: mov r0, sum
Catalin Marinas90303b12006-01-12 16:53:51 +000024 load_regs
Linus Torvalds1da177e2005-04-16 15:20:36 -070025
26 /*
27 * Align an unaligned destination pointer. We know that
28 * we have >= 8 bytes here, so we don't need to check
29 * the length. Note that the source pointer hasn't been
30 * aligned yet.
31 */
Nicolas Pitre8adbb372005-11-11 21:51:49 +000032.Ldst_unaligned:
33 tst dst, #1
34 beq .Ldst_16bit
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
36 load1b ip
37 sub len, len, #1
38 adcs sum, sum, ip, put_byte_1 @ update checksum
39 strb ip, [dst], #1
40 tst dst, #2
Russell King6ebbf2c2014-06-30 16:29:12 +010041 reteq lr @ dst is now 32bit aligned
Linus Torvalds1da177e2005-04-16 15:20:36 -070042
Nicolas Pitre8adbb372005-11-11 21:51:49 +000043.Ldst_16bit: load2b r8, ip
Linus Torvalds1da177e2005-04-16 15:20:36 -070044 sub len, len, #2
45 adcs sum, sum, r8, put_byte_0
46 strb r8, [dst], #1
47 adcs sum, sum, ip, put_byte_1
48 strb ip, [dst], #1
Russell King6ebbf2c2014-06-30 16:29:12 +010049 ret lr @ dst is now 32bit aligned
Linus Torvalds1da177e2005-04-16 15:20:36 -070050
51 /*
52 * Handle 0 to 7 bytes, with any alignment of source and
53 * destination pointers. Note that when we get here, C = 0
54 */
Nicolas Pitre8adbb372005-11-11 21:51:49 +000055.Lless8: teq len, #0 @ check for zero count
56 beq .Lzero
Linus Torvalds1da177e2005-04-16 15:20:36 -070057
58 /* we must have at least one byte. */
59 tst dst, #1 @ dst 16-bit aligned
Nicolas Pitre8adbb372005-11-11 21:51:49 +000060 beq .Lless8_aligned
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
62 /* Align dst */
63 load1b ip
64 sub len, len, #1
65 adcs sum, sum, ip, put_byte_1 @ update checksum
66 strb ip, [dst], #1
67 tst len, #6
Nicolas Pitre8adbb372005-11-11 21:51:49 +000068 beq .Lless8_byteonly
Linus Torvalds1da177e2005-04-16 15:20:36 -070069
701: load2b r8, ip
71 sub len, len, #2
72 adcs sum, sum, r8, put_byte_0
73 strb r8, [dst], #1
74 adcs sum, sum, ip, put_byte_1
75 strb ip, [dst], #1
Nicolas Pitre8adbb372005-11-11 21:51:49 +000076.Lless8_aligned:
77 tst len, #6
Linus Torvalds1da177e2005-04-16 15:20:36 -070078 bne 1b
Nicolas Pitre8adbb372005-11-11 21:51:49 +000079.Lless8_byteonly:
Linus Torvalds1da177e2005-04-16 15:20:36 -070080 tst len, #1
Nicolas Pitre8adbb372005-11-11 21:51:49 +000081 beq .Ldone
Linus Torvalds1da177e2005-04-16 15:20:36 -070082 load1b r8
83 adcs sum, sum, r8, put_byte_0 @ update checksum
84 strb r8, [dst], #1
Nicolas Pitre8adbb372005-11-11 21:51:49 +000085 b .Ldone
Linus Torvalds1da177e2005-04-16 15:20:36 -070086
87FN_ENTRY
Linus Torvalds1da177e2005-04-16 15:20:36 -070088 save_regs
Linus Torvalds1da177e2005-04-16 15:20:36 -070089
90 cmp len, #8 @ Ensure that we have at least
Nicolas Pitre8adbb372005-11-11 21:51:49 +000091 blo .Lless8 @ 8 bytes to copy.
Linus Torvalds1da177e2005-04-16 15:20:36 -070092
93 adds sum, sum, #0 @ C = 0
94 tst dst, #3 @ Test destination alignment
Nicolas Pitre8adbb372005-11-11 21:51:49 +000095 blne .Ldst_unaligned @ align destination, return here
Linus Torvalds1da177e2005-04-16 15:20:36 -070096
97 /*
98 * Ok, the dst pointer is now 32bit aligned, and we know
99 * that we must have more than 4 bytes to copy. Note
100 * that C contains the carry from the dst alignment above.
101 */
102
103 tst src, #3 @ Test source alignment
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000104 bne .Lsrc_not_aligned
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105
106 /* Routine for src & dst aligned */
107
108 bics ip, len, #15
109 beq 2f
110
1111: load4l r4, r5, r6, r7
112 stmia dst!, {r4, r5, r6, r7}
113 adcs sum, sum, r4
114 adcs sum, sum, r5
115 adcs sum, sum, r6
116 adcs sum, sum, r7
117 sub ip, ip, #16
118 teq ip, #0
119 bne 1b
120
1212: ands ip, len, #12
122 beq 4f
123 tst ip, #8
124 beq 3f
125 load2l r4, r5
126 stmia dst!, {r4, r5}
127 adcs sum, sum, r4
128 adcs sum, sum, r5
129 tst ip, #4
130 beq 4f
131
1323: load1l r4
133 str r4, [dst], #4
134 adcs sum, sum, r4
135
1364: ands len, len, #3
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000137 beq .Ldone
Linus Torvalds1da177e2005-04-16 15:20:36 -0700138 load1l r4
139 tst len, #2
140 mov r5, r4, get_byte_0
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000141 beq .Lexit
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100142 adcs sum, sum, r4, lspush #16
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143 strb r5, [dst], #1
144 mov r5, r4, get_byte_1
145 strb r5, [dst], #1
146 mov r5, r4, get_byte_2
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000147.Lexit: tst len, #1
Stefan Agnere44fc382019-02-18 00:57:38 +0100148 strbne r5, [dst], #1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700149 andne r5, r5, #255
Stefan Agnere44fc382019-02-18 00:57:38 +0100150 adcsne sum, sum, r5, put_byte_0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151
152 /*
153 * If the dst pointer was not 16-bit aligned, we
154 * need to rotate the checksum here to get around
155 * the inefficient byte manipulations in the
156 * architecture independent code.
157 */
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000158.Ldone: adc r0, sum, #0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159 ldr sum, [sp, #0] @ dst
160 tst sum, #1
161 movne r0, r0, ror #8
Catalin Marinas90303b12006-01-12 16:53:51 +0000162 load_regs
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000164.Lsrc_not_aligned:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165 adc sum, sum, #0 @ include C from dst alignment
166 and ip, src, #3
167 bic src, src, #3
168 load1l r5
169 cmp ip, #2
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000170 beq .Lsrc2_aligned
171 bhi .Lsrc3_aligned
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100172 mov r4, r5, lspull #8 @ C = 0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 bics ip, len, #15
174 beq 2f
1751: load4l r5, r6, r7, r8
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100176 orr r4, r4, r5, lspush #24
177 mov r5, r5, lspull #8
178 orr r5, r5, r6, lspush #24
179 mov r6, r6, lspull #8
180 orr r6, r6, r7, lspush #24
181 mov r7, r7, lspull #8
182 orr r7, r7, r8, lspush #24
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183 stmia dst!, {r4, r5, r6, r7}
184 adcs sum, sum, r4
185 adcs sum, sum, r5
186 adcs sum, sum, r6
187 adcs sum, sum, r7
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100188 mov r4, r8, lspull #8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700189 sub ip, ip, #16
190 teq ip, #0
191 bne 1b
1922: ands ip, len, #12
193 beq 4f
194 tst ip, #8
195 beq 3f
196 load2l r5, r6
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100197 orr r4, r4, r5, lspush #24
198 mov r5, r5, lspull #8
199 orr r5, r5, r6, lspush #24
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200 stmia dst!, {r4, r5}
201 adcs sum, sum, r4
202 adcs sum, sum, r5
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100203 mov r4, r6, lspull #8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204 tst ip, #4
205 beq 4f
2063: load1l r5
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100207 orr r4, r4, r5, lspush #24
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208 str r4, [dst], #4
209 adcs sum, sum, r4
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100210 mov r4, r5, lspull #8
Linus Torvalds1da177e2005-04-16 15:20:36 -07002114: ands len, len, #3
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000212 beq .Ldone
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 mov r5, r4, get_byte_0
214 tst len, #2
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000215 beq .Lexit
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100216 adcs sum, sum, r4, lspush #16
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217 strb r5, [dst], #1
218 mov r5, r4, get_byte_1
219 strb r5, [dst], #1
220 mov r5, r4, get_byte_2
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000221 b .Lexit
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100223.Lsrc2_aligned: mov r4, r5, lspull #16
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224 adds sum, sum, #0
225 bics ip, len, #15
226 beq 2f
2271: load4l r5, r6, r7, r8
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100228 orr r4, r4, r5, lspush #16
229 mov r5, r5, lspull #16
230 orr r5, r5, r6, lspush #16
231 mov r6, r6, lspull #16
232 orr r6, r6, r7, lspush #16
233 mov r7, r7, lspull #16
234 orr r7, r7, r8, lspush #16
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235 stmia dst!, {r4, r5, r6, r7}
236 adcs sum, sum, r4
237 adcs sum, sum, r5
238 adcs sum, sum, r6
239 adcs sum, sum, r7
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100240 mov r4, r8, lspull #16
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241 sub ip, ip, #16
242 teq ip, #0
243 bne 1b
2442: ands ip, len, #12
245 beq 4f
246 tst ip, #8
247 beq 3f
248 load2l r5, r6
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100249 orr r4, r4, r5, lspush #16
250 mov r5, r5, lspull #16
251 orr r5, r5, r6, lspush #16
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252 stmia dst!, {r4, r5}
253 adcs sum, sum, r4
254 adcs sum, sum, r5
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100255 mov r4, r6, lspull #16
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256 tst ip, #4
257 beq 4f
2583: load1l r5
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100259 orr r4, r4, r5, lspush #16
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260 str r4, [dst], #4
261 adcs sum, sum, r4
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100262 mov r4, r5, lspull #16
Linus Torvalds1da177e2005-04-16 15:20:36 -07002634: ands len, len, #3
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000264 beq .Ldone
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265 mov r5, r4, get_byte_0
266 tst len, #2
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000267 beq .Lexit
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268 adcs sum, sum, r4
269 strb r5, [dst], #1
270 mov r5, r4, get_byte_1
271 strb r5, [dst], #1
272 tst len, #1
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000273 beq .Ldone
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274 load1b r5
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000275 b .Lexit
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100277.Lsrc3_aligned: mov r4, r5, lspull #24
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 adds sum, sum, #0
279 bics ip, len, #15
280 beq 2f
2811: load4l r5, r6, r7, r8
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100282 orr r4, r4, r5, lspush #8
283 mov r5, r5, lspull #24
284 orr r5, r5, r6, lspush #8
285 mov r6, r6, lspull #24
286 orr r6, r6, r7, lspush #8
287 mov r7, r7, lspull #24
288 orr r7, r7, r8, lspush #8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289 stmia dst!, {r4, r5, r6, r7}
290 adcs sum, sum, r4
291 adcs sum, sum, r5
292 adcs sum, sum, r6
293 adcs sum, sum, r7
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100294 mov r4, r8, lspull #24
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 sub ip, ip, #16
296 teq ip, #0
297 bne 1b
2982: ands ip, len, #12
299 beq 4f
300 tst ip, #8
301 beq 3f
302 load2l r5, r6
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100303 orr r4, r4, r5, lspush #8
304 mov r5, r5, lspull #24
305 orr r5, r5, r6, lspush #8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306 stmia dst!, {r4, r5}
307 adcs sum, sum, r4
308 adcs sum, sum, r5
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100309 mov r4, r6, lspull #24
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 tst ip, #4
311 beq 4f
3123: load1l r5
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100313 orr r4, r4, r5, lspush #8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314 str r4, [dst], #4
315 adcs sum, sum, r4
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100316 mov r4, r5, lspull #24
Linus Torvalds1da177e2005-04-16 15:20:36 -07003174: ands len, len, #3
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000318 beq .Ldone
Linus Torvalds1da177e2005-04-16 15:20:36 -0700319 mov r5, r4, get_byte_0
320 tst len, #2
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000321 beq .Lexit
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322 strb r5, [dst], #1
323 adcs sum, sum, r4
324 load1l r4
325 mov r5, r4, get_byte_0
326 strb r5, [dst], #1
Victor Kamenskyd98b90e2014-02-25 08:41:09 +0100327 adcs sum, sum, r4, lspush #24
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 mov r5, r4, get_byte_1
Nicolas Pitre8adbb372005-11-11 21:51:49 +0000329 b .Lexit
Catalin Marinas93ed3972008-08-28 11:22:32 +0100330FN_EXIT