1 /* $Id: checksumcopy.S,v 1.1 2001/12/17 13:59:27 bjornw Exp $
2 * A fast checksum+copy routine using movem
3 * Copyright (c) 1998, 2001 Axis Communications AB
7 * csum_partial_copy_nocheck(const char *src, char *dst,
8 * int len, unsigned int sum)
11 .globl csum_partial_copy_nocheck
12 csum_partial_copy_nocheck:
19 ;; check for breakeven length between movem and normal word looping versions
20 ;; we also do _NOT_ want to compute a checksum over more than the
21 ;; actual length when length < 40
27 ;; need to save the registers we use below in the movem loop
28 ;; this overhead is why we have a check above for breakeven length
29 ;; only r0 - r8 have to be saved, the other ones are clobber-able
30 ;; according to the ABI
35 ;; do a movem copy and checksum
37 subq 10*4, $r12 ; update length for the first loop
39 _mloop: movem [$r10+],$r9 ; read 10 longwords
40 1: ;; A failing userspace access will have this as PC.
41 movem $r9,[$r11+] ; write 10 longwords
43 ;; perform dword checksumming on the 10 longwords
65 ;; fold the carry into the checksum, to avoid having to loop the carry
70 ax ; do it again, since we might have generated a carry
77 addq 10*4,$r12 ; compensate for last loop underflowing length
79 movem [$sp+],$r8 ; restore regs
82 ;; only fold if there is anything to fold.
87 ;; fold 32-bit checksum into a 16-bit checksum, to avoid carries below
88 ;; r9 can be used as temporary.
91 lsrq 16,$r9 ; r0 = checksum >> 16
92 and.d 0xffff,$r13 ; checksum = checksum & 0xffff
93 add.d $r9,$r13 ; checksum += r0
94 move.d $r13,$r9 ; do the same again, maybe we got a carry last add
104 ;; copy and checksum the rest of the words
108 _wloop: move.w [$r10+],$r9
109 2: ;; A failing userspace access will have this as PC.
118 ;; see if we have one odd byte more
126 ;; copy and checksum the last byte
128 3: ;; A failing userspace access will have this as PC.