Lines Matching +full:mod +full:- +full:12 +full:b
8 * of the Xtensa link-time HAL, and those files may differ per
11 * could lose the special functionality for accessing user-space
31 * do 16B chunks with a loop, and then finish up with
32 * 8B, 4B, 2B, and 1B copies conditional on the length.
36 * copying 1B and 2B and then retest.
37 * This code tries to use fall-through braches for the common
68 bbsi.l a2, 0, .Ldst1mod2 # if dst is 1 mod 2
69 bbsi.l a2, 1, .Ldst2mod4 # if dst is 2 mod 4
71 srli a7, a4, 4 # number of loop iterations with 16B
92 addi a4, a4, -1
95 .Ldst2mod4: # dst 16-bit aligned
104 addi a4, a4, -2
111 .byte 0 # 1 mod 4 alignment for LOOPNEZ
112 # (0 mod 4 alignment for LBEG)
133 * Destination and source are word-aligned.
135 # copy 16 bytes per iteration for word-aligned dst and word-aligned src
136 .align 4 # 1 mod 4 alignment for LOOPNEZ
137 .byte 0 # (0 mod 4 alignment for LBEG)
144 add a8, a8, a3 # a8 = end of last 16B source chunk
152 EX(10f) l32i a7, a3, 12
155 EX(10f) s32i a7, a5, 12
197 .byte 0 # 1 mod 4 alignement for LOOPNEZ
198 # (0 mod 4 alignment for LBEG)
200 # copy 16 bytes per iteration for word-aligned dst and unaligned src
209 add a12, a12, a3 # a12 = end of last 16B source chunk
216 EX(10f) l32i a9, a3, 12
224 EX(10f) s32i a9, a5, 12
275 * bytes_copied = a5 - a2
276 * retval = bytes_not_copied = original len - bytes_copied
277 * retval = a11 - (a5 - a2)
282 sub a2, a5, a2 /* a2 <-- bytes copied */
283 sub a2, a11, a2 /* a2 <-- bytes not copied */