Lines Matching +full:8 +full:- +full:n +full:- +full:1
2 * Copyright (C) 2008-2009 Michal Simek <monstr@monstr.eu>
3 * Copyright (C) 2008-2009 PetaLogix
4 * Copyright (C) 2008 Jim Law - Iris LP All rights reserved.
21 * Input : Operand1 in Reg r5 - destination address
22 * Operand2 in Reg r6 - source address
23 * Operand3 in Reg r7 - number of bytes to transfer
24 * Output: Result in Reg r3 - starting destinaition address
43 addi r4, r0, 4 /* n = 4 */
44 cmpu r4, r4, r7 /* n = c - n (unsigned) */
45 blti r4, a_xfer_end /* if n < 0, less than one word to transfer */
48 andi r4, r5, 3 /* n = d & 3 */
51 /* n = 4 - n (yields 3, 2, 1 transfers for 1, 2, 3 addr offset) */
53 rsub r7, r4, r7 /* c = c - n adjust c */
60 addi r6, r6, 1 /* s++ */
61 addi r5, r5, 1 /* d++ */
63 addi r4, r4, -1 /* n-- (IN DELAY SLOT) */
66 addi r4, r0, 32 /* n = 32 */
67 cmpu r4, r4, r7 /* n = c - n (unsigned) */
68 /* if n < 0, less than one block to transfer */
72 andi r4, r7, 0xffffffe0 /* n = c & ~31 */
73 rsub r7, r4, r7 /* c = c - n */
82 lwi r11, r6, 8 /* t3 = *(s + 8) */
86 swi r11, r5, 8 /* *(d + 8) = t3 */
97 addi r4, r4, -32 /* n = n - 32 */
98 bneid r4, a_block_aligned /* while (n) loop */
104 add r6, r6, r4 /* s = s + n */
107 addi r9, r9, -1
108 beqi r9, a_block_u1 /* t1 was 1 => 1 byte offset */
109 addi r9, r9, -1
116 bsrli r9, r12, 8 /* t1 = v >> 8 */
120 lwi r12, r8, 8 /* v = *(as + 8) */
121 bsrli r9, r12, 8 /* t1 = v >> 8 */
126 bsrli r9, r12, 8 /* t1 = v >> 8 */
128 swi r9, r5, 8 /* *(d + 8) = t1 */
131 bsrli r9, r12, 8 /* t1 = v >> 8 */
136 bsrli r9, r12, 8 /* t1 = v >> 8 */
141 bsrli r9, r12, 8 /* t1 = v >> 8 */
146 bsrli r9, r12, 8 /* t1 = v >> 8 */
151 bsrli r9, r12, 8 /* t1 = v >> 8 */
156 addi r4, r4, -32 /* n = n - 32 */
157 bneid r4, a_bu3_loop /* while (n) loop */
162 bslli r11, r11, 8 /* h = h << 8 */
168 bslli r11, r12, 8 /* h = v << 8 */
169 lwi r12, r8, 8 /* v = *(as + 8) */
173 bslli r11, r12, 8 /* h = v << 8 */
177 swi r9, r5, 8 /* *(d + 8) = t1 */
178 bslli r11, r12, 8 /* h = v << 8 */
183 bslli r11, r12, 8 /* h = v << 8 */
188 bslli r11, r12, 8 /* h = v << 8 */
193 bslli r11, r12, 8 /* h = v << 8 */
198 bslli r11, r12, 8 /* h = v << 8 */
203 bslli r11, r12, 8 /* h = v << 8 */
205 addi r4, r4, -32 /* n = n - 32 */
206 bneid r4, a_bu1_loop /* while (n) loop */
218 lwi r12, r8, 8 /* v = *(as + 8) */
226 swi r9, r5, 8 /* *(d + 8) = t1 */
254 addi r4, r4, -32 /* n = n - 32 */
255 bneid r4, a_bu2_loop /* while (n) loop */
259 addi r4, r0, 4 /* n = 4 */
260 cmpu r4, r4, r7 /* n = c - n (unsigned) */
261 blti r4, a_xfer_end /* if n < 0, less than one word to transfer */
264 andi r4, r7, 0xfffffffc /* n = c & ~3 */
274 addi r4, r4,-4 /* n-- */
285 addi r9, r9, -1
286 beqi r9, a_word_u1 /* t1 was 1 => 1 byte offset */
287 addi r9, r9, -1
294 bsrli r9, r12, 8 /* t1 = v >> 8 */
298 addi r4, r4,-4 /* n = n - 4 */
299 bneid r4, a_wu3_loop /* while (n) loop */
305 bslli r11, r11, 8 /* h = h << 8 */
311 bslli r11, r12, 8 /* h = v << 8 */
312 addi r4, r4,-4 /* n = n - 4 */
313 bneid r4, a_wu1_loop /* while (n) loop */
326 addi r4, r4,-4 /* n = n - 4 */
327 bneid r4, a_wu2_loop /* while (n) loop */
333 rsub r7, r10, r7 /* c = c - offset */
339 addi r6, r6, 1 /* s++ */
341 addi r7, r7, -1 /* c-- */
343 addi r5, r5, 1 /* d++ (IN DELAY SLOT) */
346 rtsd r15, 8
349 .size memcpy, . - memcpy
351 /*----------------------------------------------------------------------------*/
357 cmpu r4, r5, r6 /* n = s - d */
367 addi r4, r0, 4 /* n = 4 */
368 cmpu r4, r4, r7 /* n = c - n (unsigned) */
369 blti r4,d_xfer_end /* if n < 0, less than one word to transfer */
372 andi r4, r5, 3 /* n = d & 3 */
375 rsub r7, r4, r7 /* c = c - n adjust c */
380 addi r6, r6, -1 /* s-- */
381 addi r5, r5, -1 /* d-- */
385 addi r4, r4, -1 /* n-- (IN DELAY SLOT) */
388 addi r4, r0, 32 /* n = 32 */
389 cmpu r4, r4, r7 /* n = c - n (unsigned) */
390 /* if n < 0, less than one block to transfer */
394 andi r4, r7, 0xffffffe0 /* n = c & ~31 */
395 rsub r7, r4, r7 /* c = c - n */
402 addi r6, r6, -32 /* s = s - 32 */
403 addi r5, r5, -32 /* d = d - 32 */
413 lwi r10, r6, 8 /* t2 = *(s + 8) */
417 swi r10, r5, 8 /* *(d + 8) = t2 */
419 addi r4, r4, -32 /* n = n - 32 */
420 bneid r4, d_block_aligned /* while (n) loop */
426 rsub r6, r4, r6 /* s = s - n */
429 addi r9, r9, -1
430 beqi r9,d_block_u1 /* t1 was 1 => 1 byte offset */
431 addi r9, r9, -1
435 bsrli r11, r11, 8 /* h = h >> 8 */
437 addi r8, r8, -32 /* as = as - 32 */
438 addi r5, r5, -32 /* d = d - 32 */
443 bsrli r11, r12, 8 /* h = v >> 8 */
448 bsrli r11, r12, 8 /* h = v >> 8 */
453 bsrli r11, r12, 8 /* h = v >> 8 */
458 bsrli r11, r12, 8 /* h = v >> 8 */
463 bsrli r11, r12, 8 /* h = v >> 8 */
464 lwi r12, r8, 8 /* v = *(as + 8) */
467 swi r9, r5, 8 /* *(d + 8) = t1 */
468 bsrli r11, r12, 8 /* h = v >> 8 */
473 bsrli r11, r12, 8 /* h = v >> 8 */
478 addi r4, r4, -32 /* n = n - 32 */
479 bneid r4, d_bu3_loop /* while (n) loop */
480 bsrli r11, r12, 8 /* h = v >> 8 (IN DELAY SLOT) */
486 addi r8, r8, -32 /* as = as - 32 */
487 addi r5, r5, -32 /* d = d - 32 */
489 bslli r9, r12, 8 /* t1 = v << 8 */
494 bslli r9, r12, 8 /* t1 = v << 8 */
499 bslli r9, r12, 8 /* t1 = v << 8 */
504 bslli r9, r12, 8 /* t1 = v << 8 */
509 bslli r9, r12, 8 /* t1 = v << 8 */
513 lwi r12, r8, 8 /* v = *(as + 8) */
514 bslli r9, r12, 8 /* t1 = v << 8 */
516 swi r9, r5, 8 /* *(d + 8) = t1 */
519 bslli r9, r12, 8 /* t1 = v << 8 */
524 bslli r9, r12, 8 /* t1 = v << 8 */
527 addi r4, r4, -32 /* n = n - 32 */
528 bneid r4, d_bu1_loop /* while (n) loop */
535 addi r8, r8, -32 /* as = as - 32 */
536 addi r5, r5, -32 /* d = d - 32 */
562 lwi r12, r8, 8 /* v = *(as + 8) */
565 swi r9, r5, 8 /* *(d + 8) = t1 */
576 addi r4, r4, -32 /* n = n - 32 */
577 bneid r4, d_bu2_loop /* while (n) loop */
581 addi r4, r0, 4 /* n = 4 */
582 cmpu r4, r4, r7 /* n = c - n (unsigned) */
583 blti r4,d_xfer_end /* if n < 0, less than one word to transfer */
586 andi r4, r7, 0xfffffffc /* n = c & ~3 */
587 rsub r5, r4, r5 /* d = d - n */
588 rsub r6, r4, r6 /* s = s - n */
589 rsub r7, r4, r7 /* c = c - n */
596 addi r4, r4,-4 /* n-- */
597 lw r9, r6, r4 /* t1 = *(s+n) */
599 sw r9, r5, r4 /* *(d+n) = t1 (IN DELAY SLOT) */
605 lw r11, r8, r4 /* h = *(as + n) */
607 addi r9, r9, -1
608 beqi r9,d_word_u1 /* t1 was 1 => 1 byte offset */
609 addi r9, r9, -1
613 bsrli r11, r11, 8 /* h = h >> 8 */
615 addi r4, r4,-4 /* n = n - 4 */
616 lw r12, r8, r4 /* v = *(as + n) */
619 sw r9, r5, r4 /* *(d + n) = t1 */
620 bneid r4, d_wu3_loop /* while (n) loop */
621 bsrli r11, r12, 8 /* h = v >> 8 (IN DELAY SLOT) */
628 addi r4, r4,-4 /* n = n - 4 */
629 lw r12, r8, r4 /* v = *(as + n) */
630 bslli r9, r12, 8 /* t1 = v << 8 */
632 sw r9, r5, r4 /* *(d + n) = t1 */
633 bneid r4, d_wu1_loop /* while (n) loop */
641 addi r4, r4,-4 /* n = n - 4 */
642 lw r12, r8, r4 /* v = *(as + n) */
645 sw r9, r5, r4 /* *(d + n) = t1 */
646 bneid r4, d_wu2_loop /* while (n) loop */
654 addi r6, r6, -1 /* s-- */
656 addi r5, r5, -1 /* d-- */
659 addi r7, r7, -1 /* c-- (IN DELAY SLOT) */
662 rtsd r15, 8
665 .size memmove, . - memmove