| /* |
| * internal version of memcpy(), issued by the compiler to copy blocks of |
| * data around. This is really memmove() - it has to be able to deal with |
| * possible overlaps, because that ambiguity is when the compiler gives up |
| * and calls a function. We have our own, internal version so that we get |
| * something we trust, even if the user has redefined the normal symbol. |
| * |
| * Copyright 2004-2009 Analog Devices Inc. |
| * |
| * Licensed under the ADI BSD license or the GPL-2 (or later) |
| */ |
| |
| #include <linux/linkage.h> |
| |
| /* void *memcpy(void *dest, const void *src, size_t n); |
| * R0 = To Address (dest) (leave unchanged to form result) |
| * R1 = From Address (src) |
| * R2 = count |
| * |
| * Note: Favours word alignment |
| */ |
| |
| #ifdef CONFIG_MEMCPY_L1 |
| .section .l1.text |
| #else |
| .text |
| #endif |
| |
| .align 2 |
| |
| ENTRY(_memcpy) |
| CC = R2 <= 0; /* length not positive? */ |
| IF CC JUMP .L_P1L2147483647; /* Nothing to do */ |
| |
| P0 = R0 ; /* dst*/ |
| P1 = R1 ; /* src*/ |
| P2 = R2 ; /* length */ |
| |
| /* check for overlapping data */ |
| CC = R1 < R0; /* src < dst */ |
| IF !CC JUMP .Lno_overlap; |
| R3 = R1 + R2; |
| CC = R0 < R3; /* and dst < src+len */ |
| IF CC JUMP .Lhas_overlap; |
| |
| .Lno_overlap: |
| /* Check for aligned data.*/ |
| |
| R3 = R1 | R0; |
| R1 = 0x3; |
| R3 = R3 & R1; |
| CC = R3; /* low bits set on either address? */ |
| IF CC JUMP .Lnot_aligned; |
| |
| /* Both addresses are word-aligned, so we can copy |
| at least part of the data using word copies.*/ |
| P2 = P2 >> 2; |
| CC = P2 <= 2; |
| IF !CC JUMP .Lmore_than_seven; |
| /* less than eight bytes... */ |
| P2 = R2; |
| LSETUP(.Lthree_start, .Lthree_end) LC0=P2; |
| .Lthree_start: |
| R3 = B[P1++] (X); |
| .Lthree_end: |
| B[P0++] = R3; |
| |
| RTS; |
| |
| .Lmore_than_seven: |
| /* There's at least eight bytes to copy. */ |
| P2 += -1; /* because we unroll one iteration */ |
| LSETUP(.Lword_loops, .Lword_loope) LC0=P2; |
| I1 = P1; |
| R3 = [I1++]; |
| #if ANOMALY_05000202 |
| .Lword_loops: |
| [P0++] = R3; |
| .Lword_loope: |
| R3 = [I1++]; |
| #else |
| .Lword_loops: |
| .Lword_loope: |
| MNOP || [P0++] = R3 || R3 = [I1++]; |
| #endif |
| [P0++] = R3; |
| /* Any remaining bytes to copy? */ |
| R3 = 0x3; |
| R3 = R2 & R3; |
| CC = R3 == 0; |
| P1 = I1; /* in case there's something left, */ |
| IF !CC JUMP .Lbytes_left; |
| RTS; |
| .Lbytes_left: P2 = R3; |
| .Lnot_aligned: |
| /* From here, we're copying byte-by-byte. */ |
| LSETUP (.Lbyte_start, .Lbyte_end) LC0=P2; |
| .Lbyte_start: |
| R1 = B[P1++] (X); |
| .Lbyte_end: |
| B[P0++] = R1; |
| |
| .L_P1L2147483647: |
| RTS; |
| |
| .Lhas_overlap: |
| /* Need to reverse the copying, because the |
| * dst would clobber the src. |
| * Don't bother to work out alignment for |
| * the reverse case. |
| */ |
| P0 = P0 + P2; |
| P0 += -1; |
| P1 = P1 + P2; |
| P1 += -1; |
| LSETUP(.Lover_start, .Lover_end) LC0=P2; |
| .Lover_start: |
| R1 = B[P1--] (X); |
| .Lover_end: |
| B[P0--] = R1; |
| |
| RTS; |
| |
| ENDPROC(_memcpy) |