123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100 |
- /* memmove.S
- * Copyright (C) 2003-2007 Analog Devices Inc., All Rights Reserved.
- *
- * This file is subject to the terms and conditions of the GNU Library General
- * Public License. See the file "COPYING.LIB" in the main directory of this
- * archive for more details.
- *
- * Non-LGPL License also available as part of VisualDSP++
- * http://www.analog.com/processors/resources/crosscore/visualDspDevSoftware.html
- */
- #include <sysdep.h>
- /* void *memmove(void *dest, const void *src, size_t n);
- * R0 = To Address (dest) (leave unchanged to form result)
- * R1 = From Address (src)
- * R2 = count (n)
- *
- * Note: Data may overlap
- */
- .text
- .align 2
- .weak _memmove
- ENTRY(_memmove)
- I1 = P3;
- P0 = R0; /* P0 = To address */
- P3 = R1; /* P3 = From Address */
- P2 = R2; /* P2 = count */
- CC = P2 == 0; /* Check zero count*/
- IF CC JUMP .Lfinished; /* very unlikely */
- CC = R1 < R0 (IU); /* From < To */
- IF !CC JUMP .Lno_overlap;
- R3 = R1 + R2;
- CC = R0 <= R3 (IU); /* (From+len) >= To */
- IF CC JUMP .Loverlap;
- .Lno_overlap:
- R3 = 11;
- CC = R2 <= R3;
- IF CC JUMP .Lbytes;
- R3 = R1 | R0; /* OR addresses together */
- R3 <<= 30; /* check bottom two bits */
- CC = AZ; /* AZ set if zero.*/
- IF !CC JUMP .Lbytes; /* Jump if addrs not aligned.*/
- I0 = P3;
- P1 = P2 >> 2; /* count = n/4 */
- P1 += -1;
- R3 = 3;
- R2 = R2 & R3; /* remainder */
- P2 = R2; /* set remainder */
- R1 = [I0++];
- #if !defined(__WORKAROUND_AVOID_DAG1)
- LSETUP (.Lquad_loop, .Lquad_loop) LC0=P1;
- .Lquad_loop: MNOP || [P0++] = R1 || R1 = [I0++];
- #else
- LSETUP (.Lquad_loop_s, .Lquad_loop_e) LC0=P1;
- .Lquad_loop_s: [P0++] = R1;
- .Lquad_loop_e: R1 = [I0++];
- #endif
- [P0++] = R1;
- CC = P2 == 0; /* any remaining bytes? */
- P3 = I0; /* Ammend P3 to updated ptr. */
- IF !CC JUMP .Lbytes;
- P3 = I1;
- RTS;
- .Lbytes: LSETUP (.Lbyte2_s, .Lbyte2_e) LC0=P2;
- .Lbyte2_s: R1 = B[P3++](Z);
- .Lbyte2_e: B[P0++] = R1;
- .Lfinished: P3 = I1;
- RTS;
- .Loverlap:
- P2 += -1;
- P0 = P0 + P2;
- P3 = P3 + P2;
- R1 = B[P3--] (Z);
- CC = P2 == 0;
- IF CC JUMP .Lno_loop;
- #if defined(__WORKAROUND_SPECULATIVE_LOADS)
- NOP;
- NOP;
- #endif
- LSETUP (.Lol_s, .Lol_e) LC0 = P2;
- .Lol_s: B[P0--] = R1;
- .Lol_e: R1 = B[P3--] (Z);
- .Lno_loop: B[P0] = R1;
- P3 = I1;
- RTS;
- .size _memmove,.-_memmove
- libc_hidden_def (memmove)
|