| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182 | /* * Copyright (C) 2004 Joakim Tjernlund * Copyright (C) 2000-2005 Erik Andersen <andersen@uclibc.org> * * Licensed under the LGPL v2.1, see the file COPYING.LIB in this tarball. *//* These are carefully optimized mem*() functions for PPC written in C. * Don't muck around with these function without checking the generated * assembler code. * It is possible to optimize these significantly more by using specific * data cache instructions(mainly dcbz). However that requires knownledge * about the CPU's cache line size. * * BUG ALERT! * The cache instructions on MPC8xx CPU's are buggy(they don't update * the DAR register when causing a DTLB Miss/Error) and cannot be * used on 8xx CPU's without a kernel patch to work around this * problem. */#include <string.h>/* PPC can do pre increment and load/store, but not post increment and   load/store.  Therefore use *++ptr instead of *ptr++.  */void *memcpy(void *to, const void *from, size_t len){	unsigned long rem, chunks, tmp1, tmp2;	unsigned char *tmp_to;	unsigned char *tmp_from = (unsigned char *)from;	chunks = len / 8;	tmp_from -= 4;	tmp_to = to - 4;	if (!chunks)		goto lessthan8;	rem = (unsigned long )tmp_to % 4;	if (rem)		goto align; copy_chunks:	do {		/* make gcc to load all data, then store it */		tmp1 = *(unsigned long *)(tmp_from+4);		tmp_from += 8;		tmp2 = *(unsigned long *)tmp_from;		*(unsigned long *)(tmp_to+4) = tmp1;		tmp_to += 8;		*(unsigned long *)tmp_to = tmp2;	} while (--chunks); lessthan8:	len = len % 8;	if (len >= 4) {		tmp_from += 4;		tmp_to += 4;		*(unsigned long *)(tmp_to) = *(unsigned long *)(tmp_from);		len -= 4;	}	if (!len)		return to;	tmp_from += 3;	tmp_to += 3;	do {		*++tmp_to = *++tmp_from;	} while (--len);	return to; align:	/* ???: Do we really need to generate the carry flag here? If not, then:	rem -= 4; */	rem = 4 - rem;	len -= rem;	do {		*(tmp_to+4) = *(tmp_from+4);		++tmp_from;		++tmp_to;	} while (--rem);	chunks = len / 8;	if (chunks)		goto copy_chunks;	goto lessthan8;}libc_hidden_def(memcpy)
 |