123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201 |
- /*
- * This program is free software; you can redistribute it and/or modify it under
- * the terms of the GNU Library General Public License as published by the Free
- * Software Foundation; either version 2 of the License, or (at your option) any
- * later version.
- *
- * This program is distributed in the hope that it will be useful, but WITHOUT
- * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
- * FOR A PARTICULAR PURPOSE. See the GNU Library General Public License for more
- * details.
- */
- /* These are carefully optimized mem*() functions for PPC written in C.
- * Don't muck around with these function without checking the generated
- * assmbler code.
- * It is possible to optimize these significantly more by using specific
- * data cache instructions(mainly dcbz). However that requires knownledge
- * about the CPU's cache line size.
- *
- * BUG ALERT!
- * The cache instructions on MPC8xx CPU's are buggy(they don't update
- * the DAR register when causing a DTLB Miss/Error) and cannot be
- * used on 8xx CPU's without a kernel patch to work around this
- * problem.
- *
- * Copyright (C) 2004 Joakim Tjernlund
- */
- #define _STDIO_UTILITY
- #define _GNU_SOURCE
- #include <string.h>
- #include <locale.h> /* for __LOCALE_C_ONLY */
- #ifdef L_memcpy
- void *memcpy(void *to, const void *from, size_t n)
- /* PPC can do pre increment and load/store, but not post increment and load/store.
- Therefore use *++ptr instead of *ptr++. */
- {
- unsigned long rem, chunks, tmp1, tmp2;
- void *tmp_to;
- chunks = n / 8;
- from -= 4;
- tmp_to = to - 4;
- if (!chunks)
- goto lessthan8;
- rem = (unsigned long )tmp_to % 4;
- if (rem)
- goto align;
- copy_chunks:
- do {
- /* make gcc to load all data, then store it */
- tmp1 = *(unsigned long *)(from+4);
- from += 8;
- tmp2 = *(unsigned long *)from;
- *(unsigned long *)(tmp_to+4) = tmp1;
- tmp_to += 8;
- *(unsigned long *)tmp_to = tmp2;
- } while (--chunks);
- lessthan8:
- n = n % 8;
- if (n >= 4) {
- *++(unsigned long *)tmp_to = *++(unsigned long *)from;
- n = n-4;
- }
- if (!n ) return to;
- from += 3;
- tmp_to += 3;
- do {
- *++(unsigned char *)tmp_to = *++(unsigned char *)from;
- } while (--n);
-
- return to;
- align:
- rem = 4 - rem;
- n = n-rem;
- do {
- *(unsigned char *)(tmp_to+4) = *(unsigned char *)(from+4);
- ++from;
- ++tmp_to;
- } while (--rem);
- chunks = n / 8;
- if (chunks)
- goto copy_chunks;
- goto lessthan8;
- }
- #endif
- #ifdef L_memmove
- void *memmove(void *to, const void *from, size_t n)
- {
- unsigned long rem, chunks, tmp1, tmp2;
- void *tmp_to;
- if (from >= to)
- return memcpy(to, from, n);
- chunks = n / 8;
- from += n;
- tmp_to = to + n;
- if (!chunks)
- goto lessthan8;
- rem = (unsigned long )tmp_to % 4;
- if (rem)
- goto align;
- copy_chunks:
- do {
- /* make gcc to load all data, then store it */
- tmp1 = *(unsigned long *)(from-4);
- from -= 8;
- tmp2 = *(unsigned long *)from;
- *(unsigned long *)(tmp_to-4) = tmp1;
- tmp_to -= 8;
- *(unsigned long *)tmp_to = tmp2;
- } while (--chunks);
- lessthan8:
- n = n % 8;
- if (n >= 4) {
- *--(unsigned long *)tmp_to = *--(unsigned long *)from;
- n = n-4;
- }
- if (!n ) return to;
- do {
- *--(unsigned char *)tmp_to = *--(unsigned char *)from;
- } while (--n);
-
- return to;
- align:
- rem = 4 - rem;
- n = n-rem;
- do {
- *--(unsigned char *)tmp_to = *--(unsigned char *)from;
- } while (--rem);
- chunks = n / 8;
- if (chunks)
- goto copy_chunks;
- goto lessthan8;
- }
- #endif
- #ifdef L_memset
- static inline int expand_byte_word(int c){
- /* this does:
- c = c << 8 | c;
- c = c << 16 | c ;
- */
- asm("rlwimi %0,%0,8,16,23\n"
- "\trlwimi %0,%0,16,0,15\n"
- : "=r" (c) : "0" (c));
- return c;
- }
- void *memset(void *to, int c, size_t n)
- {
- unsigned long rem, chunks;
- void *tmp_to;
- chunks = n / 8;
- tmp_to = to - 4;
- c = expand_byte_word(c);
- if (!chunks)
- goto lessthan8;
- rem = (unsigned long )tmp_to % 4;
- if (rem)
- goto align;
- copy_chunks:
- do {
- *++(unsigned long *)tmp_to = c;
- *++(unsigned long *)tmp_to = c;
- } while (--chunks);
- lessthan8:
- n = n % 8;
- if (n >= 4) {
- *++(unsigned long *)tmp_to = c;
- n = n-4;
- }
- if (!n ) return to;
- tmp_to += 3;
- do {
- *++(unsigned char *)tmp_to = c;
- } while (--n);
-
- return to;
- align:
- rem = 4 - rem;
- n = n-rem;
- do {
- *(unsigned char *)(tmp_to+4) = c;
- ++tmp_to;
- } while (--rem);
- chunks = n / 8;
- if (chunks)
- goto copy_chunks;
- goto lessthan8;
- }
- #endif
- #ifdef L_bzero
- void bzero(void *s, size_t n)
- {
- (void)memset(s, 0, n);
- }
- #endif
|