165 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			165 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			C
		
	
	
	
| /*
 | |
| FUNCTION
 | |
|         <<memcpy>>---copy memory regions, optimized for the mips processors
 | |
| 
 | |
| ANSI_SYNOPSIS
 | |
|         #include <string.h>
 | |
|         void* memcpy(void *<[out]>, const void *<[in]>, size_t <[n]>);
 | |
| 
 | |
| TRAD_SYNOPSIS
 | |
|         void *memcpy(<[out]>, <[in]>, <[n]>
 | |
|         void *<[out]>;
 | |
|         void *<[in]>;
 | |
|         size_t <[n]>;
 | |
| 
 | |
| DESCRIPTION
 | |
|         This function copies <[n]> bytes from the memory region
 | |
|         pointed to by <[in]> to the memory region pointed to by
 | |
|         <[out]>.
 | |
| 
 | |
|         If the regions overlap, the behavior is undefined.
 | |
| 
 | |
| RETURNS
 | |
|         <<memcpy>> returns a pointer to the first byte of the <[out]>
 | |
|         region.
 | |
| 
 | |
| PORTABILITY
 | |
| <<memcpy>> is ANSI C.
 | |
| 
 | |
| <<memcpy>> requires no supporting OS subroutines.
 | |
| 
 | |
| QUICKREF
 | |
|         memcpy ansi pure
 | |
| 	*/
 | |
| 
 | |
| #include <_ansi.h>
 | |
| #include <stddef.h>
 | |
| #include <limits.h>
 | |
| 
 | |
| #ifdef __mips64
 | |
| #define wordtype long long
 | |
| #else
 | |
| #define wordtype long
 | |
| #endif
 | |
| 
 | |
| /* Nonzero if either X or Y is not aligned on a "long" boundary.  */
 | |
| #define UNALIGNED(X, Y) \
 | |
|   (((long)X & (sizeof (wordtype) - 1)) | ((long)Y & (sizeof (wordtype) - 1)))
 | |
| 
 | |
| /* How many bytes are copied each iteration of the 4X unrolled loop.  */
 | |
| #define BIGBLOCKSIZE    (sizeof (wordtype) << 2)
 | |
| 
 | |
| /* How many bytes are copied each iteration of the word copy loop.  */
 | |
| #define LITTLEBLOCKSIZE (sizeof (wordtype))
 | |
| 
 | |
| /* Threshhold for punting to the byte copier.  */
 | |
| #define TOO_SMALL(LEN)  ((LEN) < BIGBLOCKSIZE)
 | |
| 
 | |
| _PTR
 | |
| _DEFUN (memcpy, (dst0, src0, len0),
 | |
| 	_PTR dst0 _AND
 | |
| 	_CONST _PTR src0 _AND
 | |
| 	size_t len0)
 | |
| {
 | |
| #if defined(PREFER_SIZE_OVER_SPEED) || defined(__OPTIMIZE_SIZE__) || defined(__mips16)
 | |
|   char *dst = (char *) dst0;
 | |
|   char *src = (char *) src0;
 | |
| 
 | |
|   _PTR save = dst0;
 | |
| 
 | |
|   while (len0--)
 | |
|     {
 | |
|       *dst++ = *src++;
 | |
|     }
 | |
| 
 | |
|   return save;
 | |
| #else
 | |
|   char *dst = dst0;
 | |
|   _CONST char *src = src0;
 | |
|   wordtype *aligned_dst;
 | |
|   _CONST wordtype *aligned_src;
 | |
|   int   len =  len0;
 | |
|   size_t iter;
 | |
| 
 | |
|   /* Handle aligned moves here.  */
 | |
|   if (!UNALIGNED (src, dst))
 | |
|     {
 | |
|       iter = len / BIGBLOCKSIZE;
 | |
|       len = len % BIGBLOCKSIZE;
 | |
|       aligned_dst = (wordtype *)dst;
 | |
|       aligned_src = (wordtype *)src;
 | |
| 
 | |
| 	  /* Copy 4X long or long long words at a time if possible.  */
 | |
|       while (iter > 0)
 | |
| 	{
 | |
| 	  wordtype tmp0 = aligned_src[0];
 | |
| 	  wordtype tmp1 = aligned_src[1];
 | |
| 	  wordtype tmp2 = aligned_src[2];
 | |
| 	  wordtype tmp3 = aligned_src[3];
 | |
| 
 | |
| 	  aligned_dst[0] = tmp0;
 | |
| 	  aligned_dst[1] = tmp1;
 | |
| 	  aligned_dst[2] = tmp2;
 | |
| 	  aligned_dst[3] = tmp3;
 | |
| 	  aligned_src += 4;
 | |
| 	  aligned_dst += 4;
 | |
| 	  iter--;
 | |
| 	}
 | |
| 
 | |
|       /* Copy one long or long long word at a time if possible.  */
 | |
|       iter = len / LITTLEBLOCKSIZE;
 | |
|       len = len % LITTLEBLOCKSIZE;
 | |
| 
 | |
|       while (iter > 0)
 | |
| 	{
 | |
| 	  *aligned_dst++ = *aligned_src++;
 | |
| 	  iter--;
 | |
| 	}
 | |
| 
 | |
|       /* Pick up any residual with a byte copier.  */
 | |
|       dst = (char*)aligned_dst;
 | |
|       src = (char*)aligned_src;
 | |
| 
 | |
|       while (len > 0)
 | |
| 	{
 | |
| 	  *dst++ = *src++;
 | |
| 	  len--;
 | |
| 	}
 | |
| 
 | |
|       return dst0;
 | |
|     }
 | |
| 
 | |
|   /* Handle unaligned moves here, using lwr/lwl and swr/swl where possible */
 | |
|   else
 | |
|     {
 | |
| #ifndef NO_UNALIGNED_LOADSTORE
 | |
|       int tmp;
 | |
|       int *int_src = (int *)src;
 | |
|       int *int_dst = (int *)dst;
 | |
|       iter = len / 4;
 | |
|       len = len % 4;
 | |
|       while (iter > 0)
 | |
| 	{
 | |
| 	  __asm__ ("ulw %0,%1" : "=r" (tmp) : "m" (*int_src));
 | |
| 	  iter--;
 | |
| 	  int_src++;
 | |
| 	  __asm__ ("usw %1,%0" : "=m" (*int_dst) : "r" (tmp));
 | |
| 	  int_dst++;
 | |
| 	}
 | |
| 
 | |
|       /* Pick up any residual with a byte copier.  */
 | |
|       dst = (char*)int_dst;
 | |
|       src = (char*)int_src;
 | |
| #endif
 | |
| 
 | |
|       while (len > 0)
 | |
| 	{
 | |
| 	  *dst++ = *src++;
 | |
| 	  len--;
 | |
| 	}
 | |
| 
 | |
|       return dst0;
 | |
|     }
 | |
| #endif /* not PREFER_SIZE_OVER_SPEED */
 | |
| }
 |