OpenCores
URL https://opencores.org/ocsvn/openrisc_2011-10-31/openrisc_2011-10-31/trunk

Subversion Repositories openrisc_2011-10-31

[/] [openrisc/] [tags/] [gnu-src/] [newlib-1.18.0/] [newlib-1.18.0-or32-1.0rc1/] [newlib/] [libc/] [machine/] [mips/] [memcpy.c] - Diff between revs 207 and 345

Only display areas with differences | Details | Blame | View Log

Rev 207 Rev 345
/*
/*
FUNCTION
FUNCTION
        <<memcpy>>---copy memory regions, optimized for the mips processors
        <<memcpy>>---copy memory regions, optimized for the mips processors
 
 
ANSI_SYNOPSIS
ANSI_SYNOPSIS
        #include <string.h>
        #include <string.h>
        void* memcpy(void *<[out]>, const void *<[in]>, size_t <[n]>);
        void* memcpy(void *<[out]>, const void *<[in]>, size_t <[n]>);
 
 
TRAD_SYNOPSIS
TRAD_SYNOPSIS
        void *memcpy(<[out]>, <[in]>, <[n]>
        void *memcpy(<[out]>, <[in]>, <[n]>
        void *<[out]>;
        void *<[out]>;
        void *<[in]>;
        void *<[in]>;
        size_t <[n]>;
        size_t <[n]>;
 
 
DESCRIPTION
DESCRIPTION
        This function copies <[n]> bytes from the memory region
        This function copies <[n]> bytes from the memory region
        pointed to by <[in]> to the memory region pointed to by
        pointed to by <[in]> to the memory region pointed to by
        <[out]>.
        <[out]>.
 
 
        If the regions overlap, the behavior is undefined.
        If the regions overlap, the behavior is undefined.
 
 
RETURNS
RETURNS
        <<memcpy>> returns a pointer to the first byte of the <[out]>
        <<memcpy>> returns a pointer to the first byte of the <[out]>
        region.
        region.
 
 
PORTABILITY
PORTABILITY
<<memcpy>> is ANSI C.
<<memcpy>> is ANSI C.
 
 
<<memcpy>> requires no supporting OS subroutines.
<<memcpy>> requires no supporting OS subroutines.
 
 
QUICKREF
QUICKREF
        memcpy ansi pure
        memcpy ansi pure
        */
        */
 
 
#include <_ansi.h>
#include <_ansi.h>
#include <stddef.h>
#include <stddef.h>
#include <limits.h>
#include <limits.h>
 
 
#ifdef __mips64
#ifdef __mips64
#define wordtype long long
#define wordtype long long
#else
#else
#define wordtype long
#define wordtype long
#endif
#endif
 
 
/* Nonzero if either X or Y is not aligned on a "long" boundary.  */
/* Nonzero if either X or Y is not aligned on a "long" boundary.  */
#define UNALIGNED(X, Y) \
#define UNALIGNED(X, Y) \
  (((long)X & (sizeof (wordtype) - 1)) | ((long)Y & (sizeof (wordtype) - 1)))
  (((long)X & (sizeof (wordtype) - 1)) | ((long)Y & (sizeof (wordtype) - 1)))
 
 
/* How many bytes are copied each iteration of the 4X unrolled loop.  */
/* How many bytes are copied each iteration of the 4X unrolled loop.  */
#define BIGBLOCKSIZE    (sizeof (wordtype) << 2)
#define BIGBLOCKSIZE    (sizeof (wordtype) << 2)
 
 
/* How many bytes are copied each iteration of the word copy loop.  */
/* How many bytes are copied each iteration of the word copy loop.  */
#define LITTLEBLOCKSIZE (sizeof (wordtype))
#define LITTLEBLOCKSIZE (sizeof (wordtype))
 
 
/* Threshhold for punting to the byte copier.  */
/* Threshhold for punting to the byte copier.  */
#define TOO_SMALL(LEN)  ((LEN) < BIGBLOCKSIZE)
#define TOO_SMALL(LEN)  ((LEN) < BIGBLOCKSIZE)
 
 
_PTR
_PTR
_DEFUN (memcpy, (dst0, src0, len0),
_DEFUN (memcpy, (dst0, src0, len0),
        _PTR dst0 _AND
        _PTR dst0 _AND
        _CONST _PTR src0 _AND
        _CONST _PTR src0 _AND
        size_t len0)
        size_t len0)
{
{
#if defined(PREFER_SIZE_OVER_SPEED) || defined(__OPTIMIZE_SIZE__) || defined(__mips16)
#if defined(PREFER_SIZE_OVER_SPEED) || defined(__OPTIMIZE_SIZE__) || defined(__mips16)
  char *dst = (char *) dst0;
  char *dst = (char *) dst0;
  char *src = (char *) src0;
  char *src = (char *) src0;
 
 
  _PTR save = dst0;
  _PTR save = dst0;
 
 
  while (len0--)
  while (len0--)
    {
    {
      *dst++ = *src++;
      *dst++ = *src++;
    }
    }
 
 
  return save;
  return save;
#else
#else
  char *dst = dst0;
  char *dst = dst0;
  _CONST char *src = src0;
  _CONST char *src = src0;
  wordtype *aligned_dst;
  wordtype *aligned_dst;
  _CONST wordtype *aligned_src;
  _CONST wordtype *aligned_src;
  int   len =  len0;
  int   len =  len0;
  size_t iter;
  size_t iter;
 
 
  /* Handle aligned moves here.  */
  /* Handle aligned moves here.  */
  if (!UNALIGNED (src, dst))
  if (!UNALIGNED (src, dst))
    {
    {
      iter = len / BIGBLOCKSIZE;
      iter = len / BIGBLOCKSIZE;
      len = len % BIGBLOCKSIZE;
      len = len % BIGBLOCKSIZE;
      aligned_dst = (wordtype *)dst;
      aligned_dst = (wordtype *)dst;
      aligned_src = (wordtype *)src;
      aligned_src = (wordtype *)src;
 
 
          /* Copy 4X long or long long words at a time if possible.  */
          /* Copy 4X long or long long words at a time if possible.  */
      while (iter > 0)
      while (iter > 0)
        {
        {
          wordtype tmp0 = aligned_src[0];
          wordtype tmp0 = aligned_src[0];
          wordtype tmp1 = aligned_src[1];
          wordtype tmp1 = aligned_src[1];
          wordtype tmp2 = aligned_src[2];
          wordtype tmp2 = aligned_src[2];
          wordtype tmp3 = aligned_src[3];
          wordtype tmp3 = aligned_src[3];
 
 
          aligned_dst[0] = tmp0;
          aligned_dst[0] = tmp0;
          aligned_dst[1] = tmp1;
          aligned_dst[1] = tmp1;
          aligned_dst[2] = tmp2;
          aligned_dst[2] = tmp2;
          aligned_dst[3] = tmp3;
          aligned_dst[3] = tmp3;
          aligned_src += 4;
          aligned_src += 4;
          aligned_dst += 4;
          aligned_dst += 4;
          iter--;
          iter--;
        }
        }
 
 
      /* Copy one long or long long word at a time if possible.  */
      /* Copy one long or long long word at a time if possible.  */
      iter = len / LITTLEBLOCKSIZE;
      iter = len / LITTLEBLOCKSIZE;
      len = len % LITTLEBLOCKSIZE;
      len = len % LITTLEBLOCKSIZE;
 
 
      while (iter > 0)
      while (iter > 0)
        {
        {
          *aligned_dst++ = *aligned_src++;
          *aligned_dst++ = *aligned_src++;
          iter--;
          iter--;
        }
        }
 
 
      /* Pick up any residual with a byte copier.  */
      /* Pick up any residual with a byte copier.  */
      dst = (char*)aligned_dst;
      dst = (char*)aligned_dst;
      src = (char*)aligned_src;
      src = (char*)aligned_src;
 
 
      while (len > 0)
      while (len > 0)
        {
        {
          *dst++ = *src++;
          *dst++ = *src++;
          len--;
          len--;
        }
        }
 
 
      return dst0;
      return dst0;
    }
    }
 
 
  /* Handle unaligned moves here, using lwr/lwl and swr/swl where possible */
  /* Handle unaligned moves here, using lwr/lwl and swr/swl where possible */
  else
  else
    {
    {
#ifndef NO_UNALIGNED_LOADSTORE
#ifndef NO_UNALIGNED_LOADSTORE
      int tmp;
      int tmp;
      int *int_src = (int *)src;
      int *int_src = (int *)src;
      int *int_dst = (int *)dst;
      int *int_dst = (int *)dst;
      iter = len / 4;
      iter = len / 4;
      len = len % 4;
      len = len % 4;
      while (iter > 0)
      while (iter > 0)
        {
        {
          __asm__ ("ulw %0,%1" : "=r" (tmp) : "m" (*int_src));
          __asm__ ("ulw %0,%1" : "=r" (tmp) : "m" (*int_src));
          iter--;
          iter--;
          int_src++;
          int_src++;
          __asm__ ("usw %1,%0" : "=m" (*int_dst) : "r" (tmp));
          __asm__ ("usw %1,%0" : "=m" (*int_dst) : "r" (tmp));
          int_dst++;
          int_dst++;
        }
        }
 
 
      /* Pick up any residual with a byte copier.  */
      /* Pick up any residual with a byte copier.  */
      dst = (char*)int_dst;
      dst = (char*)int_dst;
      src = (char*)int_src;
      src = (char*)int_src;
#endif
#endif
 
 
      while (len > 0)
      while (len > 0)
        {
        {
          *dst++ = *src++;
          *dst++ = *src++;
          len--;
          len--;
        }
        }
 
 
      return dst0;
      return dst0;
    }
    }
#endif /* not PREFER_SIZE_OVER_SPEED */
#endif /* not PREFER_SIZE_OVER_SPEED */
}
}
 
 

powered by: WebSVN 2.1.0

© copyright 1999-2024 OpenCores.org, equivalent to Oliscience, all rights reserved. OpenCores®, registered trademark.