1 /*
2 Copyright (c) 1994 Cygnus Support.
3 All rights reserved.
4 
5 Redistribution and use in source and binary forms are permitted
6 provided that the above copyright notice and this paragraph are
7 duplicated in all such forms and that any documentation,
8 and/or other materials related to such
9 distribution and use acknowledge that the software was developed
10 at Cygnus Support, Inc.  Cygnus Support, Inc. may not be used to
11 endorse or promote products derived from this software without
12 specific prior written permission.
13 THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
14 IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
15 WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
16  */
17 /*
18 FUNCTION
19         <<memcpy>>---copy memory regions
20 
21 SYNOPSIS
22         #include <string.h>
23         void* memcpy(void *restrict <[out]>, const void *restrict <[in]>,
24                      size_t <[n]>);
25 
26 DESCRIPTION
27         This function copies <[n]> bytes from the memory region
28         pointed to by <[in]> to the memory region pointed to by
29         <[out]>.
30 
31         If the regions overlap, the behavior is undefined.
32 
33 RETURNS
34         <<memcpy>> returns a pointer to the first byte of the <[out]>
35         region.
36 
37 PORTABILITY
38 <<memcpy>> is ANSI C.
39 
40 <<memcpy>> requires no supporting OS subroutines.
41 
42 QUICKREF
43         memcpy ansi pure
44 	*/
45 
46 #include <string.h>
47 #include "local.h"
48 #include <stdint.h>
49 
50 /* Nonzero if either X or Y is not aligned on a "long" boundary.  */
51 #define UNALIGNED(X, Y) \
52   (((uintptr_t)X & (sizeof (long) - 1)) | ((uintptr_t)Y & (sizeof (long) - 1)))
53 
54 /* How many bytes are copied each iteration of the 4X unrolled loop.  */
55 #define BIGBLOCKSIZE    (sizeof (long) << 2)
56 
57 /* How many bytes are copied each iteration of the word copy loop.  */
58 #define LITTLEBLOCKSIZE (sizeof (long))
59 
60 /* Threshhold for punting to the byte copier.  */
61 #define TOO_SMALL(LEN)  ((LEN) < BIGBLOCKSIZE)
62 
63 #undef memcpy
64 
65 void *
66 __inhibit_loop_to_libcall
memcpy(void * __restrict dst0,const void * __restrict src0,size_t len0)67 memcpy (void *__restrict dst0,
68 	const void *__restrict src0,
69 	size_t len0)
70 {
71 #if defined(PREFER_SIZE_OVER_SPEED) || defined(__OPTIMIZE_SIZE__)
72   char *dst = (char *) dst0;
73   char *src = (char *) src0;
74 
75   void *save = dst0;
76 
77   while (len0--)
78     {
79       *dst++ = *src++;
80     }
81 
82   return save;
83 #else
84   char *dst = dst0;
85   const char *src = src0;
86   long *aligned_dst;
87   const long *aligned_src;
88 
89   /* If the size is small, or either SRC or DST is unaligned,
90      then punt into the byte copy loop.  This should be rare.  */
91   if (!TOO_SMALL(len0) && !UNALIGNED (src, dst))
92     {
93       aligned_dst = (long*)dst;
94       aligned_src = (long*)src;
95 
96       /* Copy 4X long words at a time if possible.  */
97       while (len0 >= BIGBLOCKSIZE)
98         {
99           *aligned_dst++ = *aligned_src++;
100           *aligned_dst++ = *aligned_src++;
101           *aligned_dst++ = *aligned_src++;
102           *aligned_dst++ = *aligned_src++;
103           len0 -= BIGBLOCKSIZE;
104         }
105 
106       /* Copy one long word at a time if possible.  */
107       while (len0 >= LITTLEBLOCKSIZE)
108         {
109           *aligned_dst++ = *aligned_src++;
110           len0 -= LITTLEBLOCKSIZE;
111         }
112 
113        /* Pick up any residual with a byte copier.  */
114       dst = (char*)aligned_dst;
115       src = (char*)aligned_src;
116     }
117 
118   while (len0--)
119     *dst++ = *src++;
120 
121   return dst0;
122 #endif /* not PREFER_SIZE_OVER_SPEED */
123 }
124