xref: /freebsd/sys/libkern/bcopy.c (revision fdafd315ad0d0f28a11b9fb4476a9ab059c62b92)
15aa07b05SWarner Losh /*-
25aa07b05SWarner Losh  * SPDX-License-Identifier: BSD-3-Clause
35aa07b05SWarner Losh  * Copyright (c) 1990 The Regents of the University of California.
45aa07b05SWarner Losh  *
55aa07b05SWarner Losh  * All rights reserved.
65aa07b05SWarner Losh  *
75aa07b05SWarner Losh  * This code is derived from software contributed to Berkeley by
85aa07b05SWarner Losh  * Chris Torek.
95aa07b05SWarner Losh  *
105aa07b05SWarner Losh  * Redistribution and use in source and binary forms, with or without
115aa07b05SWarner Losh  * modification, are permitted provided that the following conditions
125aa07b05SWarner Losh  * are met:
135aa07b05SWarner Losh  * 1. Redistributions of source code must retain the above copyright
145aa07b05SWarner Losh  *    notice, this list of conditions and the following disclaimer.
155aa07b05SWarner Losh  * 2. Redistributions in binary form must reproduce the above copyright
165aa07b05SWarner Losh  *    notice, this list of conditions and the following disclaimer in the
175aa07b05SWarner Losh  *    documentation and/or other materials provided with the distribution.
185aa07b05SWarner Losh  * 3. Neither the name of the University nor the names of its contributors
195aa07b05SWarner Losh  *    may be used to endorse or promote products derived from this software
205aa07b05SWarner Losh  *    without specific prior written permission.
215aa07b05SWarner Losh  *
225aa07b05SWarner Losh  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
235aa07b05SWarner Losh  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
245aa07b05SWarner Losh  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
255aa07b05SWarner Losh  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
265aa07b05SWarner Losh  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
275aa07b05SWarner Losh  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
285aa07b05SWarner Losh  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
295aa07b05SWarner Losh  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
305aa07b05SWarner Losh  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
315aa07b05SWarner Losh  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
325aa07b05SWarner Losh  * SUCH DAMAGE.
335aa07b05SWarner Losh  */
345aa07b05SWarner Losh 
355aa07b05SWarner Losh #include <sys/param.h>
365aa07b05SWarner Losh #ifdef _KERNEL
375aa07b05SWarner Losh #include <sys/systm.h>
385aa07b05SWarner Losh #else
395aa07b05SWarner Losh #include <string.h>
405aa07b05SWarner Losh #endif
415aa07b05SWarner Losh 
42*baaa3c4dSWarner Losh #undef memcpy
43*baaa3c4dSWarner Losh #undef memmove
44*baaa3c4dSWarner Losh 
455aa07b05SWarner Losh /*
465aa07b05SWarner Losh  * sizeof(word) MUST BE A POWER OF TWO
475aa07b05SWarner Losh  * SO THAT wmask BELOW IS ALL ONES
485aa07b05SWarner Losh  */
495aa07b05SWarner Losh typedef	long	word;		/* "word" used for optimal copy speed */
505aa07b05SWarner Losh 
515aa07b05SWarner Losh #define	wsize	sizeof(word)
525aa07b05SWarner Losh #define wmask	(wsize - 1)
535aa07b05SWarner Losh 
545aa07b05SWarner Losh /*
555aa07b05SWarner Losh  * Copy a block of memory, handling overlap.
565aa07b05SWarner Losh  * This is the routine that actually implements
575aa07b05SWarner Losh  * (the portable versions of) bcopy, memcpy, and memmove.
585aa07b05SWarner Losh  */
595aa07b05SWarner Losh void *
memcpy(void * dst0,const void * src0,size_t length)605aa07b05SWarner Losh memcpy(void *dst0, const void *src0, size_t length)
615aa07b05SWarner Losh {
625aa07b05SWarner Losh 	char		*dst;
635aa07b05SWarner Losh 	const char	*src;
645aa07b05SWarner Losh 	size_t		t;
655aa07b05SWarner Losh 
665aa07b05SWarner Losh 	dst = dst0;
675aa07b05SWarner Losh 	src = src0;
685aa07b05SWarner Losh 
695aa07b05SWarner Losh 	if (length == 0 || dst == src) {	/* nothing to do */
705aa07b05SWarner Losh 		goto done;
715aa07b05SWarner Losh 	}
725aa07b05SWarner Losh 
735aa07b05SWarner Losh 	/*
745aa07b05SWarner Losh 	 * Macros: loop-t-times; and loop-t-times, t>0
755aa07b05SWarner Losh 	 */
765aa07b05SWarner Losh #define	TLOOP(s) if (t) TLOOP1(s)
775aa07b05SWarner Losh #define	TLOOP1(s) do { s; } while (--t)
785aa07b05SWarner Losh 
795aa07b05SWarner Losh 	if ((unsigned long)dst < (unsigned long)src) {
805aa07b05SWarner Losh 		/*
815aa07b05SWarner Losh 		 * Copy forward.
825aa07b05SWarner Losh 		 */
835aa07b05SWarner Losh 		t = (size_t)src;	/* only need low bits */
845aa07b05SWarner Losh 
855aa07b05SWarner Losh 		if ((t | (uintptr_t)dst) & wmask) {
865aa07b05SWarner Losh 			/*
875aa07b05SWarner Losh 			 * Try to align operands.  This cannot be done
885aa07b05SWarner Losh 			 * unless the low bits match.
895aa07b05SWarner Losh 			 */
905aa07b05SWarner Losh 			if ((t ^ (uintptr_t)dst) & wmask || length < wsize) {
915aa07b05SWarner Losh 				t = length;
925aa07b05SWarner Losh 			} else {
935aa07b05SWarner Losh 				t = wsize - (t & wmask);
945aa07b05SWarner Losh 			}
955aa07b05SWarner Losh 
965aa07b05SWarner Losh 			length -= t;
975aa07b05SWarner Losh 			TLOOP1(*dst++ = *src++);
985aa07b05SWarner Losh 		}
995aa07b05SWarner Losh 		/*
1005aa07b05SWarner Losh 		 * Copy whole words, then mop up any trailing bytes.
1015aa07b05SWarner Losh 		 */
1025aa07b05SWarner Losh 		t = length / wsize;
1035aa07b05SWarner Losh 		TLOOP(*(word *)dst = *(const word *)src; src += wsize;
1045aa07b05SWarner Losh 		    dst += wsize);
1055aa07b05SWarner Losh 		t = length & wmask;
1065aa07b05SWarner Losh 		TLOOP(*dst++ = *src++);
1075aa07b05SWarner Losh 	} else {
1085aa07b05SWarner Losh 		/*
1095aa07b05SWarner Losh 		 * Copy backwards.  Otherwise essentially the same.
1105aa07b05SWarner Losh 		 * Alignment works as before, except that it takes
1115aa07b05SWarner Losh 		 * (t&wmask) bytes to align, not wsize-(t&wmask).
1125aa07b05SWarner Losh 		 */
1135aa07b05SWarner Losh 		src += length;
1145aa07b05SWarner Losh 		dst += length;
1155aa07b05SWarner Losh 		t = (uintptr_t)src;
1165aa07b05SWarner Losh 
1175aa07b05SWarner Losh 		if ((t | (uintptr_t)dst) & wmask) {
1185aa07b05SWarner Losh 			if ((t ^ (uintptr_t)dst) & wmask || length <= wsize) {
1195aa07b05SWarner Losh 				t = length;
1205aa07b05SWarner Losh 			} else {
1215aa07b05SWarner Losh 				t &= wmask;
1225aa07b05SWarner Losh 			}
1235aa07b05SWarner Losh 
1245aa07b05SWarner Losh 			length -= t;
1255aa07b05SWarner Losh 			TLOOP1(*--dst = *--src);
1265aa07b05SWarner Losh 		}
1275aa07b05SWarner Losh 		t = length / wsize;
1285aa07b05SWarner Losh 		TLOOP(src -= wsize; dst -= wsize;
1295aa07b05SWarner Losh 		    *(word *)dst = *(const word *)src);
1305aa07b05SWarner Losh 		t = length & wmask;
1315aa07b05SWarner Losh 		TLOOP(*--dst = *--src);
1325aa07b05SWarner Losh 	}
1335aa07b05SWarner Losh done:
1345aa07b05SWarner Losh 	return (dst0);
1355aa07b05SWarner Losh }
1365aa07b05SWarner Losh 
137*baaa3c4dSWarner Losh __strong_reference(memcpy, memmove);
138