// SPDX-License-Identifier: GPL-2.0-only /* * String functions optimized for hardware which doesn't * handle unaligned memory accesses efficiently. * * Copyright (C) 2021 Matteo Croce */ #include #include /* Minimum size for a word copy to be convenient */ #define BYTES_LONG sizeof(long) #define WORD_MASK (BYTES_LONG - 1) #define MIN_THRESHOLD (BYTES_LONG * 2) /* convenience union to avoid cast between different pointer types */ union types { u8 *as_u8; unsigned long *as_ulong; uintptr_t as_uptr; }; union const_types { const u8 *as_u8; unsigned long *as_ulong; uintptr_t as_uptr; }; void *memcpy(void *dest, const void *src, size_t count) { union const_types s = { .as_u8 = src }; union types d = { .as_u8 = dest }; int distance = 0; if (count < MIN_THRESHOLD) goto copy_remainder; /* Copy a byte at time until destination is aligned. */ for (; d.as_uptr & WORD_MASK; count--) *d.as_u8++ = *s.as_u8++; distance = s.as_uptr & WORD_MASK; if (distance) { unsigned long last, next; /* * s is distance bytes ahead of d, and d just reached * the alignment boundary. Move s backward to word align it * and shift data to compensate for distance, in order to do * word-by-word copy. */ s.as_u8 -= distance; next = s.as_ulong[0]; for (; count >= BYTES_LONG; count -= BYTES_LONG) { last = next; next = s.as_ulong[1]; d.as_ulong[0] = last >> (distance * 8) | next << ((BYTES_LONG - distance) * 8); d.as_ulong++; s.as_ulong++; } /* Restore s with the original offset. */ s.as_u8 += distance; } else { /* * If the source and dest lower bits are the same, do a simple * 32/64 bit wide copy. */ for (; count >= BYTES_LONG; count -= BYTES_LONG) *d.as_ulong++ = *s.as_ulong++; } copy_remainder: while (count--) *d.as_u8++ = *s.as_u8++; return dest; } EXPORT_SYMBOL(memcpy); /* * Simply check if the buffer overlaps an call memcpy() in case, * otherwise do a simple one byte at time backward copy. */ void *memmove(void *dest, const void *src, size_t count) { if (dest < src || src + count <= dest) return memcpy(dest, src, count); if (dest > src) { const char *s = src + count; char *tmp = dest + count; while (count--) *--tmp = *--s; } return dest; } EXPORT_SYMBOL(memmove); void *memset(void *s, int c, size_t count) { union types dest = { .as_u8 = s }; if (count >= MIN_THRESHOLD) { unsigned long cu = (unsigned long)c; /* Compose an ulong with 'c' repeated 4/8 times */ cu |= cu << 8; cu |= cu << 16; /* Suppress warning on 32 bit machines */ cu |= (cu << 16) << 16; for (; count && dest.as_uptr & WORD_MASK; count--) *dest.as_u8++ = c; /* Copy using the largest size allowed */ for (; count >= BYTES_LONG; count -= BYTES_LONG) *dest.as_ulong++ = cu; } /* copy the remainder */ while (count--) *dest.as_u8++ = c; return s; } EXPORT_SYMBOL(memset);