mirror of
git://sourceware.org/git/glibc.git
synced 2025-02-05 12:40:55 +08:00
Add a new memcpy using 128-bit Q registers - this is faster on modern cores and reduces codesize. Similar to the generic memcpy, small cases include copies up to 32 bytes. 64-128 byte copies are split into two cases to improve performance of 64-96 byte copies. Large copies align the source rather than the destination. bench-memcpy-random is ~9% faster than memcpy_falkor on Neoverse N1, so make this memcpy the default on N1 (on Centriq it is 15% faster than memcpy_falkor). Passes GLIBC regression tests. Reviewed-by: Szabolcs Nagy <szabolcs.nagy@arm.com> |
||
---|---|---|
.. | ||
bits | ||
fpu | ||
multiarch | ||
nptl | ||
sys | ||
__longjmp.S | ||
abort-instr.h | ||
atomic-machine.h | ||
bsd-_setjmp.c | ||
bsd-setjmp.c | ||
configure | ||
configure.ac | ||
crti.S | ||
crtn.S | ||
dl-bti.c | ||
dl-dtprocnum.h | ||
dl-irel.h | ||
dl-link.sym | ||
dl-machine.h | ||
dl-prop.h | ||
dl-sysdep.h | ||
dl-tls.h | ||
dl-tlsdesc.h | ||
dl-tlsdesc.S | ||
dl-trampoline.S | ||
dl-tunables.list | ||
e_sqrtl.c | ||
elf-initfini.h | ||
Implies | ||
jmpbuf-offsets.h | ||
jmpbuf-unwind.h | ||
ldsodefs.h | ||
libc-tls.c | ||
libm-test-ulps | ||
libm-test-ulps-name | ||
linkmap.h | ||
machine-gmon.h | ||
Makefile | ||
math-tests-trap.h | ||
mcount.c | ||
memchr.S | ||
memcmp.S | ||
memcpy.S | ||
memmove.c | ||
memrchr.S | ||
memset-reg.h | ||
memset.S | ||
memusage.h | ||
preconfigure | ||
rawmemchr.S | ||
setjmp.S | ||
sfp-machine.h | ||
sotruss-lib.c | ||
stackinfo.h | ||
start.S | ||
stpcpy.S | ||
strchr.S | ||
strchrnul.S | ||
strcmp.S | ||
strcpy.S | ||
string_private.h | ||
strlen.S | ||
strncmp.S | ||
strnlen.S | ||
strrchr.S | ||
sysdep.h | ||
tls-macros.h | ||
tlsdesc.c | ||
tlsdesc.sym | ||
tst-audit.h | ||
tst-ifunc-arg-1.c | ||
tst-ifunc-arg-2.c | ||
Versions |