mirror of
git://sourceware.org/git/glibc.git
synced 2025-01-06 12:00:24 +08:00
4e2d8f3527
Update ifunc-memset.h/ifunc-wmemset.h to select the function optimized with AVX512 instructions using ZMM16-ZMM31 registers to avoid RTM abort with usable AVX512VL and AVX512BW since VZEROUPPER isn't needed at function exit.
25 lines
557 B
ArmAsm
25 lines
557 B
ArmAsm
#if IS_IN (libc)
|
|
# define VEC_SIZE 64
|
|
# define XMM0 xmm16
|
|
# define YMM0 ymm16
|
|
# define VEC0 zmm16
|
|
# define VEC(i) VEC##i
|
|
# define VMOVU vmovdqu64
|
|
# define VMOVA vmovdqa64
|
|
# define VZEROUPPER
|
|
|
|
# define MEMSET_VDUP_TO_VEC0_AND_SET_RETURN(d, r) \
|
|
movq r, %rax; \
|
|
vpbroadcastb d, %VEC0
|
|
|
|
# define WMEMSET_VDUP_TO_VEC0_AND_SET_RETURN(d, r) \
|
|
movq r, %rax; \
|
|
vpbroadcastd d, %VEC0
|
|
|
|
# define SECTION(p) p##.evex512
|
|
# define MEMSET_SYMBOL(p,s) p##_avx512_##s
|
|
# define WMEMSET_SYMBOL(p,s) p##_avx512_##s
|
|
|
|
# include "memset-vec-unaligned-erms.S"
|
|
#endif
|