mirror of
git://sourceware.org/git/glibc.git
synced 2025-01-18 12:16:13 +08:00
5cb6329652
memset with zero as the value to set is by far the majority value (99%+
for Python3 and GCC).
bzero can be slightly more optimized for this case by using a zero-idiom
xor for broadcasting the set value to a register (vector or GPR).
Co-developed-by: Noah Goldstein <goldstein.w.n@gmail.com>
(cherry picked from commit 3d9f171bfb
)
78 lines
2.0 KiB
ArmAsm
78 lines
2.0 KiB
ArmAsm
/* memset/bzero -- set memory area to CH/0
|
|
Optimized version for x86-64.
|
|
Copyright (C) 2002-2021 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<https://www.gnu.org/licenses/>. */
|
|
|
|
#include <sysdep.h>
|
|
#define USE_WITH_SSE2 1
|
|
|
|
#define VEC_SIZE 16
|
|
#define MOV_SIZE 3
|
|
#define RET_SIZE 1
|
|
|
|
#define VEC(i) xmm##i
|
|
#define VMOVU movups
|
|
#define VMOVA movaps
|
|
|
|
# define MEMSET_SET_VEC0_AND_SET_RETURN(d, r) \
|
|
movd d, %xmm0; \
|
|
movq r, %rax; \
|
|
punpcklbw %xmm0, %xmm0; \
|
|
punpcklwd %xmm0, %xmm0; \
|
|
pshufd $0, %xmm0, %xmm0
|
|
|
|
# define BZERO_ZERO_VEC0() \
|
|
pxor %xmm0, %xmm0
|
|
|
|
# define WMEMSET_SET_VEC0_AND_SET_RETURN(d, r) \
|
|
movd d, %xmm0; \
|
|
pshufd $0, %xmm0, %xmm0; \
|
|
movq r, %rax
|
|
|
|
# define MEMSET_VDUP_TO_VEC0_HIGH()
|
|
# define MEMSET_VDUP_TO_VEC0_LOW()
|
|
|
|
# define WMEMSET_VDUP_TO_VEC0_HIGH()
|
|
# define WMEMSET_VDUP_TO_VEC0_LOW()
|
|
|
|
#define SECTION(p) p
|
|
|
|
#ifndef MEMSET_SYMBOL
|
|
# define MEMSET_CHK_SYMBOL(p,s) p
|
|
# define MEMSET_SYMBOL(p,s) memset
|
|
#endif
|
|
|
|
#ifndef BZERO_SYMBOL
|
|
# define BZERO_SYMBOL(p,s) __bzero
|
|
#endif
|
|
|
|
#ifndef WMEMSET_SYMBOL
|
|
# define WMEMSET_CHK_SYMBOL(p,s) p
|
|
# define WMEMSET_SYMBOL(p,s) __wmemset
|
|
#endif
|
|
|
|
#include "multiarch/memset-vec-unaligned-erms.S"
|
|
|
|
libc_hidden_builtin_def (memset)
|
|
|
|
#if IS_IN (libc)
|
|
weak_alias (__bzero, bzero)
|
|
libc_hidden_def (__wmemset)
|
|
weak_alias (__wmemset, wmemset)
|
|
libc_hidden_weak (wmemset)
|
|
#endif
|