1 /* Multiple versions of mempcpy
2 Copyright (C) 2010 Free Software Foundation, Inc.
3 Contributed by Intel Corporation.
4 This file is part of the GNU C Library.
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public
17 License along with the GNU C Library; if not, write to the Free
18 Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
22 #include <init-arch.h>
24 /* Define multiple versions only for the definition in lib and for
25 DSO. In static binaries we need mempcpy before the initialization
27 #if defined SHARED && !defined NOT_IN_libc
29 .type __mempcpy, @gnu_indirect_function
30 cmpl $0, KIND_OFFSET+__cpu_features(%rip)
32 call __init_cpu_features
33 1: leaq __mempcpy_sse2(%rip), %rax
34 testl $bit_SSSE3, __cpu_features+CPUID_OFFSET+index_SSSE3(%rip)
36 leaq __mempcpy_ssse3(%rip), %rax
37 testl $bit_Fast_Copy_Backward, __cpu_features+FEATURE_OFFSET+index_Fast_Copy_Backward(%rip)
39 leaq __mempcpy_ssse3_back(%rip), %rax
44 # define ENTRY(name) \
45 .type __mempcpy_sse2, @function; \
47 __mempcpy_sse2: cfi_startproc; \
51 cfi_endproc; .size __mempcpy_sse2, .-__mempcpy_sse2
54 # define ENTRY_CHK(name) \
55 .type __mempcpy_chk_sse2, @function; \
56 .globl __mempcpy_chk_sse2; \
58 __mempcpy_chk_sse2: cfi_startproc; \
61 # define END_CHK(name) \
62 cfi_endproc; .size __mempcpy_chk_sse2, .-__mempcpy_chk_sse2
64 # undef libc_hidden_def
65 # undef libc_hidden_builtin_def
66 /* It doesn't make sense to send libc-internal mempcpy calls through a PLT.
67 The speedup we get from using SSSE3 instruction is likely eaten away
68 by the indirect call in the PLT. */
69 # define libc_hidden_def(name) \
70 .globl __GI_mempcpy; __GI_mempcpy = __mempcpy_sse2
71 # define libc_hidden_builtin_def(name) \
72 .globl __GI___mempcpy; __GI___mempcpy = __mempcpy_sse2
75 #include "../mempcpy.S"