Work around old buggy program which cannot cope with memcpy semantics.
[glibc.git] / sysdeps / x86_64 / multiarch / memcpy.S
Commit [+]AuthorDateLineData
6fb8cbcb H.J. Lu2010-06-30 08:26:11 -07001/* Multiple versions of memcpy
0354e355
L
H.J. Lu2011-04-01 19:38:21 -04002 Copyright (C) 2010, 2011
3 Free Software Foundation, Inc.
6fb8cbcb
L
H.J. Lu2010-06-30 08:26:11 -07004 Contributed by Intel Corporation.
5 This file is part of the GNU C Library.
6
7 The GNU C Library is free software; you can redistribute it and/or
8 modify it under the terms of the GNU Lesser General Public
9 License as published by the Free Software Foundation; either
10 version 2.1 of the License, or (at your option) any later version.
11
12 The GNU C Library is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 Lesser General Public License for more details.
16
17 You should have received a copy of the GNU Lesser General Public
18 License along with the GNU C Library; if not, write to the Free
19 Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
20 02111-1307 USA. */
21
22#include <sysdep.h>
0354e355 H.J. Lu2011-04-01 19:38:21 -040023#include <shlib-compat.h>
6fb8cbcb
L
H.J. Lu2010-06-30 08:26:11 -070024#include <init-arch.h>
25
26/* Define multiple versions only for the definition in lib and for
27 DSO. In static binaries we need memcpy before the initialization
28 happened. */
29#if defined SHARED && !defined NOT_IN_libc
30 .text
0354e355
L
H.J. Lu2011-04-01 19:38:21 -040031ENTRY(__new_memcpy)
32 .type __new_memcpy, @gnu_indirect_function
6fb8cbcb
L
H.J. Lu2010-06-30 08:26:11 -070033 cmpl $0, KIND_OFFSET+__cpu_features(%rip)
34 jne 1f
35 call __init_cpu_features
361: leaq __memcpy_sse2(%rip), %rax
37 testl $bit_SSSE3, __cpu_features+CPUID_OFFSET+index_SSSE3(%rip)
38 jz 2f
39 leaq __memcpy_ssse3(%rip), %rax
40 testl $bit_Fast_Copy_Backward, __cpu_features+FEATURE_OFFSET+index_Fast_Copy_Backward(%rip)
41 jz 2f
42 leaq __memcpy_ssse3_back(%rip), %rax
432: ret
0354e355 H.J. Lu2011-04-01 19:38:21 -040044END(__new_memcpy)
6fb8cbcb
L
H.J. Lu2010-06-30 08:26:11 -070045
46# undef ENTRY
47# define ENTRY(name) \
48 .type __memcpy_sse2, @function; \
49 .p2align 4; \
50 __memcpy_sse2: cfi_startproc; \
51 CALL_MCOUNT
52# undef END
53# define END(name) \
54 cfi_endproc; .size __memcpy_sse2, .-__memcpy_sse2
55
56# undef ENTRY_CHK
57# define ENTRY_CHK(name) \
58 .type __memcpy_chk_sse2, @function; \
59 .globl __memcpy_chk_sse2; \
60 .p2align 4; \
61 __memcpy_chk_sse2: cfi_startproc; \
62 CALL_MCOUNT
63# undef END_CHK
64# define END_CHK(name) \
65 cfi_endproc; .size __memcpy_chk_sse2, .-__memcpy_chk_sse2
66
67# undef libc_hidden_builtin_def
68/* It doesn't make sense to send libc-internal memcpy calls through a PLT.
69 The speedup we get from using SSSE3 instruction is likely eaten away
70 by the indirect call in the PLT. */
71# define libc_hidden_builtin_def(name) \
72 .globl __GI_memcpy; __GI_memcpy = __memcpy_sse2
0354e355
L
H.J. Lu2011-04-01 19:38:21 -040073
74versioned_symbol (libc, __new_memcpy, memcpy, GLIBC_2_14);
6fb8cbcb
L
H.J. Lu2010-06-30 08:26:11 -070075#endif
76
77#include "../memcpy.S"