]>
Commit | Line | Data |
---|---|---|
6fb8cbcb | 1 | /* Multiple versions of mempcpy |
ac49ecaf L |
2 | All versions must be listed in ifunc-impl-list.c. |
3 | Copyright (C) 2010-2012 Free Software Foundation, Inc. | |
6fb8cbcb L |
4 | Contributed by Intel Corporation. |
5 | This file is part of the GNU C Library. | |
6 | ||
7 | The GNU C Library is free software; you can redistribute it and/or | |
8 | modify it under the terms of the GNU Lesser General Public | |
9 | License as published by the Free Software Foundation; either | |
10 | version 2.1 of the License, or (at your option) any later version. | |
11 | ||
12 | The GNU C Library is distributed in the hope that it will be useful, | |
13 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
15 | Lesser General Public License for more details. | |
16 | ||
17 | You should have received a copy of the GNU Lesser General Public | |
59ba27a6 PE |
18 | License along with the GNU C Library; if not, see |
19 | <http://www.gnu.org/licenses/>. */ | |
6fb8cbcb L |
20 | |
21 | #include <sysdep.h> | |
22 | #include <init-arch.h> | |
23 | ||
24 | /* Define multiple versions only for the definition in lib and for | |
25 | DSO. In static binaries we need mempcpy before the initialization | |
26 | happened. */ | |
27 | #if defined SHARED && !defined NOT_IN_libc | |
28 | ENTRY(__mempcpy) | |
29 | .type __mempcpy, @gnu_indirect_function | |
30 | cmpl $0, KIND_OFFSET+__cpu_features(%rip) | |
31 | jne 1f | |
32 | call __init_cpu_features | |
33 | 1: leaq __mempcpy_sse2(%rip), %rax | |
34 | testl $bit_SSSE3, __cpu_features+CPUID_OFFSET+index_SSSE3(%rip) | |
35 | jz 2f | |
36 | leaq __mempcpy_ssse3(%rip), %rax | |
37 | testl $bit_Fast_Copy_Backward, __cpu_features+FEATURE_OFFSET+index_Fast_Copy_Backward(%rip) | |
38 | jz 2f | |
39 | leaq __mempcpy_ssse3_back(%rip), %rax | |
40 | 2: ret | |
41 | END(__mempcpy) | |
42 | ||
43 | # undef ENTRY | |
44 | # define ENTRY(name) \ | |
45 | .type __mempcpy_sse2, @function; \ | |
46 | .p2align 4; \ | |
ac49ecaf L |
47 | .globl __mempcpy_sse2; \ |
48 | .hidden __mempcpy_sse2; \ | |
6fb8cbcb L |
49 | __mempcpy_sse2: cfi_startproc; \ |
50 | CALL_MCOUNT | |
51 | # undef END | |
52 | # define END(name) \ | |
53 | cfi_endproc; .size __mempcpy_sse2, .-__mempcpy_sse2 | |
54 | ||
55 | # undef ENTRY_CHK | |
56 | # define ENTRY_CHK(name) \ | |
57 | .type __mempcpy_chk_sse2, @function; \ | |
58 | .globl __mempcpy_chk_sse2; \ | |
59 | .p2align 4; \ | |
60 | __mempcpy_chk_sse2: cfi_startproc; \ | |
61 | CALL_MCOUNT | |
62 | # undef END_CHK | |
63 | # define END_CHK(name) \ | |
64 | cfi_endproc; .size __mempcpy_chk_sse2, .-__mempcpy_chk_sse2 | |
65 | ||
66 | # undef libc_hidden_def | |
67 | # undef libc_hidden_builtin_def | |
68 | /* It doesn't make sense to send libc-internal mempcpy calls through a PLT. | |
69 | The speedup we get from using SSSE3 instruction is likely eaten away | |
70 | by the indirect call in the PLT. */ | |
71 | # define libc_hidden_def(name) \ | |
72 | .globl __GI_mempcpy; __GI_mempcpy = __mempcpy_sse2 | |
73 | # define libc_hidden_builtin_def(name) \ | |
74 | .globl __GI___mempcpy; __GI___mempcpy = __mempcpy_sse2 | |
75 | #endif | |
76 | ||
77 | #include "../mempcpy.S" |