1 | /* Common definition for memcpy, mempcpy and memmove implementation. |
2 | All versions must be listed in ifunc-impl-list.c. |
3 | Copyright (C) 2017 Free Software Foundation, Inc. |
4 | This file is part of the GNU C Library. |
5 | |
6 | The GNU C Library is free software; you can redistribute it and/or |
7 | modify it under the terms of the GNU Lesser General Public |
8 | License as published by the Free Software Foundation; either |
9 | version 2.1 of the License, or (at your option) any later version. |
10 | |
11 | The GNU C Library is distributed in the hope that it will be useful, |
12 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
13 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
14 | Lesser General Public License for more details. |
15 | |
16 | You should have received a copy of the GNU Lesser General Public |
17 | License along with the GNU C Library; if not, see |
18 | <http://www.gnu.org/licenses/>. */ |
19 | |
20 | #include <init-arch.h> |
21 | |
22 | extern __typeof (REDIRECT_NAME) OPTIMIZE (erms) attribute_hidden; |
23 | extern __typeof (REDIRECT_NAME) OPTIMIZE (sse2_unaligned) |
24 | attribute_hidden; |
25 | extern __typeof (REDIRECT_NAME) OPTIMIZE (sse2_unaligned_erms) |
26 | attribute_hidden; |
27 | extern __typeof (REDIRECT_NAME) OPTIMIZE (ssse3) attribute_hidden; |
28 | extern __typeof (REDIRECT_NAME) OPTIMIZE (ssse3_back) attribute_hidden; |
29 | extern __typeof (REDIRECT_NAME) OPTIMIZE (avx_unaligned) attribute_hidden; |
30 | extern __typeof (REDIRECT_NAME) OPTIMIZE (avx_unaligned_erms) |
31 | attribute_hidden; |
32 | extern __typeof (REDIRECT_NAME) OPTIMIZE (avx512_unaligned) |
33 | attribute_hidden; |
34 | extern __typeof (REDIRECT_NAME) OPTIMIZE (avx512_unaligned_erms) |
35 | attribute_hidden; |
36 | extern __typeof (REDIRECT_NAME) OPTIMIZE (avx512_no_vzeroupper) |
37 | attribute_hidden; |
38 | |
39 | static inline void * |
40 | IFUNC_SELECTOR (void) |
41 | { |
42 | const struct cpu_features* cpu_features = __get_cpu_features (); |
43 | |
44 | if (CPU_FEATURES_ARCH_P (cpu_features, Prefer_ERMS)) |
45 | return OPTIMIZE (erms); |
46 | |
47 | if (CPU_FEATURES_ARCH_P (cpu_features, AVX512F_Usable) |
48 | && !CPU_FEATURES_ARCH_P (cpu_features, Prefer_No_AVX512)) |
49 | { |
50 | if (CPU_FEATURES_ARCH_P (cpu_features, Prefer_No_VZEROUPPER)) |
51 | return OPTIMIZE (avx512_no_vzeroupper); |
52 | |
53 | if (CPU_FEATURES_CPU_P (cpu_features, ERMS)) |
54 | return OPTIMIZE (avx512_unaligned_erms); |
55 | |
56 | return OPTIMIZE (avx512_unaligned); |
57 | } |
58 | |
59 | if (CPU_FEATURES_ARCH_P (cpu_features, AVX_Fast_Unaligned_Load)) |
60 | { |
61 | if (CPU_FEATURES_CPU_P (cpu_features, ERMS)) |
62 | return OPTIMIZE (avx_unaligned_erms); |
63 | |
64 | return OPTIMIZE (avx_unaligned); |
65 | } |
66 | |
67 | if (!CPU_FEATURES_CPU_P (cpu_features, SSSE3) |
68 | || CPU_FEATURES_ARCH_P (cpu_features, Fast_Unaligned_Copy)) |
69 | { |
70 | if (CPU_FEATURES_CPU_P (cpu_features, ERMS)) |
71 | return OPTIMIZE (sse2_unaligned_erms); |
72 | |
73 | return OPTIMIZE (sse2_unaligned); |
74 | } |
75 | |
76 | if (CPU_FEATURES_ARCH_P (cpu_features, Fast_Copy_Backward)) |
77 | return OPTIMIZE (ssse3_back); |
78 | |
79 | return OPTIMIZE (ssse3); |
80 | } |
81 | |