| /* This file is part of the GNU C Library. |
| Copyright (C) 2008-2016 Free Software Foundation, Inc. |
| |
| The GNU C Library is free software; you can redistribute it and/or |
| modify it under the terms of the GNU Lesser General Public |
| License as published by the Free Software Foundation; either |
| version 2.1 of the License, or (at your option) any later version. |
| |
| The GNU C Library is distributed in the hope that it will be useful, |
| but WITHOUT ANY WARRANTY; without even the implied warranty of |
| MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| Lesser General Public License for more details. |
| |
| You should have received a copy of the GNU Lesser General Public |
| License along with the GNU C Library; if not, see |
| <http://www.gnu.org/licenses/>. */ |
| |
| #ifndef cpu_features_h |
| #define cpu_features_h |
| |
| #define bit_Fast_Rep_String (1 << 0) |
| #define bit_Fast_Copy_Backward (1 << 1) |
| #define bit_Slow_BSF (1 << 2) |
| #define bit_Fast_Unaligned_Load (1 << 4) |
| #define bit_Prefer_PMINUB_for_stringop (1 << 5) |
| #define bit_AVX_Usable (1 << 6) |
| #define bit_FMA_Usable (1 << 7) |
| #define bit_FMA4_Usable (1 << 8) |
| #define bit_Slow_SSE4_2 (1 << 9) |
| #define bit_AVX2_Usable (1 << 10) |
| #define bit_AVX_Fast_Unaligned_Load (1 << 11) |
| #define bit_AVX512F_Usable (1 << 12) |
| #define bit_AVX512DQ_Usable (1 << 13) |
| #define bit_I586 (1 << 14) |
| #define bit_I686 (1 << 15) |
| #define bit_Prefer_MAP_32BIT_EXEC (1 << 16) |
| #define bit_Prefer_No_VZEROUPPER (1 << 17) |
| |
| /* CPUID Feature flags. */ |
| |
| /* COMMON_CPUID_INDEX_1. */ |
| #define bit_CX8 (1 << 8) |
| #define bit_CMOV (1 << 15) |
| #define bit_SSE2 (1 << 26) |
| #define bit_SSSE3 (1 << 9) |
| #define bit_SSE4_1 (1 << 19) |
| #define bit_SSE4_2 (1 << 20) |
| #define bit_OSXSAVE (1 << 27) |
| #define bit_AVX (1 << 28) |
| #define bit_POPCOUNT (1 << 23) |
| #define bit_FMA (1 << 12) |
| #define bit_FMA4 (1 << 16) |
| |
| /* COMMON_CPUID_INDEX_7. */ |
| #define bit_RTM (1 << 11) |
| #define bit_AVX2 (1 << 5) |
| #define bit_AVX512F (1 << 16) |
| #define bit_AVX512DQ (1 << 17) |
| |
| /* XCR0 Feature flags. */ |
| #define bit_XMM_state (1 << 1) |
| #define bit_YMM_state (2 << 1) |
| #define bit_Opmask_state (1 << 5) |
| #define bit_ZMM0_15_state (1 << 6) |
| #define bit_ZMM16_31_state (1 << 7) |
| |
| /* The integer bit array index for the first set of internal feature bits. */ |
| #define FEATURE_INDEX_1 0 |
| |
| /* The current maximum size of the feature integer bit array. */ |
| #define FEATURE_INDEX_MAX 1 |
| |
| #ifdef __ASSEMBLER__ |
| |
| # include <ifunc-defines.h> |
| # include <rtld-global-offsets.h> |
| |
| # define index_CX8 COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_EDX_OFFSET |
| # define index_CMOV COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_EDX_OFFSET |
| # define index_SSE2 COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_EDX_OFFSET |
| # define index_SSSE3 COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_ECX_OFFSET |
| # define index_SSE4_1 COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_ECX_OFFSET |
| # define index_SSE4_2 COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_ECX_OFFSET |
| # define index_AVX COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_ECX_OFFSET |
| # define index_AVX2 COMMON_CPUID_INDEX_7*CPUID_SIZE+CPUID_EBX_OFFSET |
| |
| # define index_Fast_Rep_String FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_Fast_Copy_Backward FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_Slow_BSF FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_Fast_Unaligned_Load FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_Prefer_PMINUB_for_stringop FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_AVX_Usable FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_FMA_Usable FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_FMA4_Usable FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_Slow_SSE4_2 FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_AVX2_Usable FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_AVX_Fast_Unaligned_Load FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_AVX512F_Usable FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_AVX512DQ_Usable FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_I586 FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_I686 FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_Prefer_MAP_32BIT_EXEC FEATURE_INDEX_1*FEATURE_SIZE |
| # define index_Prefer_No_VZEROUPPER FEATURE_INDEX_1*FEATURE_SIZE |
| |
| |
| # if defined (_LIBC) && !IS_IN (nonlib) |
| # ifdef __x86_64__ |
| # ifdef SHARED |
| # if IS_IN (rtld) |
| # define LOAD_RTLD_GLOBAL_RO_RDX |
| # define HAS_FEATURE(offset, name) \ |
| testl $(bit_##name), _rtld_local_ro+offset+(index_##name)(%rip) |
| # else |
| # define LOAD_RTLD_GLOBAL_RO_RDX \ |
| mov _rtld_global_ro@GOTPCREL(%rip), %RDX_LP |
| # define HAS_FEATURE(offset, name) \ |
| testl $(bit_##name), \ |
| RTLD_GLOBAL_RO_DL_X86_CPU_FEATURES_OFFSET+offset+(index_##name)(%rdx) |
| # endif |
| # else /* SHARED */ |
| # define LOAD_RTLD_GLOBAL_RO_RDX |
| # define HAS_FEATURE(offset, name) \ |
| testl $(bit_##name), _dl_x86_cpu_features+offset+(index_##name)(%rip) |
| # endif /* !SHARED */ |
| # else /* __x86_64__ */ |
| # ifdef SHARED |
| # define LOAD_FUNC_GOT_EAX(func) \ |
| leal func@GOTOFF(%edx), %eax |
| # if IS_IN (rtld) |
| # define LOAD_GOT_AND_RTLD_GLOBAL_RO \ |
| LOAD_PIC_REG(dx) |
| # define HAS_FEATURE(offset, name) \ |
| testl $(bit_##name), offset+(index_##name)+_rtld_local_ro@GOTOFF(%edx) |
| # else |
| # define LOAD_GOT_AND_RTLD_GLOBAL_RO \ |
| LOAD_PIC_REG(dx); \ |
| mov _rtld_global_ro@GOT(%edx), %ecx |
| # define HAS_FEATURE(offset, name) \ |
| testl $(bit_##name), \ |
| RTLD_GLOBAL_RO_DL_X86_CPU_FEATURES_OFFSET+offset+(index_##name)(%ecx) |
| # endif |
| # else /* SHARED */ |
| # define LOAD_FUNC_GOT_EAX(func) \ |
| leal func, %eax |
| # define LOAD_GOT_AND_RTLD_GLOBAL_RO |
| # define HAS_FEATURE(offset, name) \ |
| testl $(bit_##name), _dl_x86_cpu_features+offset+(index_##name) |
| # endif /* !SHARED */ |
| # endif /* !__x86_64__ */ |
| # else /* _LIBC && !nonlib */ |
| # error "Sorry, <cpu-features.h> is unimplemented for assembler" |
| # endif /* !_LIBC || nonlib */ |
| |
| /* HAS_* evaluates to true if we may use the feature at runtime. */ |
| # define HAS_CPU_FEATURE(name) HAS_FEATURE (CPUID_OFFSET, name) |
| # define HAS_ARCH_FEATURE(name) HAS_FEATURE (FEATURE_OFFSET, name) |
| |
| #else /* __ASSEMBLER__ */ |
| |
| enum |
| { |
| COMMON_CPUID_INDEX_1 = 0, |
| COMMON_CPUID_INDEX_7, |
| COMMON_CPUID_INDEX_80000001, /* for AMD */ |
| /* Keep the following line at the end. */ |
| COMMON_CPUID_INDEX_MAX |
| }; |
| |
| struct cpu_features |
| { |
| enum cpu_features_kind |
| { |
| arch_kind_unknown = 0, |
| arch_kind_intel, |
| arch_kind_amd, |
| arch_kind_other |
| } kind; |
| int max_cpuid; |
| struct cpuid_registers |
| { |
| unsigned int eax; |
| unsigned int ebx; |
| unsigned int ecx; |
| unsigned int edx; |
| } cpuid[COMMON_CPUID_INDEX_MAX]; |
| unsigned int family; |
| unsigned int model; |
| unsigned int feature[FEATURE_INDEX_MAX]; |
| }; |
| |
| /* Used from outside of glibc to get access to the CPU features |
| structure. */ |
| extern const struct cpu_features *__get_cpu_features (void) |
| __attribute__ ((const)); |
| |
| # if defined (_LIBC) && !IS_IN (nonlib) |
| /* Unused for x86. */ |
| # define INIT_ARCH() |
| # define __get_cpu_features() (&GLRO(dl_x86_cpu_features)) |
| # endif |
| |
| |
| /* HAS_* evaluates to true if we may use the feature at runtime. */ |
| # define HAS_CPU_FEATURE(name) \ |
| ((__get_cpu_features ()->cpuid[index_##name].reg_##name & (bit_##name)) != 0) |
| # define HAS_ARCH_FEATURE(name) \ |
| ((__get_cpu_features ()->feature[index_##name] & (bit_##name)) != 0) |
| |
| # define index_CX8 COMMON_CPUID_INDEX_1 |
| # define index_CMOV COMMON_CPUID_INDEX_1 |
| # define index_SSE2 COMMON_CPUID_INDEX_1 |
| # define index_SSSE3 COMMON_CPUID_INDEX_1 |
| # define index_SSE4_1 COMMON_CPUID_INDEX_1 |
| # define index_SSE4_2 COMMON_CPUID_INDEX_1 |
| # define index_AVX COMMON_CPUID_INDEX_1 |
| # define index_AVX2 COMMON_CPUID_INDEX_7 |
| # define index_AVX512F COMMON_CPUID_INDEX_7 |
| # define index_AVX512DQ COMMON_CPUID_INDEX_7 |
| # define index_RTM COMMON_CPUID_INDEX_7 |
| # define index_FMA COMMON_CPUID_INDEX_1 |
| # define index_FMA4 COMMON_CPUID_INDEX_80000001 |
| # define index_POPCOUNT COMMON_CPUID_INDEX_1 |
| # define index_OSXSAVE COMMON_CPUID_INDEX_1 |
| |
| # define reg_CX8 edx |
| # define reg_CMOV edx |
| # define reg_SSE2 edx |
| # define reg_SSSE3 ecx |
| # define reg_SSE4_1 ecx |
| # define reg_SSE4_2 ecx |
| # define reg_AVX ecx |
| # define reg_AVX2 ebx |
| # define reg_AVX512F ebx |
| # define reg_AVX512DQ ebx |
| # define reg_RTM ebx |
| # define reg_FMA ecx |
| # define reg_FMA4 ecx |
| # define reg_POPCOUNT ecx |
| # define reg_OSXSAVE ecx |
| |
| # define index_Fast_Rep_String FEATURE_INDEX_1 |
| # define index_Fast_Copy_Backward FEATURE_INDEX_1 |
| # define index_Slow_BSF FEATURE_INDEX_1 |
| # define index_Fast_Unaligned_Load FEATURE_INDEX_1 |
| # define index_Prefer_PMINUB_for_stringop FEATURE_INDEX_1 |
| # define index_AVX_Usable FEATURE_INDEX_1 |
| # define index_FMA_Usable FEATURE_INDEX_1 |
| # define index_FMA4_Usable FEATURE_INDEX_1 |
| # define index_Slow_SSE4_2 FEATURE_INDEX_1 |
| # define index_AVX2_Usable FEATURE_INDEX_1 |
| # define index_AVX_Fast_Unaligned_Load FEATURE_INDEX_1 |
| # define index_AVX512F_Usable FEATURE_INDEX_1 |
| # define index_AVX512DQ_Usable FEATURE_INDEX_1 |
| # define index_I586 FEATURE_INDEX_1 |
| # define index_I686 FEATURE_INDEX_1 |
| # define index_Prefer_MAP_32BIT_EXEC FEATURE_INDEX_1 |
| # define index_Prefer_No_VZEROUPPER FEATURE_INDEX_1 |
| |
| #endif /* !__ASSEMBLER__ */ |
| |
| #ifdef __x86_64__ |
| # define HAS_CPUID 1 |
| #elif defined __i586__ || defined __pentium__ |
| # define HAS_CPUID 1 |
| # define HAS_I586 1 |
| # define HAS_I686 HAS_ARCH_FEATURE (I686) |
| #elif (defined __i686__ || defined __pentiumpro__ \ |
| || defined __pentium4__ || defined __nocona__ \ |
| || defined __atom__ || defined __core2__ \ |
| || defined __corei7__ || defined __corei7_avx__ \ |
| || defined __core_avx2__ || defined __nehalem__ \ |
| || defined __sandybridge__ || defined __haswell__ \ |
| || defined __knl__ || defined __bonnell__ \ |
| || defined __silvermont__ \ |
| || defined __k6__ || defined __k8__ \ |
| || defined __athlon__ || defined __amdfam10__ \ |
| || defined __bdver1__ || defined __bdver2__ \ |
| || defined __bdver3__ || defined __bdver4__ \ |
| || defined __btver1__ || defined __btver2__) |
| # define HAS_CPUID 1 |
| # define HAS_I586 1 |
| # define HAS_I686 1 |
| #else |
| # define HAS_CPUID 0 |
| # define HAS_I586 HAS_ARCH_FEATURE (I586) |
| # define HAS_I686 HAS_ARCH_FEATURE (I686) |
| #endif |
| |
| #endif /* cpu_features_h */ |