| 1 | 
 /* | 
 
 
 
 
 
 | 2 | 
  * Copyright (C) 2007-2015 Free Software Foundation, Inc. | 
 
 
 
 
 
 | 3 | 
  * | 
 
 
 
 
 
 | 4 | 
  * This file is free software; you can redistribute it and/or modify it | 
 
 
 
 
 
 | 5 | 
  * under the terms of the GNU General Public License as published by the | 
 
 
 
 
 
 | 6 | 
  * Free Software Foundation; either version 3, or (at your option) any | 
 
 
 
 
 
 | 7 | 
  * later version. | 
 
 
 
 
 
 | 8 | 
  *  | 
 
 
 
 
 
 | 9 | 
  * This file is distributed in the hope that it will be useful, but | 
 
 
 
 
 
 | 10 | 
  * WITHOUT ANY WARRANTY; without even the implied warranty of | 
 
 
 
 
 
 | 11 | 
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU | 
 
 
 
 
 
 | 12 | 
  * General Public License for more details. | 
 
 
 
 
 
 | 13 | 
  *  | 
 
 
 
 
 
 | 14 | 
  * Under Section 7 of GPL version 3, you are granted additional | 
 
 
 
 
 
 | 15 | 
  * permissions described in the GCC Runtime Library Exception, version | 
 
 
 
 
 
 | 16 | 
  * 3.1, as published by the Free Software Foundation. | 
 
 
 
 
 
 | 17 | 
  *  | 
 
 
 
 
 
 | 18 | 
  * You should have received a copy of the GNU General Public License and | 
 
 
 
 
 
 | 19 | 
  * a copy of the GCC Runtime Library Exception along with this program; | 
 
 
 
 
 
 | 20 | 
  * see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see | 
 
 
 
 
 
 | 21 | 
  * <http://www.gnu.org/licenses/>. | 
 
 
 
 
 
 | 22 | 
  */ | 
 
 
 
 
 
 | 23 | 
  | 
 
 
 
 
 
 | 24 | 
 /* %ecx */ | 
 
 
 
 
 
 | 25 | 
 #define bit_SSE3        (1 << 0) | 
 
 
 
 
 
 | 26 | 
 #define bit_PCLMUL      (1 << 1) | 
 
 
 
 
 
 | 27 | 
 #define bit_LZCNT       (1 << 5) | 
 
 
 
 
 
 | 28 | 
 #define bit_SSSE3       (1 << 9) | 
 
 
 
 
 
 | 29 | 
 #define bit_FMA         (1 << 12) | 
 
 
 
 
 
 | 30 | 
 #define bit_CMPXCHG16B  (1 << 13) | 
 
 
 
 
 
 | 31 | 
 #define bit_SSE4_1      (1 << 19) | 
 
 
 
 
 
 | 32 | 
 #define bit_SSE4_2      (1 << 20) | 
 
 
 
 
 
 | 33 | 
 #define bit_MOVBE       (1 << 22) | 
 
 
 
 
 
 | 34 | 
 #define bit_POPCNT      (1 << 23) | 
 
 
 
 
 
 | 35 | 
 #define bit_AES         (1 << 25) | 
 
 
 
 
 
 | 36 | 
 #define bit_XSAVE       (1 << 26) | 
 
 
 
 
 
 | 37 | 
 #define bit_OSXSAVE     (1 << 27) | 
 
 
 
 
 
 | 38 | 
 #define bit_AVX         (1 << 28) | 
 
 
 
 
 
 | 39 | 
 #define bit_F16C        (1 << 29) | 
 
 
 
 
 
 | 40 | 
 #define bit_RDRND       (1 << 30) | 
 
 
 
 
 
 | 41 | 
  | 
 
 
 
 
 
 | 42 | 
 /* %edx */ | 
 
 
 
 
 
 | 43 | 
 #define bit_CMPXCHG8B   (1 << 8) | 
 
 
 
 
 
 | 44 | 
 #define bit_CMOV        (1 << 15) | 
 
 
 
 
 
 | 45 | 
 #define bit_MMX         (1 << 23) | 
 
 
 
 
 
 | 46 | 
 #define bit_FXSAVE      (1 << 24) | 
 
 
 
 
 
 | 47 | 
 #define bit_SSE         (1 << 25) | 
 
 
 
 
 
 | 48 | 
 #define bit_SSE2        (1 << 26) | 
 
 
 
 
 
 | 49 | 
  | 
 
 
 
 
 
 | 50 | 
 /* Extended Features */ | 
 
 
 
 
 
 | 51 | 
 /* %ecx */ | 
 
 
 
 
 
 | 52 | 
 #define bit_LAHF_LM     (1 << 0) | 
 
 
 
 
 
 | 53 | 
 #define bit_ABM         (1 << 5) | 
 
 
 
 
 
 | 54 | 
 #define bit_SSE4a       (1 << 6) | 
 
 
 
 
 
 | 55 | 
 #define bit_PRFCHW      (1 << 8) | 
 
 
 
 
 
 | 56 | 
 #define bit_XOP         (1 << 11) | 
 
 
 
 
 
 | 57 | 
 #define bit_LWP         (1 << 15) | 
 
 
 
 
 
 | 58 | 
 #define bit_FMA4        (1 << 16) | 
 
 
 
 
 
 | 59 | 
 #define bit_TBM         (1 << 21) | 
 
 
 
 
 
 | 60 | 
 #define bit_MWAITX      (1 << 29) | 
 
 
 
 
 
 | 61 | 
  | 
 
 
 
 
 
 | 62 | 
 /* %edx */ | 
 
 
 
 
 
 | 63 | 
 #define bit_MMXEXT      (1 << 22) | 
 
 
 
 
 
 | 64 | 
 #define bit_LM          (1 << 29) | 
 
 
 
 
 
 | 65 | 
 #define bit_3DNOWP      (1 << 30) | 
 
 
 
 
 
 | 66 | 
 #define bit_3DNOW       (1 << 31) | 
 
 
 
 
 
 | 67 | 
  | 
 
 
 
 
 
 | 68 | 
 /* Extended Features (%eax == 7) */ | 
 
 
 
 
 
 | 69 | 
 /* %ebx */ | 
 
 
 
 
 
 | 70 | 
 #define bit_FSGSBASE    (1 << 0) | 
 
 
 
 
 
 | 71 | 
 #define bit_BMI (1 << 3) | 
 
 
 
 
 
 | 72 | 
 #define bit_HLE (1 << 4) | 
 
 
 
 
 
 | 73 | 
 #define bit_AVX2        (1 << 5) | 
 
 
 
 
 
 | 74 | 
 #define bit_BMI2        (1 << 8) | 
 
 
 
 
 
 | 75 | 
 #define bit_RTM (1 << 11) | 
 
 
 
 
 
 | 76 | 
 #define bit_MPX (1 << 14) | 
 
 
 
 
 
 | 77 | 
 #define bit_AVX512F     (1 << 16) | 
 
 
 
 
 
 | 78 | 
 #define bit_AVX512DQ    (1 << 17) | 
 
 
 
 
 
 | 79 | 
 #define bit_RDSEED      (1 << 18) | 
 
 
 
 
 
 | 80 | 
 #define bit_ADX (1 << 19) | 
 
 
 
 
 
 | 81 | 
 #define bit_AVX512IFMA  (1 << 21) | 
 
 
 
 
 
 | 82 | 
 #define bit_PCOMMIT     (1 << 22) | 
 
 
 
 
 
 | 83 | 
 #define bit_CLFLUSHOPT  (1 << 23) | 
 
 
 
 
 
 | 84 | 
 #define bit_CLWB        (1 << 24) | 
 
 
 
 
 
 | 85 | 
 #define bit_AVX512PF    (1 << 26) | 
 
 
 
 
 
 | 86 | 
 #define bit_AVX512ER    (1 << 27) | 
 
 
 
 
 
 | 87 | 
 #define bit_AVX512CD    (1 << 28) | 
 
 
 
 
 
 | 88 | 
 #define bit_SHA         (1 << 29) | 
 
 
 
 
 
 | 89 | 
 #define bit_AVX512BW    (1 << 30) | 
 
 
 
 
 
 | 90 | 
 #define bit_AVX512VL    (1 << 31) | 
 
 
 
 
 
 | 91 | 
  | 
 
 
 
 
 
 | 92 | 
 /* %ecx */ | 
 
 
 
 
 
 | 93 | 
 #define bit_PREFETCHWT1   (1 << 0) | 
 
 
 
 
 
 | 94 | 
 #define bit_AVX512VBMI  (1 << 1) | 
 
 
 
 
 
 | 95 | 
  | 
 
 
 
 
 
 | 96 | 
 /* XFEATURE_ENABLED_MASK register bits (%eax == 13, %ecx == 0) */ | 
 
 
 
 
 
 | 97 | 
 #define bit_BNDREGS     (1 << 3) | 
 
 
 
 
 
 | 98 | 
 #define bit_BNDCSR      (1 << 4) | 
 
 
 
 
 
 | 99 | 
  | 
 
 
 
 
 
 | 100 | 
 /* Extended State Enumeration Sub-leaf (%eax == 13, %ecx == 1) */ | 
 
 
 
 
 
 | 101 | 
 #define bit_XSAVEOPT    (1 << 0) | 
 
 
 
 
 
 | 102 | 
 #define bit_XSAVEC      (1 << 1) | 
 
 
 
 
 
 | 103 | 
 #define bit_XSAVES      (1 << 3) | 
 
 
 
 
 
 | 104 | 
  | 
 
 
 
 
 
 | 105 | 
 /* Signatures for different CPU implementations as returned in uses | 
 
 
 
 
 
 | 106 | 
    of cpuid with level 0.  */ | 
 
 
 
 
 
 | 107 | 
 #define signature_AMD_ebx       0x68747541 | 
 
 
 
 
 
 | 108 | 
 #define signature_AMD_ecx       0x444d4163 | 
 
 
 
 
 
 | 109 | 
 #define signature_AMD_edx       0x69746e65 | 
 
 
 
 
 
 | 110 | 
  | 
 
 
 
 
 
 | 111 | 
 #define signature_CENTAUR_ebx   0x746e6543 | 
 
 
 
 
 
 | 112 | 
 #define signature_CENTAUR_ecx   0x736c7561 | 
 
 
 
 
 
 | 113 | 
 #define signature_CENTAUR_edx   0x48727561 | 
 
 
 
 
 
 | 114 | 
  | 
 
 
 
 
 
 | 115 | 
 #define signature_CYRIX_ebx     0x69727943 | 
 
 
 
 
 
 | 116 | 
 #define signature_CYRIX_ecx     0x64616574 | 
 
 
 
 
 
 | 117 | 
 #define signature_CYRIX_edx     0x736e4978 | 
 
 
 
 
 
 | 118 | 
  | 
 
 
 
 
 
 | 119 | 
 #define signature_INTEL_ebx     0x756e6547 | 
 
 
 
 
 
 | 120 | 
 #define signature_INTEL_ecx     0x6c65746e | 
 
 
 
 
 
 | 121 | 
 #define signature_INTEL_edx     0x49656e69 | 
 
 
 
 
 
 | 122 | 
  | 
 
 
 
 
 
 | 123 | 
 #define signature_TM1_ebx       0x6e617254 | 
 
 
 
 
 
 | 124 | 
 #define signature_TM1_ecx       0x55504361 | 
 
 
 
 
 
 | 125 | 
 #define signature_TM1_edx       0x74656d73 | 
 
 
 
 
 
 | 126 | 
  | 
 
 
 
 
 
 | 127 | 
 #define signature_TM2_ebx       0x756e6547 | 
 
 
 
 
 
 | 128 | 
 #define signature_TM2_ecx       0x3638784d | 
 
 
 
 
 
 | 129 | 
 #define signature_TM2_edx       0x54656e69 | 
 
 
 
 
 
 | 130 | 
  | 
 
 
 
 
 
 | 131 | 
 #define signature_NSC_ebx       0x646f6547 | 
 
 
 
 
 
 | 132 | 
 #define signature_NSC_ecx       0x43534e20 | 
 
 
 
 
 
 | 133 | 
 #define signature_NSC_edx       0x79622065 | 
 
 
 
 
 
 | 134 | 
  | 
 
 
 
 
 
 | 135 | 
 #define signature_NEXGEN_ebx    0x4778654e | 
 
 
 
 
 
 | 136 | 
 #define signature_NEXGEN_ecx    0x6e657669 | 
 
 
 
 
 
 | 137 | 
 #define signature_NEXGEN_edx    0x72446e65 | 
 
 
 
 
 
 | 138 | 
  | 
 
 
 
 
 
 | 139 | 
 #define signature_RISE_ebx      0x65736952 | 
 
 
 
 
 
 | 140 | 
 #define signature_RISE_ecx      0x65736952 | 
 
 
 
 
 
 | 141 | 
 #define signature_RISE_edx      0x65736952 | 
 
 
 
 
 
 | 142 | 
  | 
 
 
 
 
 
 | 143 | 
 #define signature_SIS_ebx       0x20536953 | 
 
 
 
 
 
 | 144 | 
 #define signature_SIS_ecx       0x20536953 | 
 
 
 
 
 
 | 145 | 
 #define signature_SIS_edx       0x20536953 | 
 
 
 
 
 
 | 146 | 
  | 
 
 
 
 
 
 | 147 | 
 #define signature_UMC_ebx       0x20434d55 | 
 
 
 
 
 
 | 148 | 
 #define signature_UMC_ecx       0x20434d55 | 
 
 
 
 
 
 | 149 | 
 #define signature_UMC_edx       0x20434d55 | 
 
 
 
 
 
 | 150 | 
  | 
 
 
 
 
 
 | 151 | 
 #define signature_VIA_ebx       0x20414956 | 
 
 
 
 
 
 | 152 | 
 #define signature_VIA_ecx       0x20414956 | 
 
 
 
 
 
 | 153 | 
 #define signature_VIA_edx       0x20414956 | 
 
 
 
 
 
 | 154 | 
  | 
 
 
 
 
 
 | 155 | 
 #define signature_VORTEX_ebx    0x74726f56 | 
 
 
 
 
 
 | 156 | 
 #define signature_VORTEX_ecx    0x436f5320 | 
 
 
 
 
 
 | 157 | 
 #define signature_VORTEX_edx    0x36387865 | 
 
 
 
 
 
 | 158 | 
  | 
 
 
 
 
 
 | 159 | 
 #define __cpuid(level, a, b, c, d)                      \ | 
 
 
 
 
 
 | 160 | 
   __asm__ ("cpuid\n\t"                                  \ | 
 
 
 
 
 
 | 161 | 
            : "=a" (a), "=b" (b), "=c" (c), "=d" (d)     \ | 
 
 
 
 
 
 | 162 | 
            : "0" (level)) | 
 
 
 
 
 
 | 163 | 
  | 
 
 
 
 
 
 | 164 | 
 #define __cpuid_count(level, count, a, b, c, d)         \ | 
 
 
 
 
 
 | 165 | 
   __asm__ ("cpuid\n\t"                                  \ | 
 
 
 
 
 
 | 166 | 
            : "=a" (a), "=b" (b), "=c" (c), "=d" (d)     \ | 
 
 
 
 
 
 | 167 | 
            : "0" (level), "2" (count)) | 
 
 
 
 
 
 | 168 | 
  | 
 
 
 
 
 
 | 169 | 
  | 
 
 
 
 
 
 | 170 | 
 /* Return highest supported input value for cpuid instruction.  ext can | 
 
 
 
 
 
 | 171 | 
    be either 0x0 or 0x8000000 to return highest supported value for | 
 
 
 
 
 
 | 172 | 
    basic or extended cpuid information.  Function returns 0 if cpuid | 
 
 
 
 
 
 | 173 | 
    is not supported or whatever cpuid returns in eax register.  If sig | 
 
 
 
 
 
 | 174 | 
    pointer is non-null, then first four bytes of the signature | 
 
 
 
 
 
 | 175 | 
    (as found in ebx register) are returned in location pointed by sig.  */ | 
 
 
 
 
 
 | 176 | 
  | 
 
 
 
 
 
 | 177 | 
 static __inline unsigned int | 
 
 
 
 
 
 | 178 | 
 __get_cpuid_max (unsigned int __ext, unsigned int *__sig) | 
 
 
 
 
 
 | 179 | 
 { | 
 
 
 
 
 
 | 180 | 
   unsigned int __eax, __ebx, __ecx, __edx; | 
 
 
 
 
 
 | 181 | 
  | 
 
 
 
 
 
 | 182 | 
 #ifndef __x86_64__ | 
 
 
 
 
 
 | 183 | 
   /* See if we can use cpuid.  On AMD64 we always can.  */ | 
 
 
 
 
 
 | 184 | 
 #if __GNUC__ >= 3 | 
 
 
 
 
 
 | 185 | 
   __asm__ ("pushf{l|d}\n\t" | 
 
 
 
 
 
 | 186 | 
            "pushf{l|d}\n\t" | 
 
 
 
 
 
 | 187 | 
            "pop{l}\t%0\n\t" | 
 
 
 
 
 
 | 188 | 
            "mov{l}\t{%0, %1|%1, %0}\n\t" | 
 
 
 
 
 
 | 189 | 
            "xor{l}\t{%2, %0|%0, %2}\n\t" | 
 
 
 
 
 
 | 190 | 
            "push{l}\t%0\n\t" | 
 
 
 
 
 
 | 191 | 
            "popf{l|d}\n\t" | 
 
 
 
 
 
 | 192 | 
            "pushf{l|d}\n\t" | 
 
 
 
 
 
 | 193 | 
            "pop{l}\t%0\n\t" | 
 
 
 
 
 
 | 194 | 
            "popf{l|d}\n\t" | 
 
 
 
 
 
 | 195 | 
            : "=&r" (__eax), "=&r" (__ebx) | 
 
 
 
 
 
 | 196 | 
            : "i" (0x00200000)); | 
 
 
 
 
 
 | 197 | 
 #else | 
 
 
 
 
 
 | 198 | 
 /* Host GCCs older than 3.0 weren't supporting Intel asm syntax | 
 
 
 
 
 
 | 199 | 
    nor alternatives in i386 code.  */ | 
 
 
 
 
 
 | 200 | 
   __asm__ ("pushfl\n\t" | 
 
 
 
 
 
 | 201 | 
            "pushfl\n\t" | 
 
 
 
 
 
 | 202 | 
            "popl\t%0\n\t" | 
 
 
 
 
 
 | 203 | 
            "movl\t%0, %1\n\t" | 
 
 
 
 
 
 | 204 | 
            "xorl\t%2, %0\n\t" | 
 
 
 
 
 
 | 205 | 
            "pushl\t%0\n\t" | 
 
 
 
 
 
 | 206 | 
            "popfl\n\t" | 
 
 
 
 
 
 | 207 | 
            "pushfl\n\t" | 
 
 
 
 
 
 | 208 | 
            "popl\t%0\n\t" | 
 
 
 
 
 
 | 209 | 
            "popfl\n\t" | 
 
 
 
 
 
 | 210 | 
            : "=&r" (__eax), "=&r" (__ebx) | 
 
 
 
 
 
 | 211 | 
            : "i" (0x00200000)); | 
 
 
 
 
 
 | 212 | 
 #endif | 
 
 
 
 
 
 | 213 | 
  | 
 
 
 
 
 
 | 214 | 
   if (!((__eax ^ __ebx) & 0x00200000)) | 
 
 
 
 
 
 | 215 | 
     return 0; | 
 
 
 
 
 
 | 216 | 
 #endif | 
 
 
 
 
 
 | 217 | 
  | 
 
 
 
 
 
 | 218 | 
   /* Host supports cpuid.  Return highest supported cpuid input value.  */ | 
 
 
 
 
 
 | 219 | 
   __cpuid (__ext, __eax, __ebx, __ecx, __edx); | 
 
 
 
 
 
 | 220 | 
  | 
 
 
 
 
 
 | 221 | 
   if (__sig) | 
 
 
 
 
 
 | 222 | 
     *__sig = __ebx; | 
 
 
 
 
 
 | 223 | 
  | 
 
 
 
 
 
 | 224 | 
   return __eax; | 
 
 
 
 
 
 | 225 | 
 } | 
 
 
 
 
 
 | 226 | 
  | 
 
 
 
 
 
 | 227 | 
 /* Return cpuid data for requested cpuid level, as found in returned | 
 
 
 
 
 
 | 228 | 
    eax, ebx, ecx and edx registers.  The function checks if cpuid is | 
 
 
 
 
 
 | 229 | 
    supported and returns 1 for valid cpuid information or 0 for | 
 
 
 
 
 
 | 230 | 
    unsupported cpuid level.  All pointers are required to be non-null.  */ | 
 
 
 
 
 
 | 231 | 
  | 
 
 
 
 
 
 | 232 | 
 static __inline int | 
 
 
 
 
 
 | 233 | 
 __get_cpuid (unsigned int __level, | 
 
 
 
 
 
 | 234 | 
              unsigned int *__eax, unsigned int *__ebx, | 
 
 
 
 
 
 | 235 | 
              unsigned int *__ecx, unsigned int *__edx) | 
 
 
 
 
 
 | 236 | 
 { | 
 
 
 
 
 
 | 237 | 
   unsigned int __ext = __level & 0x80000000; | 
 
 
 
 
 
 | 238 | 
  | 
 
 
 
 
 
 | 239 | 
   if (__get_cpuid_max (__ext, 0) < __level) | 
 
 
 
 
 
 | 240 | 
     return 0; | 
 
 
 
 
 
 | 241 | 
  | 
 
 
 
 
 
 | 242 | 
   __cpuid (__level, *__eax, *__ebx, *__ecx, *__edx); | 
 
 
 
 
 
 | 243 | 
   return 1; | 
 
 
 
 
 
 | 244 | 
 } |