1 /*
2 * Copyright (C) 2007-2019 Free Software Foundation, Inc.
3 *
4 * This file is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License as published by the
6 * Free Software Foundation; either version 3, or (at your option) any
7 * later version.
8 *
9 * This file is distributed in the hope that it will be useful, but
10 * WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * General Public License for more details.
13 *
14 * Under Section 7 of GPL version 3, you are granted additional
15 * permissions described in the GCC Runtime Library Exception, version
16 * 3.1, as published by the Free Software Foundation.
17 *
18 * You should have received a copy of the GNU General Public License and
19 * a copy of the GCC Runtime Library Exception along with this program;
20 * see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
21 * <http://www.gnu.org/licenses/>.
22 */
23
24 /* %ecx */
25 #define bit_SSE3 (1 << 0)
26 #define bit_PCLMUL (1 << 1)
27 #define bit_LZCNT (1 << 5)
28 #define bit_SSSE3 (1 << 9)
29 #define bit_FMA (1 << 12)
30 #define bit_CMPXCHG16B (1 << 13)
31 #define bit_SSE4_1 (1 << 19)
32 #define bit_SSE4_2 (1 << 20)
33 #define bit_MOVBE (1 << 22)
34 #define bit_POPCNT (1 << 23)
35 #define bit_AES (1 << 25)
36 #define bit_XSAVE (1 << 26)
37 #define bit_OSXSAVE (1 << 27)
38 #define bit_AVX (1 << 28)
39 #define bit_F16C (1 << 29)
40 #define bit_RDRND (1 << 30)
41
42 /* %edx */
43 #define bit_CMPXCHG8B (1 << 8)
44 #define bit_CMOV (1 << 15)
45 #define bit_MMX (1 << 23)
46 #define bit_FXSAVE (1 << 24)
47 #define bit_SSE (1 << 25)
48 #define bit_SSE2 (1 << 26)
49
50 /* Extended Features (%eax == 0x80000001) */
51 /* %ecx */
52 #define bit_LAHF_LM (1 << 0)
53 #define bit_ABM (1 << 5)
54 #define bit_SSE4a (1 << 6)
55 #define bit_PRFCHW (1 << 8)
56 #define bit_XOP (1 << 11)
57 #define bit_LWP (1 << 15)
58 #define bit_FMA4 (1 << 16)
59 #define bit_TBM (1 << 21)
60 #define bit_MWAITX (1 << 29)
61
62 /* %edx */
63 #define bit_MMXEXT (1 << 22)
64 #define bit_LM (1 << 29)
65 #define bit_3DNOWP (1 << 30)
66 #define bit_3DNOW (1u << 31)
67
68 /* %ebx */
69 #define bit_CLZERO (1 << 0)
70 #define bit_WBNOINVD (1 << 9)
71
72 /* Extended Features (%eax == 7) */
73 /* %ebx */
74 #define bit_FSGSBASE (1 << 0)
75 #define bit_SGX (1 << 2)
76 #define bit_BMI (1 << 3)
77 #define bit_HLE (1 << 4)
78 #define bit_AVX2 (1 << 5)
79 #define bit_BMI2 (1 << 8)
80 #define bit_RTM (1 << 11)
81 #define bit_MPX (1 << 14)
82 #define bit_AVX512F (1 << 16)
83 #define bit_AVX512DQ (1 << 17)
84 #define bit_RDSEED (1 << 18)
85 #define bit_ADX (1 << 19)
86 #define bit_AVX512IFMA (1 << 21)
87 #define bit_CLFLUSHOPT (1 << 23)
88 #define bit_CLWB (1 << 24)
89 #define bit_AVX512PF (1 << 26)
90 #define bit_AVX512ER (1 << 27)
91 #define bit_AVX512CD (1 << 28)
92 #define bit_SHA (1 << 29)
93 #define bit_AVX512BW (1 << 30)
94 #define bit_AVX512VL (1u << 31)
95
96 /* %ecx */
97 #define bit_PREFETCHWT1 (1 << 0)
98 #define bit_AVX512VBMI (1 << 1)
99 #define bit_PKU (1 << 3)
100 #define bit_OSPKE (1 << 4)
101 #define bit_WAITPKG (1 << 5)
102 #define bit_AVX512VBMI2 (1 << 6)
103 #define bit_SHSTK (1 << 7)
104 #define bit_GFNI (1 << 8)
105 #define bit_VAES (1 << 9)
106 #define bit_AVX512VNNI (1 << 11)
107 #define bit_VPCLMULQDQ (1 << 10)
108 #define bit_AVX512BITALG (1 << 12)
109 #define bit_AVX512VPOPCNTDQ (1 << 14)
110 #define bit_RDPID (1 << 22)
111 #define bit_MOVDIRI (1 << 27)
112 #define bit_MOVDIR64B (1 << 28)
113 #define bit_CLDEMOTE (1 << 25)
114
115 /* %edx */
116 #define bit_AVX5124VNNIW (1 << 2)
117 #define bit_AVX5124FMAPS (1 << 3)
118 #define bit_IBT (1 << 20)
119 #define bit_PCONFIG (1 << 18)
120 /* XFEATURE_ENABLED_MASK register bits (%eax == 13, %ecx == 0) */
121 #define bit_BNDREGS (1 << 3)
122 #define bit_BNDCSR (1 << 4)
123
124 /* Extended State Enumeration Sub-leaf (%eax == 13, %ecx == 1) */
125 #define bit_XSAVEOPT (1 << 0)
126 #define bit_XSAVEC (1 << 1)
127 #define bit_XSAVES (1 << 3)
128
129 /* PT sub leaf (%eax == 14, %ecx == 0) */
130 /* %ebx */
131 #define bit_PTWRITE (1 << 4)
132
133 /* Signatures for different CPU implementations as returned in uses
134 of cpuid with level 0. */
135 #define signature_AMD_ebx 0x68747541
136 #define signature_AMD_ecx 0x444d4163
137 #define signature_AMD_edx 0x69746e65
138
139 #define signature_CENTAUR_ebx 0x746e6543
140 #define signature_CENTAUR_ecx 0x736c7561
141 #define signature_CENTAUR_edx 0x48727561
142
143 #define signature_CYRIX_ebx 0x69727943
144 #define signature_CYRIX_ecx 0x64616574
145 #define signature_CYRIX_edx 0x736e4978
146
147 #define signature_INTEL_ebx 0x756e6547
148 #define signature_INTEL_ecx 0x6c65746e
149 #define signature_INTEL_edx 0x49656e69
150
151 #define signature_TM1_ebx 0x6e617254
152 #define signature_TM1_ecx 0x55504361
153 #define signature_TM1_edx 0x74656d73
154
155 #define signature_TM2_ebx 0x756e6547
156 #define signature_TM2_ecx 0x3638784d
157 #define signature_TM2_edx 0x54656e69
158
159 #define signature_NSC_ebx 0x646f6547
160 #define signature_NSC_ecx 0x43534e20
161 #define signature_NSC_edx 0x79622065
162
163 #define signature_NEXGEN_ebx 0x4778654e
164 #define signature_NEXGEN_ecx 0x6e657669
165 #define signature_NEXGEN_edx 0x72446e65
166
167 #define signature_RISE_ebx 0x65736952
168 #define signature_RISE_ecx 0x65736952
169 #define signature_RISE_edx 0x65736952
170
171 #define signature_SIS_ebx 0x20536953
172 #define signature_SIS_ecx 0x20536953
173 #define signature_SIS_edx 0x20536953
174
175 #define signature_UMC_ebx 0x20434d55
176 #define signature_UMC_ecx 0x20434d55
177 #define signature_UMC_edx 0x20434d55
178
179 #define signature_VIA_ebx 0x20414956
180 #define signature_VIA_ecx 0x20414956
181 #define signature_VIA_edx 0x20414956
182
183 #define signature_VORTEX_ebx 0x74726f56
184 #define signature_VORTEX_ecx 0x436f5320
185 #define signature_VORTEX_edx 0x36387865
186
187 #ifndef __x86_64__
188 /* At least one cpu (Winchip 2) does not set %ebx and %ecx
189 for cpuid leaf 1. Forcibly zero the two registers before
190 calling cpuid as a precaution. */
191 #define __cpuid(level, a, b, c, d) \
192 do { \
193 if (__builtin_constant_p (level) && (level) != 1) \
194 __asm__ __volatile__ ("cpuid\n\t" \
195 : "=a" (a), "=b" (b), "=c" (c), "=d" (d) \
196 : "0" (level)); \
197 else \
198 __asm__ __volatile__ ("cpuid\n\t" \
199 : "=a" (a), "=b" (b), "=c" (c), "=d" (d) \
200 : "0" (level), "1" (0), "2" (0)); \
201 } while (0)
202 #else
203 #define __cpuid(level, a, b, c, d) \
204 __asm__ __volatile__ ("cpuid\n\t" \
205 : "=a" (a), "=b" (b), "=c" (c), "=d" (d) \
206 : "0" (level))
207 #endif
208
209 #define __cpuid_count(level, count, a, b, c, d) \
210 __asm__ __volatile__ ("cpuid\n\t" \
211 : "=a" (a), "=b" (b), "=c" (c), "=d" (d) \
212 : "0" (level), "2" (count))
213
214
215 /* Return highest supported input value for cpuid instruction. ext can
216 be either 0x0 or 0x80000000 to return highest supported value for
217 basic or extended cpuid information. Function returns 0 if cpuid
218 is not supported or whatever cpuid returns in eax register. If sig
219 pointer is non-null, then first four bytes of the signature
220 (as found in ebx register) are returned in location pointed by sig. */
221
222 static __inline unsigned int
__get_cpuid_max(unsigned int __ext,unsigned int * __sig)223 __get_cpuid_max (unsigned int __ext, unsigned int *__sig)
224 {
225 unsigned int __eax, __ebx, __ecx, __edx;
226
227 #ifndef __x86_64__
228 /* See if we can use cpuid. On AMD64 we always can. */
229 #if __GNUC__ >= 3
230 __asm__ ("pushf{l|d}\n\t"
231 "pushf{l|d}\n\t"
232 "pop{l}\t%0\n\t"
233 "mov{l}\t{%0, %1|%1, %0}\n\t"
234 "xor{l}\t{%2, %0|%0, %2}\n\t"
235 "push{l}\t%0\n\t"
236 "popf{l|d}\n\t"
237 "pushf{l|d}\n\t"
238 "pop{l}\t%0\n\t"
239 "popf{l|d}\n\t"
240 : "=&r" (__eax), "=&r" (__ebx)
241 : "i" (0x00200000));
242 #else
243 /* Host GCCs older than 3.0 weren't supporting Intel asm syntax
244 nor alternatives in i386 code. */
245 __asm__ ("pushfl\n\t"
246 "pushfl\n\t"
247 "popl\t%0\n\t"
248 "movl\t%0, %1\n\t"
249 "xorl\t%2, %0\n\t"
250 "pushl\t%0\n\t"
251 "popfl\n\t"
252 "pushfl\n\t"
253 "popl\t%0\n\t"
254 "popfl\n\t"
255 : "=&r" (__eax), "=&r" (__ebx)
256 : "i" (0x00200000));
257 #endif
258
259 if (!((__eax ^ __ebx) & 0x00200000))
260 return 0;
261 #endif
262
263 /* Host supports cpuid. Return highest supported cpuid input value. */
264 __cpuid (__ext, __eax, __ebx, __ecx, __edx);
265
266 if (__sig)
267 *__sig = __ebx;
268
269 return __eax;
270 }
271
272 /* Return cpuid data for requested cpuid leaf, as found in returned
273 eax, ebx, ecx and edx registers. The function checks if cpuid is
274 supported and returns 1 for valid cpuid information or 0 for
275 unsupported cpuid leaf. All pointers are required to be non-null. */
276
277 static __inline int
__get_cpuid(unsigned int __leaf,unsigned int * __eax,unsigned int * __ebx,unsigned int * __ecx,unsigned int * __edx)278 __get_cpuid (unsigned int __leaf,
279 unsigned int *__eax, unsigned int *__ebx,
280 unsigned int *__ecx, unsigned int *__edx)
281 {
282 unsigned int __ext = __leaf & 0x80000000;
283 unsigned int __maxlevel = __get_cpuid_max (__ext, 0);
284
285 if (__maxlevel == 0 || __maxlevel < __leaf)
286 return 0;
287
288 __cpuid (__leaf, *__eax, *__ebx, *__ecx, *__edx);
289 return 1;
290 }
291
292 /* Same as above, but sub-leaf can be specified. */
293
294 static __inline int
__get_cpuid_count(unsigned int __leaf,unsigned int __subleaf,unsigned int * __eax,unsigned int * __ebx,unsigned int * __ecx,unsigned int * __edx)295 __get_cpuid_count (unsigned int __leaf, unsigned int __subleaf,
296 unsigned int *__eax, unsigned int *__ebx,
297 unsigned int *__ecx, unsigned int *__edx)
298 {
299 unsigned int __ext = __leaf & 0x80000000;
300 unsigned int __maxlevel = __get_cpuid_max (__ext, 0);
301
302 if (__maxlevel == 0 || __maxlevel < __leaf)
303 return 0;
304
305 __cpuid_count (__leaf, __subleaf, *__eax, *__ebx, *__ecx, *__edx);
306 return 1;
307 }
308