1 /* Get CPU type and Features for x86 processors.
2 Copyright (C) 2012-2017 Free Software Foundation, Inc.
3 Contributed by Sriraman Tallam (tmsriram@google.com)
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 Under Section 7 of GPL version 3, you are granted additional
18 permissions described in the GCC Runtime Library Exception, version
19 3.1, as published by the Free Software Foundation.
21 You should have received a copy of the GNU General Public License and
22 a copy of the GCC Runtime Library Exception along with this program;
23 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
24 <http://www.gnu.org/licenses/>. */
28 #include "auto-target.h"
31 #ifdef HAVE_INIT_PRIORITY
32 #define CONSTRUCTOR_PRIORITY (101)
34 #define CONSTRUCTOR_PRIORITY
37 int __cpu_indicator_init (void)
38 __attribute__ ((constructor CONSTRUCTOR_PRIORITY));
41 struct __processor_model __cpu_model = { };
44 /* Get the specific type of AMD CPU. */
47 get_amd_cpu (unsigned int family, unsigned int model)
53 __cpu_model.__cpu_type = AMDFAM10H;
58 __cpu_model.__cpu_subtype = AMDFAM10H_BARCELONA;
62 __cpu_model.__cpu_subtype = AMDFAM10H_SHANGHAI;
66 __cpu_model.__cpu_subtype = AMDFAM10H_ISTANBUL;
72 /* AMD Family 14h "btver1". */
74 __cpu_model.__cpu_type = AMD_BTVER1;
76 /* AMD Family 15h "Bulldozer". */
78 __cpu_model.__cpu_type = AMDFAM15H;
79 /* Bulldozer version 1. */
81 __cpu_model.__cpu_subtype = AMDFAM15H_BDVER1;
82 /* Bulldozer version 2 "Piledriver" */
83 if (model >= 0x10 && model <= 0x2f)
84 __cpu_model.__cpu_subtype = AMDFAM15H_BDVER2;
85 /* Bulldozer version 3 "Steamroller" */
86 if (model >= 0x30 && model <= 0x4f)
87 __cpu_model.__cpu_subtype = AMDFAM15H_BDVER3;
88 /* Bulldozer version 4 "Excavator" */
89 if (model >= 0x60 && model <= 0x7f)
90 __cpu_model.__cpu_subtype = AMDFAM15H_BDVER4;
92 /* AMD Family 16h "btver2" */
94 __cpu_model.__cpu_type = AMD_BTVER2;
97 __cpu_model.__cpu_type = AMDFAM17H;
98 /* AMD family 17h version 1. */
100 __cpu_model.__cpu_subtype = AMDFAM17H_ZNVER1;
107 /* Get the specific type of Intel CPU. */
110 get_intel_cpu (unsigned int family, unsigned int model, unsigned int brand_id)
112 /* Parse family and model only if brand ID is 0. */
126 __cpu_model.__cpu_type = INTEL_BONNELL;
134 __cpu_model.__cpu_type = INTEL_SILVERMONT;
137 /* Knights Landing. */
138 __cpu_model.__cpu_type = INTEL_KNL;
145 __cpu_model.__cpu_type = INTEL_COREI7;
146 __cpu_model.__cpu_subtype = INTEL_COREI7_NEHALEM;
152 __cpu_model.__cpu_type = INTEL_COREI7;
153 __cpu_model.__cpu_subtype = INTEL_COREI7_WESTMERE;
158 __cpu_model.__cpu_type = INTEL_COREI7;
159 __cpu_model.__cpu_subtype = INTEL_COREI7_SANDYBRIDGE;
164 __cpu_model.__cpu_type = INTEL_COREI7;
165 __cpu_model.__cpu_subtype = INTEL_COREI7_IVYBRIDGE;
172 __cpu_model.__cpu_type = INTEL_COREI7;
173 __cpu_model.__cpu_subtype = INTEL_COREI7_HASWELL;
180 __cpu_model.__cpu_type = INTEL_COREI7;
181 __cpu_model.__cpu_subtype = INTEL_COREI7_BROADWELL;
186 __cpu_model.__cpu_type = INTEL_COREI7;
187 __cpu_model.__cpu_subtype = INTEL_COREI7_SKYLAKE;
190 /* Skylake with AVX-512 support. */
191 __cpu_model.__cpu_type = INTEL_COREI7;
192 __cpu_model.__cpu_subtype = INTEL_COREI7_SKYLAKE_AVX512;
199 __cpu_model.__cpu_type = INTEL_CORE2;
206 /* We have no idea. */
212 /* ECX and EDX are output of CPUID at level one. MAX_CPUID_LEVEL is
213 the max possible level of CPUID insn. */
215 get_available_features (unsigned int ecx, unsigned int edx,
218 unsigned int features = 0;
221 features |= (1 << FEATURE_CMOV);
223 features |= (1 << FEATURE_MMX);
225 features |= (1 << FEATURE_SSE);
227 features |= (1 << FEATURE_SSE2);
228 if (ecx & bit_POPCNT)
229 features |= (1 << FEATURE_POPCNT);
231 features |= (1 << FEATURE_AES);
232 if (ecx & bit_PCLMUL)
233 features |= (1 << FEATURE_PCLMUL);
235 features |= (1 << FEATURE_SSE3);
237 features |= (1 << FEATURE_SSSE3);
238 if (ecx & bit_SSE4_1)
239 features |= (1 << FEATURE_SSE4_1);
240 if (ecx & bit_SSE4_2)
241 features |= (1 << FEATURE_SSE4_2);
243 features |= (1 << FEATURE_AVX);
245 features |= (1 << FEATURE_FMA);
247 /* Get Advanced Features at level 7 (eax = 7, ecx = 0). */
248 if (max_cpuid_level >= 7)
250 unsigned int eax, ebx, ecx, edx;
251 __cpuid_count (7, 0, eax, ebx, ecx, edx);
253 features |= (1 << FEATURE_BMI);
255 features |= (1 << FEATURE_AVX2);
257 features |= (1 << FEATURE_BMI2);
258 if (ebx & bit_AVX512F)
259 features |= (1 << FEATURE_AVX512F);
260 if (ebx & bit_AVX512VL)
261 features |= (1 << FEATURE_AVX512VL);
262 if (ebx & bit_AVX512BW)
263 features |= (1 << FEATURE_AVX512BW);
264 if (ebx & bit_AVX512DQ)
265 features |= (1 << FEATURE_AVX512DQ);
266 if (ebx & bit_AVX512CD)
267 features |= (1 << FEATURE_AVX512CD);
268 if (ebx & bit_AVX512PF)
269 features |= (1 << FEATURE_AVX512PF);
270 if (ebx & bit_AVX512ER)
271 features |= (1 << FEATURE_AVX512ER);
272 if (ebx & bit_AVX512IFMA)
273 features |= (1 << FEATURE_AVX512IFMA);
274 if (ecx & bit_AVX512VBMI)
275 features |= (1 << FEATURE_AVX512VBMI);
276 if (edx & bit_AVX5124VNNIW)
277 features |= (1 << FEATURE_AVX5124VNNIW);
278 if (edx & bit_AVX5124FMAPS)
279 features |= (1 << FEATURE_AVX5124FMAPS);
282 unsigned int ext_level;
283 unsigned int eax, ebx;
284 /* Check cpuid level of extended features. */
285 __cpuid (0x80000000, ext_level, ebx, ecx, edx);
287 if (ext_level > 0x80000000)
289 __cpuid (0x80000001, eax, ebx, ecx, edx);
292 features |= (1 << FEATURE_SSE4_A);
294 features |= (1 << FEATURE_FMA4);
296 features |= (1 << FEATURE_XOP);
299 __cpu_model.__cpu_features[0] = features;
302 /* A constructor function that is sets __cpu_model and __cpu_features with
303 the right values. This needs to run only once. This constructor is
304 given the highest priority and it should run before constructors without
305 the priority set. However, it still runs after ifunc initializers and
306 needs to be called explicitly there. */
308 int __attribute__ ((constructor CONSTRUCTOR_PRIORITY))
309 __cpu_indicator_init (void)
311 unsigned int eax, ebx, ecx, edx;
315 unsigned int model, family, brand_id;
316 unsigned int extended_model, extended_family;
318 /* This function needs to run just once. */
319 if (__cpu_model.__cpu_vendor)
322 /* Assume cpuid insn present. Run in level 0 to get vendor id. */
323 if (!__get_cpuid (0, &eax, &ebx, &ecx, &edx))
325 __cpu_model.__cpu_vendor = VENDOR_OTHER;
334 __cpu_model.__cpu_vendor = VENDOR_OTHER;
338 if (!__get_cpuid (1, &eax, &ebx, &ecx, &edx))
340 __cpu_model.__cpu_vendor = VENDOR_OTHER;
344 model = (eax >> 4) & 0x0f;
345 family = (eax >> 8) & 0x0f;
346 brand_id = ebx & 0xff;
347 extended_model = (eax >> 12) & 0xf0;
348 extended_family = (eax >> 20) & 0xff;
350 if (vendor == signature_INTEL_ebx)
352 /* Adjust model and family for Intel CPUS. */
355 family += extended_family;
356 model += extended_model;
358 else if (family == 0x06)
359 model += extended_model;
362 get_intel_cpu (family, model, brand_id);
363 /* Find available features. */
364 get_available_features (ecx, edx, max_level);
365 __cpu_model.__cpu_vendor = VENDOR_INTEL;
367 else if (vendor == signature_AMD_ebx)
369 /* Adjust model and family for AMD CPUS. */
372 family += extended_family;
373 model += extended_model;
377 get_amd_cpu (family, model);
378 /* Find available features. */
379 get_available_features (ecx, edx, max_level);
380 __cpu_model.__cpu_vendor = VENDOR_AMD;
383 __cpu_model.__cpu_vendor = VENDOR_OTHER;
385 gcc_assert (__cpu_model.__cpu_vendor < VENDOR_MAX);
386 gcc_assert (__cpu_model.__cpu_type < CPU_TYPE_MAX);
387 gcc_assert (__cpu_model.__cpu_subtype < CPU_SUBTYPE_MAX);
392 #if defined SHARED && defined USE_ELF_SYMVER
393 __asm__ (".symver __cpu_indicator_init, __cpu_indicator_init@GCC_4.8.0");
394 __asm__ (".symver __cpu_model, __cpu_model@GCC_4.8.0");