18#include "llvm/Config/llvm-config.h"
40#include <mach/host_info.h>
42#include <mach/mach_host.h>
43#include <mach/machine.h>
45#include <sys/sysctl.h>
48#include <sys/systemcfg.h>
50#if defined(__sun__) && defined(__svr4__)
53#if defined(__GNUC__) || defined(__clang__)
54#if (defined(__i386__) || defined(__x86_64__)) && !defined(_MSC_VER)
59#define DEBUG_TYPE "host-detection"
69static std::unique_ptr<llvm::MemoryBuffer>
71 const char *CPUInfoFile =
"/proc/cpuinfo";
72 if (
const char *CpuinfoIntercept = std::getenv(
"LLVM_CPUINFO"))
73 CPUInfoFile = CpuinfoIntercept;
77 if (std::error_code EC = Text.getError()) {
78 llvm::errs() <<
"Can't read " << CPUInfoFile <<
": " << EC.message()
82 return std::move(*Text);
89 const char *
generic =
"generic";
103 while (CIP < CPUInfoEnd && CPUStart ==
nullptr) {
104 if (CIP < CPUInfoEnd && *CIP ==
'\n')
107 if (CIP < CPUInfoEnd && *CIP ==
'c') {
109 if (CIP < CPUInfoEnd && *CIP ==
'p') {
111 if (CIP < CPUInfoEnd && *CIP ==
'u') {
113 while (CIP < CPUInfoEnd && (*CIP ==
' ' || *CIP ==
'\t'))
116 if (CIP < CPUInfoEnd && *CIP ==
':') {
118 while (CIP < CPUInfoEnd && (*CIP ==
' ' || *CIP ==
'\t'))
121 if (CIP < CPUInfoEnd) {
123 while (CIP < CPUInfoEnd && (*CIP !=
' ' && *CIP !=
'\t' &&
124 *CIP !=
',' && *CIP !=
'\n'))
126 CPULen = CIP - CPUStart;
133 if (CPUStart ==
nullptr)
134 while (CIP < CPUInfoEnd && *CIP !=
'\n')
138 if (CPUStart ==
nullptr)
142 .
Case(
"604e",
"604e")
144 .
Case(
"7400",
"7400")
145 .
Case(
"7410",
"7400")
146 .
Case(
"7447",
"7400")
147 .
Case(
"7455",
"7450")
149 .
Case(
"POWER4",
"970")
150 .
Case(
"PPC970FX",
"970")
151 .
Case(
"PPC970MP",
"970")
153 .
Case(
"POWER5",
"g5")
155 .
Case(
"POWER6",
"pwr6")
156 .
Case(
"POWER7",
"pwr7")
157 .
Case(
"POWER8",
"pwr8")
158 .
Case(
"POWER8E",
"pwr8")
159 .
Case(
"POWER8NVL",
"pwr8")
160 .
Case(
"POWER9",
"pwr9")
161 .
Case(
"POWER10",
"pwr10")
162 .
Case(
"POWER11",
"pwr11")
176 ProcCpuinfoContent.
split(Lines,
'\n');
182 for (
unsigned I = 0, E = Lines.size();
I != E; ++
I) {
184 Implementer = Lines[
I].substr(15).ltrim(
"\t :");
186 Hardware = Lines[
I].substr(8).ltrim(
"\t :");
188 Part = Lines[
I].substr(8).ltrim(
"\t :");
191 if (Implementer ==
"0x41") {
204 .
Case(
"0x926",
"arm926ej-s")
205 .
Case(
"0xb02",
"mpcore")
206 .
Case(
"0xb36",
"arm1136j-s")
207 .
Case(
"0xb56",
"arm1156t2-s")
208 .
Case(
"0xb76",
"arm1176jz-s")
209 .
Case(
"0xc05",
"cortex-a5")
210 .
Case(
"0xc07",
"cortex-a7")
211 .
Case(
"0xc08",
"cortex-a8")
212 .
Case(
"0xc09",
"cortex-a9")
213 .
Case(
"0xc0f",
"cortex-a15")
214 .
Case(
"0xc0e",
"cortex-a17")
215 .
Case(
"0xc20",
"cortex-m0")
216 .
Case(
"0xc23",
"cortex-m3")
217 .
Case(
"0xc24",
"cortex-m4")
218 .
Case(
"0xc27",
"cortex-m7")
219 .
Case(
"0xd20",
"cortex-m23")
220 .
Case(
"0xd21",
"cortex-m33")
221 .
Case(
"0xd24",
"cortex-m52")
222 .
Case(
"0xd22",
"cortex-m55")
223 .
Case(
"0xd23",
"cortex-m85")
224 .
Case(
"0xc18",
"cortex-r8")
225 .
Case(
"0xd13",
"cortex-r52")
226 .
Case(
"0xd16",
"cortex-r52plus")
227 .
Case(
"0xd15",
"cortex-r82")
228 .
Case(
"0xd14",
"cortex-r82ae")
229 .
Case(
"0xd02",
"cortex-a34")
230 .
Case(
"0xd04",
"cortex-a35")
231 .
Case(
"0xd03",
"cortex-a53")
232 .
Case(
"0xd05",
"cortex-a55")
233 .
Case(
"0xd46",
"cortex-a510")
234 .
Case(
"0xd80",
"cortex-a520")
235 .
Case(
"0xd88",
"cortex-a520ae")
236 .
Case(
"0xd07",
"cortex-a57")
237 .
Case(
"0xd06",
"cortex-a65")
238 .
Case(
"0xd43",
"cortex-a65ae")
239 .
Case(
"0xd08",
"cortex-a72")
240 .
Case(
"0xd09",
"cortex-a73")
241 .
Case(
"0xd0a",
"cortex-a75")
242 .
Case(
"0xd0b",
"cortex-a76")
243 .
Case(
"0xd0e",
"cortex-a76ae")
244 .
Case(
"0xd0d",
"cortex-a77")
245 .
Case(
"0xd41",
"cortex-a78")
246 .
Case(
"0xd42",
"cortex-a78ae")
247 .
Case(
"0xd4b",
"cortex-a78c")
248 .
Case(
"0xd47",
"cortex-a710")
249 .
Case(
"0xd4d",
"cortex-a715")
250 .
Case(
"0xd81",
"cortex-a720")
251 .
Case(
"0xd89",
"cortex-a720ae")
252 .
Case(
"0xd87",
"cortex-a725")
253 .
Case(
"0xd44",
"cortex-x1")
254 .
Case(
"0xd4c",
"cortex-x1c")
255 .
Case(
"0xd48",
"cortex-x2")
256 .
Case(
"0xd4e",
"cortex-x3")
257 .
Case(
"0xd82",
"cortex-x4")
258 .
Case(
"0xd85",
"cortex-x925")
259 .
Case(
"0xd4a",
"neoverse-e1")
260 .
Case(
"0xd0c",
"neoverse-n1")
261 .
Case(
"0xd49",
"neoverse-n2")
262 .
Case(
"0xd8e",
"neoverse-n3")
263 .
Case(
"0xd40",
"neoverse-v1")
264 .
Case(
"0xd4f",
"neoverse-v2")
265 .
Case(
"0xd84",
"neoverse-v3")
266 .
Case(
"0xd83",
"neoverse-v3ae")
270 if (Implementer ==
"0x42" || Implementer ==
"0x43") {
272 .
Case(
"0x516",
"thunderx2t99")
273 .
Case(
"0x0516",
"thunderx2t99")
274 .
Case(
"0xaf",
"thunderx2t99")
275 .
Case(
"0x0af",
"thunderx2t99")
276 .
Case(
"0xa1",
"thunderxt88")
277 .
Case(
"0x0a1",
"thunderxt88")
281 if (Implementer ==
"0x46") {
283 .
Case(
"0x001",
"a64fx")
284 .
Case(
"0x003",
"fujitsu-monaka")
288 if (Implementer ==
"0x4e") {
290 .
Case(
"0x004",
"carmel")
294 if (Implementer ==
"0x48")
299 .
Case(
"0xd01",
"tsv110")
302 if (Implementer ==
"0x51")
307 .
Case(
"0x06f",
"krait")
308 .
Case(
"0x201",
"kryo")
309 .
Case(
"0x205",
"kryo")
310 .
Case(
"0x211",
"kryo")
311 .
Case(
"0x800",
"cortex-a73")
312 .
Case(
"0x801",
"cortex-a73")
313 .
Case(
"0x802",
"cortex-a75")
314 .
Case(
"0x803",
"cortex-a75")
315 .
Case(
"0x804",
"cortex-a76")
316 .
Case(
"0x805",
"cortex-a76")
317 .
Case(
"0xc00",
"falkor")
318 .
Case(
"0xc01",
"saphira")
319 .
Case(
"0x001",
"oryon-1")
321 if (Implementer ==
"0x53") {
324 unsigned Variant = 0, Part = 0;
329 if (
I.consume_front(
"CPU variant"))
330 I.ltrim(
"\t :").getAsInteger(0, Variant);
335 if (
I.consume_front(
"CPU part"))
336 I.ltrim(
"\t :").getAsInteger(0, Part);
338 unsigned Exynos = (Variant << 12) | Part;
350 if (Implementer ==
"0x61") {
352 .
Case(
"0x020",
"apple-m1")
353 .
Case(
"0x021",
"apple-m1")
354 .
Case(
"0x022",
"apple-m1")
355 .
Case(
"0x023",
"apple-m1")
356 .
Case(
"0x024",
"apple-m1")
357 .
Case(
"0x025",
"apple-m1")
358 .
Case(
"0x028",
"apple-m1")
359 .
Case(
"0x029",
"apple-m1")
360 .
Case(
"0x030",
"apple-m2")
361 .
Case(
"0x031",
"apple-m2")
362 .
Case(
"0x032",
"apple-m2")
363 .
Case(
"0x033",
"apple-m2")
364 .
Case(
"0x034",
"apple-m2")
365 .
Case(
"0x035",
"apple-m2")
366 .
Case(
"0x038",
"apple-m2")
367 .
Case(
"0x039",
"apple-m2")
368 .
Case(
"0x049",
"apple-m3")
369 .
Case(
"0x048",
"apple-m3")
373 if (Implementer ==
"0x63") {
375 .
Case(
"0x132",
"star-mc1")
379 if (Implementer ==
"0x6d") {
382 .
Case(
"0xd49",
"neoverse-n2")
386 if (Implementer ==
"0xc0") {
388 .
Case(
"0xac3",
"ampere1")
389 .
Case(
"0xac4",
"ampere1a")
390 .
Case(
"0xac5",
"ampere1b")
398StringRef getCPUNameFromS390Model(
unsigned int Id,
bool HaveVectorSupport) {
418 return HaveVectorSupport?
"z13" :
"zEC12";
421 return HaveVectorSupport?
"z14" :
"zEC12";
424 return HaveVectorSupport?
"z15" :
"zEC12";
427 return HaveVectorSupport?
"z16" :
"zEC12";
431 return HaveVectorSupport?
"arch15" :
"zEC12";
442 ProcCpuinfoContent.
split(Lines,
'\n');
446 for (
unsigned I = 0, E = Lines.size();
I != E; ++
I)
448 size_t Pos = Lines[
I].find(
':');
450 Lines[
I].drop_front(Pos + 1).split(CPUFeatures,
' ');
458 bool HaveVectorSupport =
false;
459 for (
unsigned I = 0, E = CPUFeatures.
size();
I != E; ++
I) {
460 if (CPUFeatures[
I] ==
"vx")
461 HaveVectorSupport =
true;
465 for (
unsigned I = 0, E = Lines.size();
I != E; ++
I) {
467 size_t Pos = Lines[
I].find(
"machine = ");
469 Pos +=
sizeof(
"machine = ") - 1;
471 if (!Lines[
I].drop_front(Pos).getAsInteger(10, Id))
472 return getCPUNameFromS390Model(Id, HaveVectorSupport);
484 ProcCpuinfoContent.
split(Lines,
'\n');
488 for (
unsigned I = 0, E = Lines.size();
I != E; ++
I) {
490 UArch = Lines[
I].substr(5).ltrim(
"\t :");
496 .
Case(
"sifive,u74-mc",
"sifive-u74")
497 .
Case(
"sifive,bullet0",
"sifive-u74")
502#if !defined(__linux__) || !defined(__x86_64__)
505 uint8_t v3_insns[40] __attribute__ ((aligned (8))) =
507 { 0xb7, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
509 0xb7, 0x2, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
511 0xae, 0x20, 0x1, 0x0, 0x0, 0x0, 0x0, 0x0,
513 0xb7, 0x0, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
515 0x95, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0 };
517 uint8_t v2_insns[40] __attribute__ ((aligned (8))) =
519 { 0xb7, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
521 0xb7, 0x2, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
523 0xad, 0x20, 0x1, 0x0, 0x0, 0x0, 0x0, 0x0,
525 0xb7, 0x0, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
527 0x95, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0 };
529 struct bpf_prog_load_attr {
545 int fd = syscall(321 , 5 , &attr,
553 memset(&attr, 0,
sizeof(attr));
558 fd = syscall(321 , 5 , &attr,
sizeof(attr));
567#if defined(__i386__) || defined(_M_IX86) || defined(__x86_64__) || \
572static bool getX86CpuIDAndInfo(
unsigned value,
unsigned *rEAX,
unsigned *rEBX,
573 unsigned *rECX,
unsigned *rEDX) {
574#if (defined(__i386__) || defined(__x86_64__)) && !defined(_MSC_VER)
575 return !__get_cpuid(
value, rEAX, rEBX, rECX, rEDX);
576#elif defined(_MSC_VER)
579 __cpuid(registers,
value);
580 *rEAX = registers[0];
581 *rEBX = registers[1];
582 *rECX = registers[2];
583 *rEDX = registers[3];
595VendorSignatures getVendorSignature(
unsigned *MaxLeaf) {
596 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
597 if (MaxLeaf ==
nullptr)
602 if (getX86CpuIDAndInfo(0, MaxLeaf, &EBX, &ECX, &EDX) || *MaxLeaf < 1)
603 return VendorSignatures::UNKNOWN;
606 if (EBX == 0x756e6547 && EDX == 0x49656e69 && ECX == 0x6c65746e)
607 return VendorSignatures::GENUINE_INTEL;
610 if (EBX == 0x68747541 && EDX == 0x69746e65 && ECX == 0x444d4163)
611 return VendorSignatures::AUTHENTIC_AMD;
613 return VendorSignatures::UNKNOWN;
626static bool getX86CpuIDAndInfoEx(
unsigned value,
unsigned subleaf,
627 unsigned *rEAX,
unsigned *rEBX,
unsigned *rECX,
633#if (defined(__i386__) || defined(__x86_64__)) && !defined(_MSC_VER)
634 return !__get_cpuid_count(
value, subleaf, rEAX, rEBX, rECX, rEDX);
635#elif defined(_MSC_VER)
637 __cpuidex(registers,
value, subleaf);
638 *rEAX = registers[0];
639 *rEBX = registers[1];
640 *rECX = registers[2];
641 *rEDX = registers[3];
649static bool getX86XCR0(
unsigned *rEAX,
unsigned *rEDX) {
653#if defined(__GNUC__) || defined(__clang__)
657 __asm__(
".byte 0x0f, 0x01, 0xd0" :
"=a"(*rEAX),
"=d"(*rEDX) :
"c"(0));
659#elif defined(_MSC_FULL_VER) && defined(_XCR_XFEATURE_ENABLED_MASK)
660 unsigned long long Result = _xgetbv(_XCR_XFEATURE_ENABLED_MASK);
669static void detectX86FamilyModel(
unsigned EAX,
unsigned *Family,
671 *Family = (
EAX >> 8) & 0xf;
673 if (*Family == 6 || *Family == 0xf) {
676 *Family += (
EAX >> 20) & 0xff;
682#define testFeature(F) (Features[F / 32] & (1 << (F % 32))) != 0
684static StringRef getIntelProcessorTypeAndSubtype(
unsigned Family,
686 const unsigned *Features,
699 if (testFeature(X86::FEATURE_MMX)) {
715 *
Type = X86::INTEL_CORE2;
724 *
Type = X86::INTEL_CORE2;
733 *
Type = X86::INTEL_COREI7;
734 *Subtype = X86::INTEL_COREI7_NEHALEM;
741 *
Type = X86::INTEL_COREI7;
742 *Subtype = X86::INTEL_COREI7_WESTMERE;
748 *
Type = X86::INTEL_COREI7;
749 *Subtype = X86::INTEL_COREI7_SANDYBRIDGE;
754 *
Type = X86::INTEL_COREI7;
755 *Subtype = X86::INTEL_COREI7_IVYBRIDGE;
764 *
Type = X86::INTEL_COREI7;
765 *Subtype = X86::INTEL_COREI7_HASWELL;
774 *
Type = X86::INTEL_COREI7;
775 *Subtype = X86::INTEL_COREI7_BROADWELL;
786 *
Type = X86::INTEL_COREI7;
787 *Subtype = X86::INTEL_COREI7_SKYLAKE;
793 *
Type = X86::INTEL_COREI7;
794 *Subtype = X86::INTEL_COREI7_ROCKETLAKE;
799 *
Type = X86::INTEL_COREI7;
800 if (testFeature(X86::FEATURE_AVX512BF16)) {
802 *Subtype = X86::INTEL_COREI7_COOPERLAKE;
803 }
else if (testFeature(X86::FEATURE_AVX512VNNI)) {
805 *Subtype = X86::INTEL_COREI7_CASCADELAKE;
807 CPU =
"skylake-avx512";
808 *Subtype = X86::INTEL_COREI7_SKYLAKE_AVX512;
815 *
Type = X86::INTEL_COREI7;
816 *Subtype = X86::INTEL_COREI7_CANNONLAKE;
822 CPU =
"icelake-client";
823 *
Type = X86::INTEL_COREI7;
824 *Subtype = X86::INTEL_COREI7_ICELAKE_CLIENT;
831 *
Type = X86::INTEL_COREI7;
832 *Subtype = X86::INTEL_COREI7_TIGERLAKE;
839 *
Type = X86::INTEL_COREI7;
840 *Subtype = X86::INTEL_COREI7_ALDERLAKE;
846 *
Type = X86::INTEL_COREI7;
847 *Subtype = X86::INTEL_COREI7_ALDERLAKE;
855 *
Type = X86::INTEL_COREI7;
856 *Subtype = X86::INTEL_COREI7_ALDERLAKE;
863 *
Type = X86::INTEL_COREI7;
864 *Subtype = X86::INTEL_COREI7_ALDERLAKE;
872 *
Type = X86::INTEL_COREI7;
873 *Subtype = X86::INTEL_COREI7_ARROWLAKE;
879 *
Type = X86::INTEL_COREI7;
880 *Subtype = X86::INTEL_COREI7_ARROWLAKE_S;
886 *
Type = X86::INTEL_COREI7;
887 *Subtype = X86::INTEL_COREI7_ARROWLAKE_S;
893 *
Type = X86::INTEL_COREI7;
894 *Subtype = X86::INTEL_COREI7_PANTHERLAKE;
899 CPU =
"graniterapids";
900 *
Type = X86::INTEL_COREI7;
901 *Subtype = X86::INTEL_COREI7_GRANITERAPIDS;
906 CPU =
"graniterapids-d";
907 *
Type = X86::INTEL_COREI7;
908 *Subtype = X86::INTEL_COREI7_GRANITERAPIDS_D;
914 CPU =
"icelake-server";
915 *
Type = X86::INTEL_COREI7;
916 *Subtype = X86::INTEL_COREI7_ICELAKE_SERVER;
921 CPU =
"emeraldrapids";
922 *
Type = X86::INTEL_COREI7;
923 *Subtype = X86::INTEL_COREI7_SAPPHIRERAPIDS;
928 CPU =
"sapphirerapids";
929 *
Type = X86::INTEL_COREI7;
930 *Subtype = X86::INTEL_COREI7_SAPPHIRERAPIDS;
939 *
Type = X86::INTEL_BONNELL;
950 *
Type = X86::INTEL_SILVERMONT;
956 *
Type = X86::INTEL_GOLDMONT;
959 CPU =
"goldmont-plus";
960 *
Type = X86::INTEL_GOLDMONT_PLUS;
967 *
Type = X86::INTEL_TREMONT;
972 CPU =
"sierraforest";
973 *
Type = X86::INTEL_SIERRAFOREST;
979 *
Type = X86::INTEL_GRANDRIDGE;
984 CPU =
"clearwaterforest";
985 *
Type = X86::INTEL_CLEARWATERFOREST;
991 *
Type = X86::INTEL_KNL;
995 *
Type = X86::INTEL_KNM;
1002 if (testFeature(X86::FEATURE_AVX512VP2INTERSECT)) {
1004 }
else if (testFeature(X86::FEATURE_AVX512VBMI2)) {
1005 CPU =
"icelake-client";
1006 }
else if (testFeature(X86::FEATURE_AVX512VBMI)) {
1008 }
else if (testFeature(X86::FEATURE_AVX512BF16)) {
1010 }
else if (testFeature(X86::FEATURE_AVX512VNNI)) {
1011 CPU =
"cascadelake";
1012 }
else if (testFeature(X86::FEATURE_AVX512VL)) {
1013 CPU =
"skylake-avx512";
1014 }
else if (testFeature(X86::FEATURE_CLFLUSHOPT)) {
1015 if (testFeature(X86::FEATURE_SHA))
1019 }
else if (testFeature(X86::FEATURE_ADX)) {
1021 }
else if (testFeature(X86::FEATURE_AVX2)) {
1023 }
else if (testFeature(X86::FEATURE_AVX)) {
1024 CPU =
"sandybridge";
1025 }
else if (testFeature(X86::FEATURE_SSE4_2)) {
1026 if (testFeature(X86::FEATURE_MOVBE))
1030 }
else if (testFeature(X86::FEATURE_SSE4_1)) {
1032 }
else if (testFeature(X86::FEATURE_SSSE3)) {
1033 if (testFeature(X86::FEATURE_MOVBE))
1037 }
else if (testFeature(X86::FEATURE_64BIT)) {
1039 }
else if (testFeature(X86::FEATURE_SSE3)) {
1041 }
else if (testFeature(X86::FEATURE_SSE2)) {
1043 }
else if (testFeature(X86::FEATURE_SSE)) {
1045 }
else if (testFeature(X86::FEATURE_MMX)) {
1054 if (testFeature(X86::FEATURE_64BIT)) {
1058 if (testFeature(X86::FEATURE_SSE3)) {
1069 CPU =
"diamondrapids";
1070 *
Type = X86::INTEL_COREI7;
1071 *Subtype = X86::INTEL_COREI7_DIAMONDRAPIDS;
1085static const char *getAMDProcessorTypeAndSubtype(
unsigned Family,
1087 const unsigned *Features,
1089 unsigned *Subtype) {
1090 const char *CPU = 0;
1116 if (testFeature(X86::FEATURE_SSE)) {
1123 if (testFeature(X86::FEATURE_SSE3)) {
1132 *
Type = X86::AMDFAM10H;
1135 *Subtype = X86::AMDFAM10H_BARCELONA;
1138 *Subtype = X86::AMDFAM10H_SHANGHAI;
1141 *Subtype = X86::AMDFAM10H_ISTANBUL;
1147 *
Type = X86::AMD_BTVER1;
1151 *
Type = X86::AMDFAM15H;
1152 if (Model >= 0x60 && Model <= 0x7f) {
1154 *Subtype = X86::AMDFAM15H_BDVER4;
1157 if (Model >= 0x30 && Model <= 0x3f) {
1159 *Subtype = X86::AMDFAM15H_BDVER3;
1162 if ((Model >= 0x10 && Model <= 0x1f) || Model == 0x02) {
1164 *Subtype = X86::AMDFAM15H_BDVER2;
1167 if (Model <= 0x0f) {
1168 *Subtype = X86::AMDFAM15H_BDVER1;
1174 *
Type = X86::AMD_BTVER2;
1178 *
Type = X86::AMDFAM17H;
1179 if ((Model >= 0x30 && Model <= 0x3f) || (Model == 0x47) ||
1180 (Model >= 0x60 && Model <= 0x67) || (Model >= 0x68 && Model <= 0x6f) ||
1181 (Model >= 0x70 && Model <= 0x7f) || (Model >= 0x84 && Model <= 0x87) ||
1182 (Model >= 0x90 && Model <= 0x97) || (Model >= 0x98 && Model <= 0x9f) ||
1183 (Model >= 0xa0 && Model <= 0xaf)) {
1194 *Subtype = X86::AMDFAM17H_ZNVER2;
1197 if ((Model >= 0x10 && Model <= 0x1f) || (Model >= 0x20 && Model <= 0x2f)) {
1201 *Subtype = X86::AMDFAM17H_ZNVER1;
1207 *
Type = X86::AMDFAM19H;
1208 if (Model <= 0x0f || (Model >= 0x20 && Model <= 0x2f) ||
1209 (Model >= 0x30 && Model <= 0x3f) || (Model >= 0x40 && Model <= 0x4f) ||
1210 (Model >= 0x50 && Model <= 0x5f)) {
1216 *Subtype = X86::AMDFAM19H_ZNVER3;
1219 if ((Model >= 0x10 && Model <= 0x1f) || (Model >= 0x60 && Model <= 0x6f) ||
1220 (Model >= 0x70 && Model <= 0x77) || (Model >= 0x78 && Model <= 0x7f) ||
1221 (Model >= 0xa0 && Model <= 0xaf)) {
1228 *Subtype = X86::AMDFAM19H_ZNVER4;
1234 *
Type = X86::AMDFAM1AH;
1235 if (Model <= 0x77) {
1246 *Subtype = X86::AMDFAM1AH_ZNVER5;
1260static void getAvailableFeatures(
unsigned ECX,
unsigned EDX,
unsigned MaxLeaf,
1261 unsigned *Features) {
1264 auto setFeature = [&](
unsigned F) {
1265 Features[
F / 32] |= 1U << (
F % 32);
1268 if ((EDX >> 15) & 1)
1269 setFeature(X86::FEATURE_CMOV);
1270 if ((EDX >> 23) & 1)
1271 setFeature(X86::FEATURE_MMX);
1272 if ((EDX >> 25) & 1)
1273 setFeature(X86::FEATURE_SSE);
1274 if ((EDX >> 26) & 1)
1275 setFeature(X86::FEATURE_SSE2);
1278 setFeature(X86::FEATURE_SSE3);
1280 setFeature(X86::FEATURE_PCLMUL);
1282 setFeature(X86::FEATURE_SSSE3);
1283 if ((ECX >> 12) & 1)
1284 setFeature(X86::FEATURE_FMA);
1285 if ((ECX >> 19) & 1)
1286 setFeature(X86::FEATURE_SSE4_1);
1287 if ((ECX >> 20) & 1) {
1288 setFeature(X86::FEATURE_SSE4_2);
1289 setFeature(X86::FEATURE_CRC32);
1291 if ((ECX >> 23) & 1)
1292 setFeature(X86::FEATURE_POPCNT);
1293 if ((ECX >> 25) & 1)
1294 setFeature(X86::FEATURE_AES);
1296 if ((ECX >> 22) & 1)
1297 setFeature(X86::FEATURE_MOVBE);
1302 const unsigned AVXBits = (1 << 27) | (1 << 28);
1303 bool HasAVX = ((
ECX & AVXBits) == AVXBits) && !getX86XCR0(&EAX, &EDX) &&
1304 ((
EAX & 0x6) == 0x6);
1305#if defined(__APPLE__)
1309 bool HasAVX512Save =
true;
1312 bool HasAVX512Save = HasAVX && ((
EAX & 0xe0) == 0xe0);
1316 setFeature(X86::FEATURE_AVX);
1319 MaxLeaf >= 0x7 && !getX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
1321 if (HasLeaf7 && ((EBX >> 3) & 1))
1322 setFeature(X86::FEATURE_BMI);
1323 if (HasLeaf7 && ((EBX >> 5) & 1) && HasAVX)
1324 setFeature(X86::FEATURE_AVX2);
1325 if (HasLeaf7 && ((EBX >> 8) & 1))
1326 setFeature(X86::FEATURE_BMI2);
1327 if (HasLeaf7 && ((EBX >> 16) & 1) && HasAVX512Save) {
1328 setFeature(X86::FEATURE_AVX512F);
1329 setFeature(X86::FEATURE_EVEX512);
1331 if (HasLeaf7 && ((EBX >> 17) & 1) && HasAVX512Save)
1332 setFeature(X86::FEATURE_AVX512DQ);
1333 if (HasLeaf7 && ((EBX >> 19) & 1))
1334 setFeature(X86::FEATURE_ADX);
1335 if (HasLeaf7 && ((EBX >> 21) & 1) && HasAVX512Save)
1336 setFeature(X86::FEATURE_AVX512IFMA);
1337 if (HasLeaf7 && ((EBX >> 23) & 1))
1338 setFeature(X86::FEATURE_CLFLUSHOPT);
1339 if (HasLeaf7 && ((EBX >> 28) & 1) && HasAVX512Save)
1340 setFeature(X86::FEATURE_AVX512CD);
1341 if (HasLeaf7 && ((EBX >> 29) & 1))
1342 setFeature(X86::FEATURE_SHA);
1343 if (HasLeaf7 && ((EBX >> 30) & 1) && HasAVX512Save)
1344 setFeature(X86::FEATURE_AVX512BW);
1345 if (HasLeaf7 && ((EBX >> 31) & 1) && HasAVX512Save)
1346 setFeature(X86::FEATURE_AVX512VL);
1348 if (HasLeaf7 && ((ECX >> 1) & 1) && HasAVX512Save)
1349 setFeature(X86::FEATURE_AVX512VBMI);
1350 if (HasLeaf7 && ((ECX >> 6) & 1) && HasAVX512Save)
1351 setFeature(X86::FEATURE_AVX512VBMI2);
1352 if (HasLeaf7 && ((ECX >> 8) & 1))
1353 setFeature(X86::FEATURE_GFNI);
1354 if (HasLeaf7 && ((ECX >> 10) & 1) && HasAVX)
1355 setFeature(X86::FEATURE_VPCLMULQDQ);
1356 if (HasLeaf7 && ((ECX >> 11) & 1) && HasAVX512Save)
1357 setFeature(X86::FEATURE_AVX512VNNI);
1358 if (HasLeaf7 && ((ECX >> 12) & 1) && HasAVX512Save)
1359 setFeature(X86::FEATURE_AVX512BITALG);
1360 if (HasLeaf7 && ((ECX >> 14) & 1) && HasAVX512Save)
1361 setFeature(X86::FEATURE_AVX512VPOPCNTDQ);
1363 if (HasLeaf7 && ((EDX >> 2) & 1) && HasAVX512Save)
1364 setFeature(X86::FEATURE_AVX5124VNNIW);
1365 if (HasLeaf7 && ((EDX >> 3) & 1) && HasAVX512Save)
1366 setFeature(X86::FEATURE_AVX5124FMAPS);
1367 if (HasLeaf7 && ((EDX >> 8) & 1) && HasAVX512Save)
1368 setFeature(X86::FEATURE_AVX512VP2INTERSECT);
1372 bool HasLeaf7Subleaf1 =
1373 HasLeaf7 &&
EAX >= 1 &&
1374 !getX86CpuIDAndInfoEx(0x7, 0x1, &EAX, &EBX, &ECX, &EDX);
1375 if (HasLeaf7Subleaf1 && ((EAX >> 5) & 1) && HasAVX512Save)
1376 setFeature(X86::FEATURE_AVX512BF16);
1378 unsigned MaxExtLevel;
1379 getX86CpuIDAndInfo(0x80000000, &MaxExtLevel, &EBX, &ECX, &EDX);
1381 bool HasExtLeaf1 = MaxExtLevel >= 0x80000001 &&
1382 !getX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
1383 if (HasExtLeaf1 && ((ECX >> 6) & 1))
1384 setFeature(X86::FEATURE_SSE4_A);
1385 if (HasExtLeaf1 && ((ECX >> 11) & 1))
1386 setFeature(X86::FEATURE_XOP);
1387 if (HasExtLeaf1 && ((ECX >> 16) & 1))
1388 setFeature(X86::FEATURE_FMA4);
1390 if (HasExtLeaf1 && ((EDX >> 29) & 1))
1391 setFeature(X86::FEATURE_64BIT);
1395 unsigned MaxLeaf = 0;
1397 if (Vendor == VendorSignatures::UNKNOWN)
1401 getX86CpuIDAndInfo(0x1, &EAX, &EBX, &ECX, &EDX);
1403 unsigned Family = 0,
Model = 0;
1405 detectX86FamilyModel(EAX, &Family, &Model);
1406 getAvailableFeatures(ECX, EDX, MaxLeaf, Features);
1411 unsigned Subtype = 0;
1415 if (Vendor == VendorSignatures::GENUINE_INTEL) {
1416 CPU = getIntelProcessorTypeAndSubtype(Family, Model, Features, &
Type,
1418 }
else if (Vendor == VendorSignatures::AUTHENTIC_AMD) {
1419 CPU = getAMDProcessorTypeAndSubtype(Family, Model, Features, &
Type,
1429#elif defined(__APPLE__) && defined(__powerpc__)
1431 host_basic_info_data_t hostInfo;
1432 mach_msg_type_number_t infoCount;
1434 infoCount = HOST_BASIC_INFO_COUNT;
1435 mach_port_t hostPort = mach_host_self();
1436 host_info(hostPort, HOST_BASIC_INFO, (host_info_t)&hostInfo,
1438 mach_port_deallocate(mach_task_self(), hostPort);
1440 if (hostInfo.cpu_type != CPU_TYPE_POWERPC)
1443 switch (hostInfo.cpu_subtype) {
1473#elif defined(__linux__) && defined(__powerpc__)
1477 return detail::getHostCPUNameForPowerPC(
Content);
1479#elif defined(__linux__) && (defined(__arm__) || defined(__aarch64__))
1483 return detail::getHostCPUNameForARM(
Content);
1485#elif defined(__linux__) && defined(__s390x__)
1489 return detail::getHostCPUNameForS390x(
Content);
1491#elif defined(__MVS__)
1496 int *StartToCVTOffset =
reinterpret_cast<int *
>(0x10);
1499 int ReadValue = *StartToCVTOffset;
1501 ReadValue = (ReadValue & 0x7FFFFFFF);
1502 char *CVT =
reinterpret_cast<char *
>(ReadValue);
1507 Id = decodePackedBCD<uint16_t>(Id,
false);
1511 bool HaveVectorSupport = CVT[244] & 0x80;
1512 return getCPUNameFromS390Model(Id, HaveVectorSupport);
1514#elif defined(__APPLE__) && (defined(__arm__) || defined(__aarch64__))
1519#define CPUFAMILY_UNKNOWN 0
1520#define CPUFAMILY_ARM_9 0xe73283ae
1521#define CPUFAMILY_ARM_11 0x8ff620d8
1522#define CPUFAMILY_ARM_XSCALE 0x53b005f5
1523#define CPUFAMILY_ARM_12 0xbd1b0ae9
1524#define CPUFAMILY_ARM_13 0x0cc90e64
1525#define CPUFAMILY_ARM_14 0x96077ef1
1526#define CPUFAMILY_ARM_15 0xa8511bca
1527#define CPUFAMILY_ARM_SWIFT 0x1e2d6381
1528#define CPUFAMILY_ARM_CYCLONE 0x37a09642
1529#define CPUFAMILY_ARM_TYPHOON 0x2c91a47e
1530#define CPUFAMILY_ARM_TWISTER 0x92fb37c8
1531#define CPUFAMILY_ARM_HURRICANE 0x67ceee93
1532#define CPUFAMILY_ARM_MONSOON_MISTRAL 0xe81e7ef6
1533#define CPUFAMILY_ARM_VORTEX_TEMPEST 0x07d34b9f
1534#define CPUFAMILY_ARM_LIGHTNING_THUNDER 0x462504d2
1535#define CPUFAMILY_ARM_FIRESTORM_ICESTORM 0x1b588bb3
1536#define CPUFAMILY_ARM_BLIZZARD_AVALANCHE 0xda33d83d
1537#define CPUFAMILY_ARM_EVEREST_SAWTOOTH 0x8765edea
1538#define CPUFAMILY_ARM_IBIZA 0xfa33415e
1539#define CPUFAMILY_ARM_PALMA 0x72015832
1540#define CPUFAMILY_ARM_COLL 0x2876f5b5
1541#define CPUFAMILY_ARM_LOBOS 0x5f4dea93
1542#define CPUFAMILY_ARM_DONAN 0x6f5129ac
1543#define CPUFAMILY_ARM_BRAVA 0x17d5b93a
1544#define CPUFAMILY_ARM_TAHITI 0x75d4acb9
1545#define CPUFAMILY_ARM_TUPAI 0x204526d0
1549 size_t Length =
sizeof(Family);
1550 sysctlbyname(
"hw.cpufamily", &Family, &
Length, NULL, 0);
1562 case CPUFAMILY_UNKNOWN:
1564 case CPUFAMILY_ARM_9:
1566 case CPUFAMILY_ARM_11:
1567 return "arm1136jf-s";
1568 case CPUFAMILY_ARM_XSCALE:
1570 case CPUFAMILY_ARM_12:
1572 case CPUFAMILY_ARM_13:
1574 case CPUFAMILY_ARM_14:
1576 case CPUFAMILY_ARM_15:
1578 case CPUFAMILY_ARM_SWIFT:
1580 case CPUFAMILY_ARM_CYCLONE:
1582 case CPUFAMILY_ARM_TYPHOON:
1584 case CPUFAMILY_ARM_TWISTER:
1586 case CPUFAMILY_ARM_HURRICANE:
1588 case CPUFAMILY_ARM_MONSOON_MISTRAL:
1590 case CPUFAMILY_ARM_VORTEX_TEMPEST:
1592 case CPUFAMILY_ARM_LIGHTNING_THUNDER:
1594 case CPUFAMILY_ARM_FIRESTORM_ICESTORM:
1596 case CPUFAMILY_ARM_BLIZZARD_AVALANCHE:
1598 case CPUFAMILY_ARM_EVEREST_SAWTOOTH:
1599 case CPUFAMILY_ARM_IBIZA:
1600 case CPUFAMILY_ARM_PALMA:
1601 case CPUFAMILY_ARM_LOBOS:
1603 case CPUFAMILY_ARM_COLL:
1605 case CPUFAMILY_ARM_DONAN:
1606 case CPUFAMILY_ARM_BRAVA:
1607 case CPUFAMILY_ARM_TAHITI:
1608 case CPUFAMILY_ARM_TUPAI:
1617 switch (_system_configuration.implementation) {
1619 if (_system_configuration.version == PV_4_3)
1623 if (_system_configuration.version == PV_5)
1627 if (_system_configuration.version == PV_6_Compat)
1653#elif defined(__loongarch__)
1657 __asm__(
"cpucfg %[prid], $zero\n\t" : [prid]
"=r"(processor_id));
1659 switch (processor_id & 0xf000) {
1670#elif defined(__riscv)
1672#if defined(__linux__)
1679#if __riscv_xlen == 64
1680 return "generic-rv64";
1681#elif __riscv_xlen == 32
1682 return "generic-rv32";
1684#error "Unhandled value of __riscv_xlen"
1687#elif defined(__sparc__)
1688#if defined(__linux__)
1691 ProcCpuinfoContent.
split(Lines,
'\n');
1695 for (
unsigned I = 0, E =
Lines.size();
I != E; ++
I) {
1697 Cpu =
Lines[
I].substr(5).ltrim(
"\t :");
1729#if defined(__linux__)
1732 return detail::getHostCPUNameForSPARC(
Content);
1733#elif defined(__sun__) && defined(__svr4__)
1737 kstat_named_t *brand = NULL;
1741 ksp = kstat_lookup(kc,
const_cast<char *
>(
"cpu_info"), -1, NULL);
1742 if (ksp != NULL && kstat_read(kc, ksp, NULL) != -1 &&
1743 ksp->ks_type == KSTAT_TYPE_NAMED)
1745 (kstat_named_t *)kstat_data_lookup(ksp,
const_cast<char *
>(
"brand"));
1746 if (brand != NULL && brand->data_type == KSTAT_DATA_STRING)
1747 buf = KSTAT_NAMED_STR_PTR(brand);
1752 .
Case(
"TMS390S10",
"supersparc")
1753 .
Case(
"TMS390Z50",
"supersparc")
1756 .
Case(
"MB86904",
"supersparc")
1757 .
Case(
"MB86907",
"supersparc")
1758 .
Case(
"RT623",
"hypersparc")
1759 .
Case(
"RT625",
"hypersparc")
1760 .
Case(
"RT626",
"hypersparc")
1761 .
Case(
"UltraSPARC-I",
"ultrasparc")
1762 .
Case(
"UltraSPARC-II",
"ultrasparc")
1763 .
Case(
"UltraSPARC-IIe",
"ultrasparc")
1764 .
Case(
"UltraSPARC-IIi",
"ultrasparc")
1765 .
Case(
"SPARC64-III",
"ultrasparc")
1766 .
Case(
"SPARC64-IV",
"ultrasparc")
1767 .
Case(
"UltraSPARC-III",
"ultrasparc3")
1768 .
Case(
"UltraSPARC-III+",
"ultrasparc3")
1769 .
Case(
"UltraSPARC-IIIi",
"ultrasparc3")
1770 .
Case(
"UltraSPARC-IIIi+",
"ultrasparc3")
1771 .
Case(
"UltraSPARC-IV",
"ultrasparc3")
1772 .
Case(
"UltraSPARC-IV+",
"ultrasparc3")
1773 .
Case(
"SPARC64-V",
"ultrasparc3")
1774 .
Case(
"SPARC64-VI",
"ultrasparc3")
1775 .
Case(
"SPARC64-VII",
"ultrasparc3")
1776 .
Case(
"UltraSPARC-T1",
"niagara")
1777 .
Case(
"UltraSPARC-T2",
"niagara2")
1778 .
Case(
"UltraSPARC-T2",
"niagara2")
1779 .
Case(
"UltraSPARC-T2+",
"niagara2")
1780 .
Case(
"SPARC-T3",
"niagara3")
1781 .
Case(
"SPARC-T4",
"niagara4")
1782 .
Case(
"SPARC-T5",
"niagara4")
1784 .
Case(
"SPARC-M7",
"niagara4" )
1785 .
Case(
"SPARC-S7",
"niagara4" )
1786 .
Case(
"SPARC-M8",
"niagara4" )
1809#if defined(__i386__) || defined(_M_IX86) || \
1810 defined(__x86_64__) || defined(_M_X64)
1816 if (getX86CpuIDAndInfo(0, &MaxLevel, &EBX, &ECX, &EDX) || MaxLevel < 1)
1819 getX86CpuIDAndInfo(1, &EAX, &EBX, &ECX, &EDX);
1821 Features[
"cx8"] = (
EDX >> 8) & 1;
1822 Features[
"cmov"] = (
EDX >> 15) & 1;
1823 Features[
"mmx"] = (
EDX >> 23) & 1;
1824 Features[
"fxsr"] = (
EDX >> 24) & 1;
1825 Features[
"sse"] = (
EDX >> 25) & 1;
1826 Features[
"sse2"] = (
EDX >> 26) & 1;
1828 Features[
"sse3"] = (
ECX >> 0) & 1;
1829 Features[
"pclmul"] = (
ECX >> 1) & 1;
1830 Features[
"ssse3"] = (
ECX >> 9) & 1;
1831 Features[
"cx16"] = (
ECX >> 13) & 1;
1832 Features[
"sse4.1"] = (
ECX >> 19) & 1;
1833 Features[
"sse4.2"] = (
ECX >> 20) & 1;
1834 Features[
"crc32"] = Features[
"sse4.2"];
1835 Features[
"movbe"] = (
ECX >> 22) & 1;
1836 Features[
"popcnt"] = (
ECX >> 23) & 1;
1837 Features[
"aes"] = (
ECX >> 25) & 1;
1838 Features[
"rdrnd"] = (
ECX >> 30) & 1;
1843 bool HasXSave = ((
ECX >> 27) & 1) && !getX86XCR0(&EAX, &EDX);
1844 bool HasAVXSave = HasXSave && ((
ECX >> 28) & 1) && ((
EAX & 0x6) == 0x6);
1845#if defined(__APPLE__)
1849 bool HasAVX512Save =
true;
1852 bool HasAVX512Save = HasAVXSave && ((
EAX & 0xe0) == 0xe0);
1855 const unsigned AMXBits = (1 << 17) | (1 << 18);
1856 bool HasAMXSave = HasXSave && ((
EAX & AMXBits) == AMXBits);
1858 Features[
"avx"] = HasAVXSave;
1859 Features[
"fma"] = ((
ECX >> 12) & 1) && HasAVXSave;
1861 Features[
"xsave"] = ((
ECX >> 26) & 1) && HasAVXSave;
1862 Features[
"f16c"] = ((
ECX >> 29) & 1) && HasAVXSave;
1864 unsigned MaxExtLevel;
1865 getX86CpuIDAndInfo(0x80000000, &MaxExtLevel, &EBX, &ECX, &EDX);
1867 bool HasExtLeaf1 = MaxExtLevel >= 0x80000001 &&
1868 !getX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
1869 Features[
"sahf"] = HasExtLeaf1 && ((
ECX >> 0) & 1);
1870 Features[
"lzcnt"] = HasExtLeaf1 && ((
ECX >> 5) & 1);
1871 Features[
"sse4a"] = HasExtLeaf1 && ((
ECX >> 6) & 1);
1872 Features[
"prfchw"] = HasExtLeaf1 && ((
ECX >> 8) & 1);
1873 Features[
"xop"] = HasExtLeaf1 && ((
ECX >> 11) & 1) && HasAVXSave;
1874 Features[
"lwp"] = HasExtLeaf1 && ((
ECX >> 15) & 1);
1875 Features[
"fma4"] = HasExtLeaf1 && ((
ECX >> 16) & 1) && HasAVXSave;
1876 Features[
"tbm"] = HasExtLeaf1 && ((
ECX >> 21) & 1);
1877 Features[
"mwaitx"] = HasExtLeaf1 && ((
ECX >> 29) & 1);
1879 Features[
"64bit"] = HasExtLeaf1 && ((
EDX >> 29) & 1);
1883 bool HasExtLeaf8 = MaxExtLevel >= 0x80000008 &&
1884 !getX86CpuIDAndInfo(0x80000008, &EAX, &EBX, &ECX, &EDX);
1885 Features[
"clzero"] = HasExtLeaf8 && ((
EBX >> 0) & 1);
1886 Features[
"rdpru"] = HasExtLeaf8 && ((
EBX >> 4) & 1);
1887 Features[
"wbnoinvd"] = HasExtLeaf8 && ((
EBX >> 9) & 1);
1890 MaxLevel >= 7 && !getX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
1892 Features[
"fsgsbase"] = HasLeaf7 && ((
EBX >> 0) & 1);
1893 Features[
"sgx"] = HasLeaf7 && ((
EBX >> 2) & 1);
1894 Features[
"bmi"] = HasLeaf7 && ((
EBX >> 3) & 1);
1896 Features[
"avx2"] = HasLeaf7 && ((
EBX >> 5) & 1) && HasAVXSave;
1897 Features[
"bmi2"] = HasLeaf7 && ((
EBX >> 8) & 1);
1898 Features[
"invpcid"] = HasLeaf7 && ((
EBX >> 10) & 1);
1899 Features[
"rtm"] = HasLeaf7 && ((
EBX >> 11) & 1);
1901 Features[
"avx512f"] = HasLeaf7 && ((
EBX >> 16) & 1) && HasAVX512Save;
1902 if (Features[
"avx512f"])
1903 Features[
"evex512"] =
true;
1904 Features[
"avx512dq"] = HasLeaf7 && ((
EBX >> 17) & 1) && HasAVX512Save;
1905 Features[
"rdseed"] = HasLeaf7 && ((
EBX >> 18) & 1);
1906 Features[
"adx"] = HasLeaf7 && ((
EBX >> 19) & 1);
1907 Features[
"avx512ifma"] = HasLeaf7 && ((
EBX >> 21) & 1) && HasAVX512Save;
1908 Features[
"clflushopt"] = HasLeaf7 && ((
EBX >> 23) & 1);
1909 Features[
"clwb"] = HasLeaf7 && ((
EBX >> 24) & 1);
1910 Features[
"avx512cd"] = HasLeaf7 && ((
EBX >> 28) & 1) && HasAVX512Save;
1911 Features[
"sha"] = HasLeaf7 && ((
EBX >> 29) & 1);
1912 Features[
"avx512bw"] = HasLeaf7 && ((
EBX >> 30) & 1) && HasAVX512Save;
1913 Features[
"avx512vl"] = HasLeaf7 && ((
EBX >> 31) & 1) && HasAVX512Save;
1915 Features[
"avx512vbmi"] = HasLeaf7 && ((
ECX >> 1) & 1) && HasAVX512Save;
1916 Features[
"pku"] = HasLeaf7 && ((
ECX >> 4) & 1);
1917 Features[
"waitpkg"] = HasLeaf7 && ((
ECX >> 5) & 1);
1918 Features[
"avx512vbmi2"] = HasLeaf7 && ((
ECX >> 6) & 1) && HasAVX512Save;
1919 Features[
"shstk"] = HasLeaf7 && ((
ECX >> 7) & 1);
1920 Features[
"gfni"] = HasLeaf7 && ((
ECX >> 8) & 1);
1921 Features[
"vaes"] = HasLeaf7 && ((
ECX >> 9) & 1) && HasAVXSave;
1922 Features[
"vpclmulqdq"] = HasLeaf7 && ((
ECX >> 10) & 1) && HasAVXSave;
1923 Features[
"avx512vnni"] = HasLeaf7 && ((
ECX >> 11) & 1) && HasAVX512Save;
1924 Features[
"avx512bitalg"] = HasLeaf7 && ((
ECX >> 12) & 1) && HasAVX512Save;
1925 Features[
"avx512vpopcntdq"] = HasLeaf7 && ((
ECX >> 14) & 1) && HasAVX512Save;
1926 Features[
"rdpid"] = HasLeaf7 && ((
ECX >> 22) & 1);
1927 Features[
"kl"] = HasLeaf7 && ((
ECX >> 23) & 1);
1928 Features[
"cldemote"] = HasLeaf7 && ((
ECX >> 25) & 1);
1929 Features[
"movdiri"] = HasLeaf7 && ((
ECX >> 27) & 1);
1930 Features[
"movdir64b"] = HasLeaf7 && ((
ECX >> 28) & 1);
1931 Features[
"enqcmd"] = HasLeaf7 && ((
ECX >> 29) & 1);
1933 Features[
"uintr"] = HasLeaf7 && ((
EDX >> 5) & 1);
1934 Features[
"avx512vp2intersect"] =
1935 HasLeaf7 && ((
EDX >> 8) & 1) && HasAVX512Save;
1936 Features[
"serialize"] = HasLeaf7 && ((
EDX >> 14) & 1);
1937 Features[
"tsxldtrk"] = HasLeaf7 && ((
EDX >> 16) & 1);
1948 Features[
"pconfig"] = HasLeaf7 && ((
EDX >> 18) & 1);
1949 Features[
"amx-bf16"] = HasLeaf7 && ((
EDX >> 22) & 1) && HasAMXSave;
1950 Features[
"avx512fp16"] = HasLeaf7 && ((
EDX >> 23) & 1) && HasAVX512Save;
1951 Features[
"amx-tile"] = HasLeaf7 && ((
EDX >> 24) & 1) && HasAMXSave;
1952 Features[
"amx-int8"] = HasLeaf7 && ((
EDX >> 25) & 1) && HasAMXSave;
1955 bool HasLeaf7Subleaf1 =
1956 HasLeaf7 &&
EAX >= 1 &&
1957 !getX86CpuIDAndInfoEx(0x7, 0x1, &EAX, &EBX, &ECX, &EDX);
1958 Features[
"sha512"] = HasLeaf7Subleaf1 && ((
EAX >> 0) & 1);
1959 Features[
"sm3"] = HasLeaf7Subleaf1 && ((
EAX >> 1) & 1);
1960 Features[
"sm4"] = HasLeaf7Subleaf1 && ((
EAX >> 2) & 1);
1961 Features[
"raoint"] = HasLeaf7Subleaf1 && ((
EAX >> 3) & 1);
1962 Features[
"avxvnni"] = HasLeaf7Subleaf1 && ((
EAX >> 4) & 1) && HasAVXSave;
1963 Features[
"avx512bf16"] = HasLeaf7Subleaf1 && ((
EAX >> 5) & 1) && HasAVX512Save;
1964 Features[
"amx-fp16"] = HasLeaf7Subleaf1 && ((
EAX >> 21) & 1) && HasAMXSave;
1965 Features[
"cmpccxadd"] = HasLeaf7Subleaf1 && ((
EAX >> 7) & 1);
1966 Features[
"hreset"] = HasLeaf7Subleaf1 && ((
EAX >> 22) & 1);
1967 Features[
"avxifma"] = HasLeaf7Subleaf1 && ((
EAX >> 23) & 1) && HasAVXSave;
1968 Features[
"movrs"] = HasLeaf7Subleaf1 && ((
EAX >> 31) & 1);
1969 Features[
"avxvnniint8"] = HasLeaf7Subleaf1 && ((
EDX >> 4) & 1) && HasAVXSave;
1970 Features[
"avxneconvert"] = HasLeaf7Subleaf1 && ((
EDX >> 5) & 1) && HasAVXSave;
1971 Features[
"amx-complex"] = HasLeaf7Subleaf1 && ((
EDX >> 8) & 1) && HasAMXSave;
1972 Features[
"avxvnniint16"] = HasLeaf7Subleaf1 && ((
EDX >> 10) & 1) && HasAVXSave;
1973 Features[
"prefetchi"] = HasLeaf7Subleaf1 && ((
EDX >> 14) & 1);
1974 Features[
"usermsr"] = HasLeaf7Subleaf1 && ((
EDX >> 15) & 1);
1975 bool HasAVX10 = HasLeaf7Subleaf1 && ((
EDX >> 19) & 1);
1976 bool HasAPXF = HasLeaf7Subleaf1 && ((
EDX >> 21) & 1);
1977 Features[
"egpr"] = HasAPXF;
1978 Features[
"push2pop2"] = HasAPXF;
1979 Features[
"ppx"] = HasAPXF;
1980 Features[
"ndd"] = HasAPXF;
1981 Features[
"ccmp"] = HasAPXF;
1982 Features[
"nf"] = HasAPXF;
1983 Features[
"cf"] = HasAPXF;
1984 Features[
"zu"] = HasAPXF;
1986 bool HasLeafD = MaxLevel >= 0xd &&
1987 !getX86CpuIDAndInfoEx(0xd, 0x1, &EAX, &EBX, &ECX, &EDX);
1990 Features[
"xsaveopt"] = HasLeafD && ((
EAX >> 0) & 1) && HasAVXSave;
1991 Features[
"xsavec"] = HasLeafD && ((
EAX >> 1) & 1) && HasAVXSave;
1992 Features[
"xsaves"] = HasLeafD && ((
EAX >> 3) & 1) && HasAVXSave;
1994 bool HasLeaf14 = MaxLevel >= 0x14 &&
1995 !getX86CpuIDAndInfoEx(0x14, 0x0, &EAX, &EBX, &ECX, &EDX);
1997 Features[
"ptwrite"] = HasLeaf14 && ((
EBX >> 4) & 1);
2000 MaxLevel >= 0x19 && !getX86CpuIDAndInfo(0x19, &EAX, &EBX, &ECX, &EDX);
2001 Features[
"widekl"] = HasLeaf7 && HasLeaf19 && ((
EBX >> 2) & 1);
2003 bool HasLeaf1E = MaxLevel >= 0x1e &&
2004 !getX86CpuIDAndInfoEx(0x1e, 0x1, &EAX, &EBX, &ECX, &EDX);
2005 Features[
"amx-fp8"] = HasLeaf1E && ((
EAX >> 4) & 1) && HasAMXSave;
2006 Features[
"amx-transpose"] = HasLeaf1E && ((
EAX >> 5) & 1) && HasAMXSave;
2007 Features[
"amx-tf32"] = HasLeaf1E && ((
EAX >> 6) & 1) && HasAMXSave;
2008 Features[
"amx-avx512"] = HasLeaf1E && ((
EAX >> 7) & 1) && HasAMXSave;
2009 Features[
"amx-movrs"] = HasLeaf1E && ((
EAX >> 8) & 1) && HasAMXSave;
2012 MaxLevel >= 0x24 && !getX86CpuIDAndInfo(0x24, &EAX, &EBX, &ECX, &EDX);
2014 int AVX10Ver = HasLeaf24 && (
EBX & 0xff);
2015 int Has512Len = HasLeaf24 && ((
EBX >> 18) & 1);
2016 Features[
"avx10.1-256"] = HasAVX10 && AVX10Ver >= 1;
2017 Features[
"avx10.1-512"] = HasAVX10 && AVX10Ver >= 1 && Has512Len;
2018 Features[
"avx10.2-256"] = HasAVX10 && AVX10Ver >= 2;
2019 Features[
"avx10.2-512"] = HasAVX10 && AVX10Ver >= 2 && Has512Len;
2023#elif defined(__linux__) && (defined(__arm__) || defined(__aarch64__))
2031 P->getBuffer().split(Lines,
'\n');
2036 for (
unsigned I = 0, E =
Lines.size();
I != E; ++
I)
2038 Lines[
I].split(CPUFeatures,
' ');
2042#if defined(__aarch64__)
2045 enum { CAP_AES = 0x1, CAP_PMULL = 0x2, CAP_SHA1 = 0x4, CAP_SHA2 = 0x8 };
2049 for (
unsigned I = 0, E = CPUFeatures.
size();
I != E; ++
I) {
2051#if defined(__aarch64__)
2052 .
Case(
"asimd",
"neon")
2053 .
Case(
"fp",
"fp-armv8")
2054 .
Case(
"crc32",
"crc")
2055 .
Case(
"atomics",
"lse")
2057 .
Case(
"sve2",
"sve2")
2059 .
Case(
"half",
"fp16")
2060 .
Case(
"neon",
"neon")
2061 .
Case(
"vfpv3",
"vfp3")
2062 .
Case(
"vfpv3d16",
"vfp3d16")
2063 .
Case(
"vfpv4",
"vfp4")
2064 .
Case(
"idiva",
"hwdiv-arm")
2065 .
Case(
"idivt",
"hwdiv")
2069#if defined(__aarch64__)
2072 if (CPUFeatures[
I] ==
"aes")
2074 else if (CPUFeatures[
I] ==
"pmull")
2075 crypto |= CAP_PMULL;
2076 else if (CPUFeatures[
I] ==
"sha1")
2078 else if (CPUFeatures[
I] ==
"sha2")
2082 if (LLVMFeatureStr !=
"")
2083 Features[LLVMFeatureStr] =
true;
2086#if defined(__aarch64__)
2090 uint32_t Aes = CAP_AES | CAP_PMULL;
2091 uint32_t Sha2 = CAP_SHA1 | CAP_SHA2;
2092 Features[
"aes"] = (crypto & Aes) == Aes;
2093 Features[
"sha2"] = (crypto & Sha2) == Sha2;
2098#elif defined(_WIN32) && (defined(__aarch64__) || defined(_M_ARM64))
2104 IsProcessorFeaturePresent(PF_ARM_NEON_INSTRUCTIONS_AVAILABLE);
2106 IsProcessorFeaturePresent(PF_ARM_V8_CRC32_INSTRUCTIONS_AVAILABLE);
2110 IsProcessorFeaturePresent(PF_ARM_V8_CRYPTO_INSTRUCTIONS_AVAILABLE);
2111 Features[
"aes"] = TradCrypto;
2112 Features[
"sha2"] = TradCrypto;
2116#elif defined(__linux__) && defined(__loongarch__)
2117#include <sys/auxv.h>
2119 unsigned long hwcap = getauxval(AT_HWCAP);
2120 bool HasFPU = hwcap & (1UL << 3);
2121 uint32_t cpucfg2 = 0x2, cpucfg3 = 0x3;
2122 __asm__(
"cpucfg %[cpucfg2], %[cpucfg2]\n\t" : [cpucfg2]
"+r"(cpucfg2));
2123 __asm__(
"cpucfg %[cpucfg3], %[cpucfg3]\n\t" : [cpucfg3]
"+r"(cpucfg3));
2127 Features[
"f"] = HasFPU && (cpucfg2 & (1U << 1));
2128 Features[
"d"] = HasFPU && (cpucfg2 & (1U << 2));
2130 Features[
"lsx"] = hwcap & (1UL << 4);
2131 Features[
"lasx"] = hwcap & (1UL << 5);
2132 Features[
"lvz"] = hwcap & (1UL << 9);
2134 Features[
"frecipe"] = cpucfg2 & (1U << 25);
2135 Features[
"div32"] = cpucfg2 & (1U << 26);
2136 Features[
"lam-bh"] = cpucfg2 & (1U << 27);
2137 Features[
"lamcas"] = cpucfg2 & (1U << 28);
2139 Features[
"ld-seq-sa"] = cpucfg3 & (1U << 23);
2146#elif defined(__linux__) && defined(__riscv)
2148struct RISCVHwProbe {
2153 RISCVHwProbe Query[]{{3, 0},
2156 int Ret = syscall(258, Query,
2157 std::size(Query), 0,
2163 uint64_t BaseMask = Query[0].Value;
2166 Features[
"i"] =
true;
2167 Features[
"m"] =
true;
2168 Features[
"a"] =
true;
2172 Features[
"f"] = ExtMask & (1 << 0);
2173 Features[
"d"] = ExtMask & (1 << 0);
2174 Features[
"c"] = ExtMask & (1 << 1);
2175 Features[
"v"] = ExtMask & (1 << 2);
2176 Features[
"zba"] = ExtMask & (1 << 3);
2177 Features[
"zbb"] = ExtMask & (1 << 4);
2178 Features[
"zbs"] = ExtMask & (1 << 5);
2179 Features[
"zicboz"] = ExtMask & (1 << 6);
2180 Features[
"zbc"] = ExtMask & (1 << 7);
2181 Features[
"zbkb"] = ExtMask & (1 << 8);
2182 Features[
"zbkc"] = ExtMask & (1 << 9);
2183 Features[
"zbkx"] = ExtMask & (1 << 10);
2184 Features[
"zknd"] = ExtMask & (1 << 11);
2185 Features[
"zkne"] = ExtMask & (1 << 12);
2186 Features[
"zknh"] = ExtMask & (1 << 13);
2187 Features[
"zksed"] = ExtMask & (1 << 14);
2188 Features[
"zksh"] = ExtMask & (1 << 15);
2189 Features[
"zkt"] = ExtMask & (1 << 16);
2190 Features[
"zvbb"] = ExtMask & (1 << 17);
2191 Features[
"zvbc"] = ExtMask & (1 << 18);
2192 Features[
"zvkb"] = ExtMask & (1 << 19);
2193 Features[
"zvkg"] = ExtMask & (1 << 20);
2194 Features[
"zvkned"] = ExtMask & (1 << 21);
2195 Features[
"zvknha"] = ExtMask & (1 << 22);
2196 Features[
"zvknhb"] = ExtMask & (1 << 23);
2197 Features[
"zvksed"] = ExtMask & (1 << 24);
2198 Features[
"zvksh"] = ExtMask & (1 << 25);
2199 Features[
"zvkt"] = ExtMask & (1 << 26);
2200 Features[
"zfh"] = ExtMask & (1 << 27);
2201 Features[
"zfhmin"] = ExtMask & (1 << 28);
2202 Features[
"zihintntl"] = ExtMask & (1 << 29);
2203 Features[
"zvfh"] = ExtMask & (1 << 30);
2204 Features[
"zvfhmin"] = ExtMask & (1ULL << 31);
2205 Features[
"zfa"] = ExtMask & (1ULL << 32);
2206 Features[
"ztso"] = ExtMask & (1ULL << 33);
2207 Features[
"zacas"] = ExtMask & (1ULL << 34);
2208 Features[
"zicond"] = ExtMask & (1ULL << 35);
2209 Features[
"zihintpause"] =
2210 ExtMask & (1ULL << 36);
2211 Features[
"zve32x"] = ExtMask & (1ULL << 37);
2212 Features[
"zve32f"] = ExtMask & (1ULL << 38);
2213 Features[
"zve64x"] = ExtMask & (1ULL << 39);
2214 Features[
"zve64f"] = ExtMask & (1ULL << 40);
2215 Features[
"zve64d"] = ExtMask & (1ULL << 41);
2216 Features[
"zimop"] = ExtMask & (1ULL << 42);
2217 Features[
"zca"] = ExtMask & (1ULL << 43);
2218 Features[
"zcb"] = ExtMask & (1ULL << 44);
2219 Features[
"zcd"] = ExtMask & (1ULL << 45);
2220 Features[
"zcf"] = ExtMask & (1ULL << 46);
2221 Features[
"zcmop"] = ExtMask & (1ULL << 47);
2222 Features[
"zawrs"] = ExtMask & (1ULL << 48);
2228 if (Query[2].Key != -1 &&
2229 Query[2].
Value == 3)
2230 Features[
"unaligned-scalar-mem"] =
true;
2243 T.setArchName(
"arm");
2244#elif defined(__arm64e__)
2246 T.setArchName(
"arm64e");
2247#elif defined(__aarch64__)
2249 T.setArchName(
"arm64");
2250#elif defined(__x86_64h__)
2252 T.setArchName(
"x86_64h");
2253#elif defined(__x86_64__)
2255 T.setArchName(
"x86_64");
2256#elif defined(__i386__)
2258 T.setArchName(
"i386");
2259#elif defined(__powerpc__)
2261 T.setArchName(
"powerpc");
2263# error "Unimplemented host arch fixup"
2270 std::string TargetTripleString = updateTripleOSVersion(LLVM_HOST_TRIPLE);
2276 PT = withHostArch(PT);
2288#if LLVM_VERSION_PRINTER_SHOW_HOST_TARGET_INFO
2290 if (CPU ==
"generic")
2293 <<
" Host CPU: " << CPU <<
'\n';
This file defines the StringMap class.
#define LLVM_ATTRIBUTE_UNUSED
Given that RA is a live value
static std::unique_ptr< llvm::MemoryBuffer > LLVM_ATTRIBUTE_UNUSED getProcCpuinfoContent()
This file defines the SmallVector class.
This file implements the StringSwitch template, which mimics a switch() statement whose cases are str...
Represents either an error or a value T.
static ErrorOr< std::unique_ptr< MemoryBuffer > > getFileAsStream(const Twine &Filename)
Read all of the specified file into a MemoryBuffer as a stream (i.e.
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringMap - This is an unconventional map that is specialized for handling keys that are "strings",...
StringRef - Represent a constant reference to a string, i.e.
std::pair< StringRef, StringRef > split(char Separator) const
Split into two substrings around the first occurrence of a separator character.
constexpr bool empty() const
empty - Check if the string is empty.
bool ends_with(StringRef Suffix) const
Check if this string ends with the given Suffix.
static constexpr size_t npos
A switch()-like statement whose cases are string literals.
StringSwitch & Case(StringLiteral S, T Value)
StringSwitch & StartsWith(StringLiteral S, T Value)
Triple - Helper class for working with autoconf configuration names.
llvm::Triple get32BitArchVariant() const
Form a triple with a 32-bit variant of the current architecture.
llvm::Triple get64BitArchVariant() const
Form a triple with a 64-bit variant of the current architecture.
static std::string normalize(StringRef Str, CanonicalForm Form=CanonicalForm::ANY)
Turn an arbitrary machine specification into the canonical triple form (or something sensible that th...
const std::string & str() const
bool isArch64Bit() const
Test whether the architecture is 64-bit.
bool isArch32Bit() const
Test whether the architecture is 32-bit.
The instances of the Type class are immutable: once they are created, they are never changed.
LLVM Value Representation.
This class implements an extremely fast bulk output stream that can only output to a stream.
@ CPU_SUBTYPE_POWERPC_970
@ CPU_SUBTYPE_POWERPC_604e
@ CPU_SUBTYPE_POWERPC_603e
@ CPU_SUBTYPE_POWERPC_7400
@ CPU_SUBTYPE_POWERPC_604
@ CPU_SUBTYPE_POWERPC_750
@ CPU_SUBTYPE_POWERPC_601
@ CPU_SUBTYPE_POWERPC_620
@ CPU_SUBTYPE_POWERPC_603ev
@ CPU_SUBTYPE_POWERPC_603
@ CPU_SUBTYPE_POWERPC_7450
@ CPU_SUBTYPE_POWERPC_602
Helper functions to extract CPU details from CPUID on x86.
VendorSignatures getVendorSignature(unsigned *MaxLeaf=nullptr)
Returns the host CPU's vendor.
StringRef getHostCPUNameForS390x(StringRef ProcCpuinfoContent)
StringRef getHostCPUNameForPowerPC(StringRef ProcCpuinfoContent)
Helper functions to extract HostCPUName from /proc/cpuinfo on linux.
StringRef getHostCPUNameForBPF()
StringRef getHostCPUNameForARM(StringRef ProcCpuinfoContent)
StringRef getHostCPUNameForRISCV(StringRef ProcCpuinfoContent)
StringRef getHostCPUNameForSPARC(StringRef ProcCpuinfoContent)
const StringMap< bool, MallocAllocator > getHostCPUFeatures()
getHostCPUFeatures - Get the LLVM names for the host CPU features.
StringRef getHostCPUName()
getHostCPUName - Get the LLVM name for the host CPU.
void printDefaultTargetAndDetectedCPU(raw_ostream &OS)
This is a function compatible with cl::AddExtraVersionPrinter, which adds info about the current targ...
std::string getProcessTriple()
getProcessTriple() - Return an appropriate target triple for generating code to be loaded into the cu...
std::string getDefaultTargetTriple()
getDefaultTargetTriple() - Return the default target triple the compiler has been configured to produ...
This is an optimization pass for GlobalISel generic memory operations.
raw_fd_ostream & errs()
This returns a reference to a raw_ostream for standard error.