LLVM 19.0.0git
Host.cpp
Go to the documentation of this file.
1//===-- Host.cpp - Implement OS Host Detection ------------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the operating system Host detection.
10//
11//===----------------------------------------------------------------------===//
12
15#include "llvm/ADT/StringMap.h"
16#include "llvm/ADT/StringRef.h"
18#include "llvm/Config/llvm-config.h"
23#include <string.h>
24
25// Include the platform-specific parts of this class.
26#ifdef LLVM_ON_UNIX
27#include "Unix/Host.inc"
28#include <sched.h>
29#endif
30#ifdef _WIN32
31#include "Windows/Host.inc"
32#endif
33#ifdef _MSC_VER
34#include <intrin.h>
35#endif
36#ifdef __MVS__
37#include "llvm/Support/BCD.h"
38#endif
39#if defined(__APPLE__)
40#include <mach/host_info.h>
41#include <mach/mach.h>
42#include <mach/mach_host.h>
43#include <mach/machine.h>
44#include <sys/param.h>
45#include <sys/sysctl.h>
46#endif
47#ifdef _AIX
48#include <sys/systemcfg.h>
49#endif
50#if defined(__sun__) && defined(__svr4__)
51#include <kstat.h>
52#endif
53
54#define DEBUG_TYPE "host-detection"
55
56//===----------------------------------------------------------------------===//
57//
58// Implementations of the CPU detection routines
59//
60//===----------------------------------------------------------------------===//
61
62using namespace llvm;
63
64static std::unique_ptr<llvm::MemoryBuffer>
68 if (std::error_code EC = Text.getError()) {
69 llvm::errs() << "Can't read "
70 << "/proc/cpuinfo: " << EC.message() << "\n";
71 return nullptr;
72 }
73 return std::move(*Text);
74}
75
77 // Access to the Processor Version Register (PVR) on PowerPC is privileged,
78 // and so we must use an operating-system interface to determine the current
79 // processor type. On Linux, this is exposed through the /proc/cpuinfo file.
80 const char *generic = "generic";
81
82 // The cpu line is second (after the 'processor: 0' line), so if this
83 // buffer is too small then something has changed (or is wrong).
84 StringRef::const_iterator CPUInfoStart = ProcCpuinfoContent.begin();
85 StringRef::const_iterator CPUInfoEnd = ProcCpuinfoContent.end();
86
87 StringRef::const_iterator CIP = CPUInfoStart;
88
89 StringRef::const_iterator CPUStart = nullptr;
90 size_t CPULen = 0;
91
92 // We need to find the first line which starts with cpu, spaces, and a colon.
93 // After the colon, there may be some additional spaces and then the cpu type.
94 while (CIP < CPUInfoEnd && CPUStart == nullptr) {
95 if (CIP < CPUInfoEnd && *CIP == '\n')
96 ++CIP;
97
98 if (CIP < CPUInfoEnd && *CIP == 'c') {
99 ++CIP;
100 if (CIP < CPUInfoEnd && *CIP == 'p') {
101 ++CIP;
102 if (CIP < CPUInfoEnd && *CIP == 'u') {
103 ++CIP;
104 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t'))
105 ++CIP;
106
107 if (CIP < CPUInfoEnd && *CIP == ':') {
108 ++CIP;
109 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t'))
110 ++CIP;
111
112 if (CIP < CPUInfoEnd) {
113 CPUStart = CIP;
114 while (CIP < CPUInfoEnd && (*CIP != ' ' && *CIP != '\t' &&
115 *CIP != ',' && *CIP != '\n'))
116 ++CIP;
117 CPULen = CIP - CPUStart;
118 }
119 }
120 }
121 }
122 }
123
124 if (CPUStart == nullptr)
125 while (CIP < CPUInfoEnd && *CIP != '\n')
126 ++CIP;
127 }
128
129 if (CPUStart == nullptr)
130 return generic;
131
132 return StringSwitch<const char *>(StringRef(CPUStart, CPULen))
133 .Case("604e", "604e")
134 .Case("604", "604")
135 .Case("7400", "7400")
136 .Case("7410", "7400")
137 .Case("7447", "7400")
138 .Case("7455", "7450")
139 .Case("G4", "g4")
140 .Case("POWER4", "970")
141 .Case("PPC970FX", "970")
142 .Case("PPC970MP", "970")
143 .Case("G5", "g5")
144 .Case("POWER5", "g5")
145 .Case("A2", "a2")
146 .Case("POWER6", "pwr6")
147 .Case("POWER7", "pwr7")
148 .Case("POWER8", "pwr8")
149 .Case("POWER8E", "pwr8")
150 .Case("POWER8NVL", "pwr8")
151 .Case("POWER9", "pwr9")
152 .Case("POWER10", "pwr10")
153 // FIXME: If we get a simulator or machine with the capabilities of
154 // mcpu=future, we should revisit this and add the name reported by the
155 // simulator/machine.
156 .Default(generic);
157}
158
160 // The cpuid register on arm is not accessible from user space. On Linux,
161 // it is exposed through the /proc/cpuinfo file.
162
163 // Read 32 lines from /proc/cpuinfo, which should contain the CPU part line
164 // in all cases.
166 ProcCpuinfoContent.split(Lines, "\n");
167
168 // Look for the CPU implementer line.
169 StringRef Implementer;
170 StringRef Hardware;
171 StringRef Part;
172 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
173 if (Lines[I].starts_with("CPU implementer"))
174 Implementer = Lines[I].substr(15).ltrim("\t :");
175 if (Lines[I].starts_with("Hardware"))
176 Hardware = Lines[I].substr(8).ltrim("\t :");
177 if (Lines[I].starts_with("CPU part"))
178 Part = Lines[I].substr(8).ltrim("\t :");
179 }
180
181 if (Implementer == "0x41") { // ARM Ltd.
182 // MSM8992/8994 may give cpu part for the core that the kernel is running on,
183 // which is undeterministic and wrong. Always return cortex-a53 for these SoC.
184 if (Hardware.ends_with("MSM8994") || Hardware.ends_with("MSM8996"))
185 return "cortex-a53";
186
187
188 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
189 // values correspond to the "Part number" in the CP15/c0 register. The
190 // contents are specified in the various processor manuals.
191 // This corresponds to the Main ID Register in Technical Reference Manuals.
192 // and is used in programs like sys-utils
193 return StringSwitch<const char *>(Part)
194 .Case("0x926", "arm926ej-s")
195 .Case("0xb02", "mpcore")
196 .Case("0xb36", "arm1136j-s")
197 .Case("0xb56", "arm1156t2-s")
198 .Case("0xb76", "arm1176jz-s")
199 .Case("0xc05", "cortex-a5")
200 .Case("0xc07", "cortex-a7")
201 .Case("0xc08", "cortex-a8")
202 .Case("0xc09", "cortex-a9")
203 .Case("0xc0f", "cortex-a15")
204 .Case("0xc0e", "cortex-a17")
205 .Case("0xc20", "cortex-m0")
206 .Case("0xc23", "cortex-m3")
207 .Case("0xc24", "cortex-m4")
208 .Case("0xc27", "cortex-m7")
209 .Case("0xd20", "cortex-m23")
210 .Case("0xd21", "cortex-m33")
211 .Case("0xd24", "cortex-m52")
212 .Case("0xd22", "cortex-m55")
213 .Case("0xd23", "cortex-m85")
214 .Case("0xc18", "cortex-r8")
215 .Case("0xd13", "cortex-r52")
216 .Case("0xd15", "cortex-r82")
217 .Case("0xd02", "cortex-a34")
218 .Case("0xd04", "cortex-a35")
219 .Case("0xd03", "cortex-a53")
220 .Case("0xd05", "cortex-a55")
221 .Case("0xd46", "cortex-a510")
222 .Case("0xd80", "cortex-a520")
223 .Case("0xd88", "cortex-a520ae")
224 .Case("0xd07", "cortex-a57")
225 .Case("0xd06", "cortex-a65")
226 .Case("0xd43", "cortex-a65ae")
227 .Case("0xd08", "cortex-a72")
228 .Case("0xd09", "cortex-a73")
229 .Case("0xd0a", "cortex-a75")
230 .Case("0xd0b", "cortex-a76")
231 .Case("0xd0e", "cortex-a76ae")
232 .Case("0xd0d", "cortex-a77")
233 .Case("0xd41", "cortex-a78")
234 .Case("0xd42", "cortex-a78ae")
235 .Case("0xd4b", "cortex-a78c")
236 .Case("0xd47", "cortex-a710")
237 .Case("0xd4d", "cortex-a715")
238 .Case("0xd81", "cortex-a720")
239 .Case("0xd89", "cortex-a720ae")
240 .Case("0xd44", "cortex-x1")
241 .Case("0xd4c", "cortex-x1c")
242 .Case("0xd48", "cortex-x2")
243 .Case("0xd4e", "cortex-x3")
244 .Case("0xd82", "cortex-x4")
245 .Case("0xd4a", "neoverse-e1")
246 .Case("0xd0c", "neoverse-n1")
247 .Case("0xd49", "neoverse-n2")
248 .Case("0xd40", "neoverse-v1")
249 .Case("0xd4f", "neoverse-v2")
250 .Default("generic");
251 }
252
253 if (Implementer == "0x42" || Implementer == "0x43") { // Broadcom | Cavium.
254 return StringSwitch<const char *>(Part)
255 .Case("0x516", "thunderx2t99")
256 .Case("0x0516", "thunderx2t99")
257 .Case("0xaf", "thunderx2t99")
258 .Case("0x0af", "thunderx2t99")
259 .Case("0xa1", "thunderxt88")
260 .Case("0x0a1", "thunderxt88")
261 .Default("generic");
262 }
263
264 if (Implementer == "0x46") { // Fujitsu Ltd.
265 return StringSwitch<const char *>(Part)
266 .Case("0x001", "a64fx")
267 .Default("generic");
268 }
269
270 if (Implementer == "0x4e") { // NVIDIA Corporation
271 return StringSwitch<const char *>(Part)
272 .Case("0x004", "carmel")
273 .Default("generic");
274 }
275
276 if (Implementer == "0x48") // HiSilicon Technologies, Inc.
277 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
278 // values correspond to the "Part number" in the CP15/c0 register. The
279 // contents are specified in the various processor manuals.
280 return StringSwitch<const char *>(Part)
281 .Case("0xd01", "tsv110")
282 .Default("generic");
283
284 if (Implementer == "0x51") // Qualcomm Technologies, Inc.
285 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
286 // values correspond to the "Part number" in the CP15/c0 register. The
287 // contents are specified in the various processor manuals.
288 return StringSwitch<const char *>(Part)
289 .Case("0x06f", "krait") // APQ8064
290 .Case("0x201", "kryo")
291 .Case("0x205", "kryo")
292 .Case("0x211", "kryo")
293 .Case("0x800", "cortex-a73") // Kryo 2xx Gold
294 .Case("0x801", "cortex-a73") // Kryo 2xx Silver
295 .Case("0x802", "cortex-a75") // Kryo 3xx Gold
296 .Case("0x803", "cortex-a75") // Kryo 3xx Silver
297 .Case("0x804", "cortex-a76") // Kryo 4xx Gold
298 .Case("0x805", "cortex-a76") // Kryo 4xx/5xx Silver
299 .Case("0xc00", "falkor")
300 .Case("0xc01", "saphira")
301 .Default("generic");
302 if (Implementer == "0x53") { // Samsung Electronics Co., Ltd.
303 // The Exynos chips have a convoluted ID scheme that doesn't seem to follow
304 // any predictive pattern across variants and parts.
305 unsigned Variant = 0, Part = 0;
306
307 // Look for the CPU variant line, whose value is a 1 digit hexadecimal
308 // number, corresponding to the Variant bits in the CP15/C0 register.
309 for (auto I : Lines)
310 if (I.consume_front("CPU variant"))
311 I.ltrim("\t :").getAsInteger(0, Variant);
312
313 // Look for the CPU part line, whose value is a 3 digit hexadecimal
314 // number, corresponding to the PartNum bits in the CP15/C0 register.
315 for (auto I : Lines)
316 if (I.consume_front("CPU part"))
317 I.ltrim("\t :").getAsInteger(0, Part);
318
319 unsigned Exynos = (Variant << 12) | Part;
320 switch (Exynos) {
321 default:
322 // Default by falling through to Exynos M3.
323 [[fallthrough]];
324 case 0x1002:
325 return "exynos-m3";
326 case 0x1003:
327 return "exynos-m4";
328 }
329 }
330
331 if (Implementer == "0x6d") { // Microsoft Corporation.
332 // The Microsoft Azure Cobalt 100 CPU is handled as a Neoverse N2.
333 return StringSwitch<const char *>(Part)
334 .Case("0xd49", "neoverse-n2")
335 .Default("generic");
336 }
337
338 if (Implementer == "0xc0") { // Ampere Computing
339 return StringSwitch<const char *>(Part)
340 .Case("0xac3", "ampere1")
341 .Case("0xac4", "ampere1a")
342 .Case("0xac5", "ampere1b")
343 .Default("generic");
344 }
345
346 return "generic";
347}
348
349namespace {
350StringRef getCPUNameFromS390Model(unsigned int Id, bool HaveVectorSupport) {
351 switch (Id) {
352 case 2064: // z900 not supported by LLVM
353 case 2066:
354 case 2084: // z990 not supported by LLVM
355 case 2086:
356 case 2094: // z9-109 not supported by LLVM
357 case 2096:
358 return "generic";
359 case 2097:
360 case 2098:
361 return "z10";
362 case 2817:
363 case 2818:
364 return "z196";
365 case 2827:
366 case 2828:
367 return "zEC12";
368 case 2964:
369 case 2965:
370 return HaveVectorSupport? "z13" : "zEC12";
371 case 3906:
372 case 3907:
373 return HaveVectorSupport? "z14" : "zEC12";
374 case 8561:
375 case 8562:
376 return HaveVectorSupport? "z15" : "zEC12";
377 case 3931:
378 case 3932:
379 default:
380 return HaveVectorSupport? "z16" : "zEC12";
381 }
382}
383} // end anonymous namespace
384
386 // STIDP is a privileged operation, so use /proc/cpuinfo instead.
387
388 // The "processor 0:" line comes after a fair amount of other information,
389 // including a cache breakdown, but this should be plenty.
391 ProcCpuinfoContent.split(Lines, "\n");
392
393 // Look for the CPU features.
394 SmallVector<StringRef, 32> CPUFeatures;
395 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
396 if (Lines[I].starts_with("features")) {
397 size_t Pos = Lines[I].find(':');
398 if (Pos != StringRef::npos) {
399 Lines[I].drop_front(Pos + 1).split(CPUFeatures, ' ');
400 break;
401 }
402 }
403
404 // We need to check for the presence of vector support independently of
405 // the machine type, since we may only use the vector register set when
406 // supported by the kernel (and hypervisor).
407 bool HaveVectorSupport = false;
408 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) {
409 if (CPUFeatures[I] == "vx")
410 HaveVectorSupport = true;
411 }
412
413 // Now check the processor machine type.
414 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
415 if (Lines[I].starts_with("processor ")) {
416 size_t Pos = Lines[I].find("machine = ");
417 if (Pos != StringRef::npos) {
418 Pos += sizeof("machine = ") - 1;
419 unsigned int Id;
420 if (!Lines[I].drop_front(Pos).getAsInteger(10, Id))
421 return getCPUNameFromS390Model(Id, HaveVectorSupport);
422 }
423 break;
424 }
425 }
426
427 return "generic";
428}
429
431 // There are 24 lines in /proc/cpuinfo
433 ProcCpuinfoContent.split(Lines, "\n");
434
435 // Look for uarch line to determine cpu name
436 StringRef UArch;
437 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
438 if (Lines[I].starts_with("uarch")) {
439 UArch = Lines[I].substr(5).ltrim("\t :");
440 break;
441 }
442 }
443
444 return StringSwitch<const char *>(UArch)
445 .Case("sifive,u74-mc", "sifive-u74")
446 .Case("sifive,bullet0", "sifive-u74")
447 .Default("generic");
448}
449
451#if !defined(__linux__) || !defined(__x86_64__)
452 return "generic";
453#else
454 uint8_t v3_insns[40] __attribute__ ((aligned (8))) =
455 /* BPF_MOV64_IMM(BPF_REG_0, 0) */
456 { 0xb7, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
457 /* BPF_MOV64_IMM(BPF_REG_2, 1) */
458 0xb7, 0x2, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
459 /* BPF_JMP32_REG(BPF_JLT, BPF_REG_0, BPF_REG_2, 1) */
460 0xae, 0x20, 0x1, 0x0, 0x0, 0x0, 0x0, 0x0,
461 /* BPF_MOV64_IMM(BPF_REG_0, 1) */
462 0xb7, 0x0, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
463 /* BPF_EXIT_INSN() */
464 0x95, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0 };
465
466 uint8_t v2_insns[40] __attribute__ ((aligned (8))) =
467 /* BPF_MOV64_IMM(BPF_REG_0, 0) */
468 { 0xb7, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
469 /* BPF_MOV64_IMM(BPF_REG_2, 1) */
470 0xb7, 0x2, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
471 /* BPF_JMP_REG(BPF_JLT, BPF_REG_0, BPF_REG_2, 1) */
472 0xad, 0x20, 0x1, 0x0, 0x0, 0x0, 0x0, 0x0,
473 /* BPF_MOV64_IMM(BPF_REG_0, 1) */
474 0xb7, 0x0, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
475 /* BPF_EXIT_INSN() */
476 0x95, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0 };
477
478 struct bpf_prog_load_attr {
479 uint32_t prog_type;
480 uint32_t insn_cnt;
481 uint64_t insns;
482 uint64_t license;
483 uint32_t log_level;
484 uint32_t log_size;
485 uint64_t log_buf;
486 uint32_t kern_version;
487 uint32_t prog_flags;
488 } attr = {};
489 attr.prog_type = 1; /* BPF_PROG_TYPE_SOCKET_FILTER */
490 attr.insn_cnt = 5;
491 attr.insns = (uint64_t)v3_insns;
492 attr.license = (uint64_t)"DUMMY";
493
494 int fd = syscall(321 /* __NR_bpf */, 5 /* BPF_PROG_LOAD */, &attr,
495 sizeof(attr));
496 if (fd >= 0) {
497 close(fd);
498 return "v3";
499 }
500
501 /* Clear the whole attr in case its content changed by syscall. */
502 memset(&attr, 0, sizeof(attr));
503 attr.prog_type = 1; /* BPF_PROG_TYPE_SOCKET_FILTER */
504 attr.insn_cnt = 5;
505 attr.insns = (uint64_t)v2_insns;
506 attr.license = (uint64_t)"DUMMY";
507 fd = syscall(321 /* __NR_bpf */, 5 /* BPF_PROG_LOAD */, &attr, sizeof(attr));
508 if (fd >= 0) {
509 close(fd);
510 return "v2";
511 }
512 return "v1";
513#endif
514}
515
516#if defined(__i386__) || defined(_M_IX86) || \
517 defined(__x86_64__) || defined(_M_X64)
518
519// The check below for i386 was copied from clang's cpuid.h (__get_cpuid_max).
520// Check motivated by bug reports for OpenSSL crashing on CPUs without CPUID
521// support. Consequently, for i386, the presence of CPUID is checked first
522// via the corresponding eflags bit.
523// Removal of cpuid.h header motivated by PR30384
524// Header cpuid.h and method __get_cpuid_max are not used in llvm, clang, openmp
525// or test-suite, but are used in external projects e.g. libstdcxx
526static bool isCpuIdSupported() {
527#if defined(__GNUC__) || defined(__clang__)
528#if defined(__i386__)
529 int __cpuid_supported;
530 __asm__(" pushfl\n"
531 " popl %%eax\n"
532 " movl %%eax,%%ecx\n"
533 " xorl $0x00200000,%%eax\n"
534 " pushl %%eax\n"
535 " popfl\n"
536 " pushfl\n"
537 " popl %%eax\n"
538 " movl $0,%0\n"
539 " cmpl %%eax,%%ecx\n"
540 " je 1f\n"
541 " movl $1,%0\n"
542 "1:"
543 : "=r"(__cpuid_supported)
544 :
545 : "eax", "ecx");
546 if (!__cpuid_supported)
547 return false;
548#endif
549 return true;
550#endif
551 return true;
552}
553
554/// getX86CpuIDAndInfo - Execute the specified cpuid and return the 4 values in
555/// the specified arguments. If we can't run cpuid on the host, return true.
556static bool getX86CpuIDAndInfo(unsigned value, unsigned *rEAX, unsigned *rEBX,
557 unsigned *rECX, unsigned *rEDX) {
558#if defined(__GNUC__) || defined(__clang__)
559#if defined(__x86_64__)
560 // gcc doesn't know cpuid would clobber ebx/rbx. Preserve it manually.
561 // FIXME: should we save this for Clang?
562 __asm__("movq\t%%rbx, %%rsi\n\t"
563 "cpuid\n\t"
564 "xchgq\t%%rbx, %%rsi\n\t"
565 : "=a"(*rEAX), "=S"(*rEBX), "=c"(*rECX), "=d"(*rEDX)
566 : "a"(value));
567 return false;
568#elif defined(__i386__)
569 __asm__("movl\t%%ebx, %%esi\n\t"
570 "cpuid\n\t"
571 "xchgl\t%%ebx, %%esi\n\t"
572 : "=a"(*rEAX), "=S"(*rEBX), "=c"(*rECX), "=d"(*rEDX)
573 : "a"(value));
574 return false;
575#else
576 return true;
577#endif
578#elif defined(_MSC_VER)
579 // The MSVC intrinsic is portable across x86 and x64.
580 int registers[4];
581 __cpuid(registers, value);
582 *rEAX = registers[0];
583 *rEBX = registers[1];
584 *rECX = registers[2];
585 *rEDX = registers[3];
586 return false;
587#else
588 return true;
589#endif
590}
591
592namespace llvm {
593namespace sys {
594namespace detail {
595namespace x86 {
596
597VendorSignatures getVendorSignature(unsigned *MaxLeaf) {
598 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
599 if (MaxLeaf == nullptr)
600 MaxLeaf = &EAX;
601 else
602 *MaxLeaf = 0;
603
604 if (!isCpuIdSupported())
605 return VendorSignatures::UNKNOWN;
606
607 if (getX86CpuIDAndInfo(0, MaxLeaf, &EBX, &ECX, &EDX) || *MaxLeaf < 1)
608 return VendorSignatures::UNKNOWN;
609
610 // "Genu ineI ntel"
611 if (EBX == 0x756e6547 && EDX == 0x49656e69 && ECX == 0x6c65746e)
612 return VendorSignatures::GENUINE_INTEL;
613
614 // "Auth enti cAMD"
615 if (EBX == 0x68747541 && EDX == 0x69746e65 && ECX == 0x444d4163)
616 return VendorSignatures::AUTHENTIC_AMD;
617
618 return VendorSignatures::UNKNOWN;
619}
620
621} // namespace x86
622} // namespace detail
623} // namespace sys
624} // namespace llvm
625
626using namespace llvm::sys::detail::x86;
627
628/// getX86CpuIDAndInfoEx - Execute the specified cpuid with subleaf and return
629/// the 4 values in the specified arguments. If we can't run cpuid on the host,
630/// return true.
631static bool getX86CpuIDAndInfoEx(unsigned value, unsigned subleaf,
632 unsigned *rEAX, unsigned *rEBX, unsigned *rECX,
633 unsigned *rEDX) {
634#if defined(__GNUC__) || defined(__clang__)
635#if defined(__x86_64__)
636 // gcc doesn't know cpuid would clobber ebx/rbx. Preserve it manually.
637 // FIXME: should we save this for Clang?
638 __asm__("movq\t%%rbx, %%rsi\n\t"
639 "cpuid\n\t"
640 "xchgq\t%%rbx, %%rsi\n\t"
641 : "=a"(*rEAX), "=S"(*rEBX), "=c"(*rECX), "=d"(*rEDX)
642 : "a"(value), "c"(subleaf));
643 return false;
644#elif defined(__i386__)
645 __asm__("movl\t%%ebx, %%esi\n\t"
646 "cpuid\n\t"
647 "xchgl\t%%ebx, %%esi\n\t"
648 : "=a"(*rEAX), "=S"(*rEBX), "=c"(*rECX), "=d"(*rEDX)
649 : "a"(value), "c"(subleaf));
650 return false;
651#else
652 return true;
653#endif
654#elif defined(_MSC_VER)
655 int registers[4];
656 __cpuidex(registers, value, subleaf);
657 *rEAX = registers[0];
658 *rEBX = registers[1];
659 *rECX = registers[2];
660 *rEDX = registers[3];
661 return false;
662#else
663 return true;
664#endif
665}
666
667// Read control register 0 (XCR0). Used to detect features such as AVX.
668static bool getX86XCR0(unsigned *rEAX, unsigned *rEDX) {
669#if defined(__GNUC__) || defined(__clang__)
670 // Check xgetbv; this uses a .byte sequence instead of the instruction
671 // directly because older assemblers do not include support for xgetbv and
672 // there is no easy way to conditionally compile based on the assembler used.
673 __asm__(".byte 0x0f, 0x01, 0xd0" : "=a"(*rEAX), "=d"(*rEDX) : "c"(0));
674 return false;
675#elif defined(_MSC_FULL_VER) && defined(_XCR_XFEATURE_ENABLED_MASK)
676 unsigned long long Result = _xgetbv(_XCR_XFEATURE_ENABLED_MASK);
677 *rEAX = Result;
678 *rEDX = Result >> 32;
679 return false;
680#else
681 return true;
682#endif
683}
684
685static void detectX86FamilyModel(unsigned EAX, unsigned *Family,
686 unsigned *Model) {
687 *Family = (EAX >> 8) & 0xf; // Bits 8 - 11
688 *Model = (EAX >> 4) & 0xf; // Bits 4 - 7
689 if (*Family == 6 || *Family == 0xf) {
690 if (*Family == 0xf)
691 // Examine extended family ID if family ID is F.
692 *Family += (EAX >> 20) & 0xff; // Bits 20 - 27
693 // Examine extended model ID if family ID is 6 or F.
694 *Model += ((EAX >> 16) & 0xf) << 4; // Bits 16 - 19
695 }
696}
697
698static StringRef
699getIntelProcessorTypeAndSubtype(unsigned Family, unsigned Model,
700 const unsigned *Features,
701 unsigned *Type, unsigned *Subtype) {
702 auto testFeature = [&](unsigned F) {
703 return (Features[F / 32] & (1U << (F % 32))) != 0;
704 };
705
706 StringRef CPU;
707
708 switch (Family) {
709 case 3:
710 CPU = "i386";
711 break;
712 case 4:
713 CPU = "i486";
714 break;
715 case 5:
716 if (testFeature(X86::FEATURE_MMX)) {
717 CPU = "pentium-mmx";
718 break;
719 }
720 CPU = "pentium";
721 break;
722 case 6:
723 switch (Model) {
724 case 0x0f: // Intel Core 2 Duo processor, Intel Core 2 Duo mobile
725 // processor, Intel Core 2 Quad processor, Intel Core 2 Quad
726 // mobile processor, Intel Core 2 Extreme processor, Intel
727 // Pentium Dual-Core processor, Intel Xeon processor, model
728 // 0Fh. All processors are manufactured using the 65 nm process.
729 case 0x16: // Intel Celeron processor model 16h. All processors are
730 // manufactured using the 65 nm process
731 CPU = "core2";
732 *Type = X86::INTEL_CORE2;
733 break;
734 case 0x17: // Intel Core 2 Extreme processor, Intel Xeon processor, model
735 // 17h. All processors are manufactured using the 45 nm process.
736 //
737 // 45nm: Penryn , Wolfdale, Yorkfield (XE)
738 case 0x1d: // Intel Xeon processor MP. All processors are manufactured using
739 // the 45 nm process.
740 CPU = "penryn";
741 *Type = X86::INTEL_CORE2;
742 break;
743 case 0x1a: // Intel Core i7 processor and Intel Xeon processor. All
744 // processors are manufactured using the 45 nm process.
745 case 0x1e: // Intel(R) Core(TM) i7 CPU 870 @ 2.93GHz.
746 // As found in a Summer 2010 model iMac.
747 case 0x1f:
748 case 0x2e: // Nehalem EX
749 CPU = "nehalem";
750 *Type = X86::INTEL_COREI7;
751 *Subtype = X86::INTEL_COREI7_NEHALEM;
752 break;
753 case 0x25: // Intel Core i7, laptop version.
754 case 0x2c: // Intel Core i7 processor and Intel Xeon processor. All
755 // processors are manufactured using the 32 nm process.
756 case 0x2f: // Westmere EX
757 CPU = "westmere";
758 *Type = X86::INTEL_COREI7;
759 *Subtype = X86::INTEL_COREI7_WESTMERE;
760 break;
761 case 0x2a: // Intel Core i7 processor. All processors are manufactured
762 // using the 32 nm process.
763 case 0x2d:
764 CPU = "sandybridge";
765 *Type = X86::INTEL_COREI7;
766 *Subtype = X86::INTEL_COREI7_SANDYBRIDGE;
767 break;
768 case 0x3a:
769 case 0x3e: // Ivy Bridge EP
770 CPU = "ivybridge";
771 *Type = X86::INTEL_COREI7;
772 *Subtype = X86::INTEL_COREI7_IVYBRIDGE;
773 break;
774
775 // Haswell:
776 case 0x3c:
777 case 0x3f:
778 case 0x45:
779 case 0x46:
780 CPU = "haswell";
781 *Type = X86::INTEL_COREI7;
782 *Subtype = X86::INTEL_COREI7_HASWELL;
783 break;
784
785 // Broadwell:
786 case 0x3d:
787 case 0x47:
788 case 0x4f:
789 case 0x56:
790 CPU = "broadwell";
791 *Type = X86::INTEL_COREI7;
792 *Subtype = X86::INTEL_COREI7_BROADWELL;
793 break;
794
795 // Skylake:
796 case 0x4e: // Skylake mobile
797 case 0x5e: // Skylake desktop
798 case 0x8e: // Kaby Lake mobile
799 case 0x9e: // Kaby Lake desktop
800 case 0xa5: // Comet Lake-H/S
801 case 0xa6: // Comet Lake-U
802 CPU = "skylake";
803 *Type = X86::INTEL_COREI7;
804 *Subtype = X86::INTEL_COREI7_SKYLAKE;
805 break;
806
807 // Rocketlake:
808 case 0xa7:
809 CPU = "rocketlake";
810 *Type = X86::INTEL_COREI7;
811 *Subtype = X86::INTEL_COREI7_ROCKETLAKE;
812 break;
813
814 // Skylake Xeon:
815 case 0x55:
816 *Type = X86::INTEL_COREI7;
817 if (testFeature(X86::FEATURE_AVX512BF16)) {
818 CPU = "cooperlake";
819 *Subtype = X86::INTEL_COREI7_COOPERLAKE;
820 } else if (testFeature(X86::FEATURE_AVX512VNNI)) {
821 CPU = "cascadelake";
822 *Subtype = X86::INTEL_COREI7_CASCADELAKE;
823 } else {
824 CPU = "skylake-avx512";
825 *Subtype = X86::INTEL_COREI7_SKYLAKE_AVX512;
826 }
827 break;
828
829 // Cannonlake:
830 case 0x66:
831 CPU = "cannonlake";
832 *Type = X86::INTEL_COREI7;
833 *Subtype = X86::INTEL_COREI7_CANNONLAKE;
834 break;
835
836 // Icelake:
837 case 0x7d:
838 case 0x7e:
839 CPU = "icelake-client";
840 *Type = X86::INTEL_COREI7;
841 *Subtype = X86::INTEL_COREI7_ICELAKE_CLIENT;
842 break;
843
844 // Tigerlake:
845 case 0x8c:
846 case 0x8d:
847 CPU = "tigerlake";
848 *Type = X86::INTEL_COREI7;
849 *Subtype = X86::INTEL_COREI7_TIGERLAKE;
850 break;
851
852 // Alderlake:
853 case 0x97:
854 case 0x9a:
855 // Gracemont
856 case 0xbe:
857 // Raptorlake:
858 case 0xb7:
859 case 0xba:
860 case 0xbf:
861 // Meteorlake:
862 case 0xaa:
863 case 0xac:
864 CPU = "alderlake";
865 *Type = X86::INTEL_COREI7;
866 *Subtype = X86::INTEL_COREI7_ALDERLAKE;
867 break;
868
869 // Arrowlake:
870 case 0xc5:
871 CPU = "arrowlake";
872 *Type = X86::INTEL_COREI7;
873 *Subtype = X86::INTEL_COREI7_ARROWLAKE;
874 break;
875
876 // Arrowlake S:
877 case 0xc6:
878 // Lunarlake:
879 case 0xbd:
880 CPU = "arrowlake-s";
881 *Type = X86::INTEL_COREI7;
882 *Subtype = X86::INTEL_COREI7_ARROWLAKE_S;
883 break;
884
885 // Pantherlake:
886 case 0xcc:
887 CPU = "pantherlake";
888 *Type = X86::INTEL_COREI7;
889 *Subtype = X86::INTEL_COREI7_PANTHERLAKE;
890 break;
891
892 // Graniterapids:
893 case 0xad:
894 CPU = "graniterapids";
895 *Type = X86::INTEL_COREI7;
896 *Subtype = X86::INTEL_COREI7_GRANITERAPIDS;
897 break;
898
899 // Granite Rapids D:
900 case 0xae:
901 CPU = "graniterapids-d";
902 *Type = X86::INTEL_COREI7;
903 *Subtype = X86::INTEL_COREI7_GRANITERAPIDS_D;
904 break;
905
906 // Icelake Xeon:
907 case 0x6a:
908 case 0x6c:
909 CPU = "icelake-server";
910 *Type = X86::INTEL_COREI7;
911 *Subtype = X86::INTEL_COREI7_ICELAKE_SERVER;
912 break;
913
914 // Emerald Rapids:
915 case 0xcf:
916 // Sapphire Rapids:
917 case 0x8f:
918 CPU = "sapphirerapids";
919 *Type = X86::INTEL_COREI7;
920 *Subtype = X86::INTEL_COREI7_SAPPHIRERAPIDS;
921 break;
922
923 case 0x1c: // Most 45 nm Intel Atom processors
924 case 0x26: // 45 nm Atom Lincroft
925 case 0x27: // 32 nm Atom Medfield
926 case 0x35: // 32 nm Atom Midview
927 case 0x36: // 32 nm Atom Midview
928 CPU = "bonnell";
929 *Type = X86::INTEL_BONNELL;
930 break;
931
932 // Atom Silvermont codes from the Intel software optimization guide.
933 case 0x37:
934 case 0x4a:
935 case 0x4d:
936 case 0x5a:
937 case 0x5d:
938 case 0x4c: // really airmont
939 CPU = "silvermont";
940 *Type = X86::INTEL_SILVERMONT;
941 break;
942 // Goldmont:
943 case 0x5c: // Apollo Lake
944 case 0x5f: // Denverton
945 CPU = "goldmont";
946 *Type = X86::INTEL_GOLDMONT;
947 break;
948 case 0x7a:
949 CPU = "goldmont-plus";
950 *Type = X86::INTEL_GOLDMONT_PLUS;
951 break;
952 case 0x86:
953 case 0x8a: // Lakefield
954 case 0x96: // Elkhart Lake
955 case 0x9c: // Jasper Lake
956 CPU = "tremont";
957 *Type = X86::INTEL_TREMONT;
958 break;
959
960 // Sierraforest:
961 case 0xaf:
962 CPU = "sierraforest";
963 *Type = X86::INTEL_SIERRAFOREST;
964 break;
965
966 // Grandridge:
967 case 0xb6:
968 CPU = "grandridge";
969 *Type = X86::INTEL_GRANDRIDGE;
970 break;
971
972 // Clearwaterforest:
973 case 0xdd:
974 CPU = "clearwaterforest";
975 *Type = X86::INTEL_CLEARWATERFOREST;
976 break;
977
978 // Xeon Phi (Knights Landing + Knights Mill):
979 case 0x57:
980 CPU = "knl";
981 *Type = X86::INTEL_KNL;
982 break;
983 case 0x85:
984 CPU = "knm";
985 *Type = X86::INTEL_KNM;
986 break;
987
988 default: // Unknown family 6 CPU, try to guess.
989 // Don't both with Type/Subtype here, they aren't used by the caller.
990 // They're used above to keep the code in sync with compiler-rt.
991 // TODO detect tigerlake host from model
992 if (testFeature(X86::FEATURE_AVX512VP2INTERSECT)) {
993 CPU = "tigerlake";
994 } else if (testFeature(X86::FEATURE_AVX512VBMI2)) {
995 CPU = "icelake-client";
996 } else if (testFeature(X86::FEATURE_AVX512VBMI)) {
997 CPU = "cannonlake";
998 } else if (testFeature(X86::FEATURE_AVX512BF16)) {
999 CPU = "cooperlake";
1000 } else if (testFeature(X86::FEATURE_AVX512VNNI)) {
1001 CPU = "cascadelake";
1002 } else if (testFeature(X86::FEATURE_AVX512VL)) {
1003 CPU = "skylake-avx512";
1004 } else if (testFeature(X86::FEATURE_AVX512ER)) {
1005 CPU = "knl";
1006 } else if (testFeature(X86::FEATURE_CLFLUSHOPT)) {
1007 if (testFeature(X86::FEATURE_SHA))
1008 CPU = "goldmont";
1009 else
1010 CPU = "skylake";
1011 } else if (testFeature(X86::FEATURE_ADX)) {
1012 CPU = "broadwell";
1013 } else if (testFeature(X86::FEATURE_AVX2)) {
1014 CPU = "haswell";
1015 } else if (testFeature(X86::FEATURE_AVX)) {
1016 CPU = "sandybridge";
1017 } else if (testFeature(X86::FEATURE_SSE4_2)) {
1018 if (testFeature(X86::FEATURE_MOVBE))
1019 CPU = "silvermont";
1020 else
1021 CPU = "nehalem";
1022 } else if (testFeature(X86::FEATURE_SSE4_1)) {
1023 CPU = "penryn";
1024 } else if (testFeature(X86::FEATURE_SSSE3)) {
1025 if (testFeature(X86::FEATURE_MOVBE))
1026 CPU = "bonnell";
1027 else
1028 CPU = "core2";
1029 } else if (testFeature(X86::FEATURE_64BIT)) {
1030 CPU = "core2";
1031 } else if (testFeature(X86::FEATURE_SSE3)) {
1032 CPU = "yonah";
1033 } else if (testFeature(X86::FEATURE_SSE2)) {
1034 CPU = "pentium-m";
1035 } else if (testFeature(X86::FEATURE_SSE)) {
1036 CPU = "pentium3";
1037 } else if (testFeature(X86::FEATURE_MMX)) {
1038 CPU = "pentium2";
1039 } else {
1040 CPU = "pentiumpro";
1041 }
1042 break;
1043 }
1044 break;
1045 case 15: {
1046 if (testFeature(X86::FEATURE_64BIT)) {
1047 CPU = "nocona";
1048 break;
1049 }
1050 if (testFeature(X86::FEATURE_SSE3)) {
1051 CPU = "prescott";
1052 break;
1053 }
1054 CPU = "pentium4";
1055 break;
1056 }
1057 default:
1058 break; // Unknown.
1059 }
1060
1061 return CPU;
1062}
1063
1064static StringRef
1065getAMDProcessorTypeAndSubtype(unsigned Family, unsigned Model,
1066 const unsigned *Features,
1067 unsigned *Type, unsigned *Subtype) {
1068 auto testFeature = [&](unsigned F) {
1069 return (Features[F / 32] & (1U << (F % 32))) != 0;
1070 };
1071
1072 StringRef CPU;
1073
1074 switch (Family) {
1075 case 4:
1076 CPU = "i486";
1077 break;
1078 case 5:
1079 CPU = "pentium";
1080 switch (Model) {
1081 case 6:
1082 case 7:
1083 CPU = "k6";
1084 break;
1085 case 8:
1086 CPU = "k6-2";
1087 break;
1088 case 9:
1089 case 13:
1090 CPU = "k6-3";
1091 break;
1092 case 10:
1093 CPU = "geode";
1094 break;
1095 }
1096 break;
1097 case 6:
1098 if (testFeature(X86::FEATURE_SSE)) {
1099 CPU = "athlon-xp";
1100 break;
1101 }
1102 CPU = "athlon";
1103 break;
1104 case 15:
1105 if (testFeature(X86::FEATURE_SSE3)) {
1106 CPU = "k8-sse3";
1107 break;
1108 }
1109 CPU = "k8";
1110 break;
1111 case 16:
1112 CPU = "amdfam10";
1113 *Type = X86::AMDFAM10H; // "amdfam10"
1114 switch (Model) {
1115 case 2:
1116 *Subtype = X86::AMDFAM10H_BARCELONA;
1117 break;
1118 case 4:
1119 *Subtype = X86::AMDFAM10H_SHANGHAI;
1120 break;
1121 case 8:
1122 *Subtype = X86::AMDFAM10H_ISTANBUL;
1123 break;
1124 }
1125 break;
1126 case 20:
1127 CPU = "btver1";
1128 *Type = X86::AMD_BTVER1;
1129 break;
1130 case 21:
1131 CPU = "bdver1";
1132 *Type = X86::AMDFAM15H;
1133 if (Model >= 0x60 && Model <= 0x7f) {
1134 CPU = "bdver4";
1135 *Subtype = X86::AMDFAM15H_BDVER4;
1136 break; // 60h-7Fh: Excavator
1137 }
1138 if (Model >= 0x30 && Model <= 0x3f) {
1139 CPU = "bdver3";
1140 *Subtype = X86::AMDFAM15H_BDVER3;
1141 break; // 30h-3Fh: Steamroller
1142 }
1143 if ((Model >= 0x10 && Model <= 0x1f) || Model == 0x02) {
1144 CPU = "bdver2";
1145 *Subtype = X86::AMDFAM15H_BDVER2;
1146 break; // 02h, 10h-1Fh: Piledriver
1147 }
1148 if (Model <= 0x0f) {
1149 *Subtype = X86::AMDFAM15H_BDVER1;
1150 break; // 00h-0Fh: Bulldozer
1151 }
1152 break;
1153 case 22:
1154 CPU = "btver2";
1155 *Type = X86::AMD_BTVER2;
1156 break;
1157 case 23:
1158 CPU = "znver1";
1159 *Type = X86::AMDFAM17H;
1160 if ((Model >= 0x30 && Model <= 0x3f) || (Model == 0x47) ||
1161 (Model >= 0x60 && Model <= 0x67) || (Model >= 0x68 && Model <= 0x6f) ||
1162 (Model >= 0x70 && Model <= 0x7f) || (Model >= 0x84 && Model <= 0x87) ||
1163 (Model >= 0x90 && Model <= 0x97) || (Model >= 0x98 && Model <= 0x9f) ||
1164 (Model >= 0xa0 && Model <= 0xaf)) {
1165 // Family 17h Models 30h-3Fh (Starship) Zen 2
1166 // Family 17h Models 47h (Cardinal) Zen 2
1167 // Family 17h Models 60h-67h (Renoir) Zen 2
1168 // Family 17h Models 68h-6Fh (Lucienne) Zen 2
1169 // Family 17h Models 70h-7Fh (Matisse) Zen 2
1170 // Family 17h Models 84h-87h (ProjectX) Zen 2
1171 // Family 17h Models 90h-97h (VanGogh) Zen 2
1172 // Family 17h Models 98h-9Fh (Mero) Zen 2
1173 // Family 17h Models A0h-AFh (Mendocino) Zen 2
1174 CPU = "znver2";
1175 *Subtype = X86::AMDFAM17H_ZNVER2;
1176 break;
1177 }
1178 if ((Model >= 0x10 && Model <= 0x1f) || (Model >= 0x20 && Model <= 0x2f)) {
1179 // Family 17h Models 10h-1Fh (Raven1) Zen
1180 // Family 17h Models 10h-1Fh (Picasso) Zen+
1181 // Family 17h Models 20h-2Fh (Raven2 x86) Zen
1182 *Subtype = X86::AMDFAM17H_ZNVER1;
1183 break;
1184 }
1185 break;
1186 case 25:
1187 CPU = "znver3";
1188 *Type = X86::AMDFAM19H;
1189 if (Model <= 0x0f || (Model >= 0x20 && Model <= 0x2f) ||
1190 (Model >= 0x30 && Model <= 0x3f) || (Model >= 0x40 && Model <= 0x4f) ||
1191 (Model >= 0x50 && Model <= 0x5f)) {
1192 // Family 19h Models 00h-0Fh (Genesis, Chagall) Zen 3
1193 // Family 19h Models 20h-2Fh (Vermeer) Zen 3
1194 // Family 19h Models 30h-3Fh (Badami) Zen 3
1195 // Family 19h Models 40h-4Fh (Rembrandt) Zen 3+
1196 // Family 19h Models 50h-5Fh (Cezanne) Zen 3
1197 *Subtype = X86::AMDFAM19H_ZNVER3;
1198 break;
1199 }
1200 if ((Model >= 0x10 && Model <= 0x1f) || (Model >= 0x60 && Model <= 0x6f) ||
1201 (Model >= 0x70 && Model <= 0x77) || (Model >= 0x78 && Model <= 0x7f) ||
1202 (Model >= 0xa0 && Model <= 0xaf)) {
1203 // Family 19h Models 10h-1Fh (Stones; Storm Peak) Zen 4
1204 // Family 19h Models 60h-6Fh (Raphael) Zen 4
1205 // Family 19h Models 70h-77h (Phoenix, Hawkpoint1) Zen 4
1206 // Family 19h Models 78h-7Fh (Phoenix 2, Hawkpoint2) Zen 4
1207 // Family 19h Models A0h-AFh (Stones-Dense) Zen 4
1208 CPU = "znver4";
1209 *Subtype = X86::AMDFAM19H_ZNVER4;
1210 break; // "znver4"
1211 }
1212 break;
1213 default:
1214 break; // Unknown AMD CPU.
1215 }
1216
1217 return CPU;
1218}
1219
1220static void getAvailableFeatures(unsigned ECX, unsigned EDX, unsigned MaxLeaf,
1221 unsigned *Features) {
1222 unsigned EAX, EBX;
1223
1224 auto setFeature = [&](unsigned F) {
1225 Features[F / 32] |= 1U << (F % 32);
1226 };
1227
1228 if ((EDX >> 15) & 1)
1229 setFeature(X86::FEATURE_CMOV);
1230 if ((EDX >> 23) & 1)
1231 setFeature(X86::FEATURE_MMX);
1232 if ((EDX >> 25) & 1)
1233 setFeature(X86::FEATURE_SSE);
1234 if ((EDX >> 26) & 1)
1235 setFeature(X86::FEATURE_SSE2);
1236
1237 if ((ECX >> 0) & 1)
1238 setFeature(X86::FEATURE_SSE3);
1239 if ((ECX >> 1) & 1)
1240 setFeature(X86::FEATURE_PCLMUL);
1241 if ((ECX >> 9) & 1)
1242 setFeature(X86::FEATURE_SSSE3);
1243 if ((ECX >> 12) & 1)
1244 setFeature(X86::FEATURE_FMA);
1245 if ((ECX >> 19) & 1)
1246 setFeature(X86::FEATURE_SSE4_1);
1247 if ((ECX >> 20) & 1) {
1248 setFeature(X86::FEATURE_SSE4_2);
1249 setFeature(X86::FEATURE_CRC32);
1250 }
1251 if ((ECX >> 23) & 1)
1252 setFeature(X86::FEATURE_POPCNT);
1253 if ((ECX >> 25) & 1)
1254 setFeature(X86::FEATURE_AES);
1255
1256 if ((ECX >> 22) & 1)
1257 setFeature(X86::FEATURE_MOVBE);
1258
1259 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV
1260 // indicates that the AVX registers will be saved and restored on context
1261 // switch, then we have full AVX support.
1262 const unsigned AVXBits = (1 << 27) | (1 << 28);
1263 bool HasAVX = ((ECX & AVXBits) == AVXBits) && !getX86XCR0(&EAX, &EDX) &&
1264 ((EAX & 0x6) == 0x6);
1265#if defined(__APPLE__)
1266 // Darwin lazily saves the AVX512 context on first use: trust that the OS will
1267 // save the AVX512 context if we use AVX512 instructions, even the bit is not
1268 // set right now.
1269 bool HasAVX512Save = true;
1270#else
1271 // AVX512 requires additional context to be saved by the OS.
1272 bool HasAVX512Save = HasAVX && ((EAX & 0xe0) == 0xe0);
1273#endif
1274
1275 if (HasAVX)
1276 setFeature(X86::FEATURE_AVX);
1277
1278 bool HasLeaf7 =
1279 MaxLeaf >= 0x7 && !getX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
1280
1281 if (HasLeaf7 && ((EBX >> 3) & 1))
1282 setFeature(X86::FEATURE_BMI);
1283 if (HasLeaf7 && ((EBX >> 5) & 1) && HasAVX)
1284 setFeature(X86::FEATURE_AVX2);
1285 if (HasLeaf7 && ((EBX >> 8) & 1))
1286 setFeature(X86::FEATURE_BMI2);
1287 if (HasLeaf7 && ((EBX >> 16) & 1) && HasAVX512Save)
1288 setFeature(X86::FEATURE_AVX512F);
1289 if (HasLeaf7 && ((EBX >> 17) & 1) && HasAVX512Save)
1290 setFeature(X86::FEATURE_AVX512DQ);
1291 if (HasLeaf7 && ((EBX >> 19) & 1))
1292 setFeature(X86::FEATURE_ADX);
1293 if (HasLeaf7 && ((EBX >> 21) & 1) && HasAVX512Save)
1294 setFeature(X86::FEATURE_AVX512IFMA);
1295 if (HasLeaf7 && ((EBX >> 23) & 1))
1296 setFeature(X86::FEATURE_CLFLUSHOPT);
1297 if (HasLeaf7 && ((EBX >> 26) & 1) && HasAVX512Save)
1298 setFeature(X86::FEATURE_AVX512PF);
1299 if (HasLeaf7 && ((EBX >> 27) & 1) && HasAVX512Save)
1300 setFeature(X86::FEATURE_AVX512ER);
1301 if (HasLeaf7 && ((EBX >> 28) & 1) && HasAVX512Save)
1302 setFeature(X86::FEATURE_AVX512CD);
1303 if (HasLeaf7 && ((EBX >> 29) & 1))
1304 setFeature(X86::FEATURE_SHA);
1305 if (HasLeaf7 && ((EBX >> 30) & 1) && HasAVX512Save)
1306 setFeature(X86::FEATURE_AVX512BW);
1307 if (HasLeaf7 && ((EBX >> 31) & 1) && HasAVX512Save)
1308 setFeature(X86::FEATURE_AVX512VL);
1309
1310 if (HasLeaf7 && ((ECX >> 1) & 1) && HasAVX512Save)
1311 setFeature(X86::FEATURE_AVX512VBMI);
1312 if (HasLeaf7 && ((ECX >> 6) & 1) && HasAVX512Save)
1313 setFeature(X86::FEATURE_AVX512VBMI2);
1314 if (HasLeaf7 && ((ECX >> 8) & 1))
1315 setFeature(X86::FEATURE_GFNI);
1316 if (HasLeaf7 && ((ECX >> 10) & 1) && HasAVX)
1317 setFeature(X86::FEATURE_VPCLMULQDQ);
1318 if (HasLeaf7 && ((ECX >> 11) & 1) && HasAVX512Save)
1319 setFeature(X86::FEATURE_AVX512VNNI);
1320 if (HasLeaf7 && ((ECX >> 12) & 1) && HasAVX512Save)
1321 setFeature(X86::FEATURE_AVX512BITALG);
1322 if (HasLeaf7 && ((ECX >> 14) & 1) && HasAVX512Save)
1323 setFeature(X86::FEATURE_AVX512VPOPCNTDQ);
1324
1325 if (HasLeaf7 && ((EDX >> 2) & 1) && HasAVX512Save)
1326 setFeature(X86::FEATURE_AVX5124VNNIW);
1327 if (HasLeaf7 && ((EDX >> 3) & 1) && HasAVX512Save)
1328 setFeature(X86::FEATURE_AVX5124FMAPS);
1329 if (HasLeaf7 && ((EDX >> 8) & 1) && HasAVX512Save)
1330 setFeature(X86::FEATURE_AVX512VP2INTERSECT);
1331
1332 // EAX from subleaf 0 is the maximum subleaf supported. Some CPUs don't
1333 // return all 0s for invalid subleaves so check the limit.
1334 bool HasLeaf7Subleaf1 =
1335 HasLeaf7 && EAX >= 1 &&
1336 !getX86CpuIDAndInfoEx(0x7, 0x1, &EAX, &EBX, &ECX, &EDX);
1337 if (HasLeaf7Subleaf1 && ((EAX >> 5) & 1) && HasAVX512Save)
1338 setFeature(X86::FEATURE_AVX512BF16);
1339
1340 unsigned MaxExtLevel;
1341 getX86CpuIDAndInfo(0x80000000, &MaxExtLevel, &EBX, &ECX, &EDX);
1342
1343 bool HasExtLeaf1 = MaxExtLevel >= 0x80000001 &&
1344 !getX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
1345 if (HasExtLeaf1 && ((ECX >> 6) & 1))
1346 setFeature(X86::FEATURE_SSE4_A);
1347 if (HasExtLeaf1 && ((ECX >> 11) & 1))
1348 setFeature(X86::FEATURE_XOP);
1349 if (HasExtLeaf1 && ((ECX >> 16) & 1))
1350 setFeature(X86::FEATURE_FMA4);
1351
1352 if (HasExtLeaf1 && ((EDX >> 29) & 1))
1353 setFeature(X86::FEATURE_64BIT);
1354}
1355
1357 unsigned MaxLeaf = 0;
1358 const VendorSignatures Vendor = getVendorSignature(&MaxLeaf);
1359 if (Vendor == VendorSignatures::UNKNOWN)
1360 return "generic";
1361
1362 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
1363 getX86CpuIDAndInfo(0x1, &EAX, &EBX, &ECX, &EDX);
1364
1365 unsigned Family = 0, Model = 0;
1366 unsigned Features[(X86::CPU_FEATURE_MAX + 31) / 32] = {0};
1367 detectX86FamilyModel(EAX, &Family, &Model);
1368 getAvailableFeatures(ECX, EDX, MaxLeaf, Features);
1369
1370 // These aren't consumed in this file, but we try to keep some source code the
1371 // same or similar to compiler-rt.
1372 unsigned Type = 0;
1373 unsigned Subtype = 0;
1374
1375 StringRef CPU;
1376
1377 if (Vendor == VendorSignatures::GENUINE_INTEL) {
1378 CPU = getIntelProcessorTypeAndSubtype(Family, Model, Features, &Type,
1379 &Subtype);
1380 } else if (Vendor == VendorSignatures::AUTHENTIC_AMD) {
1381 CPU = getAMDProcessorTypeAndSubtype(Family, Model, Features, &Type,
1382 &Subtype);
1383 }
1384
1385 if (!CPU.empty())
1386 return CPU;
1387
1388 return "generic";
1389}
1390
1391#elif defined(__APPLE__) && defined(__powerpc__)
1393 host_basic_info_data_t hostInfo;
1394 mach_msg_type_number_t infoCount;
1395
1396 infoCount = HOST_BASIC_INFO_COUNT;
1397 mach_port_t hostPort = mach_host_self();
1398 host_info(hostPort, HOST_BASIC_INFO, (host_info_t)&hostInfo,
1399 &infoCount);
1400 mach_port_deallocate(mach_task_self(), hostPort);
1401
1402 if (hostInfo.cpu_type != CPU_TYPE_POWERPC)
1403 return "generic";
1404
1405 switch (hostInfo.cpu_subtype) {
1407 return "601";
1409 return "602";
1411 return "603";
1413 return "603e";
1415 return "603ev";
1417 return "604";
1419 return "604e";
1421 return "620";
1423 return "750";
1425 return "7400";
1427 return "7450";
1429 return "970";
1430 default:;
1431 }
1432
1433 return "generic";
1434}
1435#elif defined(__linux__) && defined(__powerpc__)
1437 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
1438 StringRef Content = P ? P->getBuffer() : "";
1439 return detail::getHostCPUNameForPowerPC(Content);
1440}
1441#elif defined(__linux__) && (defined(__arm__) || defined(__aarch64__))
1443 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
1444 StringRef Content = P ? P->getBuffer() : "";
1445 return detail::getHostCPUNameForARM(Content);
1446}
1447#elif defined(__linux__) && defined(__s390x__)
1449 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
1450 StringRef Content = P ? P->getBuffer() : "";
1451 return detail::getHostCPUNameForS390x(Content);
1452}
1453#elif defined(__MVS__)
1455 // Get pointer to Communications Vector Table (CVT).
1456 // The pointer is located at offset 16 of the Prefixed Save Area (PSA).
1457 // It is stored as 31 bit pointer and will be zero-extended to 64 bit.
1458 int *StartToCVTOffset = reinterpret_cast<int *>(0x10);
1459 // Since its stored as a 31-bit pointer, get the 4 bytes from the start
1460 // of address.
1461 int ReadValue = *StartToCVTOffset;
1462 // Explicitly clear the high order bit.
1463 ReadValue = (ReadValue & 0x7FFFFFFF);
1464 char *CVT = reinterpret_cast<char *>(ReadValue);
1465 // The model number is located in the CVT prefix at offset -6 and stored as
1466 // signless packed decimal.
1467 uint16_t Id = *(uint16_t *)&CVT[-6];
1468 // Convert number to integer.
1469 Id = decodePackedBCD<uint16_t>(Id, false);
1470 // Check for vector support. It's stored in field CVTFLAG5 (offset 244),
1471 // bit CVTVEF (X'80'). The facilities list is part of the PSA but the vector
1472 // extension can only be used if bit CVTVEF is on.
1473 bool HaveVectorSupport = CVT[244] & 0x80;
1474 return getCPUNameFromS390Model(Id, HaveVectorSupport);
1475}
1476#elif defined(__APPLE__) && (defined(__arm__) || defined(__aarch64__))
1477#define CPUFAMILY_ARM_SWIFT 0x1e2d6381
1478#define CPUFAMILY_ARM_CYCLONE 0x37a09642
1479#define CPUFAMILY_ARM_TYPHOON 0x2c91a47e
1480#define CPUFAMILY_ARM_TWISTER 0x92fb37c8
1481#define CPUFAMILY_ARM_HURRICANE 0x67ceee93
1482#define CPUFAMILY_ARM_MONSOON_MISTRAL 0xe81e7ef6
1483#define CPUFAMILY_ARM_VORTEX_TEMPEST 0x07d34b9f
1484#define CPUFAMILY_ARM_LIGHTNING_THUNDER 0x462504d2
1485#define CPUFAMILY_ARM_FIRESTORM_ICESTORM 0x1b588bb3
1486#define CPUFAMILY_ARM_BLIZZARD_AVALANCHE 0xda33d83d
1487#define CPUFAMILY_ARM_EVEREST_SAWTOOTH 0x8765edea
1488
1490 uint32_t Family;
1491 size_t Length = sizeof(Family);
1492 sysctlbyname("hw.cpufamily", &Family, &Length, NULL, 0);
1493
1494 switch (Family) {
1495 case CPUFAMILY_ARM_SWIFT:
1496 return "swift";
1497 case CPUFAMILY_ARM_CYCLONE:
1498 return "apple-a7";
1499 case CPUFAMILY_ARM_TYPHOON:
1500 return "apple-a8";
1501 case CPUFAMILY_ARM_TWISTER:
1502 return "apple-a9";
1503 case CPUFAMILY_ARM_HURRICANE:
1504 return "apple-a10";
1505 case CPUFAMILY_ARM_MONSOON_MISTRAL:
1506 return "apple-a11";
1507 case CPUFAMILY_ARM_VORTEX_TEMPEST:
1508 return "apple-a12";
1509 case CPUFAMILY_ARM_LIGHTNING_THUNDER:
1510 return "apple-a13";
1511 case CPUFAMILY_ARM_FIRESTORM_ICESTORM:
1512 return "apple-m1";
1513 case CPUFAMILY_ARM_BLIZZARD_AVALANCHE:
1514 return "apple-m2";
1515 case CPUFAMILY_ARM_EVEREST_SAWTOOTH:
1516 return "apple-m3";
1517 default:
1518 // Default to the newest CPU we know about.
1519 return "apple-m3";
1520 }
1521}
1522#elif defined(_AIX)
1524 switch (_system_configuration.implementation) {
1525 case POWER_4:
1526 if (_system_configuration.version == PV_4_3)
1527 return "970";
1528 return "pwr4";
1529 case POWER_5:
1530 if (_system_configuration.version == PV_5)
1531 return "pwr5";
1532 return "pwr5x";
1533 case POWER_6:
1534 if (_system_configuration.version == PV_6_Compat)
1535 return "pwr6";
1536 return "pwr6x";
1537 case POWER_7:
1538 return "pwr7";
1539 case POWER_8:
1540 return "pwr8";
1541 case POWER_9:
1542 return "pwr9";
1543// TODO: simplify this once the macro is available in all OS levels.
1544#ifdef POWER_10
1545 case POWER_10:
1546#else
1547 case 0x40000:
1548#endif
1549 return "pwr10";
1550 default:
1551 return "generic";
1552 }
1553}
1554#elif defined(__loongarch__)
1556 // Use processor id to detect cpu name.
1557 uint32_t processor_id;
1558 __asm__("cpucfg %[prid], $zero\n\t" : [prid] "=r"(processor_id));
1559 // Refer PRID_SERIES_MASK in linux kernel: arch/loongarch/include/asm/cpu.h.
1560 switch (processor_id & 0xf000) {
1561 case 0xc000: // Loongson 64bit, 4-issue
1562 return "la464";
1563 // TODO: Others.
1564 default:
1565 break;
1566 }
1567 return "generic";
1568}
1569#elif defined(__riscv)
1571#if defined(__linux__)
1572 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
1573 StringRef Content = P ? P->getBuffer() : "";
1574 return detail::getHostCPUNameForRISCV(Content);
1575#else
1576#if __riscv_xlen == 64
1577 return "generic-rv64";
1578#elif __riscv_xlen == 32
1579 return "generic-rv32";
1580#else
1581#error "Unhandled value of __riscv_xlen"
1582#endif
1583#endif
1584}
1585#elif defined(__sparc__)
1586#if defined(__linux__)
1589 ProcCpuinfoContent.split(Lines, "\n");
1590
1591 // Look for cpu line to determine cpu name
1592 StringRef Cpu;
1593 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
1594 if (Lines[I].starts_with("cpu")) {
1595 Cpu = Lines[I].substr(5).ltrim("\t :");
1596 break;
1597 }
1598 }
1599
1600 return StringSwitch<const char *>(Cpu)
1601 .StartsWith("SuperSparc", "supersparc")
1602 .StartsWith("HyperSparc", "hypersparc")
1603 .StartsWith("SpitFire", "ultrasparc")
1604 .StartsWith("BlackBird", "ultrasparc")
1605 .StartsWith("Sabre", " ultrasparc")
1606 .StartsWith("Hummingbird", "ultrasparc")
1607 .StartsWith("Cheetah", "ultrasparc3")
1608 .StartsWith("Jalapeno", "ultrasparc3")
1609 .StartsWith("Jaguar", "ultrasparc3")
1610 .StartsWith("Panther", "ultrasparc3")
1611 .StartsWith("Serrano", "ultrasparc3")
1612 .StartsWith("UltraSparc T1", "niagara")
1613 .StartsWith("UltraSparc T2", "niagara2")
1614 .StartsWith("UltraSparc T3", "niagara3")
1615 .StartsWith("UltraSparc T4", "niagara4")
1616 .StartsWith("UltraSparc T5", "niagara4")
1617 .StartsWith("LEON", "leon3")
1618 // niagara7/m8 not supported by LLVM yet.
1619 .StartsWith("SPARC-M7", "niagara4" /* "niagara7" */)
1620 .StartsWith("SPARC-S7", "niagara4" /* "niagara7" */)
1621 .StartsWith("SPARC-M8", "niagara4" /* "m8" */)
1622 .Default("generic");
1623}
1624#endif
1625
1627#if defined(__linux__)
1628 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
1629 StringRef Content = P ? P->getBuffer() : "";
1630 return detail::getHostCPUNameForSPARC(Content);
1631#elif defined(__sun__) && defined(__svr4__)
1632 char *buf = NULL;
1633 kstat_ctl_t *kc;
1634 kstat_t *ksp;
1635 kstat_named_t *brand = NULL;
1636
1637 kc = kstat_open();
1638 if (kc != NULL) {
1639 ksp = kstat_lookup(kc, const_cast<char *>("cpu_info"), -1, NULL);
1640 if (ksp != NULL && kstat_read(kc, ksp, NULL) != -1 &&
1641 ksp->ks_type == KSTAT_TYPE_NAMED)
1642 brand =
1643 (kstat_named_t *)kstat_data_lookup(ksp, const_cast<char *>("brand"));
1644 if (brand != NULL && brand->data_type == KSTAT_DATA_STRING)
1645 buf = KSTAT_NAMED_STR_PTR(brand);
1646 }
1647 kstat_close(kc);
1648
1649 return StringSwitch<const char *>(buf)
1650 .Case("TMS390S10", "supersparc") // Texas Instruments microSPARC I
1651 .Case("TMS390Z50", "supersparc") // Texas Instruments SuperSPARC I
1652 .Case("TMS390Z55",
1653 "supersparc") // Texas Instruments SuperSPARC I with SuperCache
1654 .Case("MB86904", "supersparc") // Fujitsu microSPARC II
1655 .Case("MB86907", "supersparc") // Fujitsu TurboSPARC
1656 .Case("RT623", "hypersparc") // Ross hyperSPARC
1657 .Case("RT625", "hypersparc")
1658 .Case("RT626", "hypersparc")
1659 .Case("UltraSPARC-I", "ultrasparc")
1660 .Case("UltraSPARC-II", "ultrasparc")
1661 .Case("UltraSPARC-IIe", "ultrasparc")
1662 .Case("UltraSPARC-IIi", "ultrasparc")
1663 .Case("SPARC64-III", "ultrasparc")
1664 .Case("SPARC64-IV", "ultrasparc")
1665 .Case("UltraSPARC-III", "ultrasparc3")
1666 .Case("UltraSPARC-III+", "ultrasparc3")
1667 .Case("UltraSPARC-IIIi", "ultrasparc3")
1668 .Case("UltraSPARC-IIIi+", "ultrasparc3")
1669 .Case("UltraSPARC-IV", "ultrasparc3")
1670 .Case("UltraSPARC-IV+", "ultrasparc3")
1671 .Case("SPARC64-V", "ultrasparc3")
1672 .Case("SPARC64-VI", "ultrasparc3")
1673 .Case("SPARC64-VII", "ultrasparc3")
1674 .Case("UltraSPARC-T1", "niagara")
1675 .Case("UltraSPARC-T2", "niagara2")
1676 .Case("UltraSPARC-T2", "niagara2")
1677 .Case("UltraSPARC-T2+", "niagara2")
1678 .Case("SPARC-T3", "niagara3")
1679 .Case("SPARC-T4", "niagara4")
1680 .Case("SPARC-T5", "niagara4")
1681 // niagara7/m8 not supported by LLVM yet.
1682 .Case("SPARC-M7", "niagara4" /* "niagara7" */)
1683 .Case("SPARC-S7", "niagara4" /* "niagara7" */)
1684 .Case("SPARC-M8", "niagara4" /* "m8" */)
1685 .Default("generic");
1686#else
1687 return "generic";
1688#endif
1689}
1690#else
1691StringRef sys::getHostCPUName() { return "generic"; }
1692namespace llvm {
1693namespace sys {
1694namespace detail {
1695namespace x86 {
1696
1699}
1700
1701} // namespace x86
1702} // namespace detail
1703} // namespace sys
1704} // namespace llvm
1705#endif
1706
1707#if defined(__i386__) || defined(_M_IX86) || \
1708 defined(__x86_64__) || defined(_M_X64)
1710 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
1711 unsigned MaxLevel;
1712
1713 if (getX86CpuIDAndInfo(0, &MaxLevel, &EBX, &ECX, &EDX) || MaxLevel < 1)
1714 return false;
1715
1716 getX86CpuIDAndInfo(1, &EAX, &EBX, &ECX, &EDX);
1717
1718 Features["cx8"] = (EDX >> 8) & 1;
1719 Features["cmov"] = (EDX >> 15) & 1;
1720 Features["mmx"] = (EDX >> 23) & 1;
1721 Features["fxsr"] = (EDX >> 24) & 1;
1722 Features["sse"] = (EDX >> 25) & 1;
1723 Features["sse2"] = (EDX >> 26) & 1;
1724
1725 Features["sse3"] = (ECX >> 0) & 1;
1726 Features["pclmul"] = (ECX >> 1) & 1;
1727 Features["ssse3"] = (ECX >> 9) & 1;
1728 Features["cx16"] = (ECX >> 13) & 1;
1729 Features["sse4.1"] = (ECX >> 19) & 1;
1730 Features["sse4.2"] = (ECX >> 20) & 1;
1731 Features["crc32"] = Features["sse4.2"];
1732 Features["movbe"] = (ECX >> 22) & 1;
1733 Features["popcnt"] = (ECX >> 23) & 1;
1734 Features["aes"] = (ECX >> 25) & 1;
1735 Features["rdrnd"] = (ECX >> 30) & 1;
1736
1737 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV
1738 // indicates that the AVX registers will be saved and restored on context
1739 // switch, then we have full AVX support.
1740 bool HasXSave = ((ECX >> 27) & 1) && !getX86XCR0(&EAX, &EDX);
1741 bool HasAVXSave = HasXSave && ((ECX >> 28) & 1) && ((EAX & 0x6) == 0x6);
1742#if defined(__APPLE__)
1743 // Darwin lazily saves the AVX512 context on first use: trust that the OS will
1744 // save the AVX512 context if we use AVX512 instructions, even the bit is not
1745 // set right now.
1746 bool HasAVX512Save = true;
1747#else
1748 // AVX512 requires additional context to be saved by the OS.
1749 bool HasAVX512Save = HasAVXSave && ((EAX & 0xe0) == 0xe0);
1750#endif
1751 // AMX requires additional context to be saved by the OS.
1752 const unsigned AMXBits = (1 << 17) | (1 << 18);
1753 bool HasAMXSave = HasXSave && ((EAX & AMXBits) == AMXBits);
1754
1755 Features["avx"] = HasAVXSave;
1756 Features["fma"] = ((ECX >> 12) & 1) && HasAVXSave;
1757 // Only enable XSAVE if OS has enabled support for saving YMM state.
1758 Features["xsave"] = ((ECX >> 26) & 1) && HasAVXSave;
1759 Features["f16c"] = ((ECX >> 29) & 1) && HasAVXSave;
1760
1761 unsigned MaxExtLevel;
1762 getX86CpuIDAndInfo(0x80000000, &MaxExtLevel, &EBX, &ECX, &EDX);
1763
1764 bool HasExtLeaf1 = MaxExtLevel >= 0x80000001 &&
1765 !getX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
1766 Features["sahf"] = HasExtLeaf1 && ((ECX >> 0) & 1);
1767 Features["lzcnt"] = HasExtLeaf1 && ((ECX >> 5) & 1);
1768 Features["sse4a"] = HasExtLeaf1 && ((ECX >> 6) & 1);
1769 Features["prfchw"] = HasExtLeaf1 && ((ECX >> 8) & 1);
1770 Features["xop"] = HasExtLeaf1 && ((ECX >> 11) & 1) && HasAVXSave;
1771 Features["lwp"] = HasExtLeaf1 && ((ECX >> 15) & 1);
1772 Features["fma4"] = HasExtLeaf1 && ((ECX >> 16) & 1) && HasAVXSave;
1773 Features["tbm"] = HasExtLeaf1 && ((ECX >> 21) & 1);
1774 Features["mwaitx"] = HasExtLeaf1 && ((ECX >> 29) & 1);
1775
1776 Features["64bit"] = HasExtLeaf1 && ((EDX >> 29) & 1);
1777
1778 // Miscellaneous memory related features, detected by
1779 // using the 0x80000008 leaf of the CPUID instruction
1780 bool HasExtLeaf8 = MaxExtLevel >= 0x80000008 &&
1781 !getX86CpuIDAndInfo(0x80000008, &EAX, &EBX, &ECX, &EDX);
1782 Features["clzero"] = HasExtLeaf8 && ((EBX >> 0) & 1);
1783 Features["rdpru"] = HasExtLeaf8 && ((EBX >> 4) & 1);
1784 Features["wbnoinvd"] = HasExtLeaf8 && ((EBX >> 9) & 1);
1785
1786 bool HasLeaf7 =
1787 MaxLevel >= 7 && !getX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
1788
1789 Features["fsgsbase"] = HasLeaf7 && ((EBX >> 0) & 1);
1790 Features["sgx"] = HasLeaf7 && ((EBX >> 2) & 1);
1791 Features["bmi"] = HasLeaf7 && ((EBX >> 3) & 1);
1792 // AVX2 is only supported if we have the OS save support from AVX.
1793 Features["avx2"] = HasLeaf7 && ((EBX >> 5) & 1) && HasAVXSave;
1794 Features["bmi2"] = HasLeaf7 && ((EBX >> 8) & 1);
1795 Features["invpcid"] = HasLeaf7 && ((EBX >> 10) & 1);
1796 Features["rtm"] = HasLeaf7 && ((EBX >> 11) & 1);
1797 // AVX512 is only supported if the OS supports the context save for it.
1798 Features["avx512f"] = HasLeaf7 && ((EBX >> 16) & 1) && HasAVX512Save;
1799 Features["avx512dq"] = HasLeaf7 && ((EBX >> 17) & 1) && HasAVX512Save;
1800 Features["rdseed"] = HasLeaf7 && ((EBX >> 18) & 1);
1801 Features["adx"] = HasLeaf7 && ((EBX >> 19) & 1);
1802 Features["avx512ifma"] = HasLeaf7 && ((EBX >> 21) & 1) && HasAVX512Save;
1803 Features["clflushopt"] = HasLeaf7 && ((EBX >> 23) & 1);
1804 Features["clwb"] = HasLeaf7 && ((EBX >> 24) & 1);
1805 Features["avx512pf"] = HasLeaf7 && ((EBX >> 26) & 1) && HasAVX512Save;
1806 Features["avx512er"] = HasLeaf7 && ((EBX >> 27) & 1) && HasAVX512Save;
1807 Features["avx512cd"] = HasLeaf7 && ((EBX >> 28) & 1) && HasAVX512Save;
1808 Features["sha"] = HasLeaf7 && ((EBX >> 29) & 1);
1809 Features["avx512bw"] = HasLeaf7 && ((EBX >> 30) & 1) && HasAVX512Save;
1810 Features["avx512vl"] = HasLeaf7 && ((EBX >> 31) & 1) && HasAVX512Save;
1811
1812 Features["prefetchwt1"] = HasLeaf7 && ((ECX >> 0) & 1);
1813 Features["avx512vbmi"] = HasLeaf7 && ((ECX >> 1) & 1) && HasAVX512Save;
1814 Features["pku"] = HasLeaf7 && ((ECX >> 4) & 1);
1815 Features["waitpkg"] = HasLeaf7 && ((ECX >> 5) & 1);
1816 Features["avx512vbmi2"] = HasLeaf7 && ((ECX >> 6) & 1) && HasAVX512Save;
1817 Features["shstk"] = HasLeaf7 && ((ECX >> 7) & 1);
1818 Features["gfni"] = HasLeaf7 && ((ECX >> 8) & 1);
1819 Features["vaes"] = HasLeaf7 && ((ECX >> 9) & 1) && HasAVXSave;
1820 Features["vpclmulqdq"] = HasLeaf7 && ((ECX >> 10) & 1) && HasAVXSave;
1821 Features["avx512vnni"] = HasLeaf7 && ((ECX >> 11) & 1) && HasAVX512Save;
1822 Features["avx512bitalg"] = HasLeaf7 && ((ECX >> 12) & 1) && HasAVX512Save;
1823 Features["avx512vpopcntdq"] = HasLeaf7 && ((ECX >> 14) & 1) && HasAVX512Save;
1824 Features["rdpid"] = HasLeaf7 && ((ECX >> 22) & 1);
1825 Features["kl"] = HasLeaf7 && ((ECX >> 23) & 1); // key locker
1826 Features["cldemote"] = HasLeaf7 && ((ECX >> 25) & 1);
1827 Features["movdiri"] = HasLeaf7 && ((ECX >> 27) & 1);
1828 Features["movdir64b"] = HasLeaf7 && ((ECX >> 28) & 1);
1829 Features["enqcmd"] = HasLeaf7 && ((ECX >> 29) & 1);
1830
1831 Features["uintr"] = HasLeaf7 && ((EDX >> 5) & 1);
1832 Features["avx512vp2intersect"] =
1833 HasLeaf7 && ((EDX >> 8) & 1) && HasAVX512Save;
1834 Features["serialize"] = HasLeaf7 && ((EDX >> 14) & 1);
1835 Features["tsxldtrk"] = HasLeaf7 && ((EDX >> 16) & 1);
1836 // There are two CPUID leafs which information associated with the pconfig
1837 // instruction:
1838 // EAX=0x7, ECX=0x0 indicates the availability of the instruction (via the 18th
1839 // bit of EDX), while the EAX=0x1b leaf returns information on the
1840 // availability of specific pconfig leafs.
1841 // The target feature here only refers to the the first of these two.
1842 // Users might need to check for the availability of specific pconfig
1843 // leaves using cpuid, since that information is ignored while
1844 // detecting features using the "-march=native" flag.
1845 // For more info, see X86 ISA docs.
1846 Features["pconfig"] = HasLeaf7 && ((EDX >> 18) & 1);
1847 Features["amx-bf16"] = HasLeaf7 && ((EDX >> 22) & 1) && HasAMXSave;
1848 Features["avx512fp16"] = HasLeaf7 && ((EDX >> 23) & 1) && HasAVX512Save;
1849 Features["amx-tile"] = HasLeaf7 && ((EDX >> 24) & 1) && HasAMXSave;
1850 Features["amx-int8"] = HasLeaf7 && ((EDX >> 25) & 1) && HasAMXSave;
1851 // EAX from subleaf 0 is the maximum subleaf supported. Some CPUs don't
1852 // return all 0s for invalid subleaves so check the limit.
1853 bool HasLeaf7Subleaf1 =
1854 HasLeaf7 && EAX >= 1 &&
1855 !getX86CpuIDAndInfoEx(0x7, 0x1, &EAX, &EBX, &ECX, &EDX);
1856 Features["sha512"] = HasLeaf7Subleaf1 && ((EAX >> 0) & 1);
1857 Features["sm3"] = HasLeaf7Subleaf1 && ((EAX >> 1) & 1);
1858 Features["sm4"] = HasLeaf7Subleaf1 && ((EAX >> 2) & 1);
1859 Features["raoint"] = HasLeaf7Subleaf1 && ((EAX >> 3) & 1);
1860 Features["avxvnni"] = HasLeaf7Subleaf1 && ((EAX >> 4) & 1) && HasAVXSave;
1861 Features["avx512bf16"] = HasLeaf7Subleaf1 && ((EAX >> 5) & 1) && HasAVX512Save;
1862 Features["amx-fp16"] = HasLeaf7Subleaf1 && ((EAX >> 21) & 1) && HasAMXSave;
1863 Features["cmpccxadd"] = HasLeaf7Subleaf1 && ((EAX >> 7) & 1);
1864 Features["hreset"] = HasLeaf7Subleaf1 && ((EAX >> 22) & 1);
1865 Features["avxifma"] = HasLeaf7Subleaf1 && ((EAX >> 23) & 1) && HasAVXSave;
1866 Features["avxvnniint8"] = HasLeaf7Subleaf1 && ((EDX >> 4) & 1) && HasAVXSave;
1867 Features["avxneconvert"] = HasLeaf7Subleaf1 && ((EDX >> 5) & 1) && HasAVXSave;
1868 Features["amx-complex"] = HasLeaf7Subleaf1 && ((EDX >> 8) & 1) && HasAMXSave;
1869 Features["avxvnniint16"] = HasLeaf7Subleaf1 && ((EDX >> 10) & 1) && HasAVXSave;
1870 Features["prefetchi"] = HasLeaf7Subleaf1 && ((EDX >> 14) & 1);
1871 Features["usermsr"] = HasLeaf7Subleaf1 && ((EDX >> 15) & 1);
1872 Features["avx10.1-256"] = HasLeaf7Subleaf1 && ((EDX >> 19) & 1);
1873 bool HasAPXF = HasLeaf7Subleaf1 && ((EDX >> 21) & 1);
1874 Features["egpr"] = HasAPXF;
1875 Features["push2pop2"] = HasAPXF;
1876 Features["ppx"] = HasAPXF;
1877 Features["ndd"] = HasAPXF;
1878 Features["ccmp"] = HasAPXF;
1879 Features["cf"] = HasAPXF;
1880
1881 bool HasLeafD = MaxLevel >= 0xd &&
1882 !getX86CpuIDAndInfoEx(0xd, 0x1, &EAX, &EBX, &ECX, &EDX);
1883
1884 // Only enable XSAVE if OS has enabled support for saving YMM state.
1885 Features["xsaveopt"] = HasLeafD && ((EAX >> 0) & 1) && HasAVXSave;
1886 Features["xsavec"] = HasLeafD && ((EAX >> 1) & 1) && HasAVXSave;
1887 Features["xsaves"] = HasLeafD && ((EAX >> 3) & 1) && HasAVXSave;
1888
1889 bool HasLeaf14 = MaxLevel >= 0x14 &&
1890 !getX86CpuIDAndInfoEx(0x14, 0x0, &EAX, &EBX, &ECX, &EDX);
1891
1892 Features["ptwrite"] = HasLeaf14 && ((EBX >> 4) & 1);
1893
1894 bool HasLeaf19 =
1895 MaxLevel >= 0x19 && !getX86CpuIDAndInfo(0x19, &EAX, &EBX, &ECX, &EDX);
1896 Features["widekl"] = HasLeaf7 && HasLeaf19 && ((EBX >> 2) & 1);
1897
1898 bool HasLeaf24 =
1899 MaxLevel >= 0x24 && !getX86CpuIDAndInfo(0x24, &EAX, &EBX, &ECX, &EDX);
1900 Features["avx10.1-512"] =
1901 Features["avx10.1-256"] && HasLeaf24 && ((EBX >> 18) & 1);
1902
1903 return true;
1904}
1905#elif defined(__linux__) && (defined(__arm__) || defined(__aarch64__))
1907 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
1908 if (!P)
1909 return false;
1910
1912 P->getBuffer().split(Lines, "\n");
1913
1915
1916 // Look for the CPU features.
1917 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
1918 if (Lines[I].starts_with("Features")) {
1919 Lines[I].split(CPUFeatures, ' ');
1920 break;
1921 }
1922
1923#if defined(__aarch64__)
1924 // Keep track of which crypto features we have seen
1925 enum { CAP_AES = 0x1, CAP_PMULL = 0x2, CAP_SHA1 = 0x4, CAP_SHA2 = 0x8 };
1926 uint32_t crypto = 0;
1927#endif
1928
1929 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) {
1930 StringRef LLVMFeatureStr = StringSwitch<StringRef>(CPUFeatures[I])
1931#if defined(__aarch64__)
1932 .Case("asimd", "neon")
1933 .Case("fp", "fp-armv8")
1934 .Case("crc32", "crc")
1935 .Case("atomics", "lse")
1936 .Case("sve", "sve")
1937 .Case("sve2", "sve2")
1938#else
1939 .Case("half", "fp16")
1940 .Case("neon", "neon")
1941 .Case("vfpv3", "vfp3")
1942 .Case("vfpv3d16", "vfp3d16")
1943 .Case("vfpv4", "vfp4")
1944 .Case("idiva", "hwdiv-arm")
1945 .Case("idivt", "hwdiv")
1946#endif
1947 .Default("");
1948
1949#if defined(__aarch64__)
1950 // We need to check crypto separately since we need all of the crypto
1951 // extensions to enable the subtarget feature
1952 if (CPUFeatures[I] == "aes")
1953 crypto |= CAP_AES;
1954 else if (CPUFeatures[I] == "pmull")
1955 crypto |= CAP_PMULL;
1956 else if (CPUFeatures[I] == "sha1")
1957 crypto |= CAP_SHA1;
1958 else if (CPUFeatures[I] == "sha2")
1959 crypto |= CAP_SHA2;
1960#endif
1961
1962 if (LLVMFeatureStr != "")
1963 Features[LLVMFeatureStr] = true;
1964 }
1965
1966#if defined(__aarch64__)
1967 // If we have all crypto bits we can add the feature
1968 if (crypto == (CAP_AES | CAP_PMULL | CAP_SHA1 | CAP_SHA2))
1969 Features["crypto"] = true;
1970#endif
1971
1972 return true;
1973}
1974#elif defined(_WIN32) && (defined(__aarch64__) || defined(_M_ARM64))
1976 if (IsProcessorFeaturePresent(PF_ARM_NEON_INSTRUCTIONS_AVAILABLE))
1977 Features["neon"] = true;
1978 if (IsProcessorFeaturePresent(PF_ARM_V8_CRC32_INSTRUCTIONS_AVAILABLE))
1979 Features["crc"] = true;
1980 if (IsProcessorFeaturePresent(PF_ARM_V8_CRYPTO_INSTRUCTIONS_AVAILABLE))
1981 Features["crypto"] = true;
1982
1983 return true;
1984}
1985#elif defined(__linux__) && defined(__loongarch__)
1986#include <sys/auxv.h>
1988 unsigned long hwcap = getauxval(AT_HWCAP);
1989 bool HasFPU = hwcap & (1UL << 3); // HWCAP_LOONGARCH_FPU
1990 uint32_t cpucfg2 = 0x2;
1991 __asm__("cpucfg %[cpucfg2], %[cpucfg2]\n\t" : [cpucfg2] "+r"(cpucfg2));
1992
1993 Features["f"] = HasFPU && (cpucfg2 & (1U << 1)); // CPUCFG.2.FP_SP
1994 Features["d"] = HasFPU && (cpucfg2 & (1U << 2)); // CPUCFG.2.FP_DP
1995
1996 Features["lsx"] = hwcap & (1UL << 4); // HWCAP_LOONGARCH_LSX
1997 Features["lasx"] = hwcap & (1UL << 5); // HWCAP_LOONGARCH_LASX
1998 Features["lvz"] = hwcap & (1UL << 9); // HWCAP_LOONGARCH_LVZ
1999
2000 return true;
2001}
2002#else
2003bool sys::getHostCPUFeatures(StringMap<bool> &Features) { return false; }
2004#endif
2005
2006#if __APPLE__
2007/// \returns the \p triple, but with the Host's arch spliced in.
2008static Triple withHostArch(Triple T) {
2009#if defined(__arm__)
2010 T.setArch(Triple::arm);
2011 T.setArchName("arm");
2012#elif defined(__arm64e__)
2014 T.setArchName("arm64e");
2015#elif defined(__aarch64__)
2016 T.setArch(Triple::aarch64);
2017 T.setArchName("arm64");
2018#elif defined(__x86_64h__)
2019 T.setArch(Triple::x86_64);
2020 T.setArchName("x86_64h");
2021#elif defined(__x86_64__)
2022 T.setArch(Triple::x86_64);
2023 T.setArchName("x86_64");
2024#elif defined(__i386__)
2025 T.setArch(Triple::x86);
2026 T.setArchName("i386");
2027#elif defined(__powerpc__)
2028 T.setArch(Triple::ppc);
2029 T.setArchName("powerpc");
2030#else
2031# error "Unimplemented host arch fixup"
2032#endif
2033 return T;
2034}
2035#endif
2036
2038 std::string TargetTripleString = updateTripleOSVersion(LLVM_HOST_TRIPLE);
2039 Triple PT(Triple::normalize(TargetTripleString));
2040
2041#if __APPLE__
2042 /// In Universal builds, LLVM_HOST_TRIPLE will have the wrong arch in one of
2043 /// the slices. This fixes that up.
2044 PT = withHostArch(PT);
2045#endif
2046
2047 if (sizeof(void *) == 8 && PT.isArch32Bit())
2048 PT = PT.get64BitArchVariant();
2049 if (sizeof(void *) == 4 && PT.isArch64Bit())
2050 PT = PT.get32BitArchVariant();
2051
2052 return PT.str();
2053}
2054
2056#if LLVM_VERSION_PRINTER_SHOW_HOST_TARGET_INFO
2057 std::string CPU = std::string(sys::getHostCPUName());
2058 if (CPU == "generic")
2059 CPU = "(unknown)";
2060 OS << " Default target: " << sys::getDefaultTargetTriple() << '\n'
2061 << " Host CPU: " << CPU << '\n';
2062#endif
2063}
This file defines the StringMap class.
#define LLVM_ATTRIBUTE_UNUSED
Definition: Compiler.h:203
Given that RA is a live value
T Content
static std::unique_ptr< llvm::MemoryBuffer > LLVM_ATTRIBUTE_UNUSED getProcCpuinfoContent()
Definition: Host.cpp:65
#define F(x, y, z)
Definition: MD5.cpp:55
#define I(x, y, z)
Definition: MD5.cpp:58
#define P(N)
raw_pwrite_stream & OS
This file defines the SmallVector class.
This file implements the StringSwitch template, which mimics a switch() statement whose cases are str...
DEMANGLE_NAMESPACE_BEGIN bool starts_with(std::string_view self, char C) noexcept
Represents either an error or a value T.
Definition: ErrorOr.h:56
static ErrorOr< std::unique_ptr< MemoryBuffer > > getFileAsStream(const Twine &Filename)
Read all of the specified file into a MemoryBuffer as a stream (i.e.
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209
StringMap - This is an unconventional map that is specialized for handling keys that are "strings",...
Definition: StringMap.h:127
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50
std::pair< StringRef, StringRef > split(char Separator) const
Split into two substrings around the first occurrence of a separator character.
Definition: StringRef.h:696
constexpr bool empty() const
empty - Check if the string is empty.
Definition: StringRef.h:134
iterator begin() const
Definition: StringRef.h:111
iterator end() const
Definition: StringRef.h:113
bool ends_with(StringRef Suffix) const
Check if this string ends with the given Suffix.
Definition: StringRef.h:271
static constexpr size_t npos
Definition: StringRef.h:52
A switch()-like statement whose cases are string literals.
Definition: StringSwitch.h:44
StringSwitch & Case(StringLiteral S, T Value)
Definition: StringSwitch.h:69
R Default(T Value)
Definition: StringSwitch.h:182
StringSwitch & StartsWith(StringLiteral S, T Value)
Definition: StringSwitch.h:83
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44
llvm::Triple get32BitArchVariant() const
Form a triple with a 32-bit variant of the current architecture.
Definition: Triple.cpp:1550
std::string normalize() const
Return the normalized form of this triple's string.
Definition: Triple.h:354
llvm::Triple get64BitArchVariant() const
Form a triple with a 64-bit variant of the current architecture.
Definition: Triple.cpp:1631
const std::string & str() const
Definition: Triple.h:424
bool isArch64Bit() const
Test whether the architecture is 64-bit.
Definition: Triple.cpp:1538
@ AArch64SubArch_arm64e
Definition: Triple.h:149
bool isArch32Bit() const
Test whether the architecture is 32-bit.
Definition: Triple.cpp:1542
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:52
@ CPU_SUBTYPE_POWERPC_970
Definition: MachO.h:1663
@ CPU_SUBTYPE_POWERPC_604e
Definition: MachO.h:1658
@ CPU_SUBTYPE_POWERPC_603e
Definition: MachO.h:1655
@ CPU_SUBTYPE_POWERPC_7400
Definition: MachO.h:1661
@ CPU_SUBTYPE_POWERPC_604
Definition: MachO.h:1657
@ CPU_SUBTYPE_POWERPC_750
Definition: MachO.h:1660
@ CPU_SUBTYPE_POWERPC_601
Definition: MachO.h:1652
@ CPU_SUBTYPE_POWERPC_620
Definition: MachO.h:1659
@ CPU_SUBTYPE_POWERPC_603ev
Definition: MachO.h:1656
@ CPU_SUBTYPE_POWERPC_603
Definition: MachO.h:1654
@ CPU_SUBTYPE_POWERPC_7450
Definition: MachO.h:1662
@ CPU_SUBTYPE_POWERPC_602
Definition: MachO.h:1653
Helper functions to extract CPU details from CPUID on x86.
Definition: Host.h:72
VendorSignatures getVendorSignature(unsigned *MaxLeaf=nullptr)
Returns the host CPU's vendor.
Definition: Host.cpp:1697
StringRef getHostCPUNameForS390x(StringRef ProcCpuinfoContent)
Definition: Host.cpp:385
StringRef getHostCPUNameForPowerPC(StringRef ProcCpuinfoContent)
Helper functions to extract HostCPUName from /proc/cpuinfo on linux.
Definition: Host.cpp:76
StringRef getHostCPUNameForBPF()
Definition: Host.cpp:450
StringRef getHostCPUNameForARM(StringRef ProcCpuinfoContent)
Definition: Host.cpp:159
StringRef getHostCPUNameForRISCV(StringRef ProcCpuinfoContent)
Definition: Host.cpp:430
StringRef getHostCPUNameForSPARC(StringRef ProcCpuinfoContent)
StringRef getHostCPUName()
getHostCPUName - Get the LLVM name for the host CPU.
Definition: Host.cpp:1691
void printDefaultTargetAndDetectedCPU(raw_ostream &OS)
This is a function compatible with cl::AddExtraVersionPrinter, which adds info about the current targ...
Definition: Host.cpp:2055
bool getHostCPUFeatures(StringMap< bool, MallocAllocator > &Features)
getHostCPUFeatures - Get the LLVM names for the host CPU features.
std::string getProcessTriple()
getProcessTriple() - Return an appropriate target triple for generating code to be loaded into the cu...
Definition: Host.cpp:2037
std::string getDefaultTargetTriple()
getDefaultTargetTriple() - Return the default target triple the compiler has been configured to produ...
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
@ Length
Definition: DWP.cpp:456
raw_fd_ostream & errs()
This returns a reference to a raw_ostream for standard error.