blob: 2fb0c254165241a7f6b17444a10fee75b3d0f619 [file] [log] [blame]
Simon Pilgrima271c542017-05-03 15:42:29 +00001//===-- Host.cpp - Implement OS Host Concept --------------------*- C++ -*-===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Simon Pilgrima271c542017-05-03 15:42:29 +00006//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the operating system Host concept.
10//
11//===----------------------------------------------------------------------===//
12
13#include "llvm/Support/Host.h"
Craig Topperc77d00e2017-11-10 17:10:57 +000014#include "llvm/Support/TargetParser.h"
Simon Pilgrima271c542017-05-03 15:42:29 +000015#include "llvm/ADT/SmallSet.h"
16#include "llvm/ADT/SmallVector.h"
17#include "llvm/ADT/StringRef.h"
18#include "llvm/ADT/StringSwitch.h"
19#include "llvm/ADT/Triple.h"
Nico Weber432a3882018-04-30 14:59:11 +000020#include "llvm/Config/llvm-config.h"
Simon Pilgrima271c542017-05-03 15:42:29 +000021#include "llvm/Support/Debug.h"
22#include "llvm/Support/FileSystem.h"
23#include "llvm/Support/MemoryBuffer.h"
24#include "llvm/Support/raw_ostream.h"
25#include <assert.h>
26#include <string.h>
27
28// Include the platform-specific parts of this class.
29#ifdef LLVM_ON_UNIX
30#include "Unix/Host.inc"
31#endif
Nico Weber712e8d22018-04-29 00:45:03 +000032#ifdef _WIN32
Simon Pilgrima271c542017-05-03 15:42:29 +000033#include "Windows/Host.inc"
34#endif
35#ifdef _MSC_VER
36#include <intrin.h>
37#endif
Chris Bieneman34688fa2019-10-30 12:50:04 -070038#if defined(__APPLE__) && (!defined(__x86_64__))
Simon Pilgrima271c542017-05-03 15:42:29 +000039#include <mach/host_info.h>
40#include <mach/mach.h>
41#include <mach/mach_host.h>
42#include <mach/machine.h>
43#endif
44
45#define DEBUG_TYPE "host-detection"
46
47//===----------------------------------------------------------------------===//
48//
49// Implementations of the CPU detection routines
50//
51//===----------------------------------------------------------------------===//
52
53using namespace llvm;
54
55static std::unique_ptr<llvm::MemoryBuffer>
56 LLVM_ATTRIBUTE_UNUSED getProcCpuinfoContent() {
57 llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> Text =
58 llvm::MemoryBuffer::getFileAsStream("/proc/cpuinfo");
59 if (std::error_code EC = Text.getError()) {
60 llvm::errs() << "Can't read "
61 << "/proc/cpuinfo: " << EC.message() << "\n";
62 return nullptr;
63 }
64 return std::move(*Text);
65}
66
Craig Topper8665f592018-03-07 17:53:16 +000067StringRef sys::detail::getHostCPUNameForPowerPC(StringRef ProcCpuinfoContent) {
Simon Pilgrima271c542017-05-03 15:42:29 +000068 // Access to the Processor Version Register (PVR) on PowerPC is privileged,
69 // and so we must use an operating-system interface to determine the current
70 // processor type. On Linux, this is exposed through the /proc/cpuinfo file.
71 const char *generic = "generic";
72
73 // The cpu line is second (after the 'processor: 0' line), so if this
74 // buffer is too small then something has changed (or is wrong).
75 StringRef::const_iterator CPUInfoStart = ProcCpuinfoContent.begin();
76 StringRef::const_iterator CPUInfoEnd = ProcCpuinfoContent.end();
77
78 StringRef::const_iterator CIP = CPUInfoStart;
79
80 StringRef::const_iterator CPUStart = 0;
81 size_t CPULen = 0;
82
83 // We need to find the first line which starts with cpu, spaces, and a colon.
84 // After the colon, there may be some additional spaces and then the cpu type.
85 while (CIP < CPUInfoEnd && CPUStart == 0) {
86 if (CIP < CPUInfoEnd && *CIP == '\n')
87 ++CIP;
88
89 if (CIP < CPUInfoEnd && *CIP == 'c') {
90 ++CIP;
91 if (CIP < CPUInfoEnd && *CIP == 'p') {
92 ++CIP;
93 if (CIP < CPUInfoEnd && *CIP == 'u') {
94 ++CIP;
95 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t'))
96 ++CIP;
97
98 if (CIP < CPUInfoEnd && *CIP == ':') {
99 ++CIP;
100 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t'))
101 ++CIP;
102
103 if (CIP < CPUInfoEnd) {
104 CPUStart = CIP;
105 while (CIP < CPUInfoEnd && (*CIP != ' ' && *CIP != '\t' &&
106 *CIP != ',' && *CIP != '\n'))
107 ++CIP;
108 CPULen = CIP - CPUStart;
109 }
110 }
111 }
112 }
113 }
114
115 if (CPUStart == 0)
116 while (CIP < CPUInfoEnd && *CIP != '\n')
117 ++CIP;
118 }
119
120 if (CPUStart == 0)
121 return generic;
122
123 return StringSwitch<const char *>(StringRef(CPUStart, CPULen))
124 .Case("604e", "604e")
125 .Case("604", "604")
126 .Case("7400", "7400")
127 .Case("7410", "7400")
128 .Case("7447", "7400")
129 .Case("7455", "7450")
130 .Case("G4", "g4")
131 .Case("POWER4", "970")
132 .Case("PPC970FX", "970")
133 .Case("PPC970MP", "970")
134 .Case("G5", "g5")
135 .Case("POWER5", "g5")
136 .Case("A2", "a2")
137 .Case("POWER6", "pwr6")
138 .Case("POWER7", "pwr7")
139 .Case("POWER8", "pwr8")
140 .Case("POWER8E", "pwr8")
141 .Case("POWER8NVL", "pwr8")
142 .Case("POWER9", "pwr9")
Stefan Pintiliedcceab12019-11-27 12:50:23 -0600143 // FIXME: If we get a simulator or machine with the capabilities of
144 // mcpu=future, we should revisit this and add the name reported by the
145 // simulator/machine.
Simon Pilgrima271c542017-05-03 15:42:29 +0000146 .Default(generic);
147}
148
Craig Topper8665f592018-03-07 17:53:16 +0000149StringRef sys::detail::getHostCPUNameForARM(StringRef ProcCpuinfoContent) {
Simon Pilgrima271c542017-05-03 15:42:29 +0000150 // The cpuid register on arm is not accessible from user space. On Linux,
151 // it is exposed through the /proc/cpuinfo file.
152
153 // Read 32 lines from /proc/cpuinfo, which should contain the CPU part line
154 // in all cases.
155 SmallVector<StringRef, 32> Lines;
156 ProcCpuinfoContent.split(Lines, "\n");
157
158 // Look for the CPU implementer line.
159 StringRef Implementer;
160 StringRef Hardware;
161 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
162 if (Lines[I].startswith("CPU implementer"))
163 Implementer = Lines[I].substr(15).ltrim("\t :");
164 if (Lines[I].startswith("Hardware"))
165 Hardware = Lines[I].substr(8).ltrim("\t :");
166 }
167
168 if (Implementer == "0x41") { // ARM Ltd.
169 // MSM8992/8994 may give cpu part for the core that the kernel is running on,
170 // which is undeterministic and wrong. Always return cortex-a53 for these SoC.
171 if (Hardware.endswith("MSM8994") || Hardware.endswith("MSM8996"))
172 return "cortex-a53";
173
174
175 // Look for the CPU part line.
176 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
177 if (Lines[I].startswith("CPU part"))
178 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
179 // values correspond to the "Part number" in the CP15/c0 register. The
180 // contents are specified in the various processor manuals.
Luke Geeson4518aab2020-02-11 16:57:25 +0000181 // This corresponds to the Main ID Register in Technical Reference Manuals.
182 // and is used in programs like sys-utils
Simon Pilgrima271c542017-05-03 15:42:29 +0000183 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
184 .Case("0x926", "arm926ej-s")
185 .Case("0xb02", "mpcore")
186 .Case("0xb36", "arm1136j-s")
187 .Case("0xb56", "arm1156t2-s")
188 .Case("0xb76", "arm1176jz-s")
189 .Case("0xc08", "cortex-a8")
190 .Case("0xc09", "cortex-a9")
191 .Case("0xc0f", "cortex-a15")
192 .Case("0xc20", "cortex-m0")
193 .Case("0xc23", "cortex-m3")
194 .Case("0xc24", "cortex-m4")
Luke Geeson7d594cf2020-02-14 13:33:32 +0000195 .Case("0xd22", "cortex-m55")
Luke Geeson4518aab2020-02-11 16:57:25 +0000196 .Case("0xd02", "cortex-a34")
Simon Pilgrima271c542017-05-03 15:42:29 +0000197 .Case("0xd04", "cortex-a35")
198 .Case("0xd03", "cortex-a53")
199 .Case("0xd07", "cortex-a57")
200 .Case("0xd08", "cortex-a72")
201 .Case("0xd09", "cortex-a73")
Yi Kong432f48f2019-06-11 00:05:36 +0000202 .Case("0xd0a", "cortex-a75")
203 .Case("0xd0b", "cortex-a76")
Simon Pilgrima271c542017-05-03 15:42:29 +0000204 .Default("generic");
205 }
206
Joel Jones0a6c0002018-10-05 22:23:21 +0000207 if (Implementer == "0x42" || Implementer == "0x43") { // Broadcom | Cavium.
208 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
209 if (Lines[I].startswith("CPU part")) {
210 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
211 .Case("0x516", "thunderx2t99")
212 .Case("0x0516", "thunderx2t99")
213 .Case("0xaf", "thunderx2t99")
214 .Case("0x0af", "thunderx2t99")
215 .Case("0xa1", "thunderxt88")
216 .Case("0x0a1", "thunderxt88")
217 .Default("generic");
218 }
219 }
220 }
221
KAWASHIMA Takahiroc8cd1a92020-03-03 21:52:27 +0900222 if (Implementer == "0x46") { // Fujitsu Ltd.
223 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
224 if (Lines[I].startswith("CPU part")) {
225 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
226 .Case("0x001", "a64fx")
227 .Default("generic");
228 }
229 }
230 }
231
Bryan Chan12355392018-11-09 19:32:08 +0000232 if (Implementer == "0x48") // HiSilicon Technologies, Inc.
233 // Look for the CPU part line.
234 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
235 if (Lines[I].startswith("CPU part"))
236 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
237 // values correspond to the "Part number" in the CP15/c0 register. The
238 // contents are specified in the various processor manuals.
239 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
240 .Case("0xd01", "tsv110")
241 .Default("generic");
242
Simon Pilgrima271c542017-05-03 15:42:29 +0000243 if (Implementer == "0x51") // Qualcomm Technologies, Inc.
244 // Look for the CPU part line.
245 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
246 if (Lines[I].startswith("CPU part"))
247 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
248 // values correspond to the "Part number" in the CP15/c0 register. The
249 // contents are specified in the various processor manuals.
250 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
251 .Case("0x06f", "krait") // APQ8064
252 .Case("0x201", "kryo")
253 .Case("0x205", "kryo")
Eli Friedmanbde9fc72017-09-13 21:48:00 +0000254 .Case("0x211", "kryo")
255 .Case("0x800", "cortex-a73")
256 .Case("0x801", "cortex-a73")
Yi Kong432f48f2019-06-11 00:05:36 +0000257 .Case("0x802", "cortex-a73")
258 .Case("0x803", "cortex-a73")
259 .Case("0x804", "cortex-a73")
260 .Case("0x805", "cortex-a73")
Balaram Makama1e7ecc72017-09-22 17:46:36 +0000261 .Case("0xc00", "falkor")
Chad Rosier71070852017-09-25 14:05:00 +0000262 .Case("0xc01", "saphira")
Simon Pilgrima271c542017-05-03 15:42:29 +0000263 .Default("generic");
264
Evandro Menezes5d7a9e62017-12-08 21:09:59 +0000265 if (Implementer == "0x53") { // Samsung Electronics Co., Ltd.
266 // The Exynos chips have a convoluted ID scheme that doesn't seem to follow
267 // any predictive pattern across variants and parts.
268 unsigned Variant = 0, Part = 0;
269
270 // Look for the CPU variant line, whose value is a 1 digit hexadecimal
271 // number, corresponding to the Variant bits in the CP15/C0 register.
272 for (auto I : Lines)
273 if (I.consume_front("CPU variant"))
274 I.ltrim("\t :").getAsInteger(0, Variant);
275
276 // Look for the CPU part line, whose value is a 3 digit hexadecimal
277 // number, corresponding to the PartNum bits in the CP15/C0 register.
278 for (auto I : Lines)
279 if (I.consume_front("CPU part"))
280 I.ltrim("\t :").getAsInteger(0, Part);
281
282 unsigned Exynos = (Variant << 12) | Part;
283 switch (Exynos) {
284 default:
Evandro Menezes215da662019-10-02 16:26:40 -0500285 // Default by falling through to Exynos M3.
Evandro Menezes5d7a9e62017-12-08 21:09:59 +0000286 LLVM_FALLTHROUGH;
Evandro Menezes215da662019-10-02 16:26:40 -0500287 case 0x1002:
288 return "exynos-m3";
289 case 0x1003:
290 return "exynos-m4";
Evandro Menezes5d7a9e62017-12-08 21:09:59 +0000291 }
292 }
293
Simon Pilgrima271c542017-05-03 15:42:29 +0000294 return "generic";
295}
296
Craig Topper8665f592018-03-07 17:53:16 +0000297StringRef sys::detail::getHostCPUNameForS390x(StringRef ProcCpuinfoContent) {
Simon Pilgrima271c542017-05-03 15:42:29 +0000298 // STIDP is a privileged operation, so use /proc/cpuinfo instead.
299
300 // The "processor 0:" line comes after a fair amount of other information,
301 // including a cache breakdown, but this should be plenty.
302 SmallVector<StringRef, 32> Lines;
303 ProcCpuinfoContent.split(Lines, "\n");
304
305 // Look for the CPU features.
306 SmallVector<StringRef, 32> CPUFeatures;
307 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
308 if (Lines[I].startswith("features")) {
309 size_t Pos = Lines[I].find(":");
310 if (Pos != StringRef::npos) {
311 Lines[I].drop_front(Pos + 1).split(CPUFeatures, ' ');
312 break;
313 }
314 }
315
316 // We need to check for the presence of vector support independently of
317 // the machine type, since we may only use the vector register set when
318 // supported by the kernel (and hypervisor).
319 bool HaveVectorSupport = false;
320 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) {
321 if (CPUFeatures[I] == "vx")
322 HaveVectorSupport = true;
323 }
324
325 // Now check the processor machine type.
326 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
327 if (Lines[I].startswith("processor ")) {
328 size_t Pos = Lines[I].find("machine = ");
329 if (Pos != StringRef::npos) {
330 Pos += sizeof("machine = ") - 1;
331 unsigned int Id;
332 if (!Lines[I].drop_front(Pos).getAsInteger(10, Id)) {
Ulrich Weigand0f0a8b72019-07-12 18:13:16 +0000333 if (Id >= 8561 && HaveVectorSupport)
Ulrich Weigand819c1652019-09-20 23:04:45 +0000334 return "z15";
Ulrich Weigand2b3482f2017-07-17 17:41:11 +0000335 if (Id >= 3906 && HaveVectorSupport)
336 return "z14";
Simon Pilgrima271c542017-05-03 15:42:29 +0000337 if (Id >= 2964 && HaveVectorSupport)
338 return "z13";
339 if (Id >= 2827)
340 return "zEC12";
341 if (Id >= 2817)
342 return "z196";
343 }
344 }
345 break;
346 }
347 }
348
349 return "generic";
350}
351
Yonghong Songdc1dbf62017-08-23 04:25:57 +0000352StringRef sys::detail::getHostCPUNameForBPF() {
353#if !defined(__linux__) || !defined(__x86_64__)
354 return "generic";
355#else
Jiong Wang66b18e52019-02-07 10:43:09 +0000356 uint8_t v3_insns[40] __attribute__ ((aligned (8))) =
357 /* BPF_MOV64_IMM(BPF_REG_0, 0) */
358 { 0xb7, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
359 /* BPF_MOV64_IMM(BPF_REG_2, 1) */
360 0xb7, 0x2, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
361 /* BPF_JMP32_REG(BPF_JLT, BPF_REG_0, BPF_REG_2, 1) */
362 0xae, 0x20, 0x1, 0x0, 0x0, 0x0, 0x0, 0x0,
363 /* BPF_MOV64_IMM(BPF_REG_0, 1) */
364 0xb7, 0x0, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
365 /* BPF_EXIT_INSN() */
366 0x95, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0 };
367
368 uint8_t v2_insns[40] __attribute__ ((aligned (8))) =
Yonghong Songdc1dbf62017-08-23 04:25:57 +0000369 /* BPF_MOV64_IMM(BPF_REG_0, 0) */
370 { 0xb7, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
371 /* BPF_MOV64_IMM(BPF_REG_2, 1) */
372 0xb7, 0x2, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
373 /* BPF_JMP_REG(BPF_JLT, BPF_REG_0, BPF_REG_2, 1) */
374 0xad, 0x20, 0x1, 0x0, 0x0, 0x0, 0x0, 0x0,
375 /* BPF_MOV64_IMM(BPF_REG_0, 1) */
376 0xb7, 0x0, 0x0, 0x0, 0x1, 0x0, 0x0, 0x0,
377 /* BPF_EXIT_INSN() */
378 0x95, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0 };
379
380 struct bpf_prog_load_attr {
381 uint32_t prog_type;
382 uint32_t insn_cnt;
383 uint64_t insns;
384 uint64_t license;
385 uint32_t log_level;
386 uint32_t log_size;
387 uint64_t log_buf;
388 uint32_t kern_version;
389 uint32_t prog_flags;
390 } attr = {};
391 attr.prog_type = 1; /* BPF_PROG_TYPE_SOCKET_FILTER */
392 attr.insn_cnt = 5;
Jiong Wang66b18e52019-02-07 10:43:09 +0000393 attr.insns = (uint64_t)v3_insns;
Yonghong Songdc1dbf62017-08-23 04:25:57 +0000394 attr.license = (uint64_t)"DUMMY";
395
Jiong Wang66b18e52019-02-07 10:43:09 +0000396 int fd = syscall(321 /* __NR_bpf */, 5 /* BPF_PROG_LOAD */, &attr,
397 sizeof(attr));
398 if (fd >= 0) {
399 close(fd);
400 return "v3";
401 }
402
403 /* Clear the whole attr in case its content changed by syscall. */
404 memset(&attr, 0, sizeof(attr));
405 attr.prog_type = 1; /* BPF_PROG_TYPE_SOCKET_FILTER */
406 attr.insn_cnt = 5;
407 attr.insns = (uint64_t)v2_insns;
408 attr.license = (uint64_t)"DUMMY";
409 fd = syscall(321 /* __NR_bpf */, 5 /* BPF_PROG_LOAD */, &attr, sizeof(attr));
Yonghong Songc6d25712017-08-23 16:24:31 +0000410 if (fd >= 0) {
411 close(fd);
412 return "v2";
413 }
414 return "v1";
Yonghong Songdc1dbf62017-08-23 04:25:57 +0000415#endif
416}
417
Simon Pilgrima271c542017-05-03 15:42:29 +0000418#if defined(__i386__) || defined(_M_IX86) || \
419 defined(__x86_64__) || defined(_M_X64)
420
421enum VendorSignatures {
422 SIG_INTEL = 0x756e6547 /* Genu */,
423 SIG_AMD = 0x68747541 /* Auth */
424};
425
Simon Pilgrima271c542017-05-03 15:42:29 +0000426// The check below for i386 was copied from clang's cpuid.h (__get_cpuid_max).
427// Check motivated by bug reports for OpenSSL crashing on CPUs without CPUID
428// support. Consequently, for i386, the presence of CPUID is checked first
429// via the corresponding eflags bit.
430// Removal of cpuid.h header motivated by PR30384
431// Header cpuid.h and method __get_cpuid_max are not used in llvm, clang, openmp
432// or test-suite, but are used in external projects e.g. libstdcxx
433static bool isCpuIdSupported() {
434#if defined(__GNUC__) || defined(__clang__)
435#if defined(__i386__)
436 int __cpuid_supported;
437 __asm__(" pushfl\n"
438 " popl %%eax\n"
439 " movl %%eax,%%ecx\n"
440 " xorl $0x00200000,%%eax\n"
441 " pushl %%eax\n"
442 " popfl\n"
443 " pushfl\n"
444 " popl %%eax\n"
445 " movl $0,%0\n"
446 " cmpl %%eax,%%ecx\n"
447 " je 1f\n"
448 " movl $1,%0\n"
449 "1:"
450 : "=r"(__cpuid_supported)
451 :
452 : "eax", "ecx");
453 if (!__cpuid_supported)
454 return false;
455#endif
456 return true;
457#endif
458 return true;
459}
460
461/// getX86CpuIDAndInfo - Execute the specified cpuid and return the 4 values in
462/// the specified arguments. If we can't run cpuid on the host, return true.
463static bool getX86CpuIDAndInfo(unsigned value, unsigned *rEAX, unsigned *rEBX,
464 unsigned *rECX, unsigned *rEDX) {
Simon Pilgrima271c542017-05-03 15:42:29 +0000465#if defined(__GNUC__) || defined(__clang__)
466#if defined(__x86_64__)
467 // gcc doesn't know cpuid would clobber ebx/rbx. Preserve it manually.
468 // FIXME: should we save this for Clang?
469 __asm__("movq\t%%rbx, %%rsi\n\t"
470 "cpuid\n\t"
471 "xchgq\t%%rbx, %%rsi\n\t"
472 : "=a"(*rEAX), "=S"(*rEBX), "=c"(*rECX), "=d"(*rEDX)
473 : "a"(value));
Craig Topper1efd10a2017-07-10 06:04:11 +0000474 return false;
Simon Pilgrima271c542017-05-03 15:42:29 +0000475#elif defined(__i386__)
476 __asm__("movl\t%%ebx, %%esi\n\t"
477 "cpuid\n\t"
478 "xchgl\t%%ebx, %%esi\n\t"
479 : "=a"(*rEAX), "=S"(*rEBX), "=c"(*rECX), "=d"(*rEDX)
480 : "a"(value));
Craig Topper1efd10a2017-07-10 06:04:11 +0000481 return false;
Simon Pilgrima271c542017-05-03 15:42:29 +0000482#else
Craig Topper1efd10a2017-07-10 06:04:11 +0000483 return true;
Simon Pilgrima271c542017-05-03 15:42:29 +0000484#endif
485#elif defined(_MSC_VER)
486 // The MSVC intrinsic is portable across x86 and x64.
487 int registers[4];
488 __cpuid(registers, value);
489 *rEAX = registers[0];
490 *rEBX = registers[1];
491 *rECX = registers[2];
492 *rEDX = registers[3];
Simon Pilgrima271c542017-05-03 15:42:29 +0000493 return false;
494#else
495 return true;
496#endif
497}
498
499/// getX86CpuIDAndInfoEx - Execute the specified cpuid with subleaf and return
500/// the 4 values in the specified arguments. If we can't run cpuid on the host,
501/// return true.
502static bool getX86CpuIDAndInfoEx(unsigned value, unsigned subleaf,
503 unsigned *rEAX, unsigned *rEBX, unsigned *rECX,
504 unsigned *rEDX) {
Simon Pilgrima271c542017-05-03 15:42:29 +0000505#if defined(__GNUC__) || defined(__clang__)
Craig Topper828cf302017-07-17 05:16:16 +0000506#if defined(__x86_64__)
Craig Topperada983a2017-07-10 06:09:22 +0000507 // gcc doesn't know cpuid would clobber ebx/rbx. Preserve it manually.
Simon Pilgrima271c542017-05-03 15:42:29 +0000508 // FIXME: should we save this for Clang?
509 __asm__("movq\t%%rbx, %%rsi\n\t"
510 "cpuid\n\t"
511 "xchgq\t%%rbx, %%rsi\n\t"
512 : "=a"(*rEAX), "=S"(*rEBX), "=c"(*rECX), "=d"(*rEDX)
513 : "a"(value), "c"(subleaf));
Craig Topper1efd10a2017-07-10 06:04:11 +0000514 return false;
Craig Topper828cf302017-07-17 05:16:16 +0000515#elif defined(__i386__)
516 __asm__("movl\t%%ebx, %%esi\n\t"
517 "cpuid\n\t"
518 "xchgl\t%%ebx, %%esi\n\t"
519 : "=a"(*rEAX), "=S"(*rEBX), "=c"(*rECX), "=d"(*rEDX)
520 : "a"(value), "c"(subleaf));
521 return false;
522#else
523 return true;
524#endif
Simon Pilgrima271c542017-05-03 15:42:29 +0000525#elif defined(_MSC_VER)
526 int registers[4];
527 __cpuidex(registers, value, subleaf);
528 *rEAX = registers[0];
529 *rEBX = registers[1];
530 *rECX = registers[2];
531 *rEDX = registers[3];
Craig Topper1efd10a2017-07-10 06:04:11 +0000532 return false;
533#else
534 return true;
Simon Pilgrima271c542017-05-03 15:42:29 +0000535#endif
Simon Pilgrima271c542017-05-03 15:42:29 +0000536}
537
Craig Topperf3af64e2017-07-12 06:49:57 +0000538// Read control register 0 (XCR0). Used to detect features such as AVX.
Simon Pilgrima271c542017-05-03 15:42:29 +0000539static bool getX86XCR0(unsigned *rEAX, unsigned *rEDX) {
540#if defined(__GNUC__) || defined(__clang__)
541 // Check xgetbv; this uses a .byte sequence instead of the instruction
542 // directly because older assemblers do not include support for xgetbv and
543 // there is no easy way to conditionally compile based on the assembler used.
544 __asm__(".byte 0x0f, 0x01, 0xd0" : "=a"(*rEAX), "=d"(*rEDX) : "c"(0));
545 return false;
546#elif defined(_MSC_FULL_VER) && defined(_XCR_XFEATURE_ENABLED_MASK)
547 unsigned long long Result = _xgetbv(_XCR_XFEATURE_ENABLED_MASK);
548 *rEAX = Result;
549 *rEDX = Result >> 32;
550 return false;
551#else
552 return true;
553#endif
554}
555
556static void detectX86FamilyModel(unsigned EAX, unsigned *Family,
557 unsigned *Model) {
558 *Family = (EAX >> 8) & 0xf; // Bits 8 - 11
559 *Model = (EAX >> 4) & 0xf; // Bits 4 - 7
560 if (*Family == 6 || *Family == 0xf) {
561 if (*Family == 0xf)
562 // Examine extended family ID if family ID is F.
563 *Family += (EAX >> 20) & 0xff; // Bits 20 - 27
564 // Examine extended model ID if family ID is 6 or F.
565 *Model += ((EAX >> 16) & 0xf) << 4; // Bits 16 - 19
566 }
567}
568
569static void
Craig Topperc6bbe4b2017-07-08 05:16:14 +0000570getIntelProcessorTypeAndSubtype(unsigned Family, unsigned Model,
571 unsigned Brand_id, unsigned Features,
Craig Topper0aca35d2018-10-20 03:51:43 +0000572 unsigned Features2, unsigned Features3,
573 unsigned *Type, unsigned *Subtype) {
Simon Pilgrima271c542017-05-03 15:42:29 +0000574 if (Brand_id != 0)
575 return;
576 switch (Family) {
577 case 3:
Craig Topperc77d00e2017-11-10 17:10:57 +0000578 *Type = X86::INTEL_i386;
Simon Pilgrima271c542017-05-03 15:42:29 +0000579 break;
580 case 4:
Craig Topperc77d00e2017-11-10 17:10:57 +0000581 *Type = X86::INTEL_i486;
Simon Pilgrima271c542017-05-03 15:42:29 +0000582 break;
583 case 5:
Craig Topper47c87392017-11-21 23:36:42 +0000584 if (Features & (1 << X86::FEATURE_MMX)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000585 *Type = X86::INTEL_PENTIUM_MMX;
Simon Pilgrima271c542017-05-03 15:42:29 +0000586 break;
587 }
Craig Topperc77d00e2017-11-10 17:10:57 +0000588 *Type = X86::INTEL_PENTIUM;
Simon Pilgrima271c542017-05-03 15:42:29 +0000589 break;
590 case 6:
591 switch (Model) {
592 case 0x01: // Pentium Pro processor
Craig Topperc77d00e2017-11-10 17:10:57 +0000593 *Type = X86::INTEL_PENTIUM_PRO;
Simon Pilgrima271c542017-05-03 15:42:29 +0000594 break;
595 case 0x03: // Intel Pentium II OverDrive processor, Pentium II processor,
596 // model 03
597 case 0x05: // Pentium II processor, model 05, Pentium II Xeon processor,
598 // model 05, and Intel Celeron processor, model 05
599 case 0x06: // Celeron processor, model 06
Craig Topperc77d00e2017-11-10 17:10:57 +0000600 *Type = X86::INTEL_PENTIUM_II;
Simon Pilgrima271c542017-05-03 15:42:29 +0000601 break;
602 case 0x07: // Pentium III processor, model 07, and Pentium III Xeon
603 // processor, model 07
604 case 0x08: // Pentium III processor, model 08, Pentium III Xeon processor,
605 // model 08, and Celeron processor, model 08
606 case 0x0a: // Pentium III Xeon processor, model 0Ah
607 case 0x0b: // Pentium III processor, model 0Bh
Craig Topperc77d00e2017-11-10 17:10:57 +0000608 *Type = X86::INTEL_PENTIUM_III;
Simon Pilgrima271c542017-05-03 15:42:29 +0000609 break;
610 case 0x09: // Intel Pentium M processor, Intel Celeron M processor model 09.
611 case 0x0d: // Intel Pentium M processor, Intel Celeron M processor, model
612 // 0Dh. All processors are manufactured using the 90 nm process.
613 case 0x15: // Intel EP80579 Integrated Processor and Intel EP80579
614 // Integrated Processor with Intel QuickAssist Technology
Craig Topperc77d00e2017-11-10 17:10:57 +0000615 *Type = X86::INTEL_PENTIUM_M;
Simon Pilgrima271c542017-05-03 15:42:29 +0000616 break;
617 case 0x0e: // Intel Core Duo processor, Intel Core Solo processor, model
618 // 0Eh. All processors are manufactured using the 65 nm process.
Craig Topperc77d00e2017-11-10 17:10:57 +0000619 *Type = X86::INTEL_CORE_DUO;
Simon Pilgrima271c542017-05-03 15:42:29 +0000620 break; // yonah
621 case 0x0f: // Intel Core 2 Duo processor, Intel Core 2 Duo mobile
622 // processor, Intel Core 2 Quad processor, Intel Core 2 Quad
623 // mobile processor, Intel Core 2 Extreme processor, Intel
624 // Pentium Dual-Core processor, Intel Xeon processor, model
625 // 0Fh. All processors are manufactured using the 65 nm process.
626 case 0x16: // Intel Celeron processor model 16h. All processors are
627 // manufactured using the 65 nm process
Craig Topperc77d00e2017-11-10 17:10:57 +0000628 *Type = X86::INTEL_CORE2; // "core2"
629 *Subtype = X86::INTEL_CORE2_65;
Simon Pilgrima271c542017-05-03 15:42:29 +0000630 break;
631 case 0x17: // Intel Core 2 Extreme processor, Intel Xeon processor, model
632 // 17h. All processors are manufactured using the 45 nm process.
633 //
634 // 45nm: Penryn , Wolfdale, Yorkfield (XE)
635 case 0x1d: // Intel Xeon processor MP. All processors are manufactured using
636 // the 45 nm process.
Craig Topperc77d00e2017-11-10 17:10:57 +0000637 *Type = X86::INTEL_CORE2; // "penryn"
638 *Subtype = X86::INTEL_CORE2_45;
Simon Pilgrima271c542017-05-03 15:42:29 +0000639 break;
640 case 0x1a: // Intel Core i7 processor and Intel Xeon processor. All
641 // processors are manufactured using the 45 nm process.
642 case 0x1e: // Intel(R) Core(TM) i7 CPU 870 @ 2.93GHz.
643 // As found in a Summer 2010 model iMac.
644 case 0x1f:
645 case 0x2e: // Nehalem EX
Craig Topperc77d00e2017-11-10 17:10:57 +0000646 *Type = X86::INTEL_COREI7; // "nehalem"
647 *Subtype = X86::INTEL_COREI7_NEHALEM;
Simon Pilgrima271c542017-05-03 15:42:29 +0000648 break;
649 case 0x25: // Intel Core i7, laptop version.
650 case 0x2c: // Intel Core i7 processor and Intel Xeon processor. All
651 // processors are manufactured using the 32 nm process.
652 case 0x2f: // Westmere EX
Craig Topperc77d00e2017-11-10 17:10:57 +0000653 *Type = X86::INTEL_COREI7; // "westmere"
654 *Subtype = X86::INTEL_COREI7_WESTMERE;
Simon Pilgrima271c542017-05-03 15:42:29 +0000655 break;
656 case 0x2a: // Intel Core i7 processor. All processors are manufactured
657 // using the 32 nm process.
658 case 0x2d:
Craig Topperc77d00e2017-11-10 17:10:57 +0000659 *Type = X86::INTEL_COREI7; //"sandybridge"
660 *Subtype = X86::INTEL_COREI7_SANDYBRIDGE;
Simon Pilgrima271c542017-05-03 15:42:29 +0000661 break;
662 case 0x3a:
663 case 0x3e: // Ivy Bridge EP
Craig Topperc77d00e2017-11-10 17:10:57 +0000664 *Type = X86::INTEL_COREI7; // "ivybridge"
665 *Subtype = X86::INTEL_COREI7_IVYBRIDGE;
Simon Pilgrima271c542017-05-03 15:42:29 +0000666 break;
667
668 // Haswell:
669 case 0x3c:
670 case 0x3f:
671 case 0x45:
672 case 0x46:
Craig Topperc77d00e2017-11-10 17:10:57 +0000673 *Type = X86::INTEL_COREI7; // "haswell"
674 *Subtype = X86::INTEL_COREI7_HASWELL;
Simon Pilgrima271c542017-05-03 15:42:29 +0000675 break;
676
677 // Broadwell:
678 case 0x3d:
679 case 0x47:
680 case 0x4f:
681 case 0x56:
Craig Topperc77d00e2017-11-10 17:10:57 +0000682 *Type = X86::INTEL_COREI7; // "broadwell"
683 *Subtype = X86::INTEL_COREI7_BROADWELL;
Simon Pilgrima271c542017-05-03 15:42:29 +0000684 break;
685
686 // Skylake:
Craig Topperc6696292019-05-31 19:18:07 +0000687 case 0x4e: // Skylake mobile
688 case 0x5e: // Skylake desktop
689 case 0x8e: // Kaby Lake mobile
690 case 0x9e: // Kaby Lake desktop
Craig Topperc77d00e2017-11-10 17:10:57 +0000691 *Type = X86::INTEL_COREI7; // "skylake"
692 *Subtype = X86::INTEL_COREI7_SKYLAKE;
Simon Pilgrima271c542017-05-03 15:42:29 +0000693 break;
694
695 // Skylake Xeon:
696 case 0x55:
Craig Topperc77d00e2017-11-10 17:10:57 +0000697 *Type = X86::INTEL_COREI7;
Craig Topper54658752019-09-04 16:01:43 +0000698 if (Features2 & (1 << (X86::FEATURE_AVX512BF16 - 32)))
Pengfei Wangf8b28932019-06-07 08:31:35 +0000699 *Subtype = X86::INTEL_COREI7_COOPERLAKE; // "cooperlake"
700 else if (Features2 & (1 << (X86::FEATURE_AVX512VNNI - 32)))
Craig Topperc6696292019-05-31 19:18:07 +0000701 *Subtype = X86::INTEL_COREI7_CASCADELAKE; // "cascadelake"
702 else
703 *Subtype = X86::INTEL_COREI7_SKYLAKE_AVX512; // "skylake-avx512"
Simon Pilgrima271c542017-05-03 15:42:29 +0000704 break;
705
Craig Topper07491862017-11-15 06:02:42 +0000706 // Cannonlake:
707 case 0x66:
708 *Type = X86::INTEL_COREI7;
709 *Subtype = X86::INTEL_COREI7_CANNONLAKE; // "cannonlake"
710 break;
711
Craig Toppercac6b762019-05-20 16:58:23 +0000712 // Icelake:
Craig Topper2f1895e2019-05-22 19:51:35 +0000713 case 0x7d:
Craig Toppercac6b762019-05-20 16:58:23 +0000714 case 0x7e:
715 *Type = X86::INTEL_COREI7;
716 *Subtype = X86::INTEL_COREI7_ICELAKE_CLIENT; // "icelake-client"
717 break;
718
Craig Topper2f1895e2019-05-22 19:51:35 +0000719 // Icelake Xeon:
720 case 0x6a:
721 case 0x6c:
722 *Type = X86::INTEL_COREI7;
723 *Subtype = X86::INTEL_COREI7_ICELAKE_SERVER; // "icelake-server"
724 break;
725
Simon Pilgrima271c542017-05-03 15:42:29 +0000726 case 0x1c: // Most 45 nm Intel Atom processors
727 case 0x26: // 45 nm Atom Lincroft
728 case 0x27: // 32 nm Atom Medfield
729 case 0x35: // 32 nm Atom Midview
730 case 0x36: // 32 nm Atom Midview
Craig Topperc77d00e2017-11-10 17:10:57 +0000731 *Type = X86::INTEL_BONNELL;
Simon Pilgrima271c542017-05-03 15:42:29 +0000732 break; // "bonnell"
733
734 // Atom Silvermont codes from the Intel software optimization guide.
735 case 0x37:
736 case 0x4a:
737 case 0x4d:
738 case 0x5a:
739 case 0x5d:
740 case 0x4c: // really airmont
Craig Topperc77d00e2017-11-10 17:10:57 +0000741 *Type = X86::INTEL_SILVERMONT;
Simon Pilgrima271c542017-05-03 15:42:29 +0000742 break; // "silvermont"
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000743 // Goldmont:
Craig Topper0dadfe32017-11-15 06:02:43 +0000744 case 0x5c: // Apollo Lake
745 case 0x5f: // Denverton
Craig Topperc77d00e2017-11-10 17:10:57 +0000746 *Type = X86::INTEL_GOLDMONT;
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000747 break; // "goldmont"
Gabor Buella8f1646b2018-04-16 07:47:35 +0000748 case 0x7a:
749 *Type = X86::INTEL_GOLDMONT_PLUS;
750 break;
Craig Toppercac6b762019-05-20 16:58:23 +0000751 case 0x86:
752 *Type = X86::INTEL_TREMONT;
753 break;
Craig Topperc6696292019-05-31 19:18:07 +0000754
Simon Pilgrima271c542017-05-03 15:42:29 +0000755 case 0x57:
Craig Topperc77d00e2017-11-10 17:10:57 +0000756 *Type = X86::INTEL_KNL; // knl
Simon Pilgrima271c542017-05-03 15:42:29 +0000757 break;
Craig Topperc6696292019-05-31 19:18:07 +0000758
Craig Topper5d692912017-10-13 18:10:17 +0000759 case 0x85:
Craig Topperc77d00e2017-11-10 17:10:57 +0000760 *Type = X86::INTEL_KNM; // knm
Craig Topper5d692912017-10-13 18:10:17 +0000761 break;
Simon Pilgrima271c542017-05-03 15:42:29 +0000762
763 default: // Unknown family 6 CPU, try to guess.
Pengfei Wange28cbbd2019-08-12 01:29:46 +0000764 // TODO detect tigerlake host
765 if (Features3 & (1 << (X86::FEATURE_AVX512VP2INTERSECT - 64))) {
766 *Type = X86::INTEL_COREI7;
767 *Subtype = X86::INTEL_COREI7_TIGERLAKE;
768 break;
769 }
770
Craig Topperaa3f2492018-11-15 18:11:52 +0000771 if (Features & (1 << X86::FEATURE_AVX512VBMI2)) {
772 *Type = X86::INTEL_COREI7;
773 *Subtype = X86::INTEL_COREI7_ICELAKE_CLIENT;
774 break;
775 }
776
Craig Topper47c87392017-11-21 23:36:42 +0000777 if (Features & (1 << X86::FEATURE_AVX512VBMI)) {
Craig Topper07491862017-11-15 06:02:42 +0000778 *Type = X86::INTEL_COREI7;
779 *Subtype = X86::INTEL_COREI7_CANNONLAKE;
Craig Topper4eda7562017-07-27 03:26:52 +0000780 break;
781 }
Craig Topper07491862017-11-15 06:02:42 +0000782
Craig Topper54658752019-09-04 16:01:43 +0000783 if (Features2 & (1 << (X86::FEATURE_AVX512BF16 - 32))) {
Pengfei Wangf8b28932019-06-07 08:31:35 +0000784 *Type = X86::INTEL_COREI7;
785 *Subtype = X86::INTEL_COREI7_COOPERLAKE;
786 break;
787 }
788
Craig Topper5fb34b52018-11-27 18:05:00 +0000789 if (Features2 & (1 << (X86::FEATURE_AVX512VNNI - 32))) {
790 *Type = X86::INTEL_COREI7;
791 *Subtype = X86::INTEL_COREI7_CASCADELAKE;
792 break;
793 }
794
Craig Topper47c87392017-11-21 23:36:42 +0000795 if (Features & (1 << X86::FEATURE_AVX512VL)) {
Craig Topper07491862017-11-15 06:02:42 +0000796 *Type = X86::INTEL_COREI7;
797 *Subtype = X86::INTEL_COREI7_SKYLAKE_AVX512;
798 break;
799 }
800
Craig Topper47c87392017-11-21 23:36:42 +0000801 if (Features & (1 << X86::FEATURE_AVX512ER)) {
Craig Topper07491862017-11-15 06:02:42 +0000802 *Type = X86::INTEL_KNL; // knl
803 break;
804 }
805
Craig Topper0aca35d2018-10-20 03:51:43 +0000806 if (Features3 & (1 << (X86::FEATURE_CLFLUSHOPT - 64))) {
807 if (Features3 & (1 << (X86::FEATURE_SHA - 64))) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000808 *Type = X86::INTEL_GOLDMONT;
Craig Topper4eda7562017-07-27 03:26:52 +0000809 } else {
Craig Topperc77d00e2017-11-10 17:10:57 +0000810 *Type = X86::INTEL_COREI7;
811 *Subtype = X86::INTEL_COREI7_SKYLAKE;
Craig Topper4eda7562017-07-27 03:26:52 +0000812 }
Simon Pilgrima271c542017-05-03 15:42:29 +0000813 break;
814 }
Craig Topper0aca35d2018-10-20 03:51:43 +0000815 if (Features3 & (1 << (X86::FEATURE_ADX - 64))) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000816 *Type = X86::INTEL_COREI7;
817 *Subtype = X86::INTEL_COREI7_BROADWELL;
Simon Pilgrima271c542017-05-03 15:42:29 +0000818 break;
819 }
Craig Topper47c87392017-11-21 23:36:42 +0000820 if (Features & (1 << X86::FEATURE_AVX2)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000821 *Type = X86::INTEL_COREI7;
822 *Subtype = X86::INTEL_COREI7_HASWELL;
Simon Pilgrima271c542017-05-03 15:42:29 +0000823 break;
824 }
Craig Topper47c87392017-11-21 23:36:42 +0000825 if (Features & (1 << X86::FEATURE_AVX)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000826 *Type = X86::INTEL_COREI7;
827 *Subtype = X86::INTEL_COREI7_SANDYBRIDGE;
Simon Pilgrima271c542017-05-03 15:42:29 +0000828 break;
829 }
Craig Topper47c87392017-11-21 23:36:42 +0000830 if (Features & (1 << X86::FEATURE_SSE4_2)) {
Craig Topper0aca35d2018-10-20 03:51:43 +0000831 if (Features3 & (1 << (X86::FEATURE_MOVBE - 64))) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000832 *Type = X86::INTEL_SILVERMONT;
Simon Pilgrima271c542017-05-03 15:42:29 +0000833 } else {
Craig Topperc77d00e2017-11-10 17:10:57 +0000834 *Type = X86::INTEL_COREI7;
835 *Subtype = X86::INTEL_COREI7_NEHALEM;
Simon Pilgrima271c542017-05-03 15:42:29 +0000836 }
837 break;
838 }
Craig Topper47c87392017-11-21 23:36:42 +0000839 if (Features & (1 << X86::FEATURE_SSE4_1)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000840 *Type = X86::INTEL_CORE2; // "penryn"
841 *Subtype = X86::INTEL_CORE2_45;
Simon Pilgrima271c542017-05-03 15:42:29 +0000842 break;
843 }
Craig Topper47c87392017-11-21 23:36:42 +0000844 if (Features & (1 << X86::FEATURE_SSSE3)) {
Craig Topper0aca35d2018-10-20 03:51:43 +0000845 if (Features3 & (1 << (X86::FEATURE_MOVBE - 64))) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000846 *Type = X86::INTEL_BONNELL; // "bonnell"
Simon Pilgrima271c542017-05-03 15:42:29 +0000847 } else {
Craig Topperc77d00e2017-11-10 17:10:57 +0000848 *Type = X86::INTEL_CORE2; // "core2"
849 *Subtype = X86::INTEL_CORE2_65;
Simon Pilgrima271c542017-05-03 15:42:29 +0000850 }
851 break;
852 }
Craig Topper0aca35d2018-10-20 03:51:43 +0000853 if (Features3 & (1 << (X86::FEATURE_EM64T - 64))) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000854 *Type = X86::INTEL_CORE2; // "core2"
855 *Subtype = X86::INTEL_CORE2_65;
Craig Toppera233e162017-11-02 19:13:32 +0000856 break;
857 }
Craig Topper47c87392017-11-21 23:36:42 +0000858 if (Features & (1 << X86::FEATURE_SSE3)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000859 *Type = X86::INTEL_CORE_DUO;
Craig Toppera233e162017-11-02 19:13:32 +0000860 break;
Simon Pilgrima271c542017-05-03 15:42:29 +0000861 }
Craig Topper47c87392017-11-21 23:36:42 +0000862 if (Features & (1 << X86::FEATURE_SSE2)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000863 *Type = X86::INTEL_PENTIUM_M;
Simon Pilgrima271c542017-05-03 15:42:29 +0000864 break;
865 }
Craig Topper47c87392017-11-21 23:36:42 +0000866 if (Features & (1 << X86::FEATURE_SSE)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000867 *Type = X86::INTEL_PENTIUM_III;
Simon Pilgrima271c542017-05-03 15:42:29 +0000868 break;
869 }
Craig Topper47c87392017-11-21 23:36:42 +0000870 if (Features & (1 << X86::FEATURE_MMX)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000871 *Type = X86::INTEL_PENTIUM_II;
Simon Pilgrima271c542017-05-03 15:42:29 +0000872 break;
873 }
Craig Topperc77d00e2017-11-10 17:10:57 +0000874 *Type = X86::INTEL_PENTIUM_PRO;
Simon Pilgrima271c542017-05-03 15:42:29 +0000875 break;
876 }
877 break;
878 case 15: {
Craig Topper0aca35d2018-10-20 03:51:43 +0000879 if (Features3 & (1 << (X86::FEATURE_EM64T - 64))) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000880 *Type = X86::INTEL_NOCONA;
Simon Pilgrima271c542017-05-03 15:42:29 +0000881 break;
882 }
Craig Topper47c87392017-11-21 23:36:42 +0000883 if (Features & (1 << X86::FEATURE_SSE3)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000884 *Type = X86::INTEL_PRESCOTT;
Craig Topper14949152017-11-02 19:13:34 +0000885 break;
886 }
Craig Topperc77d00e2017-11-10 17:10:57 +0000887 *Type = X86::INTEL_PENTIUM_IV;
Simon Pilgrima271c542017-05-03 15:42:29 +0000888 break;
889 }
890 default:
891 break; /*"generic"*/
892 }
893}
894
Craig Topper2ace1532017-07-08 06:44:34 +0000895static void getAMDProcessorTypeAndSubtype(unsigned Family, unsigned Model,
896 unsigned Features, unsigned *Type,
Simon Pilgrima271c542017-05-03 15:42:29 +0000897 unsigned *Subtype) {
898 // FIXME: this poorly matches the generated SubtargetFeatureKV table. There
899 // appears to be no way to generate the wide variety of AMD-specific targets
900 // from the information returned from CPUID.
901 switch (Family) {
902 case 4:
Craig Topperc77d00e2017-11-10 17:10:57 +0000903 *Type = X86::AMD_i486;
Simon Pilgrima271c542017-05-03 15:42:29 +0000904 break;
905 case 5:
Craig Topperc77d00e2017-11-10 17:10:57 +0000906 *Type = X86::AMDPENTIUM;
Simon Pilgrima271c542017-05-03 15:42:29 +0000907 switch (Model) {
908 case 6:
909 case 7:
Craig Topperc77d00e2017-11-10 17:10:57 +0000910 *Subtype = X86::AMDPENTIUM_K6;
Simon Pilgrima271c542017-05-03 15:42:29 +0000911 break; // "k6"
912 case 8:
Craig Topperc77d00e2017-11-10 17:10:57 +0000913 *Subtype = X86::AMDPENTIUM_K62;
Simon Pilgrima271c542017-05-03 15:42:29 +0000914 break; // "k6-2"
915 case 9:
916 case 13:
Craig Topperc77d00e2017-11-10 17:10:57 +0000917 *Subtype = X86::AMDPENTIUM_K63;
Simon Pilgrima271c542017-05-03 15:42:29 +0000918 break; // "k6-3"
919 case 10:
Craig Topperc77d00e2017-11-10 17:10:57 +0000920 *Subtype = X86::AMDPENTIUM_GEODE;
Simon Pilgrima271c542017-05-03 15:42:29 +0000921 break; // "geode"
922 }
923 break;
924 case 6:
Craig Topper47c87392017-11-21 23:36:42 +0000925 if (Features & (1 << X86::FEATURE_SSE)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000926 *Type = X86::AMD_ATHLON_XP;
Simon Pilgrima271c542017-05-03 15:42:29 +0000927 break; // "athlon-xp"
928 }
Craig Topperc77d00e2017-11-10 17:10:57 +0000929 *Type = X86::AMD_ATHLON;
Craig Topperf3de5eb2017-07-13 06:34:10 +0000930 break; // "athlon"
Simon Pilgrima271c542017-05-03 15:42:29 +0000931 case 15:
Craig Topper47c87392017-11-21 23:36:42 +0000932 if (Features & (1 << X86::FEATURE_SSE3)) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000933 *Type = X86::AMD_K8SSE3;
Simon Pilgrima271c542017-05-03 15:42:29 +0000934 break; // "k8-sse3"
935 }
Craig Topperc77d00e2017-11-10 17:10:57 +0000936 *Type = X86::AMD_K8;
Craig Topperf3de5eb2017-07-13 06:34:10 +0000937 break; // "k8"
Simon Pilgrima271c542017-05-03 15:42:29 +0000938 case 16:
Craig Topperc77d00e2017-11-10 17:10:57 +0000939 *Type = X86::AMDFAM10H; // "amdfam10"
Simon Pilgrima271c542017-05-03 15:42:29 +0000940 switch (Model) {
941 case 2:
Craig Topperc77d00e2017-11-10 17:10:57 +0000942 *Subtype = X86::AMDFAM10H_BARCELONA;
Simon Pilgrima271c542017-05-03 15:42:29 +0000943 break;
944 case 4:
Craig Topperc77d00e2017-11-10 17:10:57 +0000945 *Subtype = X86::AMDFAM10H_SHANGHAI;
Simon Pilgrima271c542017-05-03 15:42:29 +0000946 break;
947 case 8:
Craig Topperc77d00e2017-11-10 17:10:57 +0000948 *Subtype = X86::AMDFAM10H_ISTANBUL;
Simon Pilgrima271c542017-05-03 15:42:29 +0000949 break;
950 }
951 break;
952 case 20:
Craig Topperc77d00e2017-11-10 17:10:57 +0000953 *Type = X86::AMD_BTVER1;
Simon Pilgrima271c542017-05-03 15:42:29 +0000954 break; // "btver1";
955 case 21:
Craig Topperc77d00e2017-11-10 17:10:57 +0000956 *Type = X86::AMDFAM15H;
Craig Topper1f9d3c02017-07-08 06:44:35 +0000957 if (Model >= 0x60 && Model <= 0x7f) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000958 *Subtype = X86::AMDFAM15H_BDVER4;
Craig Topper3db11702017-07-12 06:49:56 +0000959 break; // "bdver4"; 60h-7Fh: Excavator
Simon Pilgrima271c542017-05-03 15:42:29 +0000960 }
961 if (Model >= 0x30 && Model <= 0x3f) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000962 *Subtype = X86::AMDFAM15H_BDVER3;
Simon Pilgrima271c542017-05-03 15:42:29 +0000963 break; // "bdver3"; 30h-3Fh: Steamroller
964 }
Roman Lebedevbc1a9242018-05-01 18:39:31 +0000965 if ((Model >= 0x10 && Model <= 0x1f) || Model == 0x02) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000966 *Subtype = X86::AMDFAM15H_BDVER2;
Roman Lebedevbc1a9242018-05-01 18:39:31 +0000967 break; // "bdver2"; 02h, 10h-1Fh: Piledriver
Simon Pilgrima271c542017-05-03 15:42:29 +0000968 }
969 if (Model <= 0x0f) {
Craig Topperc77d00e2017-11-10 17:10:57 +0000970 *Subtype = X86::AMDFAM15H_BDVER1;
Simon Pilgrima271c542017-05-03 15:42:29 +0000971 break; // "bdver1"; 00h-0Fh: Bulldozer
972 }
973 break;
974 case 22:
Craig Topperc77d00e2017-11-10 17:10:57 +0000975 *Type = X86::AMD_BTVER2;
Simon Pilgrima271c542017-05-03 15:42:29 +0000976 break; // "btver2"
977 case 23:
Craig Topperc77d00e2017-11-10 17:10:57 +0000978 *Type = X86::AMDFAM17H;
Craig Topperff75bf62019-11-18 11:31:17 -0800979 if ((Model >= 0x30 && Model <= 0x3f) || Model == 0x71) {
Ganesh Gopalasubramaniane172d7002019-02-26 16:55:10 +0000980 *Subtype = X86::AMDFAM17H_ZNVER2;
Craig Topperff75bf62019-11-18 11:31:17 -0800981 break; // "znver2"; 30h-3fh, 71h: Zen2
Ganesh Gopalasubramaniane172d7002019-02-26 16:55:10 +0000982 }
983 if (Model <= 0x0f) {
984 *Subtype = X86::AMDFAM17H_ZNVER1;
985 break; // "znver1"; 00h-0Fh: Zen1
986 }
Simon Pilgrima271c542017-05-03 15:42:29 +0000987 break;
988 default:
989 break; // "generic"
990 }
991}
992
Craig Topper3a5d0822017-07-12 06:49:58 +0000993static void getAvailableFeatures(unsigned ECX, unsigned EDX, unsigned MaxLeaf,
Craig Topper0aca35d2018-10-20 03:51:43 +0000994 unsigned *FeaturesOut, unsigned *Features2Out,
995 unsigned *Features3Out) {
Simon Pilgrima271c542017-05-03 15:42:29 +0000996 unsigned Features = 0;
Craig Topper3a5d0822017-07-12 06:49:58 +0000997 unsigned Features2 = 0;
Craig Topper0aca35d2018-10-20 03:51:43 +0000998 unsigned Features3 = 0;
Craig Topperc6bbe4b2017-07-08 05:16:14 +0000999 unsigned EAX, EBX;
Craig Topper3a5d0822017-07-12 06:49:58 +00001000
Simon Pilgrima7d1a7c2018-10-20 13:16:31 +00001001 auto setFeature = [&](unsigned F) {
1002 if (F < 32)
Craig Topper28659f52018-11-24 20:26:11 +00001003 Features |= 1U << (F & 0x1f);
Simon Pilgrima7d1a7c2018-10-20 13:16:31 +00001004 else if (F < 64)
Craig Topper28659f52018-11-24 20:26:11 +00001005 Features2 |= 1U << ((F - 32) & 0x1f);
Simon Pilgrima7d1a7c2018-10-20 13:16:31 +00001006 else if (F < 96)
Craig Topper28659f52018-11-24 20:26:11 +00001007 Features3 |= 1U << ((F - 64) & 0x1f);
Simon Pilgrima7d1a7c2018-10-20 13:16:31 +00001008 else
1009 llvm_unreachable("Unexpected FeatureBit");
1010 };
Craig Topper0aca35d2018-10-20 03:51:43 +00001011
Craig Topper3a5d0822017-07-12 06:49:58 +00001012 if ((EDX >> 15) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001013 setFeature(X86::FEATURE_CMOV);
Craig Topper3a5d0822017-07-12 06:49:58 +00001014 if ((EDX >> 23) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001015 setFeature(X86::FEATURE_MMX);
Craig Topper3a5d0822017-07-12 06:49:58 +00001016 if ((EDX >> 25) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001017 setFeature(X86::FEATURE_SSE);
Craig Topper3a5d0822017-07-12 06:49:58 +00001018 if ((EDX >> 26) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001019 setFeature(X86::FEATURE_SSE2);
Craig Topper3a5d0822017-07-12 06:49:58 +00001020
1021 if ((ECX >> 0) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001022 setFeature(X86::FEATURE_SSE3);
Craig Topper3a5d0822017-07-12 06:49:58 +00001023 if ((ECX >> 1) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001024 setFeature(X86::FEATURE_PCLMUL);
Craig Topper3a5d0822017-07-12 06:49:58 +00001025 if ((ECX >> 9) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001026 setFeature(X86::FEATURE_SSSE3);
Craig Topper3a5d0822017-07-12 06:49:58 +00001027 if ((ECX >> 12) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001028 setFeature(X86::FEATURE_FMA);
Craig Topper3a5d0822017-07-12 06:49:58 +00001029 if ((ECX >> 19) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001030 setFeature(X86::FEATURE_SSE4_1);
Craig Topper3a5d0822017-07-12 06:49:58 +00001031 if ((ECX >> 20) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001032 setFeature(X86::FEATURE_SSE4_2);
Craig Topper3a5d0822017-07-12 06:49:58 +00001033 if ((ECX >> 23) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001034 setFeature(X86::FEATURE_POPCNT);
Craig Topper3a5d0822017-07-12 06:49:58 +00001035 if ((ECX >> 25) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001036 setFeature(X86::FEATURE_AES);
Craig Topper3a5d0822017-07-12 06:49:58 +00001037
1038 if ((ECX >> 22) & 1)
Craig Topper0aca35d2018-10-20 03:51:43 +00001039 setFeature(X86::FEATURE_MOVBE);
Simon Pilgrima271c542017-05-03 15:42:29 +00001040
1041 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV
1042 // indicates that the AVX registers will be saved and restored on context
1043 // switch, then we have full AVX support.
1044 const unsigned AVXBits = (1 << 27) | (1 << 28);
1045 bool HasAVX = ((ECX & AVXBits) == AVXBits) && !getX86XCR0(&EAX, &EDX) &&
1046 ((EAX & 0x6) == 0x6);
Florian Hahn82921bf2019-11-21 09:03:16 +00001047#if defined(__APPLE__)
1048 // Darwin lazily saves the AVX512 context on first use: trust that the OS will
1049 // save the AVX512 context if we use AVX512 instructions, even the bit is not
1050 // set right now.
1051 bool HasAVX512Save = true;
1052#else
1053 // AVX512 requires additional context to be saved by the OS.
Simon Pilgrima271c542017-05-03 15:42:29 +00001054 bool HasAVX512Save = HasAVX && ((EAX & 0xe0) == 0xe0);
Florian Hahn82921bf2019-11-21 09:03:16 +00001055#endif
Craig Topper3a5d0822017-07-12 06:49:58 +00001056
1057 if (HasAVX)
Craig Topper0aca35d2018-10-20 03:51:43 +00001058 setFeature(X86::FEATURE_AVX);
Craig Topper3a5d0822017-07-12 06:49:58 +00001059
Simon Pilgrima271c542017-05-03 15:42:29 +00001060 bool HasLeaf7 =
1061 MaxLeaf >= 0x7 && !getX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
Craig Topper3a5d0822017-07-12 06:49:58 +00001062
1063 if (HasLeaf7 && ((EBX >> 3) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001064 setFeature(X86::FEATURE_BMI);
Craig Topper3a5d0822017-07-12 06:49:58 +00001065 if (HasLeaf7 && ((EBX >> 5) & 1) && HasAVX)
Craig Topper0aca35d2018-10-20 03:51:43 +00001066 setFeature(X86::FEATURE_AVX2);
Eric Christopher1d73e222019-08-05 21:25:59 +00001067 if (HasLeaf7 && ((EBX >> 8) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001068 setFeature(X86::FEATURE_BMI2);
Craig Topper3a5d0822017-07-12 06:49:58 +00001069 if (HasLeaf7 && ((EBX >> 16) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001070 setFeature(X86::FEATURE_AVX512F);
Craig Topper3a5d0822017-07-12 06:49:58 +00001071 if (HasLeaf7 && ((EBX >> 17) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001072 setFeature(X86::FEATURE_AVX512DQ);
Craig Topper3a5d0822017-07-12 06:49:58 +00001073 if (HasLeaf7 && ((EBX >> 19) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001074 setFeature(X86::FEATURE_ADX);
Craig Topper3a5d0822017-07-12 06:49:58 +00001075 if (HasLeaf7 && ((EBX >> 21) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001076 setFeature(X86::FEATURE_AVX512IFMA);
Craig Topper4eda7562017-07-27 03:26:52 +00001077 if (HasLeaf7 && ((EBX >> 23) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001078 setFeature(X86::FEATURE_CLFLUSHOPT);
Craig Topper3a5d0822017-07-12 06:49:58 +00001079 if (HasLeaf7 && ((EBX >> 26) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001080 setFeature(X86::FEATURE_AVX512PF);
Craig Topper3a5d0822017-07-12 06:49:58 +00001081 if (HasLeaf7 && ((EBX >> 27) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001082 setFeature(X86::FEATURE_AVX512ER);
Craig Topper3a5d0822017-07-12 06:49:58 +00001083 if (HasLeaf7 && ((EBX >> 28) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001084 setFeature(X86::FEATURE_AVX512CD);
Craig Topper4eda7562017-07-27 03:26:52 +00001085 if (HasLeaf7 && ((EBX >> 29) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001086 setFeature(X86::FEATURE_SHA);
Craig Topper3a5d0822017-07-12 06:49:58 +00001087 if (HasLeaf7 && ((EBX >> 30) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001088 setFeature(X86::FEATURE_AVX512BW);
Craig Topper3a5d0822017-07-12 06:49:58 +00001089 if (HasLeaf7 && ((EBX >> 31) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001090 setFeature(X86::FEATURE_AVX512VL);
Craig Topper3a5d0822017-07-12 06:49:58 +00001091
1092 if (HasLeaf7 && ((ECX >> 1) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001093 setFeature(X86::FEATURE_AVX512VBMI);
1094 if (HasLeaf7 && ((ECX >> 6) & 1) && HasAVX512Save)
1095 setFeature(X86::FEATURE_AVX512VBMI2);
1096 if (HasLeaf7 && ((ECX >> 8) & 1))
1097 setFeature(X86::FEATURE_GFNI);
1098 if (HasLeaf7 && ((ECX >> 10) & 1) && HasAVX)
1099 setFeature(X86::FEATURE_VPCLMULQDQ);
1100 if (HasLeaf7 && ((ECX >> 11) & 1) && HasAVX512Save)
1101 setFeature(X86::FEATURE_AVX512VNNI);
1102 if (HasLeaf7 && ((ECX >> 12) & 1) && HasAVX512Save)
1103 setFeature(X86::FEATURE_AVX512BITALG);
Craig Topper3a5d0822017-07-12 06:49:58 +00001104 if (HasLeaf7 && ((ECX >> 14) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001105 setFeature(X86::FEATURE_AVX512VPOPCNTDQ);
Craig Topper3a5d0822017-07-12 06:49:58 +00001106
1107 if (HasLeaf7 && ((EDX >> 2) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001108 setFeature(X86::FEATURE_AVX5124VNNIW);
Craig Topper3a5d0822017-07-12 06:49:58 +00001109 if (HasLeaf7 && ((EDX >> 3) & 1) && HasAVX512Save)
Craig Topper0aca35d2018-10-20 03:51:43 +00001110 setFeature(X86::FEATURE_AVX5124FMAPS);
Pengfei Wange28cbbd2019-08-12 01:29:46 +00001111 if (HasLeaf7 && ((EDX >> 8) & 1) && HasAVX512Save)
1112 setFeature(X86::FEATURE_AVX512VP2INTERSECT);
Simon Pilgrima271c542017-05-03 15:42:29 +00001113
Craig Topper54658752019-09-04 16:01:43 +00001114 bool HasLeaf7Subleaf1 =
1115 MaxLeaf >= 7 && !getX86CpuIDAndInfoEx(0x7, 0x1, &EAX, &EBX, &ECX, &EDX);
1116 if (HasLeaf7Subleaf1 && ((EAX >> 5) & 1) && HasAVX512Save)
1117 setFeature(X86::FEATURE_AVX512BF16);
1118
Craig Topperbb8c7992017-07-08 05:16:13 +00001119 unsigned MaxExtLevel;
1120 getX86CpuIDAndInfo(0x80000000, &MaxExtLevel, &EBX, &ECX, &EDX);
1121
1122 bool HasExtLeaf1 = MaxExtLevel >= 0x80000001 &&
1123 !getX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
Craig Topper3a5d0822017-07-12 06:49:58 +00001124 if (HasExtLeaf1 && ((ECX >> 6) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001125 setFeature(X86::FEATURE_SSE4_A);
Craig Topper3a5d0822017-07-12 06:49:58 +00001126 if (HasExtLeaf1 && ((ECX >> 11) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001127 setFeature(X86::FEATURE_XOP);
Craig Topper3a5d0822017-07-12 06:49:58 +00001128 if (HasExtLeaf1 && ((ECX >> 16) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001129 setFeature(X86::FEATURE_FMA4);
Craig Topperbb8c7992017-07-08 05:16:13 +00001130
Craig Topper3a5d0822017-07-12 06:49:58 +00001131 if (HasExtLeaf1 && ((EDX >> 29) & 1))
Craig Topper0aca35d2018-10-20 03:51:43 +00001132 setFeature(X86::FEATURE_EM64T);
Craig Topper3a5d0822017-07-12 06:49:58 +00001133
1134 *FeaturesOut = Features;
1135 *Features2Out = Features2;
Craig Topper0aca35d2018-10-20 03:51:43 +00001136 *Features3Out = Features3;
Simon Pilgrima271c542017-05-03 15:42:29 +00001137}
1138
1139StringRef sys::getHostCPUName() {
1140 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
1141 unsigned MaxLeaf, Vendor;
1142
1143#if defined(__GNUC__) || defined(__clang__)
1144 //FIXME: include cpuid.h from clang or copy __get_cpuid_max here
1145 // and simplify it to not invoke __cpuid (like cpu_model.c in
1146 // compiler-rt/lib/builtins/cpu_model.c?
1147 // Opting for the second option.
1148 if(!isCpuIdSupported())
1149 return "generic";
1150#endif
Craig Topperbb8c7992017-07-08 05:16:13 +00001151 if (getX86CpuIDAndInfo(0, &MaxLeaf, &Vendor, &ECX, &EDX) || MaxLeaf < 1)
Simon Pilgrima271c542017-05-03 15:42:29 +00001152 return "generic";
Craig Topperbb8c7992017-07-08 05:16:13 +00001153 getX86CpuIDAndInfo(0x1, &EAX, &EBX, &ECX, &EDX);
Simon Pilgrima271c542017-05-03 15:42:29 +00001154
1155 unsigned Brand_id = EBX & 0xff;
1156 unsigned Family = 0, Model = 0;
Craig Topper0aca35d2018-10-20 03:51:43 +00001157 unsigned Features = 0, Features2 = 0, Features3 = 0;
Simon Pilgrima271c542017-05-03 15:42:29 +00001158 detectX86FamilyModel(EAX, &Family, &Model);
Craig Topper0aca35d2018-10-20 03:51:43 +00001159 getAvailableFeatures(ECX, EDX, MaxLeaf, &Features, &Features2, &Features3);
Simon Pilgrima271c542017-05-03 15:42:29 +00001160
Craig Topper741e7e62017-11-03 18:02:44 +00001161 unsigned Type = 0;
1162 unsigned Subtype = 0;
Simon Pilgrima271c542017-05-03 15:42:29 +00001163
1164 if (Vendor == SIG_INTEL) {
Craig Topper3a5d0822017-07-12 06:49:58 +00001165 getIntelProcessorTypeAndSubtype(Family, Model, Brand_id, Features,
Craig Topper0aca35d2018-10-20 03:51:43 +00001166 Features2, Features3, &Type, &Subtype);
Simon Pilgrima271c542017-05-03 15:42:29 +00001167 } else if (Vendor == SIG_AMD) {
1168 getAMDProcessorTypeAndSubtype(Family, Model, Features, &Type, &Subtype);
Simon Pilgrima271c542017-05-03 15:42:29 +00001169 }
Craig Topperc77d00e2017-11-10 17:10:57 +00001170
1171 // Check subtypes first since those are more specific.
1172#define X86_CPU_SUBTYPE(ARCHNAME, ENUM) \
1173 if (Subtype == X86::ENUM) \
1174 return ARCHNAME;
1175#include "llvm/Support/X86TargetParser.def"
1176
1177 // Now check types.
Craig Topper55ad3292018-03-06 22:45:31 +00001178#define X86_CPU_TYPE(ARCHNAME, ENUM) \
Craig Topperc77d00e2017-11-10 17:10:57 +00001179 if (Type == X86::ENUM) \
1180 return ARCHNAME;
1181#include "llvm/Support/X86TargetParser.def"
1182
Simon Pilgrima271c542017-05-03 15:42:29 +00001183 return "generic";
1184}
1185
1186#elif defined(__APPLE__) && (defined(__ppc__) || defined(__powerpc__))
1187StringRef sys::getHostCPUName() {
1188 host_basic_info_data_t hostInfo;
1189 mach_msg_type_number_t infoCount;
1190
1191 infoCount = HOST_BASIC_INFO_COUNT;
Kristina Brooks51ae9342018-09-04 10:54:09 +00001192 mach_port_t hostPort = mach_host_self();
1193 host_info(hostPort, HOST_BASIC_INFO, (host_info_t)&hostInfo,
Simon Pilgrima271c542017-05-03 15:42:29 +00001194 &infoCount);
Kristina Brooks51ae9342018-09-04 10:54:09 +00001195 mach_port_deallocate(mach_task_self(), hostPort);
Simon Pilgrima271c542017-05-03 15:42:29 +00001196
1197 if (hostInfo.cpu_type != CPU_TYPE_POWERPC)
1198 return "generic";
1199
1200 switch (hostInfo.cpu_subtype) {
1201 case CPU_SUBTYPE_POWERPC_601:
1202 return "601";
1203 case CPU_SUBTYPE_POWERPC_602:
1204 return "602";
1205 case CPU_SUBTYPE_POWERPC_603:
1206 return "603";
1207 case CPU_SUBTYPE_POWERPC_603e:
1208 return "603e";
1209 case CPU_SUBTYPE_POWERPC_603ev:
1210 return "603ev";
1211 case CPU_SUBTYPE_POWERPC_604:
1212 return "604";
1213 case CPU_SUBTYPE_POWERPC_604e:
1214 return "604e";
1215 case CPU_SUBTYPE_POWERPC_620:
1216 return "620";
1217 case CPU_SUBTYPE_POWERPC_750:
1218 return "750";
1219 case CPU_SUBTYPE_POWERPC_7400:
1220 return "7400";
1221 case CPU_SUBTYPE_POWERPC_7450:
1222 return "7450";
1223 case CPU_SUBTYPE_POWERPC_970:
1224 return "970";
1225 default:;
1226 }
1227
1228 return "generic";
1229}
1230#elif defined(__linux__) && (defined(__ppc__) || defined(__powerpc__))
1231StringRef sys::getHostCPUName() {
1232 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
Craig Topper8665f592018-03-07 17:53:16 +00001233 StringRef Content = P ? P->getBuffer() : "";
Simon Pilgrima271c542017-05-03 15:42:29 +00001234 return detail::getHostCPUNameForPowerPC(Content);
1235}
1236#elif defined(__linux__) && (defined(__arm__) || defined(__aarch64__))
1237StringRef sys::getHostCPUName() {
1238 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
Craig Topper8665f592018-03-07 17:53:16 +00001239 StringRef Content = P ? P->getBuffer() : "";
Simon Pilgrima271c542017-05-03 15:42:29 +00001240 return detail::getHostCPUNameForARM(Content);
1241}
1242#elif defined(__linux__) && defined(__s390x__)
1243StringRef sys::getHostCPUName() {
1244 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
Craig Topper8665f592018-03-07 17:53:16 +00001245 StringRef Content = P ? P->getBuffer() : "";
Simon Pilgrima271c542017-05-03 15:42:29 +00001246 return detail::getHostCPUNameForS390x(Content);
1247}
Chris Bieneman34688fa2019-10-30 12:50:04 -07001248#elif defined(__APPLE__) && defined(__aarch64__)
1249StringRef sys::getHostCPUName() {
1250 return "cyclone";
1251}
1252#elif defined(__APPLE__) && defined(__arm__)
1253StringRef sys::getHostCPUName() {
1254 host_basic_info_data_t hostInfo;
1255 mach_msg_type_number_t infoCount;
1256
1257 infoCount = HOST_BASIC_INFO_COUNT;
1258 mach_port_t hostPort = mach_host_self();
1259 host_info(hostPort, HOST_BASIC_INFO, (host_info_t)&hostInfo,
1260 &infoCount);
1261 mach_port_deallocate(mach_task_self(), hostPort);
1262
1263 if (hostInfo.cpu_type != CPU_TYPE_ARM) {
1264 assert(false && "CPUType not equal to ARM should not be possible on ARM");
1265 return "generic";
1266 }
1267 switch (hostInfo.cpu_subtype) {
1268 case CPU_SUBTYPE_ARM_V7S:
1269 return "swift";
1270 default:;
1271 }
Jim Lin466f8842020-02-18 10:48:38 +08001272
Chris Bieneman34688fa2019-10-30 12:50:04 -07001273 return "generic";
1274}
Simon Pilgrima271c542017-05-03 15:42:29 +00001275#else
1276StringRef sys::getHostCPUName() { return "generic"; }
1277#endif
1278
1279#if defined(__linux__) && defined(__x86_64__)
1280// On Linux, the number of physical cores can be computed from /proc/cpuinfo,
1281// using the number of unique physical/core id pairs. The following
1282// implementation reads the /proc/cpuinfo format on an x86_64 system.
Alexandre Ganea8404aeb2020-02-13 22:49:57 -05001283int computeHostNumPhysicalCores() {
Simon Pilgrima271c542017-05-03 15:42:29 +00001284 // Read /proc/cpuinfo as a stream (until EOF reached). It cannot be
1285 // mmapped because it appears to have 0 size.
1286 llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> Text =
1287 llvm::MemoryBuffer::getFileAsStream("/proc/cpuinfo");
1288 if (std::error_code EC = Text.getError()) {
1289 llvm::errs() << "Can't read "
1290 << "/proc/cpuinfo: " << EC.message() << "\n";
1291 return -1;
1292 }
1293 SmallVector<StringRef, 8> strs;
1294 (*Text)->getBuffer().split(strs, "\n", /*MaxSplit=*/-1,
1295 /*KeepEmpty=*/false);
1296 int CurPhysicalId = -1;
1297 int CurCoreId = -1;
1298 SmallSet<std::pair<int, int>, 32> UniqueItems;
1299 for (auto &Line : strs) {
1300 Line = Line.trim();
1301 if (!Line.startswith("physical id") && !Line.startswith("core id"))
1302 continue;
1303 std::pair<StringRef, StringRef> Data = Line.split(':');
1304 auto Name = Data.first.trim();
1305 auto Val = Data.second.trim();
1306 if (Name == "physical id") {
1307 assert(CurPhysicalId == -1 &&
1308 "Expected a core id before seeing another physical id");
1309 Val.getAsInteger(10, CurPhysicalId);
1310 }
1311 if (Name == "core id") {
1312 assert(CurCoreId == -1 &&
1313 "Expected a physical id before seeing another core id");
1314 Val.getAsInteger(10, CurCoreId);
1315 }
1316 if (CurPhysicalId != -1 && CurCoreId != -1) {
1317 UniqueItems.insert(std::make_pair(CurPhysicalId, CurCoreId));
1318 CurPhysicalId = -1;
1319 CurCoreId = -1;
1320 }
1321 }
1322 return UniqueItems.size();
1323}
1324#elif defined(__APPLE__) && defined(__x86_64__)
1325#include <sys/param.h>
1326#include <sys/sysctl.h>
1327
1328// Gets the number of *physical cores* on the machine.
Alexandre Ganea8404aeb2020-02-13 22:49:57 -05001329int computeHostNumPhysicalCores() {
Simon Pilgrima271c542017-05-03 15:42:29 +00001330 uint32_t count;
1331 size_t len = sizeof(count);
1332 sysctlbyname("hw.physicalcpu", &count, &len, NULL, 0);
1333 if (count < 1) {
1334 int nm[2];
1335 nm[0] = CTL_HW;
1336 nm[1] = HW_AVAILCPU;
1337 sysctl(nm, 2, &count, &len, NULL, 0);
1338 if (count < 1)
1339 return -1;
1340 }
1341 return count;
1342}
Amy Huangcb36bfa2020-02-14 15:31:45 -08001343#elif defined(_WIN32) && LLVM_ENABLE_THREADS != 0
Alexandre Ganea8404aeb2020-02-13 22:49:57 -05001344// Defined in llvm/lib/Support/Windows/Threading.inc
1345int computeHostNumPhysicalCores();
Simon Pilgrima271c542017-05-03 15:42:29 +00001346#else
1347// On other systems, return -1 to indicate unknown.
1348static int computeHostNumPhysicalCores() { return -1; }
1349#endif
1350
1351int sys::getHostNumPhysicalCores() {
1352 static int NumCores = computeHostNumPhysicalCores();
1353 return NumCores;
1354}
1355
1356#if defined(__i386__) || defined(_M_IX86) || \
1357 defined(__x86_64__) || defined(_M_X64)
1358bool sys::getHostCPUFeatures(StringMap<bool> &Features) {
1359 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
1360 unsigned MaxLevel;
1361 union {
1362 unsigned u[3];
1363 char c[12];
1364 } text;
1365
1366 if (getX86CpuIDAndInfo(0, &MaxLevel, text.u + 0, text.u + 2, text.u + 1) ||
1367 MaxLevel < 1)
1368 return false;
1369
1370 getX86CpuIDAndInfo(1, &EAX, &EBX, &ECX, &EDX);
1371
Craig Topper8d464032019-03-20 23:35:49 +00001372 Features["cx8"] = (EDX >> 8) & 1;
Craig Topper1af7e442017-11-19 23:30:22 +00001373 Features["cmov"] = (EDX >> 15) & 1;
1374 Features["mmx"] = (EDX >> 23) & 1;
Craig Topper6829ca92019-02-13 18:21:36 +00001375 Features["fxsr"] = (EDX >> 24) & 1;
Craig Topper1af7e442017-11-19 23:30:22 +00001376 Features["sse"] = (EDX >> 25) & 1;
1377 Features["sse2"] = (EDX >> 26) & 1;
1378
1379 Features["sse3"] = (ECX >> 0) & 1;
1380 Features["pclmul"] = (ECX >> 1) & 1;
1381 Features["ssse3"] = (ECX >> 9) & 1;
1382 Features["cx16"] = (ECX >> 13) & 1;
Simon Pilgrima271c542017-05-03 15:42:29 +00001383 Features["sse4.1"] = (ECX >> 19) & 1;
1384 Features["sse4.2"] = (ECX >> 20) & 1;
Craig Topper1af7e442017-11-19 23:30:22 +00001385 Features["movbe"] = (ECX >> 22) & 1;
Simon Pilgrima271c542017-05-03 15:42:29 +00001386 Features["popcnt"] = (ECX >> 23) & 1;
Craig Topper1af7e442017-11-19 23:30:22 +00001387 Features["aes"] = (ECX >> 25) & 1;
1388 Features["rdrnd"] = (ECX >> 30) & 1;
Simon Pilgrima271c542017-05-03 15:42:29 +00001389
1390 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV
1391 // indicates that the AVX registers will be saved and restored on context
1392 // switch, then we have full AVX support.
1393 bool HasAVXSave = ((ECX >> 27) & 1) && ((ECX >> 28) & 1) &&
1394 !getX86XCR0(&EAX, &EDX) && ((EAX & 0x6) == 0x6);
Florian Hahn82921bf2019-11-21 09:03:16 +00001395#if defined(__APPLE__)
1396 // Darwin lazily saves the AVX512 context on first use: trust that the OS will
1397 // save the AVX512 context if we use AVX512 instructions, even the bit is not
1398 // set right now.
1399 bool HasAVX512Save = true;
1400#else
Simon Pilgrima271c542017-05-03 15:42:29 +00001401 // AVX512 requires additional context to be saved by the OS.
1402 bool HasAVX512Save = HasAVXSave && ((EAX & 0xe0) == 0xe0);
Florian Hahn82921bf2019-11-21 09:03:16 +00001403#endif
Simon Pilgrima271c542017-05-03 15:42:29 +00001404
Craig Topper1af7e442017-11-19 23:30:22 +00001405 Features["avx"] = HasAVXSave;
1406 Features["fma"] = ((ECX >> 12) & 1) && HasAVXSave;
1407 // Only enable XSAVE if OS has enabled support for saving YMM state.
1408 Features["xsave"] = ((ECX >> 26) & 1) && HasAVXSave;
1409 Features["f16c"] = ((ECX >> 29) & 1) && HasAVXSave;
1410
Simon Pilgrima271c542017-05-03 15:42:29 +00001411 unsigned MaxExtLevel;
1412 getX86CpuIDAndInfo(0x80000000, &MaxExtLevel, &EBX, &ECX, &EDX);
1413
1414 bool HasExtLeaf1 = MaxExtLevel >= 0x80000001 &&
1415 !getX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
Craig Topper8d02be32018-02-17 16:52:49 +00001416 Features["sahf"] = HasExtLeaf1 && ((ECX >> 0) & 1);
Craig Topper1af7e442017-11-19 23:30:22 +00001417 Features["lzcnt"] = HasExtLeaf1 && ((ECX >> 5) & 1);
1418 Features["sse4a"] = HasExtLeaf1 && ((ECX >> 6) & 1);
1419 Features["prfchw"] = HasExtLeaf1 && ((ECX >> 8) & 1);
1420 Features["xop"] = HasExtLeaf1 && ((ECX >> 11) & 1) && HasAVXSave;
1421 Features["lwp"] = HasExtLeaf1 && ((ECX >> 15) & 1);
1422 Features["fma4"] = HasExtLeaf1 && ((ECX >> 16) & 1) && HasAVXSave;
1423 Features["tbm"] = HasExtLeaf1 && ((ECX >> 21) & 1);
Simon Pilgrima271c542017-05-03 15:42:29 +00001424 Features["mwaitx"] = HasExtLeaf1 && ((ECX >> 29) & 1);
1425
Craig Topper6cdab202018-09-24 18:55:41 +00001426 Features["64bit"] = HasExtLeaf1 && ((EDX >> 29) & 1);
1427
Gabor Buella2ef36f32018-04-11 20:01:57 +00001428 // Miscellaneous memory related features, detected by
1429 // using the 0x80000008 leaf of the CPUID instruction
Simon Pilgrima271c542017-05-03 15:42:29 +00001430 bool HasExtLeaf8 = MaxExtLevel >= 0x80000008 &&
Craig Topperdcd69792017-11-19 23:49:19 +00001431 !getX86CpuIDAndInfo(0x80000008, &EAX, &EBX, &ECX, &EDX);
Gabor Buella2ef36f32018-04-11 20:01:57 +00001432 Features["clzero"] = HasExtLeaf8 && ((EBX >> 0) & 1);
1433 Features["wbnoinvd"] = HasExtLeaf8 && ((EBX >> 9) & 1);
Simon Pilgrima271c542017-05-03 15:42:29 +00001434
1435 bool HasLeaf7 =
1436 MaxLevel >= 7 && !getX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
1437
Craig Topper1af7e442017-11-19 23:30:22 +00001438 Features["fsgsbase"] = HasLeaf7 && ((EBX >> 0) & 1);
1439 Features["sgx"] = HasLeaf7 && ((EBX >> 2) & 1);
1440 Features["bmi"] = HasLeaf7 && ((EBX >> 3) & 1);
Simon Pilgrima271c542017-05-03 15:42:29 +00001441 // AVX2 is only supported if we have the OS save support from AVX.
Craig Topper1af7e442017-11-19 23:30:22 +00001442 Features["avx2"] = HasLeaf7 && ((EBX >> 5) & 1) && HasAVXSave;
1443 Features["bmi2"] = HasLeaf7 && ((EBX >> 8) & 1);
Gabor Buellad2f1ab12018-05-25 06:32:05 +00001444 Features["invpcid"] = HasLeaf7 && ((EBX >> 10) & 1);
Craig Topper1af7e442017-11-19 23:30:22 +00001445 Features["rtm"] = HasLeaf7 && ((EBX >> 11) & 1);
Simon Pilgrima271c542017-05-03 15:42:29 +00001446 // AVX512 is only supported if the OS supports the context save for it.
Craig Topper1af7e442017-11-19 23:30:22 +00001447 Features["avx512f"] = HasLeaf7 && ((EBX >> 16) & 1) && HasAVX512Save;
1448 Features["avx512dq"] = HasLeaf7 && ((EBX >> 17) & 1) && HasAVX512Save;
1449 Features["rdseed"] = HasLeaf7 && ((EBX >> 18) & 1);
1450 Features["adx"] = HasLeaf7 && ((EBX >> 19) & 1);
Simon Pilgrima271c542017-05-03 15:42:29 +00001451 Features["avx512ifma"] = HasLeaf7 && ((EBX >> 21) & 1) && HasAVX512Save;
Craig Topper1af7e442017-11-19 23:30:22 +00001452 Features["clflushopt"] = HasLeaf7 && ((EBX >> 23) & 1);
1453 Features["clwb"] = HasLeaf7 && ((EBX >> 24) & 1);
1454 Features["avx512pf"] = HasLeaf7 && ((EBX >> 26) & 1) && HasAVX512Save;
1455 Features["avx512er"] = HasLeaf7 && ((EBX >> 27) & 1) && HasAVX512Save;
1456 Features["avx512cd"] = HasLeaf7 && ((EBX >> 28) & 1) && HasAVX512Save;
1457 Features["sha"] = HasLeaf7 && ((EBX >> 29) & 1);
1458 Features["avx512bw"] = HasLeaf7 && ((EBX >> 30) & 1) && HasAVX512Save;
1459 Features["avx512vl"] = HasLeaf7 && ((EBX >> 31) & 1) && HasAVX512Save;
Simon Pilgrima271c542017-05-03 15:42:29 +00001460
Craig Topper1af7e442017-11-19 23:30:22 +00001461 Features["prefetchwt1"] = HasLeaf7 && ((ECX >> 0) & 1);
1462 Features["avx512vbmi"] = HasLeaf7 && ((ECX >> 1) & 1) && HasAVX512Save;
Craig Topper9b03f672017-11-21 18:50:41 +00001463 Features["pku"] = HasLeaf7 && ((ECX >> 4) & 1);
Gabor Buella31fa8022018-04-20 18:42:47 +00001464 Features["waitpkg"] = HasLeaf7 && ((ECX >> 5) & 1);
Coby Tayree71e37cc2017-11-21 09:48:44 +00001465 Features["avx512vbmi2"] = HasLeaf7 && ((ECX >> 6) & 1) && HasAVX512Save;
Oren Ben Simhonfa582b02017-11-26 13:02:45 +00001466 Features["shstk"] = HasLeaf7 && ((ECX >> 7) & 1);
Coby Tayreed8b17be2017-11-26 09:36:41 +00001467 Features["gfni"] = HasLeaf7 && ((ECX >> 8) & 1);
Craig Topper9b03f672017-11-21 18:50:41 +00001468 Features["vaes"] = HasLeaf7 && ((ECX >> 9) & 1) && HasAVXSave;
1469 Features["vpclmulqdq"] = HasLeaf7 && ((ECX >> 10) & 1) && HasAVXSave;
1470 Features["avx512vnni"] = HasLeaf7 && ((ECX >> 11) & 1) && HasAVX512Save;
1471 Features["avx512bitalg"] = HasLeaf7 && ((ECX >> 12) & 1) && HasAVX512Save;
Yonghong Songdc1dbf62017-08-23 04:25:57 +00001472 Features["avx512vpopcntdq"] = HasLeaf7 && ((ECX >> 14) & 1) && HasAVX512Save;
Craig Topper84b26b92018-01-18 23:52:31 +00001473 Features["rdpid"] = HasLeaf7 && ((ECX >> 22) & 1);
Gabor Buella604be442018-04-13 07:35:08 +00001474 Features["cldemote"] = HasLeaf7 && ((ECX >> 25) & 1);
Gabor Buellac8ded042018-05-01 10:01:16 +00001475 Features["movdiri"] = HasLeaf7 && ((ECX >> 27) & 1);
1476 Features["movdir64b"] = HasLeaf7 && ((ECX >> 28) & 1);
Pengfei Wang1f67d942019-05-30 03:59:16 +00001477 Features["enqcmd"] = HasLeaf7 && ((ECX >> 29) & 1);
Craig Topper84b26b92018-01-18 23:52:31 +00001478
Gabor Buella2b5e9602018-05-08 06:47:36 +00001479 // There are two CPUID leafs which information associated with the pconfig
1480 // instruction:
1481 // EAX=0x7, ECX=0x0 indicates the availability of the instruction (via the 18th
1482 // bit of EDX), while the EAX=0x1b leaf returns information on the
1483 // availability of specific pconfig leafs.
1484 // The target feature here only refers to the the first of these two.
1485 // Users might need to check for the availability of specific pconfig
1486 // leaves using cpuid, since that information is ignored while
1487 // detecting features using the "-march=native" flag.
1488 // For more info, see X86 ISA docs.
1489 Features["pconfig"] = HasLeaf7 && ((EDX >> 18) & 1);
Luo, Yuankebeec41c2019-05-06 08:22:37 +00001490 bool HasLeaf7Subleaf1 =
1491 MaxLevel >= 7 && !getX86CpuIDAndInfoEx(0x7, 0x1, &EAX, &EBX, &ECX, &EDX);
1492 Features["avx512bf16"] = HasLeaf7Subleaf1 && ((EAX >> 5) & 1) && HasAVX512Save;
Gabor Buella2b5e9602018-05-08 06:47:36 +00001493
Simon Pilgrima271c542017-05-03 15:42:29 +00001494 bool HasLeafD = MaxLevel >= 0xd &&
1495 !getX86CpuIDAndInfoEx(0xd, 0x1, &EAX, &EBX, &ECX, &EDX);
1496
1497 // Only enable XSAVE if OS has enabled support for saving YMM state.
Craig Topper1af7e442017-11-19 23:30:22 +00001498 Features["xsaveopt"] = HasLeafD && ((EAX >> 0) & 1) && HasAVXSave;
1499 Features["xsavec"] = HasLeafD && ((EAX >> 1) & 1) && HasAVXSave;
1500 Features["xsaves"] = HasLeafD && ((EAX >> 3) & 1) && HasAVXSave;
Simon Pilgrima271c542017-05-03 15:42:29 +00001501
Gabor Buellaa832b222018-05-10 07:26:05 +00001502 bool HasLeaf14 = MaxLevel >= 0x14 &&
1503 !getX86CpuIDAndInfoEx(0x14, 0x0, &EAX, &EBX, &ECX, &EDX);
1504
1505 Features["ptwrite"] = HasLeaf14 && ((EBX >> 4) & 1);
1506
Simon Pilgrima271c542017-05-03 15:42:29 +00001507 return true;
1508}
1509#elif defined(__linux__) && (defined(__arm__) || defined(__aarch64__))
1510bool sys::getHostCPUFeatures(StringMap<bool> &Features) {
1511 std::unique_ptr<llvm::MemoryBuffer> P = getProcCpuinfoContent();
1512 if (!P)
1513 return false;
1514
1515 SmallVector<StringRef, 32> Lines;
1516 P->getBuffer().split(Lines, "\n");
1517
1518 SmallVector<StringRef, 32> CPUFeatures;
1519
1520 // Look for the CPU features.
1521 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
1522 if (Lines[I].startswith("Features")) {
1523 Lines[I].split(CPUFeatures, ' ');
1524 break;
1525 }
1526
1527#if defined(__aarch64__)
1528 // Keep track of which crypto features we have seen
1529 enum { CAP_AES = 0x1, CAP_PMULL = 0x2, CAP_SHA1 = 0x4, CAP_SHA2 = 0x8 };
1530 uint32_t crypto = 0;
1531#endif
1532
1533 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) {
1534 StringRef LLVMFeatureStr = StringSwitch<StringRef>(CPUFeatures[I])
1535#if defined(__aarch64__)
1536 .Case("asimd", "neon")
1537 .Case("fp", "fp-armv8")
1538 .Case("crc32", "crc")
1539#else
1540 .Case("half", "fp16")
1541 .Case("neon", "neon")
1542 .Case("vfpv3", "vfp3")
1543 .Case("vfpv3d16", "d16")
1544 .Case("vfpv4", "vfp4")
1545 .Case("idiva", "hwdiv-arm")
1546 .Case("idivt", "hwdiv")
1547#endif
1548 .Default("");
1549
1550#if defined(__aarch64__)
1551 // We need to check crypto separately since we need all of the crypto
1552 // extensions to enable the subtarget feature
1553 if (CPUFeatures[I] == "aes")
1554 crypto |= CAP_AES;
1555 else if (CPUFeatures[I] == "pmull")
1556 crypto |= CAP_PMULL;
1557 else if (CPUFeatures[I] == "sha1")
1558 crypto |= CAP_SHA1;
1559 else if (CPUFeatures[I] == "sha2")
1560 crypto |= CAP_SHA2;
1561#endif
1562
1563 if (LLVMFeatureStr != "")
1564 Features[LLVMFeatureStr] = true;
1565 }
1566
1567#if defined(__aarch64__)
1568 // If we have all crypto bits we can add the feature
1569 if (crypto == (CAP_AES | CAP_PMULL | CAP_SHA1 | CAP_SHA2))
1570 Features["crypto"] = true;
1571#endif
1572
1573 return true;
1574}
Martin Storsjo353ac422019-10-02 11:04:55 +00001575#elif defined(_WIN32) && (defined(__aarch64__) || defined(_M_ARM64))
1576bool sys::getHostCPUFeatures(StringMap<bool> &Features) {
1577 if (IsProcessorFeaturePresent(PF_ARM_NEON_INSTRUCTIONS_AVAILABLE))
1578 Features["neon"] = true;
1579 if (IsProcessorFeaturePresent(PF_ARM_V8_CRC32_INSTRUCTIONS_AVAILABLE))
1580 Features["crc"] = true;
1581 if (IsProcessorFeaturePresent(PF_ARM_V8_CRYPTO_INSTRUCTIONS_AVAILABLE))
1582 Features["crypto"] = true;
1583
1584 return true;
1585}
Simon Pilgrima271c542017-05-03 15:42:29 +00001586#else
1587bool sys::getHostCPUFeatures(StringMap<bool> &Features) { return false; }
1588#endif
1589
1590std::string sys::getProcessTriple() {
Alex Lorenz3803df32017-07-07 09:53:47 +00001591 std::string TargetTripleString = updateTripleOSVersion(LLVM_HOST_TRIPLE);
1592 Triple PT(Triple::normalize(TargetTripleString));
Simon Pilgrima271c542017-05-03 15:42:29 +00001593
1594 if (sizeof(void *) == 8 && PT.isArch32Bit())
1595 PT = PT.get64BitArchVariant();
1596 if (sizeof(void *) == 4 && PT.isArch64Bit())
1597 PT = PT.get32BitArchVariant();
1598
1599 return PT.str();
1600}