blob: ffad1d79ad02026540fa600a1982a7e37a6d874c [file] [log] [blame]
Daniel Dunbare52e6bf2008-10-02 01:17:28 +00001//===-- Host.cpp - Implement OS Host Concept --------------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Hans Wennborgcfe341f2014-06-20 01:36:00 +000010// This file implements the operating system Host concept.
Daniel Dunbare52e6bf2008-10-02 01:17:28 +000011//
12//===----------------------------------------------------------------------===//
13
Chandler Carruthed0881b2012-12-03 16:50:05 +000014#include "llvm/Support/Host.h"
Benjamin Kramerefe40282012-06-26 21:36:32 +000015#include "llvm/ADT/SmallVector.h"
Hal Finkel59b0ee82012-06-12 03:03:13 +000016#include "llvm/ADT/StringRef.h"
17#include "llvm/ADT/StringSwitch.h"
Peter Collingbournea51c6ed2013-01-16 17:27:22 +000018#include "llvm/ADT/Triple.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000019#include "llvm/Config/config.h"
Hal Finkel59b0ee82012-06-12 03:03:13 +000020#include "llvm/Support/Debug.h"
Rafael Espindola97935a92014-12-17 02:32:44 +000021#include "llvm/Support/FileSystem.h"
Hal Finkel59b0ee82012-06-12 03:03:13 +000022#include "llvm/Support/raw_ostream.h"
Daniel Dunbar241d01b2009-11-14 10:09:12 +000023#include <string.h>
Daniel Dunbare52e6bf2008-10-02 01:17:28 +000024
25// Include the platform-specific parts of this class.
26#ifdef LLVM_ON_UNIX
27#include "Unix/Host.inc"
28#endif
29#ifdef LLVM_ON_WIN32
Michael J. Spencer447762d2010-11-29 18:16:10 +000030#include "Windows/Host.inc"
Daniel Dunbare52e6bf2008-10-02 01:17:28 +000031#endif
Benjamin Kramer38465062009-11-19 12:17:31 +000032#ifdef _MSC_VER
33#include <intrin.h>
34#endif
Hal Finkel59b0ee82012-06-12 03:03:13 +000035#if defined(__APPLE__) && (defined(__ppc__) || defined(__powerpc__))
36#include <mach/mach.h>
37#include <mach/mach_host.h>
38#include <mach/host_info.h>
39#include <mach/machine.h>
40#endif
Daniel Dunbare52e6bf2008-10-02 01:17:28 +000041
Chandler Carruth66f38db2014-04-21 23:58:10 +000042#define DEBUG_TYPE "host-detection"
43
Daniel Dunbar241d01b2009-11-14 10:09:12 +000044//===----------------------------------------------------------------------===//
45//
46// Implementations of the CPU detection routines
47//
48//===----------------------------------------------------------------------===//
49
50using namespace llvm;
51
Rafael Espindola81adfb52014-12-17 02:42:20 +000052#if defined(__linux__)
Rafael Espindola97935a92014-12-17 02:32:44 +000053static ssize_t LLVM_ATTRIBUTE_UNUSED readCpuInfo(void *Buf, size_t Size) {
Rafael Espindola97935a92014-12-17 02:32:44 +000054 // Note: We cannot mmap /proc/cpuinfo here and then process the resulting
55 // memory buffer because the 'file' has 0 size (it can be read from only
56 // as a stream).
57
58 int FD;
59 std::error_code EC = sys::fs::openFileForRead("/proc/cpuinfo", FD);
60 if (EC) {
61 DEBUG(dbgs() << "Unable to open /proc/cpuinfo: " << EC.message() << "\n");
62 return -1;
63 }
64 int Ret = read(FD, Buf, Size);
65 int CloseStatus = close(FD);
66 if (CloseStatus)
67 return -1;
68 return Ret;
69}
Rafael Espindola81adfb52014-12-17 02:42:20 +000070#endif
Rafael Espindola97935a92014-12-17 02:32:44 +000071
Daniel Dunbar241d01b2009-11-14 10:09:12 +000072#if defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)\
73 || defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64)
74
75/// GetX86CpuIDAndInfo - Execute the specified cpuid and return the 4 values in the
76/// specified arguments. If we can't run cpuid on the host, return true.
Reid Klecknerbe85cb92013-08-14 18:21:51 +000077static bool GetX86CpuIDAndInfo(unsigned value, unsigned *rEAX, unsigned *rEBX,
78 unsigned *rECX, unsigned *rEDX) {
Reid Klecknerbf4f9eb2013-08-16 22:42:42 +000079#if defined(__GNUC__) || defined(__clang__)
Reid Klecknerbe85cb92013-08-14 18:21:51 +000080 #if defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64)
Daniel Dunbar241d01b2009-11-14 10:09:12 +000081 // gcc doesn't know cpuid would clobber ebx/rbx. Preseve it manually.
82 asm ("movq\t%%rbx, %%rsi\n\t"
83 "cpuid\n\t"
84 "xchgq\t%%rbx, %%rsi\n\t"
85 : "=a" (*rEAX),
86 "=S" (*rEBX),
87 "=c" (*rECX),
88 "=d" (*rEDX)
89 : "a" (value));
90 return false;
Reid Klecknerbe85cb92013-08-14 18:21:51 +000091 #elif defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)
Daniel Dunbar241d01b2009-11-14 10:09:12 +000092 asm ("movl\t%%ebx, %%esi\n\t"
93 "cpuid\n\t"
94 "xchgl\t%%ebx, %%esi\n\t"
95 : "=a" (*rEAX),
96 "=S" (*rEBX),
97 "=c" (*rECX),
98 "=d" (*rEDX)
99 : "a" (value));
100 return false;
David Blaikieb48ed1a2012-01-17 04:43:56 +0000101// pedantic #else returns to appease -Wunreachable-code (so we don't generate
102// postprocessed code that looks like "return true; return false;")
103 #else
104 return true;
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000105 #endif
Reid Klecknerbf4f9eb2013-08-16 22:42:42 +0000106#elif defined(_MSC_VER)
107 // The MSVC intrinsic is portable across x86 and x64.
108 int registers[4];
109 __cpuid(registers, value);
110 *rEAX = registers[0];
111 *rEBX = registers[1];
112 *rECX = registers[2];
113 *rEDX = registers[3];
114 return false;
David Blaikieb48ed1a2012-01-17 04:43:56 +0000115#else
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000116 return true;
David Blaikieb48ed1a2012-01-17 04:43:56 +0000117#endif
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000118}
119
Tim Northover89ccb612013-11-25 09:52:59 +0000120/// GetX86CpuIDAndInfoEx - Execute the specified cpuid with subleaf and return the
121/// 4 values in the specified arguments. If we can't run cpuid on the host,
122/// return true.
Benjamin Kramer583b00e2013-11-25 15:40:24 +0000123static bool GetX86CpuIDAndInfoEx(unsigned value, unsigned subleaf,
124 unsigned *rEAX, unsigned *rEBX, unsigned *rECX,
125 unsigned *rEDX) {
Tim Northover89ccb612013-11-25 09:52:59 +0000126#if defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64)
127 #if defined(__GNUC__)
128 // gcc doesn't know cpuid would clobber ebx/rbx. Preseve it manually.
129 asm ("movq\t%%rbx, %%rsi\n\t"
130 "cpuid\n\t"
131 "xchgq\t%%rbx, %%rsi\n\t"
132 : "=a" (*rEAX),
133 "=S" (*rEBX),
134 "=c" (*rECX),
135 "=d" (*rEDX)
136 : "a" (value),
137 "c" (subleaf));
138 return false;
139 #elif defined(_MSC_VER)
Aaron Ballmanb664e2a2015-02-16 18:23:00 +0000140 int registers[4];
141 __cpuidex(registers, value, subleaf);
142 *rEAX = registers[0];
143 *rEBX = registers[1];
144 *rECX = registers[2];
145 *rEDX = registers[3];
146 return false;
Tim Northover89ccb612013-11-25 09:52:59 +0000147 #else
148 return true;
149 #endif
150#elif defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)
151 #if defined(__GNUC__)
152 asm ("movl\t%%ebx, %%esi\n\t"
153 "cpuid\n\t"
154 "xchgl\t%%ebx, %%esi\n\t"
155 : "=a" (*rEAX),
156 "=S" (*rEBX),
157 "=c" (*rECX),
158 "=d" (*rEDX)
159 : "a" (value),
160 "c" (subleaf));
161 return false;
162 #elif defined(_MSC_VER)
163 __asm {
164 mov eax,value
165 mov ecx,subleaf
166 cpuid
167 mov esi,rEAX
168 mov dword ptr [esi],eax
169 mov esi,rEBX
170 mov dword ptr [esi],ebx
171 mov esi,rECX
172 mov dword ptr [esi],ecx
173 mov esi,rEDX
174 mov dword ptr [esi],edx
175 }
176 return false;
177 #else
178 return true;
179 #endif
180#else
181 return true;
182#endif
183}
184
Craig Topper798a2602015-03-29 01:00:23 +0000185static bool GetX86XCR0(unsigned *rEAX, unsigned *rEDX) {
Craig Topper7af39d72013-04-22 05:38:01 +0000186#if defined(__GNUC__)
187 // Check xgetbv; this uses a .byte sequence instead of the instruction
188 // directly because older assemblers do not include support for xgetbv and
189 // there is no easy way to conditionally compile based on the assembler used.
Craig Topper798a2602015-03-29 01:00:23 +0000190 __asm__ (".byte 0x0f, 0x01, 0xd0" : "=a" (*rEAX), "=d" (*rEDX) : "c" (0));
191 return false;
Aaron Ballman31c0adc2013-04-23 17:38:44 +0000192#elif defined(_MSC_FULL_VER) && defined(_XCR_XFEATURE_ENABLED_MASK)
Craig Topper798a2602015-03-29 01:00:23 +0000193 unsigned long long Result = _xgetbv(_XCR_XFEATURE_ENABLED_MASK);
Craig Topper7db49fd2015-03-29 01:07:57 +0000194 *rEAX = Result;
195 *rEDX = Result >> 32;
Craig Topper798a2602015-03-29 01:00:23 +0000196 return false;
Craig Topper7af39d72013-04-22 05:38:01 +0000197#else
Craig Topper798a2602015-03-29 01:00:23 +0000198 return true;
Craig Topper7af39d72013-04-22 05:38:01 +0000199#endif
Aaron Ballman5f7c6802013-04-03 12:25:06 +0000200}
201
Chris Lattner963debc2010-09-06 05:19:44 +0000202static void DetectX86FamilyModel(unsigned EAX, unsigned &Family,
203 unsigned &Model) {
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000204 Family = (EAX >> 8) & 0xf; // Bits 8 - 11
205 Model = (EAX >> 4) & 0xf; // Bits 4 - 7
206 if (Family == 6 || Family == 0xf) {
207 if (Family == 0xf)
208 // Examine extended family ID if family ID is F.
209 Family += (EAX >> 20) & 0xff; // Bits 20 - 27
210 // Examine extended model ID if family ID is 6 or F.
211 Model += ((EAX >> 16) & 0xf) << 4; // Bits 16 - 19
212 }
213}
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000214
Rafael Espindola74f444c2013-12-12 15:45:32 +0000215StringRef sys::getHostCPUName() {
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000216 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
217 if (GetX86CpuIDAndInfo(0x1, &EAX, &EBX, &ECX, &EDX))
218 return "generic";
219 unsigned Family = 0;
220 unsigned Model = 0;
221 DetectX86FamilyModel(EAX, Family, Model);
222
Tim Northover89ccb612013-11-25 09:52:59 +0000223 union {
224 unsigned u[3];
225 char c[12];
226 } text;
227
Craig Topper1214bdc2015-03-31 05:42:45 +0000228 unsigned MaxLeaf;
229 GetX86CpuIDAndInfo(0, &MaxLeaf, text.u+0, text.u+2, text.u+1);
Tim Northover89ccb612013-11-25 09:52:59 +0000230
Craig Topper1214bdc2015-03-31 05:42:45 +0000231 bool HasMMX = (EDX >> 23) & 1;
232 bool HasSSE = (EDX >> 25) & 1;
233 bool HasSSE2 = (EDX >> 26) & 1;
234 bool HasSSE3 = (ECX >> 0) & 1;
235 bool HasSSSE3 = (ECX >> 9) & 1;
236 bool HasSSE41 = (ECX >> 19) & 1;
237 bool HasSSE42 = (ECX >> 20) & 1;
238 bool HasMOVBE = (ECX >> 22) & 1;
239 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV
Aaron Ballman5f7c6802013-04-03 12:25:06 +0000240 // indicates that the AVX registers will be saved and restored on context
241 // switch, then we have full AVX support.
Aaron Ballman5e6d2052013-04-03 18:00:22 +0000242 const unsigned AVXBits = (1 << 27) | (1 << 28);
Craig Topper798a2602015-03-29 01:00:23 +0000243 bool HasAVX = ((ECX & AVXBits) == AVXBits) && !GetX86XCR0(&EAX, &EDX) &&
244 ((EAX & 0x6) == 0x6);
Craig Topper1214bdc2015-03-31 05:42:45 +0000245 bool HasAVX512Save = HasAVX && ((EAX & 0xe0) == 0xe0);
246 bool HasLeaf7 = MaxLeaf >= 0x7 &&
247 !GetX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
248 bool HasADX = HasLeaf7 && ((EBX >> 19) & 1);
249 bool HasAVX2 = HasAVX && HasLeaf7 && (EBX & 0x20);
250 bool HasAVX512 = HasLeaf7 && HasAVX512Save && ((EBX >> 16) & 1);
251
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000252 GetX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
253 bool Em64T = (EDX >> 29) & 0x1;
Kaelyn Takataa39d2a02014-05-05 16:32:10 +0000254 bool HasTBM = (ECX >> 21) & 0x1;
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000255
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000256 if (memcmp(text.c, "GenuineIntel", 12) == 0) {
257 switch (Family) {
Daniel Dunbar397235f2009-11-14 21:36:19 +0000258 case 3:
259 return "i386";
260 case 4:
261 switch (Model) {
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000262 case 0: // Intel486 DX processors
263 case 1: // Intel486 DX processors
Daniel Dunbar397235f2009-11-14 21:36:19 +0000264 case 2: // Intel486 SX processors
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000265 case 3: // Intel487 processors, IntelDX2 OverDrive processors,
266 // IntelDX2 processors
Daniel Dunbar397235f2009-11-14 21:36:19 +0000267 case 4: // Intel486 SL processor
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000268 case 5: // IntelSX2 processors
Daniel Dunbar397235f2009-11-14 21:36:19 +0000269 case 7: // Write-Back Enhanced IntelDX2 processors
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000270 case 8: // IntelDX4 OverDrive processors, IntelDX4 processors
Daniel Dunbar397235f2009-11-14 21:36:19 +0000271 default: return "i486";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000272 }
Daniel Dunbar397235f2009-11-14 21:36:19 +0000273 case 5:
274 switch (Model) {
275 case 1: // Pentium OverDrive processor for Pentium processor (60, 66),
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000276 // Pentium processors (60, 66)
Daniel Dunbar397235f2009-11-14 21:36:19 +0000277 case 2: // Pentium OverDrive processor for Pentium processor (75, 90,
278 // 100, 120, 133), Pentium processors (75, 90, 100, 120, 133,
279 // 150, 166, 200)
280 case 3: // Pentium OverDrive processors for Intel486 processor-based
281 // systems
282 return "pentium";
283
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000284 case 4: // Pentium OverDrive processor with MMX technology for Pentium
Daniel Dunbar397235f2009-11-14 21:36:19 +0000285 // processor (75, 90, 100, 120, 133), Pentium processor with
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000286 // MMX technology (166, 200)
Daniel Dunbar397235f2009-11-14 21:36:19 +0000287 return "pentium-mmx";
288
289 default: return "pentium";
290 }
291 case 6:
292 switch (Model) {
293 case 1: // Pentium Pro processor
294 return "pentiumpro";
295
296 case 3: // Intel Pentium II OverDrive processor, Pentium II processor,
297 // model 03
298 case 5: // Pentium II processor, model 05, Pentium II Xeon processor,
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000299 // model 05, and Intel Celeron processor, model 05
Daniel Dunbar397235f2009-11-14 21:36:19 +0000300 case 6: // Celeron processor, model 06
301 return "pentium2";
302
303 case 7: // Pentium III processor, model 07, and Pentium III Xeon
304 // processor, model 07
305 case 8: // Pentium III processor, model 08, Pentium III Xeon processor,
306 // model 08, and Celeron processor, model 08
307 case 10: // Pentium III Xeon processor, model 0Ah
308 case 11: // Pentium III processor, model 0Bh
309 return "pentium3";
310
311 case 9: // Intel Pentium M processor, Intel Celeron M processor model 09.
312 case 13: // Intel Pentium M processor, Intel Celeron M processor, model
313 // 0Dh. All processors are manufactured using the 90 nm process.
Craig Topper06682852015-03-30 06:31:06 +0000314 case 21: // Intel EP80579 Integrated Processor and Intel EP80579
315 // Integrated Processor with Intel QuickAssist Technology
Daniel Dunbar397235f2009-11-14 21:36:19 +0000316 return "pentium-m";
317
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000318 case 14: // Intel Core Duo processor, Intel Core Solo processor, model
Daniel Dunbar397235f2009-11-14 21:36:19 +0000319 // 0Eh. All processors are manufactured using the 65 nm process.
320 return "yonah";
321
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000322 case 15: // Intel Core 2 Duo processor, Intel Core 2 Duo mobile
323 // processor, Intel Core 2 Quad processor, Intel Core 2 Quad
324 // mobile processor, Intel Core 2 Extreme processor, Intel
Daniel Dunbar397235f2009-11-14 21:36:19 +0000325 // Pentium Dual-Core processor, Intel Xeon processor, model
326 // 0Fh. All processors are manufactured using the 65 nm process.
327 case 22: // Intel Celeron processor model 16h. All processors are
328 // manufactured using the 65 nm process
329 return "core2";
330
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000331 case 23: // Intel Core 2 Extreme processor, Intel Xeon processor, model
Daniel Dunbar397235f2009-11-14 21:36:19 +0000332 // 17h. All processors are manufactured using the 45 nm process.
333 //
334 // 45nm: Penryn , Wolfdale, Yorkfield (XE)
Craig Topper4e78a922015-03-30 06:31:03 +0000335 case 29: // Intel Xeon processor MP. All processors are manufactured using
336 // the 45 nm process.
Craig Topper545b9512015-03-31 06:18:31 +0000337 return "penryn";
Daniel Dunbar397235f2009-11-14 21:36:19 +0000338
339 case 26: // Intel Core i7 processor and Intel Xeon processor. All
340 // processors are manufactured using the 45 nm process.
Jakob Stoklund Olesen49e58a92010-09-19 17:54:28 +0000341 case 30: // Intel(R) Core(TM) i7 CPU 870 @ 2.93GHz.
342 // As found in a Summer 2010 model iMac.
Craig Topper3c2e7582015-03-30 06:31:09 +0000343 case 46: // Nehalem EX
344 return "nehalem";
Chris Lattnerb737bac2010-09-19 00:31:58 +0000345 case 37: // Intel Core i7, laptop version.
Benjamin Kramer5a122f32011-08-25 18:05:56 +0000346 case 44: // Intel Core i7 processor and Intel Xeon processor. All
347 // processors are manufactured using the 32 nm process.
Benjamin Kramer9d6063a2012-09-26 18:21:47 +0000348 case 47: // Westmere EX
Craig Topper3c2e7582015-03-30 06:31:09 +0000349 return "westmere";
Bob Wilsond0f06002011-07-08 22:33:59 +0000350
351 // SandyBridge:
352 case 42: // Intel Core i7 processor. All processors are manufactured
353 // using the 32 nm process.
Chris Lattner889c40e2011-06-09 06:38:17 +0000354 case 45:
Craig Topper545b9512015-03-31 06:18:31 +0000355 return "sandybridge";
Daniel Dunbar397235f2009-11-14 21:36:19 +0000356
Evan Cheng7fd16072012-04-23 22:41:39 +0000357 // Ivy Bridge:
358 case 58:
Tim Northover89ccb612013-11-25 09:52:59 +0000359 case 62: // Ivy Bridge EP
Craig Topper545b9512015-03-31 06:18:31 +0000360 return "ivybridge";
Evan Cheng7fd16072012-04-23 22:41:39 +0000361
Tim Northover89ccb612013-11-25 09:52:59 +0000362 // Haswell:
363 case 60:
364 case 63:
365 case 69:
366 case 70:
Craig Topper545b9512015-03-31 06:18:31 +0000367 return "haswell";
Tim Northover89ccb612013-11-25 09:52:59 +0000368
Craig Topper1e1b0f72015-03-23 00:15:06 +0000369 // Broadwell:
370 case 61:
Craig Topper68ba18f2015-08-08 01:29:15 +0000371 case 71:
Craig Topper545b9512015-03-31 06:18:31 +0000372 return "broadwell";
Craig Topper1e1b0f72015-03-23 00:15:06 +0000373
Craig Topper68ba18f2015-08-08 01:29:15 +0000374 // Skylake:
375 case 78:
376 case 94:
377 return "skylake";
378
Preston Gurdc0b976c2012-05-02 21:38:46 +0000379 case 28: // Most 45 nm Intel Atom processors
380 case 38: // 45 nm Atom Lincroft
381 case 39: // 32 nm Atom Medfield
Preston Gurd8e082682012-07-19 19:05:37 +0000382 case 53: // 32 nm Atom Midview
383 case 54: // 32 nm Atom Midview
Craig Topper3c2e7582015-03-30 06:31:09 +0000384 return "bonnell";
Daniel Dunbar397235f2009-11-14 21:36:19 +0000385
Preston Gurd3fe264d2013-09-13 19:23:28 +0000386 // Atom Silvermont codes from the Intel software optimization guide.
387 case 55:
Benjamin Kramer8f429382013-08-30 14:05:32 +0000388 case 74:
389 case 77:
Craig Toppera3db7d22015-08-07 20:09:42 +0000390 case 90:
Craig Topperf7ce7542015-08-08 01:16:05 +0000391 case 93:
Craig Topper3c2e7582015-03-30 06:31:09 +0000392 return "silvermont";
Benjamin Kramer8f429382013-08-30 14:05:32 +0000393
Craig Topper1214bdc2015-03-31 05:42:45 +0000394 default: // Unknown family 6 CPU, try to guess.
395 if (HasAVX512)
396 return "knl";
397 if (HasADX)
398 return "broadwell";
399 if (HasAVX2)
400 return "haswell";
401 if (HasAVX)
402 return "sandybridge";
403 if (HasSSE42)
404 return HasMOVBE ? "silvermont" : "nehalem";
405 if (HasSSE41)
406 return "penryn";
407 if (HasSSSE3)
408 return HasMOVBE ? "bonnell" : "core2";
409 if (Em64T)
410 return "x86-64";
411 if (HasSSE2)
412 return "pentium-m";
413 if (HasSSE)
414 return "pentium3";
415 if (HasMMX)
416 return "pentium2";
417 return "pentiumpro";
Daniel Dunbar397235f2009-11-14 21:36:19 +0000418 }
419 case 15: {
420 switch (Model) {
421 case 0: // Pentium 4 processor, Intel Xeon processor. All processors are
422 // model 00h and manufactured using the 0.18 micron process.
423 case 1: // Pentium 4 processor, Intel Xeon processor, Intel Xeon
424 // processor MP, and Intel Celeron processor. All processors are
425 // model 01h and manufactured using the 0.18 micron process.
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000426 case 2: // Pentium 4 processor, Mobile Intel Pentium 4 processor - M,
Daniel Dunbar397235f2009-11-14 21:36:19 +0000427 // Intel Xeon processor, Intel Xeon processor MP, Intel Celeron
428 // processor, and Mobile Intel Celeron processor. All processors
429 // are model 02h and manufactured using the 0.13 micron process.
430 return (Em64T) ? "x86-64" : "pentium4";
431
432 case 3: // Pentium 4 processor, Intel Xeon processor, Intel Celeron D
433 // processor. All processors are model 03h and manufactured using
434 // the 90 nm process.
435 case 4: // Pentium 4 processor, Pentium 4 processor Extreme Edition,
436 // Pentium D processor, Intel Xeon processor, Intel Xeon
437 // processor MP, Intel Celeron D processor. All processors are
438 // model 04h and manufactured using the 90 nm process.
439 case 6: // Pentium 4 processor, Pentium D processor, Pentium processor
440 // Extreme Edition, Intel Xeon processor, Intel Xeon processor
441 // MP, Intel Celeron D processor. All processors are model 06h
442 // and manufactured using the 65 nm process.
443 return (Em64T) ? "nocona" : "prescott";
444
Daniel Dunbar397235f2009-11-14 21:36:19 +0000445 default:
446 return (Em64T) ? "x86-64" : "pentium4";
447 }
448 }
449
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000450 default:
Benjamin Kramer713fd352009-11-17 17:57:04 +0000451 return "generic";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000452 }
453 } else if (memcmp(text.c, "AuthenticAMD", 12) == 0) {
454 // FIXME: this poorly matches the generated SubtargetFeatureKV table. There
455 // appears to be no way to generate the wide variety of AMD-specific targets
456 // from the information returned from CPUID.
457 switch (Family) {
458 case 4:
459 return "i486";
460 case 5:
461 switch (Model) {
462 case 6:
463 case 7: return "k6";
464 case 8: return "k6-2";
465 case 9:
466 case 13: return "k6-3";
Roman Divackyfd690092012-09-12 14:36:02 +0000467 case 10: return "geode";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000468 default: return "pentium";
469 }
470 case 6:
471 switch (Model) {
472 case 4: return "athlon-tbird";
473 case 6:
474 case 7:
475 case 8: return "athlon-mp";
476 case 10: return "athlon-xp";
477 default: return "athlon";
478 }
479 case 15:
Chris Lattner963debc2010-09-06 05:19:44 +0000480 if (HasSSE3)
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000481 return "k8-sse3";
Chris Lattner963debc2010-09-06 05:19:44 +0000482 switch (Model) {
483 case 1: return "opteron";
484 case 5: return "athlon-fx"; // also opteron
485 default: return "athlon64";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000486 }
487 case 16:
488 return "amdfam10";
Benjamin Kramer077ae1d2012-01-10 11:50:02 +0000489 case 20:
490 return "btver1";
Benjamin Kramer3ced5452011-12-01 18:24:17 +0000491 case 21:
Benjamin Kramerb44c4272013-05-03 10:20:08 +0000492 if (!HasAVX) // If the OS doesn't support AVX provide a sane fallback.
493 return "btver1";
Benjamin Kramer60045732014-05-02 15:47:07 +0000494 if (Model >= 0x50)
495 return "bdver4"; // 50h-6Fh: Excavator
Benjamin Kramerd114def2013-11-04 10:29:20 +0000496 if (Model >= 0x30)
497 return "bdver3"; // 30h-3Fh: Steamroller
Kaelyn Takataa39d2a02014-05-05 16:32:10 +0000498 if (Model >= 0x10 || HasTBM)
Benjamin Kramerd114def2013-11-04 10:29:20 +0000499 return "bdver2"; // 10h-1Fh: Piledriver
500 return "bdver1"; // 00h-0Fh: Bulldozer
Benjamin Kramerb44c4272013-05-03 10:20:08 +0000501 case 22:
502 if (!HasAVX) // If the OS doesn't support AVX provide a sane fallback.
503 return "btver1";
504 return "btver2";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000505 default:
Benjamin Kramer713fd352009-11-17 17:57:04 +0000506 return "generic";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000507 }
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000508 }
Torok Edwin022336a2009-12-14 12:38:18 +0000509 return "generic";
Torok Edwinabdc1c22009-12-13 08:59:40 +0000510}
Hal Finkel59b0ee82012-06-12 03:03:13 +0000511#elif defined(__APPLE__) && (defined(__ppc__) || defined(__powerpc__))
Rafael Espindola1f58e4d2013-12-12 16:10:48 +0000512StringRef sys::getHostCPUName() {
Hal Finkel59b0ee82012-06-12 03:03:13 +0000513 host_basic_info_data_t hostInfo;
514 mach_msg_type_number_t infoCount;
515
516 infoCount = HOST_BASIC_INFO_COUNT;
517 host_info(mach_host_self(), HOST_BASIC_INFO, (host_info_t)&hostInfo,
518 &infoCount);
519
520 if (hostInfo.cpu_type != CPU_TYPE_POWERPC) return "generic";
521
522 switch(hostInfo.cpu_subtype) {
523 case CPU_SUBTYPE_POWERPC_601: return "601";
524 case CPU_SUBTYPE_POWERPC_602: return "602";
525 case CPU_SUBTYPE_POWERPC_603: return "603";
526 case CPU_SUBTYPE_POWERPC_603e: return "603e";
527 case CPU_SUBTYPE_POWERPC_603ev: return "603ev";
528 case CPU_SUBTYPE_POWERPC_604: return "604";
529 case CPU_SUBTYPE_POWERPC_604e: return "604e";
530 case CPU_SUBTYPE_POWERPC_620: return "620";
531 case CPU_SUBTYPE_POWERPC_750: return "750";
532 case CPU_SUBTYPE_POWERPC_7400: return "7400";
533 case CPU_SUBTYPE_POWERPC_7450: return "7450";
534 case CPU_SUBTYPE_POWERPC_970: return "970";
535 default: ;
536 }
537
538 return "generic";
539}
540#elif defined(__linux__) && (defined(__ppc__) || defined(__powerpc__))
Rafael Espindolab75ea012013-12-12 16:17:40 +0000541StringRef sys::getHostCPUName() {
Hal Finkel59b0ee82012-06-12 03:03:13 +0000542 // Access to the Processor Version Register (PVR) on PowerPC is privileged,
543 // and so we must use an operating-system interface to determine the current
544 // processor type. On Linux, this is exposed through the /proc/cpuinfo file.
545 const char *generic = "generic";
546
Hal Finkel59b0ee82012-06-12 03:03:13 +0000547 // The cpu line is second (after the 'processor: 0' line), so if this
548 // buffer is too small then something has changed (or is wrong).
549 char buffer[1024];
Rafael Espindola97935a92014-12-17 02:32:44 +0000550 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer));
551 if (CPUInfoSize == -1)
552 return generic;
Hal Finkel59b0ee82012-06-12 03:03:13 +0000553
554 const char *CPUInfoStart = buffer;
555 const char *CPUInfoEnd = buffer + CPUInfoSize;
556
557 const char *CIP = CPUInfoStart;
558
559 const char *CPUStart = 0;
560 size_t CPULen = 0;
561
562 // We need to find the first line which starts with cpu, spaces, and a colon.
563 // After the colon, there may be some additional spaces and then the cpu type.
564 while (CIP < CPUInfoEnd && CPUStart == 0) {
565 if (CIP < CPUInfoEnd && *CIP == '\n')
566 ++CIP;
567
568 if (CIP < CPUInfoEnd && *CIP == 'c') {
569 ++CIP;
570 if (CIP < CPUInfoEnd && *CIP == 'p') {
571 ++CIP;
572 if (CIP < CPUInfoEnd && *CIP == 'u') {
573 ++CIP;
574 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t'))
575 ++CIP;
576
577 if (CIP < CPUInfoEnd && *CIP == ':') {
578 ++CIP;
579 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t'))
580 ++CIP;
581
582 if (CIP < CPUInfoEnd) {
583 CPUStart = CIP;
584 while (CIP < CPUInfoEnd && (*CIP != ' ' && *CIP != '\t' &&
585 *CIP != ',' && *CIP != '\n'))
586 ++CIP;
587 CPULen = CIP - CPUStart;
588 }
589 }
590 }
591 }
592 }
593
594 if (CPUStart == 0)
595 while (CIP < CPUInfoEnd && *CIP != '\n')
596 ++CIP;
597 }
598
599 if (CPUStart == 0)
600 return generic;
601
602 return StringSwitch<const char *>(StringRef(CPUStart, CPULen))
603 .Case("604e", "604e")
604 .Case("604", "604")
605 .Case("7400", "7400")
606 .Case("7410", "7400")
607 .Case("7447", "7400")
608 .Case("7455", "7450")
609 .Case("G4", "g4")
Hal Finkelf1cc96a2012-06-12 16:39:23 +0000610 .Case("POWER4", "970")
Hal Finkel59b0ee82012-06-12 03:03:13 +0000611 .Case("PPC970FX", "970")
612 .Case("PPC970MP", "970")
613 .Case("G5", "g5")
614 .Case("POWER5", "g5")
615 .Case("A2", "a2")
616 .Case("POWER6", "pwr6")
617 .Case("POWER7", "pwr7")
Will Schmidt579e4022014-06-26 13:37:03 +0000618 .Case("POWER8", "pwr8")
619 .Case("POWER8E", "pwr8")
Hal Finkel59b0ee82012-06-12 03:03:13 +0000620 .Default(generic);
621}
Benjamin Kramerefe40282012-06-26 21:36:32 +0000622#elif defined(__linux__) && defined(__arm__)
Rafael Espindola1f58e4d2013-12-12 16:10:48 +0000623StringRef sys::getHostCPUName() {
Benjamin Kramerefe40282012-06-26 21:36:32 +0000624 // The cpuid register on arm is not accessible from user space. On Linux,
625 // it is exposed through the /proc/cpuinfo file.
Benjamin Kramerefe40282012-06-26 21:36:32 +0000626
627 // Read 1024 bytes from /proc/cpuinfo, which should contain the CPU part line
628 // in all cases.
629 char buffer[1024];
Rafael Espindola97935a92014-12-17 02:32:44 +0000630 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer));
631 if (CPUInfoSize == -1)
632 return "generic";
Benjamin Kramerefe40282012-06-26 21:36:32 +0000633
634 StringRef Str(buffer, CPUInfoSize);
635
636 SmallVector<StringRef, 32> Lines;
637 Str.split(Lines, "\n");
638
639 // Look for the CPU implementer line.
640 StringRef Implementer;
641 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
642 if (Lines[I].startswith("CPU implementer"))
643 Implementer = Lines[I].substr(15).ltrim("\t :");
644
645 if (Implementer == "0x41") // ARM Ltd.
646 // Look for the CPU part line.
647 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
648 if (Lines[I].startswith("CPU part"))
649 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
650 // values correspond to the "Part number" in the CP15/c0 register. The
651 // contents are specified in the various processor manuals.
652 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
653 .Case("0x926", "arm926ej-s")
654 .Case("0xb02", "mpcore")
655 .Case("0xb36", "arm1136j-s")
656 .Case("0xb56", "arm1156t2-s")
657 .Case("0xb76", "arm1176jz-s")
658 .Case("0xc08", "cortex-a8")
659 .Case("0xc09", "cortex-a9")
James Molloy3ebe7a52012-10-31 09:07:37 +0000660 .Case("0xc0f", "cortex-a15")
Benjamin Kramerefe40282012-06-26 21:36:32 +0000661 .Case("0xc20", "cortex-m0")
662 .Case("0xc23", "cortex-m3")
663 .Case("0xc24", "cortex-m4")
664 .Default("generic");
665
Kai Nackeb38bf962013-12-20 09:24:13 +0000666 if (Implementer == "0x51") // Qualcomm Technologies, Inc.
667 // Look for the CPU part line.
668 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
669 if (Lines[I].startswith("CPU part"))
670 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
671 // values correspond to the "Part number" in the CP15/c0 register. The
672 // contents are specified in the various processor manuals.
673 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
674 .Case("0x06f", "krait") // APQ8064
675 .Default("generic");
676
Benjamin Kramerefe40282012-06-26 21:36:32 +0000677 return "generic";
678}
Richard Sandifordf834ea12013-10-31 12:14:17 +0000679#elif defined(__linux__) && defined(__s390x__)
Rafael Espindola1f58e4d2013-12-12 16:10:48 +0000680StringRef sys::getHostCPUName() {
Richard Sandifordf834ea12013-10-31 12:14:17 +0000681 // STIDP is a privileged operation, so use /proc/cpuinfo instead.
Richard Sandifordf834ea12013-10-31 12:14:17 +0000682
683 // The "processor 0:" line comes after a fair amount of other information,
684 // including a cache breakdown, but this should be plenty.
685 char buffer[2048];
Rafael Espindola97935a92014-12-17 02:32:44 +0000686 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer));
687 if (CPUInfoSize == -1)
688 return "generic";
Richard Sandifordf834ea12013-10-31 12:14:17 +0000689
690 StringRef Str(buffer, CPUInfoSize);
691 SmallVector<StringRef, 32> Lines;
692 Str.split(Lines, "\n");
Ulrich Weiganda8b04e12015-05-05 19:23:40 +0000693
694 // Look for the CPU features.
695 SmallVector<StringRef, 32> CPUFeatures;
696 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
697 if (Lines[I].startswith("features")) {
698 size_t Pos = Lines[I].find(":");
699 if (Pos != StringRef::npos) {
Chandler Carruthe4405e92015-09-10 06:12:31 +0000700 Lines[I].drop_front(Pos + 1).split(CPUFeatures, ' ');
Ulrich Weiganda8b04e12015-05-05 19:23:40 +0000701 break;
702 }
703 }
704
705 // We need to check for the presence of vector support independently of
706 // the machine type, since we may only use the vector register set when
707 // supported by the kernel (and hypervisor).
708 bool HaveVectorSupport = false;
709 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) {
710 if (CPUFeatures[I] == "vx")
711 HaveVectorSupport = true;
712 }
713
714 // Now check the processor machine type.
Richard Sandifordf834ea12013-10-31 12:14:17 +0000715 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
716 if (Lines[I].startswith("processor ")) {
717 size_t Pos = Lines[I].find("machine = ");
718 if (Pos != StringRef::npos) {
719 Pos += sizeof("machine = ") - 1;
720 unsigned int Id;
721 if (!Lines[I].drop_front(Pos).getAsInteger(10, Id)) {
Ulrich Weiganda8b04e12015-05-05 19:23:40 +0000722 if (Id >= 2964 && HaveVectorSupport)
723 return "z13";
Richard Sandifordf834ea12013-10-31 12:14:17 +0000724 if (Id >= 2827)
725 return "zEC12";
726 if (Id >= 2817)
727 return "z196";
728 }
729 }
730 break;
731 }
732 }
733
734 return "generic";
735}
Torok Edwinabdc1c22009-12-13 08:59:40 +0000736#else
Rafael Espindola1f58e4d2013-12-12 16:10:48 +0000737StringRef sys::getHostCPUName() {
Benjamin Kramer713fd352009-11-17 17:57:04 +0000738 return "generic";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000739}
Torok Edwinabdc1c22009-12-13 08:59:40 +0000740#endif
Xerxes Ranby17dc3a02010-01-19 21:26:05 +0000741
Craig Topper798a2602015-03-29 01:00:23 +0000742#if defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)\
743 || defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64)
744bool sys::getHostCPUFeatures(StringMap<bool> &Features) {
745 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
746 unsigned MaxLevel;
747 union {
748 unsigned u[3];
749 char c[12];
750 } text;
751
752 if (GetX86CpuIDAndInfo(0, &MaxLevel, text.u+0, text.u+2, text.u+1) ||
753 MaxLevel < 1)
754 return false;
755
756 GetX86CpuIDAndInfo(1, &EAX, &EBX, &ECX, &EDX);
757
758 Features["cmov"] = (EDX >> 15) & 1;
759 Features["mmx"] = (EDX >> 23) & 1;
760 Features["sse"] = (EDX >> 25) & 1;
761 Features["sse2"] = (EDX >> 26) & 1;
762 Features["sse3"] = (ECX >> 0) & 1;
763 Features["ssse3"] = (ECX >> 9) & 1;
764 Features["sse4.1"] = (ECX >> 19) & 1;
765 Features["sse4.2"] = (ECX >> 20) & 1;
766
767 Features["pclmul"] = (ECX >> 1) & 1;
Craig Topper798a2602015-03-29 01:00:23 +0000768 Features["cx16"] = (ECX >> 13) & 1;
769 Features["movbe"] = (ECX >> 22) & 1;
770 Features["popcnt"] = (ECX >> 23) & 1;
771 Features["aes"] = (ECX >> 25) & 1;
Craig Topper798a2602015-03-29 01:00:23 +0000772 Features["rdrnd"] = (ECX >> 30) & 1;
773
774 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV
775 // indicates that the AVX registers will be saved and restored on context
776 // switch, then we have full AVX support.
Craig Topperb84b1262015-10-14 05:37:42 +0000777 bool HasAVXSave = ((ECX >> 27) & 1) && ((ECX >> 28) & 1) &&
778 !GetX86XCR0(&EAX, &EDX) && ((EAX & 0x6) == 0x6);
779 Features["avx"] = HasAVXSave;
780 Features["fma"] = HasAVXSave && (ECX >> 12) & 1;
781 Features["f16c"] = HasAVXSave && (ECX >> 29) & 1;
782
783 // Only enable XSAVE if OS has enabled support for saving YMM state.
784 Features["xsave"] = HasAVXSave && (ECX >> 26) & 1;
Craig Topper798a2602015-03-29 01:00:23 +0000785
786 // AVX512 requires additional context to be saved by the OS.
Craig Topperb84b1262015-10-14 05:37:42 +0000787 bool HasAVX512Save = HasAVXSave && ((EAX & 0xe0) == 0xe0);
Craig Topper798a2602015-03-29 01:00:23 +0000788
789 unsigned MaxExtLevel;
790 GetX86CpuIDAndInfo(0x80000000, &MaxExtLevel, &EBX, &ECX, &EDX);
791
792 bool HasExtLeaf1 = MaxExtLevel >= 0x80000001 &&
793 !GetX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
794 Features["lzcnt"] = HasExtLeaf1 && ((ECX >> 5) & 1);
795 Features["sse4a"] = HasExtLeaf1 && ((ECX >> 6) & 1);
796 Features["prfchw"] = HasExtLeaf1 && ((ECX >> 8) & 1);
Craig Topperb84b1262015-10-14 05:37:42 +0000797 Features["xop"] = HasExtLeaf1 && ((ECX >> 11) & 1) && HasAVXSave;
798 Features["fma4"] = HasExtLeaf1 && ((ECX >> 16) & 1) && HasAVXSave;
Craig Topper798a2602015-03-29 01:00:23 +0000799 Features["tbm"] = HasExtLeaf1 && ((ECX >> 21) & 1);
800
801 bool HasLeaf7 = MaxLevel >= 7 &&
802 !GetX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
803
804 // AVX2 is only supported if we have the OS save support from AVX.
Craig Topperb84b1262015-10-14 05:37:42 +0000805 Features["avx2"] = HasAVXSave && HasLeaf7 && ((EBX >> 5) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000806
807 Features["fsgsbase"] = HasLeaf7 && ((EBX >> 0) & 1);
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000808 Features["sgx"] = HasLeaf7 && ((EBX >> 2) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000809 Features["bmi"] = HasLeaf7 && ((EBX >> 3) & 1);
810 Features["hle"] = HasLeaf7 && ((EBX >> 4) & 1);
811 Features["bmi2"] = HasLeaf7 && ((EBX >> 8) & 1);
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000812 Features["invpcid"] = HasLeaf7 && ((EBX >> 10) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000813 Features["rtm"] = HasLeaf7 && ((EBX >> 11) & 1);
814 Features["rdseed"] = HasLeaf7 && ((EBX >> 18) & 1);
815 Features["adx"] = HasLeaf7 && ((EBX >> 19) & 1);
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000816 Features["smap"] = HasLeaf7 && ((EBX >> 20) & 1);
817 Features["pcommit"] = HasLeaf7 && ((EBX >> 22) & 1);
818 Features["clflushopt"] = HasLeaf7 && ((EBX >> 23) & 1);
819 Features["clwb"] = HasLeaf7 && ((EBX >> 24) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000820 Features["sha"] = HasLeaf7 && ((EBX >> 29) & 1);
821
822 // AVX512 is only supported if the OS supports the context save for it.
823 Features["avx512f"] = HasLeaf7 && ((EBX >> 16) & 1) && HasAVX512Save;
824 Features["avx512dq"] = HasLeaf7 && ((EBX >> 17) & 1) && HasAVX512Save;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000825 Features["avx512ifma"] = HasLeaf7 && ((EBX >> 21) & 1) && HasAVX512Save;
Craig Topper798a2602015-03-29 01:00:23 +0000826 Features["avx512pf"] = HasLeaf7 && ((EBX >> 26) & 1) && HasAVX512Save;
827 Features["avx512er"] = HasLeaf7 && ((EBX >> 27) & 1) && HasAVX512Save;
828 Features["avx512cd"] = HasLeaf7 && ((EBX >> 28) & 1) && HasAVX512Save;
829 Features["avx512bw"] = HasLeaf7 && ((EBX >> 30) & 1) && HasAVX512Save;
830 Features["avx512vl"] = HasLeaf7 && ((EBX >> 31) & 1) && HasAVX512Save;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000831
832 Features["prefetchwt1"] = HasLeaf7 && (ECX & 1);
833 Features["avx512vbmi"] = HasLeaf7 && ((ECX >> 1) & 1) && HasAVX512Save;
834 // Enable protection keys
835 Features["pku"] = HasLeaf7 && ((ECX >> 4) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000836
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000837 bool HasLeafD = MaxLevel >= 0xd &&
838 !GetX86CpuIDAndInfoEx(0xd, 0x1, &EAX, &EBX, &ECX, &EDX);
839
Craig Topperb84b1262015-10-14 05:37:42 +0000840 // Only enable XSAVE if OS has enabled support for saving YMM state.
841 Features["xsaveopt"] = HasAVXSave && HasLeafD && ((EAX >> 0) & 1);
842 Features["xsavec"] = HasAVXSave && HasLeafD && ((EAX >> 1) & 1);
843 Features["xsaves"] = HasAVXSave && HasLeafD && ((EAX >> 3) & 1);
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000844
Craig Topper798a2602015-03-29 01:00:23 +0000845 return true;
846}
847#elif defined(__linux__) && (defined(__arm__) || defined(__aarch64__))
Hao Liu10be3b22012-12-13 02:40:20 +0000848bool sys::getHostCPUFeatures(StringMap<bool> &Features) {
Hao Liu10be3b22012-12-13 02:40:20 +0000849 // Read 1024 bytes from /proc/cpuinfo, which should contain the Features line
850 // in all cases.
851 char buffer[1024];
Rafael Espindola97935a92014-12-17 02:32:44 +0000852 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer));
853 if (CPUInfoSize == -1)
854 return false;
Hao Liu10be3b22012-12-13 02:40:20 +0000855
856 StringRef Str(buffer, CPUInfoSize);
857
858 SmallVector<StringRef, 32> Lines;
859 Str.split(Lines, "\n");
860
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000861 SmallVector<StringRef, 32> CPUFeatures;
862
863 // Look for the CPU features.
Hao Liu10be3b22012-12-13 02:40:20 +0000864 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000865 if (Lines[I].startswith("Features")) {
Chandler Carruthe4405e92015-09-10 06:12:31 +0000866 Lines[I].split(CPUFeatures, ' ');
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000867 break;
Hao Liu10be3b22012-12-13 02:40:20 +0000868 }
869
Bradley Smith9288b212014-05-22 11:44:34 +0000870#if defined(__aarch64__)
871 // Keep track of which crypto features we have seen
872 enum {
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000873 CAP_AES = 0x1,
874 CAP_PMULL = 0x2,
875 CAP_SHA1 = 0x4,
876 CAP_SHA2 = 0x8
Bradley Smith9288b212014-05-22 11:44:34 +0000877 };
878 uint32_t crypto = 0;
879#endif
880
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000881 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) {
882 StringRef LLVMFeatureStr = StringSwitch<StringRef>(CPUFeatures[I])
Bradley Smith9288b212014-05-22 11:44:34 +0000883#if defined(__aarch64__)
884 .Case("asimd", "neon")
885 .Case("fp", "fp-armv8")
886 .Case("crc32", "crc")
887#else
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000888 .Case("half", "fp16")
889 .Case("neon", "neon")
890 .Case("vfpv3", "vfp3")
891 .Case("vfpv3d16", "d16")
892 .Case("vfpv4", "vfp4")
893 .Case("idiva", "hwdiv-arm")
894 .Case("idivt", "hwdiv")
Bradley Smith9288b212014-05-22 11:44:34 +0000895#endif
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000896 .Default("");
897
Bradley Smith9288b212014-05-22 11:44:34 +0000898#if defined(__aarch64__)
Alp Tokerda0c7932014-05-31 21:26:28 +0000899 // We need to check crypto separately since we need all of the crypto
Bradley Smith9288b212014-05-22 11:44:34 +0000900 // extensions to enable the subtarget feature
901 if (CPUFeatures[I] == "aes")
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000902 crypto |= CAP_AES;
Bradley Smith9288b212014-05-22 11:44:34 +0000903 else if (CPUFeatures[I] == "pmull")
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000904 crypto |= CAP_PMULL;
Bradley Smith9288b212014-05-22 11:44:34 +0000905 else if (CPUFeatures[I] == "sha1")
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000906 crypto |= CAP_SHA1;
Bradley Smith9288b212014-05-22 11:44:34 +0000907 else if (CPUFeatures[I] == "sha2")
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000908 crypto |= CAP_SHA2;
Bradley Smith9288b212014-05-22 11:44:34 +0000909#endif
910
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000911 if (LLVMFeatureStr != "")
David Blaikie5106ce72014-11-19 05:49:42 +0000912 Features[LLVMFeatureStr] = true;
Hao Liu10be3b22012-12-13 02:40:20 +0000913 }
914
Bradley Smith9288b212014-05-22 11:44:34 +0000915#if defined(__aarch64__)
916 // If we have all crypto bits we can add the feature
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000917 if (crypto == (CAP_AES | CAP_PMULL | CAP_SHA1 | CAP_SHA2))
David Blaikie5106ce72014-11-19 05:49:42 +0000918 Features["crypto"] = true;
Bradley Smith9288b212014-05-22 11:44:34 +0000919#endif
920
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000921 return true;
Hao Liu10be3b22012-12-13 02:40:20 +0000922}
923#else
Xerxes Ranby17dc3a02010-01-19 21:26:05 +0000924bool sys::getHostCPUFeatures(StringMap<bool> &Features){
925 return false;
926}
Hao Liu10be3b22012-12-13 02:40:20 +0000927#endif
Peter Collingbournea51c6ed2013-01-16 17:27:22 +0000928
929std::string sys::getProcessTriple() {
Duncan Sandse2cd1392013-07-17 11:01:05 +0000930 Triple PT(Triple::normalize(LLVM_HOST_TRIPLE));
Peter Collingbournea51c6ed2013-01-16 17:27:22 +0000931
932 if (sizeof(void *) == 8 && PT.isArch32Bit())
933 PT = PT.get64BitArchVariant();
934 if (sizeof(void *) == 4 && PT.isArch64Bit())
935 PT = PT.get32BitArchVariant();
936
937 return PT.str();
938}