blob: 5962e5ee1df9e09cc7283d49d0008343d06a09b8 [file] [log] [blame]
Daniel Dunbare52e6bf2008-10-02 01:17:28 +00001//===-- Host.cpp - Implement OS Host Concept --------------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Hans Wennborgcfe341f2014-06-20 01:36:00 +000010// This file implements the operating system Host concept.
Daniel Dunbare52e6bf2008-10-02 01:17:28 +000011//
12//===----------------------------------------------------------------------===//
13
Chandler Carruthed0881b2012-12-03 16:50:05 +000014#include "llvm/Support/Host.h"
Benjamin Kramerefe40282012-06-26 21:36:32 +000015#include "llvm/ADT/SmallVector.h"
Hal Finkel59b0ee82012-06-12 03:03:13 +000016#include "llvm/ADT/StringRef.h"
17#include "llvm/ADT/StringSwitch.h"
Peter Collingbournea51c6ed2013-01-16 17:27:22 +000018#include "llvm/ADT/Triple.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000019#include "llvm/Config/config.h"
Hal Finkel59b0ee82012-06-12 03:03:13 +000020#include "llvm/Support/Debug.h"
Rafael Espindola97935a92014-12-17 02:32:44 +000021#include "llvm/Support/FileSystem.h"
Eugene Zelenko1760dc22016-04-05 20:19:49 +000022#include <cstring>
23#include <string>
Daniel Dunbare52e6bf2008-10-02 01:17:28 +000024
25// Include the platform-specific parts of this class.
26#ifdef LLVM_ON_UNIX
27#include "Unix/Host.inc"
28#endif
29#ifdef LLVM_ON_WIN32
Michael J. Spencer447762d2010-11-29 18:16:10 +000030#include "Windows/Host.inc"
Daniel Dunbare52e6bf2008-10-02 01:17:28 +000031#endif
Benjamin Kramer38465062009-11-19 12:17:31 +000032#ifdef _MSC_VER
33#include <intrin.h>
34#endif
Hal Finkel59b0ee82012-06-12 03:03:13 +000035#if defined(__APPLE__) && (defined(__ppc__) || defined(__powerpc__))
36#include <mach/mach.h>
37#include <mach/mach_host.h>
38#include <mach/host_info.h>
39#include <mach/machine.h>
40#endif
Daniel Dunbare52e6bf2008-10-02 01:17:28 +000041
Chandler Carruth66f38db2014-04-21 23:58:10 +000042#define DEBUG_TYPE "host-detection"
43
Daniel Dunbar241d01b2009-11-14 10:09:12 +000044//===----------------------------------------------------------------------===//
45//
46// Implementations of the CPU detection routines
47//
48//===----------------------------------------------------------------------===//
49
50using namespace llvm;
51
Eugene Zelenko1760dc22016-04-05 20:19:49 +000052namespace {
53
Rafael Espindola81adfb52014-12-17 02:42:20 +000054#if defined(__linux__)
Eugene Zelenko1760dc22016-04-05 20:19:49 +000055ssize_t LLVM_ATTRIBUTE_UNUSED readCpuInfo(void *Buf, size_t Size) {
Rafael Espindola97935a92014-12-17 02:32:44 +000056 // Note: We cannot mmap /proc/cpuinfo here and then process the resulting
57 // memory buffer because the 'file' has 0 size (it can be read from only
58 // as a stream).
59
60 int FD;
61 std::error_code EC = sys::fs::openFileForRead("/proc/cpuinfo", FD);
62 if (EC) {
63 DEBUG(dbgs() << "Unable to open /proc/cpuinfo: " << EC.message() << "\n");
64 return -1;
65 }
66 int Ret = read(FD, Buf, Size);
67 int CloseStatus = close(FD);
68 if (CloseStatus)
69 return -1;
70 return Ret;
71}
Rafael Espindola81adfb52014-12-17 02:42:20 +000072#endif
Rafael Espindola97935a92014-12-17 02:32:44 +000073
Daniel Dunbar241d01b2009-11-14 10:09:12 +000074#if defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)\
75 || defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64)
76
77/// GetX86CpuIDAndInfo - Execute the specified cpuid and return the 4 values in the
78/// specified arguments. If we can't run cpuid on the host, return true.
Eugene Zelenko1760dc22016-04-05 20:19:49 +000079bool GetX86CpuIDAndInfo(unsigned value, unsigned *rEAX, unsigned *rEBX,
80 unsigned *rECX, unsigned *rEDX) {
Reid Klecknerbf4f9eb2013-08-16 22:42:42 +000081#if defined(__GNUC__) || defined(__clang__)
Reid Klecknerbe85cb92013-08-14 18:21:51 +000082 #if defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64)
Daniel Dunbar241d01b2009-11-14 10:09:12 +000083 // gcc doesn't know cpuid would clobber ebx/rbx. Preseve it manually.
84 asm ("movq\t%%rbx, %%rsi\n\t"
85 "cpuid\n\t"
86 "xchgq\t%%rbx, %%rsi\n\t"
87 : "=a" (*rEAX),
88 "=S" (*rEBX),
89 "=c" (*rECX),
90 "=d" (*rEDX)
91 : "a" (value));
92 return false;
Reid Klecknerbe85cb92013-08-14 18:21:51 +000093 #elif defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)
Daniel Dunbar241d01b2009-11-14 10:09:12 +000094 asm ("movl\t%%ebx, %%esi\n\t"
95 "cpuid\n\t"
96 "xchgl\t%%ebx, %%esi\n\t"
97 : "=a" (*rEAX),
98 "=S" (*rEBX),
99 "=c" (*rECX),
100 "=d" (*rEDX)
101 : "a" (value));
102 return false;
David Blaikieb48ed1a2012-01-17 04:43:56 +0000103// pedantic #else returns to appease -Wunreachable-code (so we don't generate
104// postprocessed code that looks like "return true; return false;")
105 #else
106 return true;
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000107 #endif
Reid Klecknerbf4f9eb2013-08-16 22:42:42 +0000108#elif defined(_MSC_VER)
109 // The MSVC intrinsic is portable across x86 and x64.
110 int registers[4];
111 __cpuid(registers, value);
112 *rEAX = registers[0];
113 *rEBX = registers[1];
114 *rECX = registers[2];
115 *rEDX = registers[3];
116 return false;
David Blaikieb48ed1a2012-01-17 04:43:56 +0000117#else
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000118 return true;
David Blaikieb48ed1a2012-01-17 04:43:56 +0000119#endif
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000120}
121
Tim Northover89ccb612013-11-25 09:52:59 +0000122/// GetX86CpuIDAndInfoEx - Execute the specified cpuid with subleaf and return the
123/// 4 values in the specified arguments. If we can't run cpuid on the host,
124/// return true.
Eugene Zelenko1760dc22016-04-05 20:19:49 +0000125bool GetX86CpuIDAndInfoEx(unsigned value, unsigned subleaf, unsigned *rEAX,
126 unsigned *rEBX, unsigned *rECX, unsigned *rEDX) {
Tim Northover89ccb612013-11-25 09:52:59 +0000127#if defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64)
128 #if defined(__GNUC__)
129 // gcc doesn't know cpuid would clobber ebx/rbx. Preseve it manually.
130 asm ("movq\t%%rbx, %%rsi\n\t"
131 "cpuid\n\t"
132 "xchgq\t%%rbx, %%rsi\n\t"
133 : "=a" (*rEAX),
134 "=S" (*rEBX),
135 "=c" (*rECX),
136 "=d" (*rEDX)
137 : "a" (value),
138 "c" (subleaf));
139 return false;
140 #elif defined(_MSC_VER)
Aaron Ballmanb664e2a2015-02-16 18:23:00 +0000141 int registers[4];
142 __cpuidex(registers, value, subleaf);
143 *rEAX = registers[0];
144 *rEBX = registers[1];
145 *rECX = registers[2];
146 *rEDX = registers[3];
147 return false;
Tim Northover89ccb612013-11-25 09:52:59 +0000148 #else
149 return true;
150 #endif
151#elif defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)
152 #if defined(__GNUC__)
153 asm ("movl\t%%ebx, %%esi\n\t"
154 "cpuid\n\t"
155 "xchgl\t%%ebx, %%esi\n\t"
156 : "=a" (*rEAX),
157 "=S" (*rEBX),
158 "=c" (*rECX),
159 "=d" (*rEDX)
160 : "a" (value),
161 "c" (subleaf));
162 return false;
163 #elif defined(_MSC_VER)
164 __asm {
165 mov eax,value
166 mov ecx,subleaf
167 cpuid
168 mov esi,rEAX
169 mov dword ptr [esi],eax
170 mov esi,rEBX
171 mov dword ptr [esi],ebx
172 mov esi,rECX
173 mov dword ptr [esi],ecx
174 mov esi,rEDX
175 mov dword ptr [esi],edx
176 }
177 return false;
178 #else
179 return true;
180 #endif
181#else
182 return true;
183#endif
184}
185
Eugene Zelenko1760dc22016-04-05 20:19:49 +0000186bool GetX86XCR0(unsigned *rEAX, unsigned *rEDX) {
Craig Topper7af39d72013-04-22 05:38:01 +0000187#if defined(__GNUC__)
188 // Check xgetbv; this uses a .byte sequence instead of the instruction
189 // directly because older assemblers do not include support for xgetbv and
190 // there is no easy way to conditionally compile based on the assembler used.
Craig Topper798a2602015-03-29 01:00:23 +0000191 __asm__ (".byte 0x0f, 0x01, 0xd0" : "=a" (*rEAX), "=d" (*rEDX) : "c" (0));
192 return false;
Aaron Ballman31c0adc2013-04-23 17:38:44 +0000193#elif defined(_MSC_FULL_VER) && defined(_XCR_XFEATURE_ENABLED_MASK)
Craig Topper798a2602015-03-29 01:00:23 +0000194 unsigned long long Result = _xgetbv(_XCR_XFEATURE_ENABLED_MASK);
Craig Topper7db49fd2015-03-29 01:07:57 +0000195 *rEAX = Result;
196 *rEDX = Result >> 32;
Craig Topper798a2602015-03-29 01:00:23 +0000197 return false;
Craig Topper7af39d72013-04-22 05:38:01 +0000198#else
Craig Topper798a2602015-03-29 01:00:23 +0000199 return true;
Craig Topper7af39d72013-04-22 05:38:01 +0000200#endif
Aaron Ballman5f7c6802013-04-03 12:25:06 +0000201}
202
Eugene Zelenko1760dc22016-04-05 20:19:49 +0000203void DetectX86FamilyModel(unsigned EAX, unsigned &Family, unsigned &Model) {
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000204 Family = (EAX >> 8) & 0xf; // Bits 8 - 11
205 Model = (EAX >> 4) & 0xf; // Bits 4 - 7
206 if (Family == 6 || Family == 0xf) {
207 if (Family == 0xf)
208 // Examine extended family ID if family ID is F.
209 Family += (EAX >> 20) & 0xff; // Bits 20 - 27
210 // Examine extended model ID if family ID is 6 or F.
211 Model += ((EAX >> 16) & 0xf) << 4; // Bits 16 - 19
212 }
213}
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000214
Eugene Zelenko1760dc22016-04-05 20:19:49 +0000215} // end anonymous namespace
216
Rafael Espindola74f444c2013-12-12 15:45:32 +0000217StringRef sys::getHostCPUName() {
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000218 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
219 if (GetX86CpuIDAndInfo(0x1, &EAX, &EBX, &ECX, &EDX))
220 return "generic";
221 unsigned Family = 0;
222 unsigned Model = 0;
223 DetectX86FamilyModel(EAX, Family, Model);
224
Tim Northover89ccb612013-11-25 09:52:59 +0000225 union {
226 unsigned u[3];
227 char c[12];
228 } text;
229
Craig Topper1214bdc2015-03-31 05:42:45 +0000230 unsigned MaxLeaf;
231 GetX86CpuIDAndInfo(0, &MaxLeaf, text.u+0, text.u+2, text.u+1);
Tim Northover89ccb612013-11-25 09:52:59 +0000232
Craig Topper1214bdc2015-03-31 05:42:45 +0000233 bool HasMMX = (EDX >> 23) & 1;
234 bool HasSSE = (EDX >> 25) & 1;
235 bool HasSSE2 = (EDX >> 26) & 1;
236 bool HasSSE3 = (ECX >> 0) & 1;
237 bool HasSSSE3 = (ECX >> 9) & 1;
238 bool HasSSE41 = (ECX >> 19) & 1;
239 bool HasSSE42 = (ECX >> 20) & 1;
240 bool HasMOVBE = (ECX >> 22) & 1;
241 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV
Aaron Ballman5f7c6802013-04-03 12:25:06 +0000242 // indicates that the AVX registers will be saved and restored on context
243 // switch, then we have full AVX support.
Aaron Ballman5e6d2052013-04-03 18:00:22 +0000244 const unsigned AVXBits = (1 << 27) | (1 << 28);
Craig Topper798a2602015-03-29 01:00:23 +0000245 bool HasAVX = ((ECX & AVXBits) == AVXBits) && !GetX86XCR0(&EAX, &EDX) &&
246 ((EAX & 0x6) == 0x6);
Craig Topper1214bdc2015-03-31 05:42:45 +0000247 bool HasAVX512Save = HasAVX && ((EAX & 0xe0) == 0xe0);
248 bool HasLeaf7 = MaxLeaf >= 0x7 &&
249 !GetX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
250 bool HasADX = HasLeaf7 && ((EBX >> 19) & 1);
251 bool HasAVX2 = HasAVX && HasLeaf7 && (EBX & 0x20);
252 bool HasAVX512 = HasLeaf7 && HasAVX512Save && ((EBX >> 16) & 1);
253
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000254 GetX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
255 bool Em64T = (EDX >> 29) & 0x1;
Kaelyn Takataa39d2a02014-05-05 16:32:10 +0000256 bool HasTBM = (ECX >> 21) & 0x1;
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000257
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000258 if (memcmp(text.c, "GenuineIntel", 12) == 0) {
259 switch (Family) {
Daniel Dunbar397235f2009-11-14 21:36:19 +0000260 case 3:
261 return "i386";
262 case 4:
263 switch (Model) {
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000264 case 0: // Intel486 DX processors
265 case 1: // Intel486 DX processors
Daniel Dunbar397235f2009-11-14 21:36:19 +0000266 case 2: // Intel486 SX processors
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000267 case 3: // Intel487 processors, IntelDX2 OverDrive processors,
268 // IntelDX2 processors
Daniel Dunbar397235f2009-11-14 21:36:19 +0000269 case 4: // Intel486 SL processor
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000270 case 5: // IntelSX2 processors
Daniel Dunbar397235f2009-11-14 21:36:19 +0000271 case 7: // Write-Back Enhanced IntelDX2 processors
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000272 case 8: // IntelDX4 OverDrive processors, IntelDX4 processors
Daniel Dunbar397235f2009-11-14 21:36:19 +0000273 default: return "i486";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000274 }
Daniel Dunbar397235f2009-11-14 21:36:19 +0000275 case 5:
276 switch (Model) {
277 case 1: // Pentium OverDrive processor for Pentium processor (60, 66),
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000278 // Pentium processors (60, 66)
Daniel Dunbar397235f2009-11-14 21:36:19 +0000279 case 2: // Pentium OverDrive processor for Pentium processor (75, 90,
280 // 100, 120, 133), Pentium processors (75, 90, 100, 120, 133,
281 // 150, 166, 200)
282 case 3: // Pentium OverDrive processors for Intel486 processor-based
283 // systems
284 return "pentium";
285
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000286 case 4: // Pentium OverDrive processor with MMX technology for Pentium
Daniel Dunbar397235f2009-11-14 21:36:19 +0000287 // processor (75, 90, 100, 120, 133), Pentium processor with
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000288 // MMX technology (166, 200)
Daniel Dunbar397235f2009-11-14 21:36:19 +0000289 return "pentium-mmx";
290
291 default: return "pentium";
292 }
293 case 6:
294 switch (Model) {
295 case 1: // Pentium Pro processor
296 return "pentiumpro";
297
298 case 3: // Intel Pentium II OverDrive processor, Pentium II processor,
299 // model 03
300 case 5: // Pentium II processor, model 05, Pentium II Xeon processor,
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000301 // model 05, and Intel Celeron processor, model 05
Daniel Dunbar397235f2009-11-14 21:36:19 +0000302 case 6: // Celeron processor, model 06
303 return "pentium2";
304
305 case 7: // Pentium III processor, model 07, and Pentium III Xeon
306 // processor, model 07
307 case 8: // Pentium III processor, model 08, Pentium III Xeon processor,
308 // model 08, and Celeron processor, model 08
309 case 10: // Pentium III Xeon processor, model 0Ah
310 case 11: // Pentium III processor, model 0Bh
311 return "pentium3";
312
313 case 9: // Intel Pentium M processor, Intel Celeron M processor model 09.
314 case 13: // Intel Pentium M processor, Intel Celeron M processor, model
315 // 0Dh. All processors are manufactured using the 90 nm process.
Craig Topper06682852015-03-30 06:31:06 +0000316 case 21: // Intel EP80579 Integrated Processor and Intel EP80579
317 // Integrated Processor with Intel QuickAssist Technology
Daniel Dunbar397235f2009-11-14 21:36:19 +0000318 return "pentium-m";
319
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000320 case 14: // Intel Core Duo processor, Intel Core Solo processor, model
Daniel Dunbar397235f2009-11-14 21:36:19 +0000321 // 0Eh. All processors are manufactured using the 65 nm process.
322 return "yonah";
323
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000324 case 15: // Intel Core 2 Duo processor, Intel Core 2 Duo mobile
325 // processor, Intel Core 2 Quad processor, Intel Core 2 Quad
326 // mobile processor, Intel Core 2 Extreme processor, Intel
Daniel Dunbar397235f2009-11-14 21:36:19 +0000327 // Pentium Dual-Core processor, Intel Xeon processor, model
328 // 0Fh. All processors are manufactured using the 65 nm process.
329 case 22: // Intel Celeron processor model 16h. All processors are
330 // manufactured using the 65 nm process
331 return "core2";
332
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000333 case 23: // Intel Core 2 Extreme processor, Intel Xeon processor, model
Daniel Dunbar397235f2009-11-14 21:36:19 +0000334 // 17h. All processors are manufactured using the 45 nm process.
335 //
336 // 45nm: Penryn , Wolfdale, Yorkfield (XE)
Craig Topper4e78a922015-03-30 06:31:03 +0000337 case 29: // Intel Xeon processor MP. All processors are manufactured using
338 // the 45 nm process.
Craig Topper545b9512015-03-31 06:18:31 +0000339 return "penryn";
Daniel Dunbar397235f2009-11-14 21:36:19 +0000340
341 case 26: // Intel Core i7 processor and Intel Xeon processor. All
342 // processors are manufactured using the 45 nm process.
Jakob Stoklund Olesen49e58a92010-09-19 17:54:28 +0000343 case 30: // Intel(R) Core(TM) i7 CPU 870 @ 2.93GHz.
344 // As found in a Summer 2010 model iMac.
Craig Topper3c2e7582015-03-30 06:31:09 +0000345 case 46: // Nehalem EX
346 return "nehalem";
Chris Lattnerb737bac2010-09-19 00:31:58 +0000347 case 37: // Intel Core i7, laptop version.
Benjamin Kramer5a122f32011-08-25 18:05:56 +0000348 case 44: // Intel Core i7 processor and Intel Xeon processor. All
349 // processors are manufactured using the 32 nm process.
Benjamin Kramer9d6063a2012-09-26 18:21:47 +0000350 case 47: // Westmere EX
Craig Topper3c2e7582015-03-30 06:31:09 +0000351 return "westmere";
Bob Wilsond0f06002011-07-08 22:33:59 +0000352
353 // SandyBridge:
354 case 42: // Intel Core i7 processor. All processors are manufactured
355 // using the 32 nm process.
Chris Lattner889c40e2011-06-09 06:38:17 +0000356 case 45:
Craig Topper545b9512015-03-31 06:18:31 +0000357 return "sandybridge";
Daniel Dunbar397235f2009-11-14 21:36:19 +0000358
Evan Cheng7fd16072012-04-23 22:41:39 +0000359 // Ivy Bridge:
360 case 58:
Tim Northover89ccb612013-11-25 09:52:59 +0000361 case 62: // Ivy Bridge EP
Craig Topper545b9512015-03-31 06:18:31 +0000362 return "ivybridge";
Evan Cheng7fd16072012-04-23 22:41:39 +0000363
Tim Northover89ccb612013-11-25 09:52:59 +0000364 // Haswell:
365 case 60:
366 case 63:
367 case 69:
368 case 70:
Craig Topper545b9512015-03-31 06:18:31 +0000369 return "haswell";
Tim Northover89ccb612013-11-25 09:52:59 +0000370
Craig Topper1e1b0f72015-03-23 00:15:06 +0000371 // Broadwell:
372 case 61:
Craig Topper68ba18f2015-08-08 01:29:15 +0000373 case 71:
Craig Topper545b9512015-03-31 06:18:31 +0000374 return "broadwell";
Craig Topper1e1b0f72015-03-23 00:15:06 +0000375
Craig Topper68ba18f2015-08-08 01:29:15 +0000376 // Skylake:
377 case 78:
Sanjoy Dasaa63dc02016-02-21 17:12:03 +0000378 return "skylake-avx512";
Craig Topper68ba18f2015-08-08 01:29:15 +0000379 case 94:
380 return "skylake";
381
Preston Gurdc0b976c2012-05-02 21:38:46 +0000382 case 28: // Most 45 nm Intel Atom processors
383 case 38: // 45 nm Atom Lincroft
384 case 39: // 32 nm Atom Medfield
Preston Gurd8e082682012-07-19 19:05:37 +0000385 case 53: // 32 nm Atom Midview
386 case 54: // 32 nm Atom Midview
Craig Topper3c2e7582015-03-30 06:31:09 +0000387 return "bonnell";
Daniel Dunbar397235f2009-11-14 21:36:19 +0000388
Preston Gurd3fe264d2013-09-13 19:23:28 +0000389 // Atom Silvermont codes from the Intel software optimization guide.
390 case 55:
Benjamin Kramer8f429382013-08-30 14:05:32 +0000391 case 74:
392 case 77:
Craig Toppera3db7d22015-08-07 20:09:42 +0000393 case 90:
Craig Topperf7ce7542015-08-08 01:16:05 +0000394 case 93:
Craig Topper3c2e7582015-03-30 06:31:09 +0000395 return "silvermont";
Benjamin Kramer8f429382013-08-30 14:05:32 +0000396
Craig Topper1214bdc2015-03-31 05:42:45 +0000397 default: // Unknown family 6 CPU, try to guess.
398 if (HasAVX512)
399 return "knl";
400 if (HasADX)
401 return "broadwell";
402 if (HasAVX2)
403 return "haswell";
404 if (HasAVX)
405 return "sandybridge";
406 if (HasSSE42)
407 return HasMOVBE ? "silvermont" : "nehalem";
408 if (HasSSE41)
409 return "penryn";
410 if (HasSSSE3)
411 return HasMOVBE ? "bonnell" : "core2";
412 if (Em64T)
413 return "x86-64";
414 if (HasSSE2)
415 return "pentium-m";
416 if (HasSSE)
417 return "pentium3";
418 if (HasMMX)
419 return "pentium2";
420 return "pentiumpro";
Daniel Dunbar397235f2009-11-14 21:36:19 +0000421 }
422 case 15: {
423 switch (Model) {
424 case 0: // Pentium 4 processor, Intel Xeon processor. All processors are
425 // model 00h and manufactured using the 0.18 micron process.
426 case 1: // Pentium 4 processor, Intel Xeon processor, Intel Xeon
427 // processor MP, and Intel Celeron processor. All processors are
428 // model 01h and manufactured using the 0.18 micron process.
NAKAMURA Takumi19e11f12010-09-09 13:30:48 +0000429 case 2: // Pentium 4 processor, Mobile Intel Pentium 4 processor - M,
Daniel Dunbar397235f2009-11-14 21:36:19 +0000430 // Intel Xeon processor, Intel Xeon processor MP, Intel Celeron
431 // processor, and Mobile Intel Celeron processor. All processors
432 // are model 02h and manufactured using the 0.13 micron process.
433 return (Em64T) ? "x86-64" : "pentium4";
434
435 case 3: // Pentium 4 processor, Intel Xeon processor, Intel Celeron D
436 // processor. All processors are model 03h and manufactured using
437 // the 90 nm process.
438 case 4: // Pentium 4 processor, Pentium 4 processor Extreme Edition,
439 // Pentium D processor, Intel Xeon processor, Intel Xeon
440 // processor MP, Intel Celeron D processor. All processors are
441 // model 04h and manufactured using the 90 nm process.
442 case 6: // Pentium 4 processor, Pentium D processor, Pentium processor
443 // Extreme Edition, Intel Xeon processor, Intel Xeon processor
444 // MP, Intel Celeron D processor. All processors are model 06h
445 // and manufactured using the 65 nm process.
446 return (Em64T) ? "nocona" : "prescott";
447
Daniel Dunbar397235f2009-11-14 21:36:19 +0000448 default:
449 return (Em64T) ? "x86-64" : "pentium4";
450 }
451 }
452
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000453 default:
Benjamin Kramer713fd352009-11-17 17:57:04 +0000454 return "generic";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000455 }
456 } else if (memcmp(text.c, "AuthenticAMD", 12) == 0) {
457 // FIXME: this poorly matches the generated SubtargetFeatureKV table. There
458 // appears to be no way to generate the wide variety of AMD-specific targets
459 // from the information returned from CPUID.
460 switch (Family) {
461 case 4:
462 return "i486";
463 case 5:
464 switch (Model) {
465 case 6:
466 case 7: return "k6";
467 case 8: return "k6-2";
468 case 9:
469 case 13: return "k6-3";
Roman Divackyfd690092012-09-12 14:36:02 +0000470 case 10: return "geode";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000471 default: return "pentium";
472 }
473 case 6:
474 switch (Model) {
475 case 4: return "athlon-tbird";
476 case 6:
477 case 7:
478 case 8: return "athlon-mp";
479 case 10: return "athlon-xp";
480 default: return "athlon";
481 }
482 case 15:
Chris Lattner963debc2010-09-06 05:19:44 +0000483 if (HasSSE3)
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000484 return "k8-sse3";
Chris Lattner963debc2010-09-06 05:19:44 +0000485 switch (Model) {
486 case 1: return "opteron";
487 case 5: return "athlon-fx"; // also opteron
488 default: return "athlon64";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000489 }
490 case 16:
491 return "amdfam10";
Benjamin Kramer077ae1d2012-01-10 11:50:02 +0000492 case 20:
493 return "btver1";
Benjamin Kramer3ced5452011-12-01 18:24:17 +0000494 case 21:
Benjamin Kramerb44c4272013-05-03 10:20:08 +0000495 if (!HasAVX) // If the OS doesn't support AVX provide a sane fallback.
496 return "btver1";
Benjamin Kramer60045732014-05-02 15:47:07 +0000497 if (Model >= 0x50)
498 return "bdver4"; // 50h-6Fh: Excavator
Benjamin Kramerd114def2013-11-04 10:29:20 +0000499 if (Model >= 0x30)
500 return "bdver3"; // 30h-3Fh: Steamroller
Kaelyn Takataa39d2a02014-05-05 16:32:10 +0000501 if (Model >= 0x10 || HasTBM)
Benjamin Kramerd114def2013-11-04 10:29:20 +0000502 return "bdver2"; // 10h-1Fh: Piledriver
503 return "bdver1"; // 00h-0Fh: Bulldozer
Benjamin Kramerb44c4272013-05-03 10:20:08 +0000504 case 22:
505 if (!HasAVX) // If the OS doesn't support AVX provide a sane fallback.
506 return "btver1";
507 return "btver2";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000508 default:
Benjamin Kramer713fd352009-11-17 17:57:04 +0000509 return "generic";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000510 }
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000511 }
Torok Edwin022336a2009-12-14 12:38:18 +0000512 return "generic";
Torok Edwinabdc1c22009-12-13 08:59:40 +0000513}
Hal Finkel59b0ee82012-06-12 03:03:13 +0000514#elif defined(__APPLE__) && (defined(__ppc__) || defined(__powerpc__))
Rafael Espindola1f58e4d2013-12-12 16:10:48 +0000515StringRef sys::getHostCPUName() {
Hal Finkel59b0ee82012-06-12 03:03:13 +0000516 host_basic_info_data_t hostInfo;
517 mach_msg_type_number_t infoCount;
518
519 infoCount = HOST_BASIC_INFO_COUNT;
520 host_info(mach_host_self(), HOST_BASIC_INFO, (host_info_t)&hostInfo,
521 &infoCount);
522
523 if (hostInfo.cpu_type != CPU_TYPE_POWERPC) return "generic";
524
525 switch(hostInfo.cpu_subtype) {
526 case CPU_SUBTYPE_POWERPC_601: return "601";
527 case CPU_SUBTYPE_POWERPC_602: return "602";
528 case CPU_SUBTYPE_POWERPC_603: return "603";
529 case CPU_SUBTYPE_POWERPC_603e: return "603e";
530 case CPU_SUBTYPE_POWERPC_603ev: return "603ev";
531 case CPU_SUBTYPE_POWERPC_604: return "604";
532 case CPU_SUBTYPE_POWERPC_604e: return "604e";
533 case CPU_SUBTYPE_POWERPC_620: return "620";
534 case CPU_SUBTYPE_POWERPC_750: return "750";
535 case CPU_SUBTYPE_POWERPC_7400: return "7400";
536 case CPU_SUBTYPE_POWERPC_7450: return "7450";
537 case CPU_SUBTYPE_POWERPC_970: return "970";
538 default: ;
539 }
540
541 return "generic";
542}
543#elif defined(__linux__) && (defined(__ppc__) || defined(__powerpc__))
Rafael Espindolab75ea012013-12-12 16:17:40 +0000544StringRef sys::getHostCPUName() {
Hal Finkel59b0ee82012-06-12 03:03:13 +0000545 // Access to the Processor Version Register (PVR) on PowerPC is privileged,
546 // and so we must use an operating-system interface to determine the current
547 // processor type. On Linux, this is exposed through the /proc/cpuinfo file.
548 const char *generic = "generic";
549
Hal Finkel59b0ee82012-06-12 03:03:13 +0000550 // The cpu line is second (after the 'processor: 0' line), so if this
551 // buffer is too small then something has changed (or is wrong).
552 char buffer[1024];
Rafael Espindola97935a92014-12-17 02:32:44 +0000553 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer));
554 if (CPUInfoSize == -1)
555 return generic;
Hal Finkel59b0ee82012-06-12 03:03:13 +0000556
557 const char *CPUInfoStart = buffer;
558 const char *CPUInfoEnd = buffer + CPUInfoSize;
559
560 const char *CIP = CPUInfoStart;
561
562 const char *CPUStart = 0;
563 size_t CPULen = 0;
564
565 // We need to find the first line which starts with cpu, spaces, and a colon.
566 // After the colon, there may be some additional spaces and then the cpu type.
567 while (CIP < CPUInfoEnd && CPUStart == 0) {
568 if (CIP < CPUInfoEnd && *CIP == '\n')
569 ++CIP;
570
571 if (CIP < CPUInfoEnd && *CIP == 'c') {
572 ++CIP;
573 if (CIP < CPUInfoEnd && *CIP == 'p') {
574 ++CIP;
575 if (CIP < CPUInfoEnd && *CIP == 'u') {
576 ++CIP;
577 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t'))
578 ++CIP;
579
580 if (CIP < CPUInfoEnd && *CIP == ':') {
581 ++CIP;
582 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t'))
583 ++CIP;
584
585 if (CIP < CPUInfoEnd) {
586 CPUStart = CIP;
587 while (CIP < CPUInfoEnd && (*CIP != ' ' && *CIP != '\t' &&
588 *CIP != ',' && *CIP != '\n'))
589 ++CIP;
590 CPULen = CIP - CPUStart;
591 }
592 }
593 }
594 }
595 }
596
597 if (CPUStart == 0)
598 while (CIP < CPUInfoEnd && *CIP != '\n')
599 ++CIP;
600 }
601
602 if (CPUStart == 0)
603 return generic;
604
605 return StringSwitch<const char *>(StringRef(CPUStart, CPULen))
606 .Case("604e", "604e")
607 .Case("604", "604")
608 .Case("7400", "7400")
609 .Case("7410", "7400")
610 .Case("7447", "7400")
611 .Case("7455", "7450")
612 .Case("G4", "g4")
Hal Finkelf1cc96a2012-06-12 16:39:23 +0000613 .Case("POWER4", "970")
Hal Finkel59b0ee82012-06-12 03:03:13 +0000614 .Case("PPC970FX", "970")
615 .Case("PPC970MP", "970")
616 .Case("G5", "g5")
617 .Case("POWER5", "g5")
618 .Case("A2", "a2")
619 .Case("POWER6", "pwr6")
620 .Case("POWER7", "pwr7")
Will Schmidt579e4022014-06-26 13:37:03 +0000621 .Case("POWER8", "pwr8")
622 .Case("POWER8E", "pwr8")
Hal Finkel59b0ee82012-06-12 03:03:13 +0000623 .Default(generic);
624}
Benjamin Kramerefe40282012-06-26 21:36:32 +0000625#elif defined(__linux__) && defined(__arm__)
Rafael Espindola1f58e4d2013-12-12 16:10:48 +0000626StringRef sys::getHostCPUName() {
Benjamin Kramerefe40282012-06-26 21:36:32 +0000627 // The cpuid register on arm is not accessible from user space. On Linux,
628 // it is exposed through the /proc/cpuinfo file.
Benjamin Kramerefe40282012-06-26 21:36:32 +0000629
630 // Read 1024 bytes from /proc/cpuinfo, which should contain the CPU part line
631 // in all cases.
632 char buffer[1024];
Rafael Espindola97935a92014-12-17 02:32:44 +0000633 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer));
634 if (CPUInfoSize == -1)
635 return "generic";
Benjamin Kramerefe40282012-06-26 21:36:32 +0000636
637 StringRef Str(buffer, CPUInfoSize);
638
639 SmallVector<StringRef, 32> Lines;
640 Str.split(Lines, "\n");
641
642 // Look for the CPU implementer line.
643 StringRef Implementer;
644 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
645 if (Lines[I].startswith("CPU implementer"))
646 Implementer = Lines[I].substr(15).ltrim("\t :");
647
648 if (Implementer == "0x41") // ARM Ltd.
649 // Look for the CPU part line.
650 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
651 if (Lines[I].startswith("CPU part"))
652 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
653 // values correspond to the "Part number" in the CP15/c0 register. The
654 // contents are specified in the various processor manuals.
655 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
656 .Case("0x926", "arm926ej-s")
657 .Case("0xb02", "mpcore")
658 .Case("0xb36", "arm1136j-s")
659 .Case("0xb56", "arm1156t2-s")
660 .Case("0xb76", "arm1176jz-s")
661 .Case("0xc08", "cortex-a8")
662 .Case("0xc09", "cortex-a9")
James Molloy3ebe7a52012-10-31 09:07:37 +0000663 .Case("0xc0f", "cortex-a15")
Benjamin Kramerefe40282012-06-26 21:36:32 +0000664 .Case("0xc20", "cortex-m0")
665 .Case("0xc23", "cortex-m3")
666 .Case("0xc24", "cortex-m4")
667 .Default("generic");
668
Kai Nackeb38bf962013-12-20 09:24:13 +0000669 if (Implementer == "0x51") // Qualcomm Technologies, Inc.
670 // Look for the CPU part line.
671 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
672 if (Lines[I].startswith("CPU part"))
673 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The
674 // values correspond to the "Part number" in the CP15/c0 register. The
675 // contents are specified in the various processor manuals.
676 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :"))
677 .Case("0x06f", "krait") // APQ8064
678 .Default("generic");
679
Benjamin Kramerefe40282012-06-26 21:36:32 +0000680 return "generic";
681}
Richard Sandifordf834ea12013-10-31 12:14:17 +0000682#elif defined(__linux__) && defined(__s390x__)
Rafael Espindola1f58e4d2013-12-12 16:10:48 +0000683StringRef sys::getHostCPUName() {
Richard Sandifordf834ea12013-10-31 12:14:17 +0000684 // STIDP is a privileged operation, so use /proc/cpuinfo instead.
Richard Sandifordf834ea12013-10-31 12:14:17 +0000685
686 // The "processor 0:" line comes after a fair amount of other information,
687 // including a cache breakdown, but this should be plenty.
688 char buffer[2048];
Rafael Espindola97935a92014-12-17 02:32:44 +0000689 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer));
690 if (CPUInfoSize == -1)
691 return "generic";
Richard Sandifordf834ea12013-10-31 12:14:17 +0000692
693 StringRef Str(buffer, CPUInfoSize);
694 SmallVector<StringRef, 32> Lines;
695 Str.split(Lines, "\n");
Ulrich Weiganda8b04e12015-05-05 19:23:40 +0000696
697 // Look for the CPU features.
698 SmallVector<StringRef, 32> CPUFeatures;
699 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
700 if (Lines[I].startswith("features")) {
701 size_t Pos = Lines[I].find(":");
702 if (Pos != StringRef::npos) {
Chandler Carruthe4405e92015-09-10 06:12:31 +0000703 Lines[I].drop_front(Pos + 1).split(CPUFeatures, ' ');
Ulrich Weiganda8b04e12015-05-05 19:23:40 +0000704 break;
705 }
706 }
707
708 // We need to check for the presence of vector support independently of
709 // the machine type, since we may only use the vector register set when
710 // supported by the kernel (and hypervisor).
711 bool HaveVectorSupport = false;
712 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) {
713 if (CPUFeatures[I] == "vx")
714 HaveVectorSupport = true;
715 }
716
717 // Now check the processor machine type.
Richard Sandifordf834ea12013-10-31 12:14:17 +0000718 for (unsigned I = 0, E = Lines.size(); I != E; ++I) {
719 if (Lines[I].startswith("processor ")) {
720 size_t Pos = Lines[I].find("machine = ");
721 if (Pos != StringRef::npos) {
722 Pos += sizeof("machine = ") - 1;
723 unsigned int Id;
724 if (!Lines[I].drop_front(Pos).getAsInteger(10, Id)) {
Ulrich Weiganda8b04e12015-05-05 19:23:40 +0000725 if (Id >= 2964 && HaveVectorSupport)
726 return "z13";
Richard Sandifordf834ea12013-10-31 12:14:17 +0000727 if (Id >= 2827)
728 return "zEC12";
729 if (Id >= 2817)
730 return "z196";
731 }
732 }
733 break;
734 }
735 }
736
737 return "generic";
738}
Torok Edwinabdc1c22009-12-13 08:59:40 +0000739#else
Rafael Espindola1f58e4d2013-12-12 16:10:48 +0000740StringRef sys::getHostCPUName() {
Benjamin Kramer713fd352009-11-17 17:57:04 +0000741 return "generic";
Daniel Dunbar241d01b2009-11-14 10:09:12 +0000742}
Torok Edwinabdc1c22009-12-13 08:59:40 +0000743#endif
Xerxes Ranby17dc3a02010-01-19 21:26:05 +0000744
Craig Topper798a2602015-03-29 01:00:23 +0000745#if defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)\
746 || defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64)
747bool sys::getHostCPUFeatures(StringMap<bool> &Features) {
748 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0;
749 unsigned MaxLevel;
750 union {
751 unsigned u[3];
752 char c[12];
753 } text;
754
755 if (GetX86CpuIDAndInfo(0, &MaxLevel, text.u+0, text.u+2, text.u+1) ||
756 MaxLevel < 1)
757 return false;
758
759 GetX86CpuIDAndInfo(1, &EAX, &EBX, &ECX, &EDX);
760
761 Features["cmov"] = (EDX >> 15) & 1;
762 Features["mmx"] = (EDX >> 23) & 1;
763 Features["sse"] = (EDX >> 25) & 1;
764 Features["sse2"] = (EDX >> 26) & 1;
765 Features["sse3"] = (ECX >> 0) & 1;
766 Features["ssse3"] = (ECX >> 9) & 1;
767 Features["sse4.1"] = (ECX >> 19) & 1;
768 Features["sse4.2"] = (ECX >> 20) & 1;
769
770 Features["pclmul"] = (ECX >> 1) & 1;
Craig Topper798a2602015-03-29 01:00:23 +0000771 Features["cx16"] = (ECX >> 13) & 1;
772 Features["movbe"] = (ECX >> 22) & 1;
773 Features["popcnt"] = (ECX >> 23) & 1;
774 Features["aes"] = (ECX >> 25) & 1;
Craig Topper798a2602015-03-29 01:00:23 +0000775 Features["rdrnd"] = (ECX >> 30) & 1;
776
777 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV
778 // indicates that the AVX registers will be saved and restored on context
779 // switch, then we have full AVX support.
Craig Topperb84b1262015-10-14 05:37:42 +0000780 bool HasAVXSave = ((ECX >> 27) & 1) && ((ECX >> 28) & 1) &&
781 !GetX86XCR0(&EAX, &EDX) && ((EAX & 0x6) == 0x6);
782 Features["avx"] = HasAVXSave;
783 Features["fma"] = HasAVXSave && (ECX >> 12) & 1;
784 Features["f16c"] = HasAVXSave && (ECX >> 29) & 1;
785
786 // Only enable XSAVE if OS has enabled support for saving YMM state.
787 Features["xsave"] = HasAVXSave && (ECX >> 26) & 1;
Craig Topper798a2602015-03-29 01:00:23 +0000788
789 // AVX512 requires additional context to be saved by the OS.
Craig Topperb84b1262015-10-14 05:37:42 +0000790 bool HasAVX512Save = HasAVXSave && ((EAX & 0xe0) == 0xe0);
Craig Topper798a2602015-03-29 01:00:23 +0000791
792 unsigned MaxExtLevel;
793 GetX86CpuIDAndInfo(0x80000000, &MaxExtLevel, &EBX, &ECX, &EDX);
794
795 bool HasExtLeaf1 = MaxExtLevel >= 0x80000001 &&
796 !GetX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX);
797 Features["lzcnt"] = HasExtLeaf1 && ((ECX >> 5) & 1);
798 Features["sse4a"] = HasExtLeaf1 && ((ECX >> 6) & 1);
799 Features["prfchw"] = HasExtLeaf1 && ((ECX >> 8) & 1);
Craig Topperb84b1262015-10-14 05:37:42 +0000800 Features["xop"] = HasExtLeaf1 && ((ECX >> 11) & 1) && HasAVXSave;
801 Features["fma4"] = HasExtLeaf1 && ((ECX >> 16) & 1) && HasAVXSave;
Craig Topper798a2602015-03-29 01:00:23 +0000802 Features["tbm"] = HasExtLeaf1 && ((ECX >> 21) & 1);
803
804 bool HasLeaf7 = MaxLevel >= 7 &&
805 !GetX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX);
806
807 // AVX2 is only supported if we have the OS save support from AVX.
Craig Topperb84b1262015-10-14 05:37:42 +0000808 Features["avx2"] = HasAVXSave && HasLeaf7 && ((EBX >> 5) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000809
810 Features["fsgsbase"] = HasLeaf7 && ((EBX >> 0) & 1);
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000811 Features["sgx"] = HasLeaf7 && ((EBX >> 2) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000812 Features["bmi"] = HasLeaf7 && ((EBX >> 3) & 1);
813 Features["hle"] = HasLeaf7 && ((EBX >> 4) & 1);
814 Features["bmi2"] = HasLeaf7 && ((EBX >> 8) & 1);
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000815 Features["invpcid"] = HasLeaf7 && ((EBX >> 10) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000816 Features["rtm"] = HasLeaf7 && ((EBX >> 11) & 1);
817 Features["rdseed"] = HasLeaf7 && ((EBX >> 18) & 1);
818 Features["adx"] = HasLeaf7 && ((EBX >> 19) & 1);
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000819 Features["smap"] = HasLeaf7 && ((EBX >> 20) & 1);
820 Features["pcommit"] = HasLeaf7 && ((EBX >> 22) & 1);
821 Features["clflushopt"] = HasLeaf7 && ((EBX >> 23) & 1);
822 Features["clwb"] = HasLeaf7 && ((EBX >> 24) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000823 Features["sha"] = HasLeaf7 && ((EBX >> 29) & 1);
824
825 // AVX512 is only supported if the OS supports the context save for it.
826 Features["avx512f"] = HasLeaf7 && ((EBX >> 16) & 1) && HasAVX512Save;
827 Features["avx512dq"] = HasLeaf7 && ((EBX >> 17) & 1) && HasAVX512Save;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000828 Features["avx512ifma"] = HasLeaf7 && ((EBX >> 21) & 1) && HasAVX512Save;
Craig Topper798a2602015-03-29 01:00:23 +0000829 Features["avx512pf"] = HasLeaf7 && ((EBX >> 26) & 1) && HasAVX512Save;
830 Features["avx512er"] = HasLeaf7 && ((EBX >> 27) & 1) && HasAVX512Save;
831 Features["avx512cd"] = HasLeaf7 && ((EBX >> 28) & 1) && HasAVX512Save;
832 Features["avx512bw"] = HasLeaf7 && ((EBX >> 30) & 1) && HasAVX512Save;
833 Features["avx512vl"] = HasLeaf7 && ((EBX >> 31) & 1) && HasAVX512Save;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000834
835 Features["prefetchwt1"] = HasLeaf7 && (ECX & 1);
836 Features["avx512vbmi"] = HasLeaf7 && ((ECX >> 1) & 1) && HasAVX512Save;
837 // Enable protection keys
838 Features["pku"] = HasLeaf7 && ((ECX >> 4) & 1);
Craig Topper798a2602015-03-29 01:00:23 +0000839
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000840 bool HasLeafD = MaxLevel >= 0xd &&
841 !GetX86CpuIDAndInfoEx(0xd, 0x1, &EAX, &EBX, &ECX, &EDX);
842
Craig Topperb84b1262015-10-14 05:37:42 +0000843 // Only enable XSAVE if OS has enabled support for saving YMM state.
844 Features["xsaveopt"] = HasAVXSave && HasLeafD && ((EAX >> 0) & 1);
845 Features["xsavec"] = HasAVXSave && HasLeafD && ((EAX >> 1) & 1);
846 Features["xsaves"] = HasAVXSave && HasLeafD && ((EAX >> 3) & 1);
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000847
Craig Topper798a2602015-03-29 01:00:23 +0000848 return true;
849}
850#elif defined(__linux__) && (defined(__arm__) || defined(__aarch64__))
Hao Liu10be3b22012-12-13 02:40:20 +0000851bool sys::getHostCPUFeatures(StringMap<bool> &Features) {
Hao Liu10be3b22012-12-13 02:40:20 +0000852 // Read 1024 bytes from /proc/cpuinfo, which should contain the Features line
853 // in all cases.
854 char buffer[1024];
Rafael Espindola97935a92014-12-17 02:32:44 +0000855 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer));
856 if (CPUInfoSize == -1)
857 return false;
Hao Liu10be3b22012-12-13 02:40:20 +0000858
859 StringRef Str(buffer, CPUInfoSize);
860
861 SmallVector<StringRef, 32> Lines;
862 Str.split(Lines, "\n");
863
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000864 SmallVector<StringRef, 32> CPUFeatures;
865
866 // Look for the CPU features.
Hao Liu10be3b22012-12-13 02:40:20 +0000867 for (unsigned I = 0, E = Lines.size(); I != E; ++I)
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000868 if (Lines[I].startswith("Features")) {
Chandler Carruthe4405e92015-09-10 06:12:31 +0000869 Lines[I].split(CPUFeatures, ' ');
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000870 break;
Hao Liu10be3b22012-12-13 02:40:20 +0000871 }
872
Bradley Smith9288b212014-05-22 11:44:34 +0000873#if defined(__aarch64__)
874 // Keep track of which crypto features we have seen
875 enum {
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000876 CAP_AES = 0x1,
877 CAP_PMULL = 0x2,
878 CAP_SHA1 = 0x4,
879 CAP_SHA2 = 0x8
Bradley Smith9288b212014-05-22 11:44:34 +0000880 };
881 uint32_t crypto = 0;
882#endif
883
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000884 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) {
885 StringRef LLVMFeatureStr = StringSwitch<StringRef>(CPUFeatures[I])
Bradley Smith9288b212014-05-22 11:44:34 +0000886#if defined(__aarch64__)
887 .Case("asimd", "neon")
888 .Case("fp", "fp-armv8")
889 .Case("crc32", "crc")
890#else
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000891 .Case("half", "fp16")
892 .Case("neon", "neon")
893 .Case("vfpv3", "vfp3")
894 .Case("vfpv3d16", "d16")
895 .Case("vfpv4", "vfp4")
896 .Case("idiva", "hwdiv-arm")
897 .Case("idivt", "hwdiv")
Bradley Smith9288b212014-05-22 11:44:34 +0000898#endif
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000899 .Default("");
900
Bradley Smith9288b212014-05-22 11:44:34 +0000901#if defined(__aarch64__)
Alp Tokerda0c7932014-05-31 21:26:28 +0000902 // We need to check crypto separately since we need all of the crypto
Bradley Smith9288b212014-05-22 11:44:34 +0000903 // extensions to enable the subtarget feature
904 if (CPUFeatures[I] == "aes")
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000905 crypto |= CAP_AES;
Bradley Smith9288b212014-05-22 11:44:34 +0000906 else if (CPUFeatures[I] == "pmull")
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000907 crypto |= CAP_PMULL;
Bradley Smith9288b212014-05-22 11:44:34 +0000908 else if (CPUFeatures[I] == "sha1")
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000909 crypto |= CAP_SHA1;
Bradley Smith9288b212014-05-22 11:44:34 +0000910 else if (CPUFeatures[I] == "sha2")
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000911 crypto |= CAP_SHA2;
Bradley Smith9288b212014-05-22 11:44:34 +0000912#endif
913
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000914 if (LLVMFeatureStr != "")
David Blaikie5106ce72014-11-19 05:49:42 +0000915 Features[LLVMFeatureStr] = true;
Hao Liu10be3b22012-12-13 02:40:20 +0000916 }
917
Bradley Smith9288b212014-05-22 11:44:34 +0000918#if defined(__aarch64__)
919 // If we have all crypto bits we can add the feature
Bradley Smith63c8b1b2014-05-23 10:14:13 +0000920 if (crypto == (CAP_AES | CAP_PMULL | CAP_SHA1 | CAP_SHA2))
David Blaikie5106ce72014-11-19 05:49:42 +0000921 Features["crypto"] = true;
Bradley Smith9288b212014-05-22 11:44:34 +0000922#endif
923
Tobias Grosserbd9e5492013-06-11 21:45:01 +0000924 return true;
Hao Liu10be3b22012-12-13 02:40:20 +0000925}
926#else
Xerxes Ranby17dc3a02010-01-19 21:26:05 +0000927bool sys::getHostCPUFeatures(StringMap<bool> &Features){
928 return false;
929}
Hao Liu10be3b22012-12-13 02:40:20 +0000930#endif
Peter Collingbournea51c6ed2013-01-16 17:27:22 +0000931
932std::string sys::getProcessTriple() {
Duncan Sandse2cd1392013-07-17 11:01:05 +0000933 Triple PT(Triple::normalize(LLVM_HOST_TRIPLE));
Peter Collingbournea51c6ed2013-01-16 17:27:22 +0000934
935 if (sizeof(void *) == 8 && PT.isArch32Bit())
936 PT = PT.get64BitArchVariant();
937 if (sizeof(void *) == 4 && PT.isArch64Bit())
938 PT = PT.get32BitArchVariant();
939
940 return PT.str();
941}