1 //===-- Host.cpp - Implement OS Host Concept --------------------*- C++ -*-===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file implements the operating system Host concept. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "llvm/Support/Host.h" 15 #include "llvm/ADT/SmallVector.h" 16 #include "llvm/ADT/StringRef.h" 17 #include "llvm/ADT/StringSwitch.h" 18 #include "llvm/ADT/Triple.h" 19 #include "llvm/Config/config.h" 20 #include "llvm/Support/Debug.h" 21 #include "llvm/Support/FileSystem.h" 22 #include "llvm/Support/raw_ostream.h" 23 #include <string.h> 24 25 // Include the platform-specific parts of this class. 26 #ifdef LLVM_ON_UNIX 27 #include "Unix/Host.inc" 28 #endif 29 #ifdef LLVM_ON_WIN32 30 #include "Windows/Host.inc" 31 #endif 32 #ifdef _MSC_VER 33 #include <intrin.h> 34 #endif 35 #if defined(__APPLE__) && (defined(__ppc__) || defined(__powerpc__)) 36 #include <mach/mach.h> 37 #include <mach/mach_host.h> 38 #include <mach/host_info.h> 39 #include <mach/machine.h> 40 #endif 41 42 #define DEBUG_TYPE "host-detection" 43 44 //===----------------------------------------------------------------------===// 45 // 46 // Implementations of the CPU detection routines 47 // 48 //===----------------------------------------------------------------------===// 49 50 using namespace llvm; 51 52 #if defined(__linux__) 53 static ssize_t LLVM_ATTRIBUTE_UNUSED readCpuInfo(void *Buf, size_t Size) { 54 // Note: We cannot mmap /proc/cpuinfo here and then process the resulting 55 // memory buffer because the 'file' has 0 size (it can be read from only 56 // as a stream). 57 58 int FD; 59 std::error_code EC = sys::fs::openFileForRead("/proc/cpuinfo", FD); 60 if (EC) { 61 DEBUG(dbgs() << "Unable to open /proc/cpuinfo: " << EC.message() << "\n"); 62 return -1; 63 } 64 int Ret = read(FD, Buf, Size); 65 int CloseStatus = close(FD); 66 if (CloseStatus) 67 return -1; 68 return Ret; 69 } 70 #endif 71 72 #if defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86)\ 73 || defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64) 74 75 /// GetX86CpuIDAndInfo - Execute the specified cpuid and return the 4 values in the 76 /// specified arguments. If we can't run cpuid on the host, return true. 77 static bool GetX86CpuIDAndInfo(unsigned value, unsigned *rEAX, unsigned *rEBX, 78 unsigned *rECX, unsigned *rEDX) { 79 #if defined(__GNUC__) || defined(__clang__) 80 #if defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64) 81 // gcc doesn't know cpuid would clobber ebx/rbx. Preseve it manually. 82 asm ("movq\t%%rbx, %%rsi\n\t" 83 "cpuid\n\t" 84 "xchgq\t%%rbx, %%rsi\n\t" 85 : "=a" (*rEAX), 86 "=S" (*rEBX), 87 "=c" (*rECX), 88 "=d" (*rEDX) 89 : "a" (value)); 90 return false; 91 #elif defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86) 92 asm ("movl\t%%ebx, %%esi\n\t" 93 "cpuid\n\t" 94 "xchgl\t%%ebx, %%esi\n\t" 95 : "=a" (*rEAX), 96 "=S" (*rEBX), 97 "=c" (*rECX), 98 "=d" (*rEDX) 99 : "a" (value)); 100 return false; 101 // pedantic #else returns to appease -Wunreachable-code (so we don't generate 102 // postprocessed code that looks like "return true; return false;") 103 #else 104 return true; 105 #endif 106 #elif defined(_MSC_VER) 107 // The MSVC intrinsic is portable across x86 and x64. 108 int registers[4]; 109 __cpuid(registers, value); 110 *rEAX = registers[0]; 111 *rEBX = registers[1]; 112 *rECX = registers[2]; 113 *rEDX = registers[3]; 114 return false; 115 #else 116 return true; 117 #endif 118 } 119 120 /// GetX86CpuIDAndInfoEx - Execute the specified cpuid with subleaf and return the 121 /// 4 values in the specified arguments. If we can't run cpuid on the host, 122 /// return true. 123 static bool GetX86CpuIDAndInfoEx(unsigned value, unsigned subleaf, 124 unsigned *rEAX, unsigned *rEBX, unsigned *rECX, 125 unsigned *rEDX) { 126 #if defined(__x86_64__) || defined(_M_AMD64) || defined (_M_X64) 127 #if defined(__GNUC__) 128 // gcc doesn't know cpuid would clobber ebx/rbx. Preseve it manually. 129 asm ("movq\t%%rbx, %%rsi\n\t" 130 "cpuid\n\t" 131 "xchgq\t%%rbx, %%rsi\n\t" 132 : "=a" (*rEAX), 133 "=S" (*rEBX), 134 "=c" (*rECX), 135 "=d" (*rEDX) 136 : "a" (value), 137 "c" (subleaf)); 138 return false; 139 #elif defined(_MSC_VER) 140 int registers[4]; 141 __cpuidex(registers, value, subleaf); 142 *rEAX = registers[0]; 143 *rEBX = registers[1]; 144 *rECX = registers[2]; 145 *rEDX = registers[3]; 146 return false; 147 #else 148 return true; 149 #endif 150 #elif defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86) 151 #if defined(__GNUC__) 152 asm ("movl\t%%ebx, %%esi\n\t" 153 "cpuid\n\t" 154 "xchgl\t%%ebx, %%esi\n\t" 155 : "=a" (*rEAX), 156 "=S" (*rEBX), 157 "=c" (*rECX), 158 "=d" (*rEDX) 159 : "a" (value), 160 "c" (subleaf)); 161 return false; 162 #elif defined(_MSC_VER) 163 __asm { 164 mov eax,value 165 mov ecx,subleaf 166 cpuid 167 mov esi,rEAX 168 mov dword ptr [esi],eax 169 mov esi,rEBX 170 mov dword ptr [esi],ebx 171 mov esi,rECX 172 mov dword ptr [esi],ecx 173 mov esi,rEDX 174 mov dword ptr [esi],edx 175 } 176 return false; 177 #else 178 return true; 179 #endif 180 #else 181 return true; 182 #endif 183 } 184 185 static bool OSHasAVXSupport() { 186 #if defined(__GNUC__) 187 // Check xgetbv; this uses a .byte sequence instead of the instruction 188 // directly because older assemblers do not include support for xgetbv and 189 // there is no easy way to conditionally compile based on the assembler used. 190 int rEAX, rEDX; 191 __asm__ (".byte 0x0f, 0x01, 0xd0" : "=a" (rEAX), "=d" (rEDX) : "c" (0)); 192 #elif defined(_MSC_FULL_VER) && defined(_XCR_XFEATURE_ENABLED_MASK) 193 unsigned long long rEAX = _xgetbv(_XCR_XFEATURE_ENABLED_MASK); 194 #else 195 int rEAX = 0; // Ensures we return false 196 #endif 197 return (rEAX & 6) == 6; 198 } 199 200 static void DetectX86FamilyModel(unsigned EAX, unsigned &Family, 201 unsigned &Model) { 202 Family = (EAX >> 8) & 0xf; // Bits 8 - 11 203 Model = (EAX >> 4) & 0xf; // Bits 4 - 7 204 if (Family == 6 || Family == 0xf) { 205 if (Family == 0xf) 206 // Examine extended family ID if family ID is F. 207 Family += (EAX >> 20) & 0xff; // Bits 20 - 27 208 // Examine extended model ID if family ID is 6 or F. 209 Model += ((EAX >> 16) & 0xf) << 4; // Bits 16 - 19 210 } 211 } 212 213 StringRef sys::getHostCPUName() { 214 unsigned EAX = 0, EBX = 0, ECX = 0, EDX = 0; 215 if (GetX86CpuIDAndInfo(0x1, &EAX, &EBX, &ECX, &EDX)) 216 return "generic"; 217 unsigned Family = 0; 218 unsigned Model = 0; 219 DetectX86FamilyModel(EAX, Family, Model); 220 221 union { 222 unsigned u[3]; 223 char c[12]; 224 } text; 225 226 GetX86CpuIDAndInfo(0, &EAX, text.u+0, text.u+2, text.u+1); 227 228 unsigned MaxLeaf = EAX; 229 bool HasSSE3 = (ECX & 0x1); 230 bool HasSSE41 = (ECX & 0x80000); 231 // If CPUID indicates support for XSAVE, XRESTORE and AVX, and XGETBV 232 // indicates that the AVX registers will be saved and restored on context 233 // switch, then we have full AVX support. 234 const unsigned AVXBits = (1 << 27) | (1 << 28); 235 bool HasAVX = ((ECX & AVXBits) == AVXBits) && OSHasAVXSupport(); 236 bool HasAVX2 = HasAVX && MaxLeaf >= 0x7 && 237 !GetX86CpuIDAndInfoEx(0x7, 0x0, &EAX, &EBX, &ECX, &EDX) && 238 (EBX & 0x20); 239 GetX86CpuIDAndInfo(0x80000001, &EAX, &EBX, &ECX, &EDX); 240 bool Em64T = (EDX >> 29) & 0x1; 241 bool HasTBM = (ECX >> 21) & 0x1; 242 243 if (memcmp(text.c, "GenuineIntel", 12) == 0) { 244 switch (Family) { 245 case 3: 246 return "i386"; 247 case 4: 248 switch (Model) { 249 case 0: // Intel486 DX processors 250 case 1: // Intel486 DX processors 251 case 2: // Intel486 SX processors 252 case 3: // Intel487 processors, IntelDX2 OverDrive processors, 253 // IntelDX2 processors 254 case 4: // Intel486 SL processor 255 case 5: // IntelSX2 processors 256 case 7: // Write-Back Enhanced IntelDX2 processors 257 case 8: // IntelDX4 OverDrive processors, IntelDX4 processors 258 default: return "i486"; 259 } 260 case 5: 261 switch (Model) { 262 case 1: // Pentium OverDrive processor for Pentium processor (60, 66), 263 // Pentium processors (60, 66) 264 case 2: // Pentium OverDrive processor for Pentium processor (75, 90, 265 // 100, 120, 133), Pentium processors (75, 90, 100, 120, 133, 266 // 150, 166, 200) 267 case 3: // Pentium OverDrive processors for Intel486 processor-based 268 // systems 269 return "pentium"; 270 271 case 4: // Pentium OverDrive processor with MMX technology for Pentium 272 // processor (75, 90, 100, 120, 133), Pentium processor with 273 // MMX technology (166, 200) 274 return "pentium-mmx"; 275 276 default: return "pentium"; 277 } 278 case 6: 279 switch (Model) { 280 case 1: // Pentium Pro processor 281 return "pentiumpro"; 282 283 case 3: // Intel Pentium II OverDrive processor, Pentium II processor, 284 // model 03 285 case 5: // Pentium II processor, model 05, Pentium II Xeon processor, 286 // model 05, and Intel Celeron processor, model 05 287 case 6: // Celeron processor, model 06 288 return "pentium2"; 289 290 case 7: // Pentium III processor, model 07, and Pentium III Xeon 291 // processor, model 07 292 case 8: // Pentium III processor, model 08, Pentium III Xeon processor, 293 // model 08, and Celeron processor, model 08 294 case 10: // Pentium III Xeon processor, model 0Ah 295 case 11: // Pentium III processor, model 0Bh 296 return "pentium3"; 297 298 case 9: // Intel Pentium M processor, Intel Celeron M processor model 09. 299 case 13: // Intel Pentium M processor, Intel Celeron M processor, model 300 // 0Dh. All processors are manufactured using the 90 nm process. 301 return "pentium-m"; 302 303 case 14: // Intel Core Duo processor, Intel Core Solo processor, model 304 // 0Eh. All processors are manufactured using the 65 nm process. 305 return "yonah"; 306 307 case 15: // Intel Core 2 Duo processor, Intel Core 2 Duo mobile 308 // processor, Intel Core 2 Quad processor, Intel Core 2 Quad 309 // mobile processor, Intel Core 2 Extreme processor, Intel 310 // Pentium Dual-Core processor, Intel Xeon processor, model 311 // 0Fh. All processors are manufactured using the 65 nm process. 312 case 22: // Intel Celeron processor model 16h. All processors are 313 // manufactured using the 65 nm process 314 return "core2"; 315 316 case 21: // Intel EP80579 Integrated Processor and Intel EP80579 317 // Integrated Processor with Intel QuickAssist Technology 318 return "i686"; // FIXME: ??? 319 320 case 23: // Intel Core 2 Extreme processor, Intel Xeon processor, model 321 // 17h. All processors are manufactured using the 45 nm process. 322 // 323 // 45nm: Penryn , Wolfdale, Yorkfield (XE) 324 // Not all Penryn processors support SSE 4.1 (such as the Pentium brand) 325 return HasSSE41 ? "penryn" : "core2"; 326 327 case 26: // Intel Core i7 processor and Intel Xeon processor. All 328 // processors are manufactured using the 45 nm process. 329 case 29: // Intel Xeon processor MP. All processors are manufactured using 330 // the 45 nm process. 331 case 30: // Intel(R) Core(TM) i7 CPU 870 @ 2.93GHz. 332 // As found in a Summer 2010 model iMac. 333 case 37: // Intel Core i7, laptop version. 334 case 44: // Intel Core i7 processor and Intel Xeon processor. All 335 // processors are manufactured using the 32 nm process. 336 case 46: // Nehalem EX 337 case 47: // Westmere EX 338 return "corei7"; 339 340 // SandyBridge: 341 case 42: // Intel Core i7 processor. All processors are manufactured 342 // using the 32 nm process. 343 case 45: 344 // Not all Sandy Bridge processors support AVX (such as the Pentium 345 // versions instead of the i7 versions). 346 return HasAVX ? "corei7-avx" : "corei7"; 347 348 // Ivy Bridge: 349 case 58: 350 case 62: // Ivy Bridge EP 351 // Not all Ivy Bridge processors support AVX (such as the Pentium 352 // versions instead of the i7 versions). 353 return HasAVX ? "core-avx-i" : "corei7"; 354 355 // Haswell: 356 case 60: 357 case 63: 358 case 69: 359 case 70: 360 // Not all Haswell processors support AVX too (such as the Pentium 361 // versions instead of the i7 versions). 362 return HasAVX2 ? "core-avx2" : "corei7"; 363 364 case 28: // Most 45 nm Intel Atom processors 365 case 38: // 45 nm Atom Lincroft 366 case 39: // 32 nm Atom Medfield 367 case 53: // 32 nm Atom Midview 368 case 54: // 32 nm Atom Midview 369 return "atom"; 370 371 // Atom Silvermont codes from the Intel software optimization guide. 372 case 55: 373 case 74: 374 case 77: 375 return "slm"; 376 377 default: return (Em64T) ? "x86-64" : "i686"; 378 } 379 case 15: { 380 switch (Model) { 381 case 0: // Pentium 4 processor, Intel Xeon processor. All processors are 382 // model 00h and manufactured using the 0.18 micron process. 383 case 1: // Pentium 4 processor, Intel Xeon processor, Intel Xeon 384 // processor MP, and Intel Celeron processor. All processors are 385 // model 01h and manufactured using the 0.18 micron process. 386 case 2: // Pentium 4 processor, Mobile Intel Pentium 4 processor - M, 387 // Intel Xeon processor, Intel Xeon processor MP, Intel Celeron 388 // processor, and Mobile Intel Celeron processor. All processors 389 // are model 02h and manufactured using the 0.13 micron process. 390 return (Em64T) ? "x86-64" : "pentium4"; 391 392 case 3: // Pentium 4 processor, Intel Xeon processor, Intel Celeron D 393 // processor. All processors are model 03h and manufactured using 394 // the 90 nm process. 395 case 4: // Pentium 4 processor, Pentium 4 processor Extreme Edition, 396 // Pentium D processor, Intel Xeon processor, Intel Xeon 397 // processor MP, Intel Celeron D processor. All processors are 398 // model 04h and manufactured using the 90 nm process. 399 case 6: // Pentium 4 processor, Pentium D processor, Pentium processor 400 // Extreme Edition, Intel Xeon processor, Intel Xeon processor 401 // MP, Intel Celeron D processor. All processors are model 06h 402 // and manufactured using the 65 nm process. 403 return (Em64T) ? "nocona" : "prescott"; 404 405 default: 406 return (Em64T) ? "x86-64" : "pentium4"; 407 } 408 } 409 410 default: 411 return "generic"; 412 } 413 } else if (memcmp(text.c, "AuthenticAMD", 12) == 0) { 414 // FIXME: this poorly matches the generated SubtargetFeatureKV table. There 415 // appears to be no way to generate the wide variety of AMD-specific targets 416 // from the information returned from CPUID. 417 switch (Family) { 418 case 4: 419 return "i486"; 420 case 5: 421 switch (Model) { 422 case 6: 423 case 7: return "k6"; 424 case 8: return "k6-2"; 425 case 9: 426 case 13: return "k6-3"; 427 case 10: return "geode"; 428 default: return "pentium"; 429 } 430 case 6: 431 switch (Model) { 432 case 4: return "athlon-tbird"; 433 case 6: 434 case 7: 435 case 8: return "athlon-mp"; 436 case 10: return "athlon-xp"; 437 default: return "athlon"; 438 } 439 case 15: 440 if (HasSSE3) 441 return "k8-sse3"; 442 switch (Model) { 443 case 1: return "opteron"; 444 case 5: return "athlon-fx"; // also opteron 445 default: return "athlon64"; 446 } 447 case 16: 448 return "amdfam10"; 449 case 20: 450 return "btver1"; 451 case 21: 452 if (!HasAVX) // If the OS doesn't support AVX provide a sane fallback. 453 return "btver1"; 454 if (Model >= 0x50) 455 return "bdver4"; // 50h-6Fh: Excavator 456 if (Model >= 0x30) 457 return "bdver3"; // 30h-3Fh: Steamroller 458 if (Model >= 0x10 || HasTBM) 459 return "bdver2"; // 10h-1Fh: Piledriver 460 return "bdver1"; // 00h-0Fh: Bulldozer 461 case 22: 462 if (!HasAVX) // If the OS doesn't support AVX provide a sane fallback. 463 return "btver1"; 464 return "btver2"; 465 default: 466 return "generic"; 467 } 468 } 469 return "generic"; 470 } 471 #elif defined(__APPLE__) && (defined(__ppc__) || defined(__powerpc__)) 472 StringRef sys::getHostCPUName() { 473 host_basic_info_data_t hostInfo; 474 mach_msg_type_number_t infoCount; 475 476 infoCount = HOST_BASIC_INFO_COUNT; 477 host_info(mach_host_self(), HOST_BASIC_INFO, (host_info_t)&hostInfo, 478 &infoCount); 479 480 if (hostInfo.cpu_type != CPU_TYPE_POWERPC) return "generic"; 481 482 switch(hostInfo.cpu_subtype) { 483 case CPU_SUBTYPE_POWERPC_601: return "601"; 484 case CPU_SUBTYPE_POWERPC_602: return "602"; 485 case CPU_SUBTYPE_POWERPC_603: return "603"; 486 case CPU_SUBTYPE_POWERPC_603e: return "603e"; 487 case CPU_SUBTYPE_POWERPC_603ev: return "603ev"; 488 case CPU_SUBTYPE_POWERPC_604: return "604"; 489 case CPU_SUBTYPE_POWERPC_604e: return "604e"; 490 case CPU_SUBTYPE_POWERPC_620: return "620"; 491 case CPU_SUBTYPE_POWERPC_750: return "750"; 492 case CPU_SUBTYPE_POWERPC_7400: return "7400"; 493 case CPU_SUBTYPE_POWERPC_7450: return "7450"; 494 case CPU_SUBTYPE_POWERPC_970: return "970"; 495 default: ; 496 } 497 498 return "generic"; 499 } 500 #elif defined(__linux__) && (defined(__ppc__) || defined(__powerpc__)) 501 StringRef sys::getHostCPUName() { 502 // Access to the Processor Version Register (PVR) on PowerPC is privileged, 503 // and so we must use an operating-system interface to determine the current 504 // processor type. On Linux, this is exposed through the /proc/cpuinfo file. 505 const char *generic = "generic"; 506 507 // The cpu line is second (after the 'processor: 0' line), so if this 508 // buffer is too small then something has changed (or is wrong). 509 char buffer[1024]; 510 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer)); 511 if (CPUInfoSize == -1) 512 return generic; 513 514 const char *CPUInfoStart = buffer; 515 const char *CPUInfoEnd = buffer + CPUInfoSize; 516 517 const char *CIP = CPUInfoStart; 518 519 const char *CPUStart = 0; 520 size_t CPULen = 0; 521 522 // We need to find the first line which starts with cpu, spaces, and a colon. 523 // After the colon, there may be some additional spaces and then the cpu type. 524 while (CIP < CPUInfoEnd && CPUStart == 0) { 525 if (CIP < CPUInfoEnd && *CIP == '\n') 526 ++CIP; 527 528 if (CIP < CPUInfoEnd && *CIP == 'c') { 529 ++CIP; 530 if (CIP < CPUInfoEnd && *CIP == 'p') { 531 ++CIP; 532 if (CIP < CPUInfoEnd && *CIP == 'u') { 533 ++CIP; 534 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t')) 535 ++CIP; 536 537 if (CIP < CPUInfoEnd && *CIP == ':') { 538 ++CIP; 539 while (CIP < CPUInfoEnd && (*CIP == ' ' || *CIP == '\t')) 540 ++CIP; 541 542 if (CIP < CPUInfoEnd) { 543 CPUStart = CIP; 544 while (CIP < CPUInfoEnd && (*CIP != ' ' && *CIP != '\t' && 545 *CIP != ',' && *CIP != '\n')) 546 ++CIP; 547 CPULen = CIP - CPUStart; 548 } 549 } 550 } 551 } 552 } 553 554 if (CPUStart == 0) 555 while (CIP < CPUInfoEnd && *CIP != '\n') 556 ++CIP; 557 } 558 559 if (CPUStart == 0) 560 return generic; 561 562 return StringSwitch<const char *>(StringRef(CPUStart, CPULen)) 563 .Case("604e", "604e") 564 .Case("604", "604") 565 .Case("7400", "7400") 566 .Case("7410", "7400") 567 .Case("7447", "7400") 568 .Case("7455", "7450") 569 .Case("G4", "g4") 570 .Case("POWER4", "970") 571 .Case("PPC970FX", "970") 572 .Case("PPC970MP", "970") 573 .Case("G5", "g5") 574 .Case("POWER5", "g5") 575 .Case("A2", "a2") 576 .Case("POWER6", "pwr6") 577 .Case("POWER7", "pwr7") 578 .Case("POWER8", "pwr8") 579 .Case("POWER8E", "pwr8") 580 .Default(generic); 581 } 582 #elif defined(__linux__) && defined(__arm__) 583 StringRef sys::getHostCPUName() { 584 // The cpuid register on arm is not accessible from user space. On Linux, 585 // it is exposed through the /proc/cpuinfo file. 586 587 // Read 1024 bytes from /proc/cpuinfo, which should contain the CPU part line 588 // in all cases. 589 char buffer[1024]; 590 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer)); 591 if (CPUInfoSize == -1) 592 return "generic"; 593 594 StringRef Str(buffer, CPUInfoSize); 595 596 SmallVector<StringRef, 32> Lines; 597 Str.split(Lines, "\n"); 598 599 // Look for the CPU implementer line. 600 StringRef Implementer; 601 for (unsigned I = 0, E = Lines.size(); I != E; ++I) 602 if (Lines[I].startswith("CPU implementer")) 603 Implementer = Lines[I].substr(15).ltrim("\t :"); 604 605 if (Implementer == "0x41") // ARM Ltd. 606 // Look for the CPU part line. 607 for (unsigned I = 0, E = Lines.size(); I != E; ++I) 608 if (Lines[I].startswith("CPU part")) 609 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The 610 // values correspond to the "Part number" in the CP15/c0 register. The 611 // contents are specified in the various processor manuals. 612 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :")) 613 .Case("0x926", "arm926ej-s") 614 .Case("0xb02", "mpcore") 615 .Case("0xb36", "arm1136j-s") 616 .Case("0xb56", "arm1156t2-s") 617 .Case("0xb76", "arm1176jz-s") 618 .Case("0xc08", "cortex-a8") 619 .Case("0xc09", "cortex-a9") 620 .Case("0xc0f", "cortex-a15") 621 .Case("0xc20", "cortex-m0") 622 .Case("0xc23", "cortex-m3") 623 .Case("0xc24", "cortex-m4") 624 .Default("generic"); 625 626 if (Implementer == "0x51") // Qualcomm Technologies, Inc. 627 // Look for the CPU part line. 628 for (unsigned I = 0, E = Lines.size(); I != E; ++I) 629 if (Lines[I].startswith("CPU part")) 630 // The CPU part is a 3 digit hexadecimal number with a 0x prefix. The 631 // values correspond to the "Part number" in the CP15/c0 register. The 632 // contents are specified in the various processor manuals. 633 return StringSwitch<const char *>(Lines[I].substr(8).ltrim("\t :")) 634 .Case("0x06f", "krait") // APQ8064 635 .Default("generic"); 636 637 return "generic"; 638 } 639 #elif defined(__linux__) && defined(__s390x__) 640 StringRef sys::getHostCPUName() { 641 // STIDP is a privileged operation, so use /proc/cpuinfo instead. 642 643 // The "processor 0:" line comes after a fair amount of other information, 644 // including a cache breakdown, but this should be plenty. 645 char buffer[2048]; 646 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer)); 647 if (CPUInfoSize == -1) 648 return "generic"; 649 650 StringRef Str(buffer, CPUInfoSize); 651 SmallVector<StringRef, 32> Lines; 652 Str.split(Lines, "\n"); 653 for (unsigned I = 0, E = Lines.size(); I != E; ++I) { 654 if (Lines[I].startswith("processor ")) { 655 size_t Pos = Lines[I].find("machine = "); 656 if (Pos != StringRef::npos) { 657 Pos += sizeof("machine = ") - 1; 658 unsigned int Id; 659 if (!Lines[I].drop_front(Pos).getAsInteger(10, Id)) { 660 if (Id >= 2827) 661 return "zEC12"; 662 if (Id >= 2817) 663 return "z196"; 664 } 665 } 666 break; 667 } 668 } 669 670 return "generic"; 671 } 672 #else 673 StringRef sys::getHostCPUName() { 674 return "generic"; 675 } 676 #endif 677 678 #if defined(__linux__) && (defined(__arm__) || defined(__aarch64__)) 679 bool sys::getHostCPUFeatures(StringMap<bool> &Features) { 680 // Read 1024 bytes from /proc/cpuinfo, which should contain the Features line 681 // in all cases. 682 char buffer[1024]; 683 ssize_t CPUInfoSize = readCpuInfo(buffer, sizeof(buffer)); 684 if (CPUInfoSize == -1) 685 return false; 686 687 StringRef Str(buffer, CPUInfoSize); 688 689 SmallVector<StringRef, 32> Lines; 690 Str.split(Lines, "\n"); 691 692 SmallVector<StringRef, 32> CPUFeatures; 693 694 // Look for the CPU features. 695 for (unsigned I = 0, E = Lines.size(); I != E; ++I) 696 if (Lines[I].startswith("Features")) { 697 Lines[I].split(CPUFeatures, " "); 698 break; 699 } 700 701 #if defined(__aarch64__) 702 // Keep track of which crypto features we have seen 703 enum { 704 CAP_AES = 0x1, 705 CAP_PMULL = 0x2, 706 CAP_SHA1 = 0x4, 707 CAP_SHA2 = 0x8 708 }; 709 uint32_t crypto = 0; 710 #endif 711 712 for (unsigned I = 0, E = CPUFeatures.size(); I != E; ++I) { 713 StringRef LLVMFeatureStr = StringSwitch<StringRef>(CPUFeatures[I]) 714 #if defined(__aarch64__) 715 .Case("asimd", "neon") 716 .Case("fp", "fp-armv8") 717 .Case("crc32", "crc") 718 #else 719 .Case("half", "fp16") 720 .Case("neon", "neon") 721 .Case("vfpv3", "vfp3") 722 .Case("vfpv3d16", "d16") 723 .Case("vfpv4", "vfp4") 724 .Case("idiva", "hwdiv-arm") 725 .Case("idivt", "hwdiv") 726 #endif 727 .Default(""); 728 729 #if defined(__aarch64__) 730 // We need to check crypto separately since we need all of the crypto 731 // extensions to enable the subtarget feature 732 if (CPUFeatures[I] == "aes") 733 crypto |= CAP_AES; 734 else if (CPUFeatures[I] == "pmull") 735 crypto |= CAP_PMULL; 736 else if (CPUFeatures[I] == "sha1") 737 crypto |= CAP_SHA1; 738 else if (CPUFeatures[I] == "sha2") 739 crypto |= CAP_SHA2; 740 #endif 741 742 if (LLVMFeatureStr != "") 743 Features[LLVMFeatureStr] = true; 744 } 745 746 #if defined(__aarch64__) 747 // If we have all crypto bits we can add the feature 748 if (crypto == (CAP_AES | CAP_PMULL | CAP_SHA1 | CAP_SHA2)) 749 Features["crypto"] = true; 750 #endif 751 752 return true; 753 } 754 #else 755 bool sys::getHostCPUFeatures(StringMap<bool> &Features){ 756 return false; 757 } 758 #endif 759 760 std::string sys::getProcessTriple() { 761 Triple PT(Triple::normalize(LLVM_HOST_TRIPLE)); 762 763 if (sizeof(void *) == 8 && PT.isArch32Bit()) 764 PT = PT.get64BitArchVariant(); 765 if (sizeof(void *) == 4 && PT.isArch64Bit()) 766 PT = PT.get32BitArchVariant(); 767 768 return PT.str(); 769 } 770