1 //===-- AArch64Subtarget.cpp - AArch64 Subtarget Information ----*- C++ -*-===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file implements the AArch64 specific subclass of TargetSubtarget. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "AArch64Subtarget.h" 15 #include "AArch64InstrInfo.h" 16 #include "AArch64PBQPRegAlloc.h" 17 #include "llvm/CodeGen/MachineScheduler.h" 18 #include "llvm/IR/GlobalValue.h" 19 #include "llvm/Support/TargetRegistry.h" 20 21 using namespace llvm; 22 23 #define DEBUG_TYPE "aarch64-subtarget" 24 25 #define GET_SUBTARGETINFO_CTOR 26 #define GET_SUBTARGETINFO_TARGET_DESC 27 #include "AArch64GenSubtargetInfo.inc" 28 29 static cl::opt<bool> 30 EnableEarlyIfConvert("aarch64-early-ifcvt", cl::desc("Enable the early if " 31 "converter pass"), cl::init(true), cl::Hidden); 32 33 // If OS supports TBI, use this flag to enable it. 34 static cl::opt<bool> 35 UseAddressTopByteIgnored("aarch64-use-tbi", cl::desc("Assume that top byte of " 36 "an address is ignored"), cl::init(false), cl::Hidden); 37 38 AArch64Subtarget & 39 AArch64Subtarget::initializeSubtargetDependencies(StringRef FS, 40 StringRef CPUString) { 41 // Determine default and user-specified characteristics 42 43 if (CPUString.empty()) 44 CPUString = "generic"; 45 46 ParseSubtargetFeatures(CPUString, FS); 47 initializeProperties(); 48 49 return *this; 50 } 51 52 void AArch64Subtarget::initializeProperties() { 53 // Initialize CPU specific properties. We should add a tablegen feature for 54 // this in the future so we can specify it together with the subtarget 55 // features. 56 switch (ARMProcFamily) { 57 case Cyclone: 58 CacheLineSize = 64; 59 PrefetchDistance = 280; 60 MinPrefetchStride = 2048; 61 MaxPrefetchIterationsAhead = 3; 62 break; 63 case CortexA57: 64 MaxInterleaveFactor = 4; 65 break; 66 case ExynosM1: 67 PrefFunctionAlignment = 4; 68 PrefLoopAlignment = 3; 69 MaxJumpTableSize = 12; 70 break; 71 case Kryo: 72 MaxInterleaveFactor = 4; 73 VectorInsertExtractBaseCost = 2; 74 CacheLineSize = 128; 75 PrefetchDistance = 740; 76 MinPrefetchStride = 1024; 77 MaxPrefetchIterationsAhead = 11; 78 break; 79 case Vulcan: 80 MaxInterleaveFactor = 4; 81 break; 82 case CortexA35: break; 83 case CortexA53: break; 84 case CortexA72: break; 85 case CortexA73: break; 86 case Others: break; 87 } 88 } 89 90 AArch64Subtarget::AArch64Subtarget(const Triple &TT, const std::string &CPU, 91 const std::string &FS, 92 const TargetMachine &TM, bool LittleEndian) 93 : AArch64GenSubtargetInfo(TT, CPU, FS), ReserveX18(TT.isOSDarwin()), 94 IsLittle(LittleEndian), TargetTriple(TT), FrameLowering(), 95 InstrInfo(initializeSubtargetDependencies(FS, CPU)), TSInfo(), 96 TLInfo(TM, *this), GISel() {} 97 98 const CallLowering *AArch64Subtarget::getCallLowering() const { 99 assert(GISel && "Access to GlobalISel APIs not set"); 100 return GISel->getCallLowering(); 101 } 102 103 const InstructionSelector *AArch64Subtarget::getInstructionSelector() const { 104 assert(GISel && "Access to GlobalISel APIs not set"); 105 return GISel->getInstructionSelector(); 106 } 107 108 const LegalizerInfo *AArch64Subtarget::getLegalizerInfo() const { 109 assert(GISel && "Access to GlobalISel APIs not set"); 110 return GISel->getLegalizerInfo(); 111 } 112 113 const RegisterBankInfo *AArch64Subtarget::getRegBankInfo() const { 114 assert(GISel && "Access to GlobalISel APIs not set"); 115 return GISel->getRegBankInfo(); 116 } 117 118 /// Find the target operand flags that describe how a global value should be 119 /// referenced for the current subtarget. 120 unsigned char 121 AArch64Subtarget::ClassifyGlobalReference(const GlobalValue *GV, 122 const TargetMachine &TM) const { 123 // MachO large model always goes via a GOT, simply to get a single 8-byte 124 // absolute relocation on all global addresses. 125 if (TM.getCodeModel() == CodeModel::Large && isTargetMachO()) 126 return AArch64II::MO_GOT; 127 128 if (!TM.shouldAssumeDSOLocal(*GV->getParent(), GV)) 129 return AArch64II::MO_GOT; 130 131 // The small code mode's direct accesses use ADRP, which cannot necessarily 132 // produce the value 0 (if the code is above 4GB). 133 if (TM.getCodeModel() == CodeModel::Small && GV->hasExternalWeakLinkage()) 134 return AArch64II::MO_GOT; 135 136 return AArch64II::MO_NO_FLAG; 137 } 138 139 /// This function returns the name of a function which has an interface 140 /// like the non-standard bzero function, if such a function exists on 141 /// the current subtarget and it is considered prefereable over 142 /// memset with zero passed as the second argument. Otherwise it 143 /// returns null. 144 const char *AArch64Subtarget::getBZeroEntry() const { 145 // Prefer bzero on Darwin only. 146 if(isTargetDarwin()) 147 return "bzero"; 148 149 return nullptr; 150 } 151 152 void AArch64Subtarget::overrideSchedPolicy(MachineSchedPolicy &Policy, 153 unsigned NumRegionInstrs) const { 154 // LNT run (at least on Cyclone) showed reasonably significant gains for 155 // bi-directional scheduling. 253.perlbmk. 156 Policy.OnlyTopDown = false; 157 Policy.OnlyBottomUp = false; 158 // Enabling or Disabling the latency heuristic is a close call: It seems to 159 // help nearly no benchmark on out-of-order architectures, on the other hand 160 // it regresses register pressure on a few benchmarking. 161 Policy.DisableLatencyHeuristic = DisableLatencySchedHeuristic; 162 } 163 164 bool AArch64Subtarget::enableEarlyIfConversion() const { 165 return EnableEarlyIfConvert; 166 } 167 168 bool AArch64Subtarget::supportsAddressTopByteIgnored() const { 169 if (!UseAddressTopByteIgnored) 170 return false; 171 172 if (TargetTriple.isiOS()) { 173 unsigned Major, Minor, Micro; 174 TargetTriple.getiOSVersion(Major, Minor, Micro); 175 return Major >= 8; 176 } 177 178 return false; 179 } 180 181 std::unique_ptr<PBQPRAConstraint> 182 AArch64Subtarget::getCustomPBQPConstraints() const { 183 return balanceFPOps() ? llvm::make_unique<A57ChainingConstraint>() : nullptr; 184 } 185