1 //===-- NVPTXTargetMachine.cpp - Define TargetMachine for NVPTX -----------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // Top-level implementation for the NVPTX target. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "NVPTXTargetMachine.h" 15 #include "MCTargetDesc/NVPTXMCAsmInfo.h" 16 #include "NVPTX.h" 17 #include "NVPTXAllocaHoisting.h" 18 #include "NVPTXLowerAggrCopies.h" 19 #include "llvm/Analysis/Passes.h" 20 #include "llvm/CodeGen/AsmPrinter.h" 21 #include "llvm/CodeGen/MachineFunctionAnalysis.h" 22 #include "llvm/CodeGen/MachineModuleInfo.h" 23 #include "llvm/CodeGen/Passes.h" 24 #include "llvm/IR/DataLayout.h" 25 #include "llvm/IR/IRPrintingPasses.h" 26 #include "llvm/IR/Verifier.h" 27 #include "llvm/MC/MCAsmInfo.h" 28 #include "llvm/MC/MCInstrInfo.h" 29 #include "llvm/MC/MCStreamer.h" 30 #include "llvm/MC/MCSubtargetInfo.h" 31 #include "llvm/PassManager.h" 32 #include "llvm/Support/CommandLine.h" 33 #include "llvm/Support/Debug.h" 34 #include "llvm/Support/FormattedStream.h" 35 #include "llvm/Support/TargetRegistry.h" 36 #include "llvm/Support/raw_ostream.h" 37 #include "llvm/Target/TargetInstrInfo.h" 38 #include "llvm/Target/TargetLowering.h" 39 #include "llvm/Target/TargetLoweringObjectFile.h" 40 #include "llvm/Target/TargetMachine.h" 41 #include "llvm/Target/TargetOptions.h" 42 #include "llvm/Target/TargetRegisterInfo.h" 43 #include "llvm/Target/TargetSubtargetInfo.h" 44 #include "llvm/Transforms/Scalar.h" 45 46 using namespace llvm; 47 48 namespace llvm { 49 void initializeNVVMReflectPass(PassRegistry&); 50 void initializeGenericToNVVMPass(PassRegistry&); 51 void initializeNVPTXAssignValidGlobalNamesPass(PassRegistry&); 52 void initializeNVPTXFavorNonGenericAddrSpacesPass(PassRegistry &); 53 } 54 55 extern "C" void LLVMInitializeNVPTXTarget() { 56 // Register the target. 57 RegisterTargetMachine<NVPTXTargetMachine32> X(TheNVPTXTarget32); 58 RegisterTargetMachine<NVPTXTargetMachine64> Y(TheNVPTXTarget64); 59 60 // FIXME: This pass is really intended to be invoked during IR optimization, 61 // but it's very NVPTX-specific. 62 initializeNVVMReflectPass(*PassRegistry::getPassRegistry()); 63 initializeGenericToNVVMPass(*PassRegistry::getPassRegistry()); 64 initializeNVPTXAssignValidGlobalNamesPass(*PassRegistry::getPassRegistry()); 65 initializeNVPTXFavorNonGenericAddrSpacesPass( 66 *PassRegistry::getPassRegistry()); 67 } 68 69 static std::string computeDataLayout(const NVPTXSubtarget &ST) { 70 std::string Ret = "e"; 71 72 if (!ST.is64Bit()) 73 Ret += "-p:32:32"; 74 75 Ret += "-i64:64-v16:16-v32:32-n16:32:64"; 76 77 return Ret; 78 } 79 80 NVPTXTargetMachine::NVPTXTargetMachine( 81 const Target &T, StringRef TT, StringRef CPU, StringRef FS, 82 const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM, 83 CodeGenOpt::Level OL, bool is64bit) 84 : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL), 85 Subtarget(TT, CPU, FS, is64bit), DL(computeDataLayout(Subtarget)), 86 InstrInfo(*this), TLInfo(*this), TSInfo(*this), 87 FrameLowering( 88 *this, is64bit) /*FrameInfo(TargetFrameInfo::StackGrowsUp, 8, 0)*/ { 89 initAsmInfo(); 90 } 91 92 void NVPTXTargetMachine32::anchor() {} 93 94 NVPTXTargetMachine32::NVPTXTargetMachine32( 95 const Target &T, StringRef TT, StringRef CPU, StringRef FS, 96 const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM, 97 CodeGenOpt::Level OL) 98 : NVPTXTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) {} 99 100 void NVPTXTargetMachine64::anchor() {} 101 102 NVPTXTargetMachine64::NVPTXTargetMachine64( 103 const Target &T, StringRef TT, StringRef CPU, StringRef FS, 104 const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM, 105 CodeGenOpt::Level OL) 106 : NVPTXTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) {} 107 108 namespace { 109 class NVPTXPassConfig : public TargetPassConfig { 110 public: 111 NVPTXPassConfig(NVPTXTargetMachine *TM, PassManagerBase &PM) 112 : TargetPassConfig(TM, PM) {} 113 114 NVPTXTargetMachine &getNVPTXTargetMachine() const { 115 return getTM<NVPTXTargetMachine>(); 116 } 117 118 virtual void addIRPasses(); 119 virtual bool addInstSelector(); 120 virtual bool addPreRegAlloc(); 121 virtual bool addPostRegAlloc(); 122 123 virtual FunctionPass *createTargetRegisterAllocator(bool) override; 124 virtual void addFastRegAlloc(FunctionPass *RegAllocPass); 125 virtual void addOptimizedRegAlloc(FunctionPass *RegAllocPass); 126 }; 127 } // end anonymous namespace 128 129 TargetPassConfig *NVPTXTargetMachine::createPassConfig(PassManagerBase &PM) { 130 NVPTXPassConfig *PassConfig = new NVPTXPassConfig(this, PM); 131 return PassConfig; 132 } 133 134 void NVPTXPassConfig::addIRPasses() { 135 // The following passes are known to not play well with virtual regs hanging 136 // around after register allocation (which in our case, is *all* registers). 137 // We explicitly disable them here. We do, however, need some functionality 138 // of the PrologEpilogCodeInserter pass, so we emulate that behavior in the 139 // NVPTXPrologEpilog pass (see NVPTXPrologEpilogPass.cpp). 140 disablePass(&PrologEpilogCodeInserterID); 141 disablePass(&MachineCopyPropagationID); 142 disablePass(&BranchFolderPassID); 143 disablePass(&TailDuplicateID); 144 145 addPass(createNVPTXImageOptimizerPass()); 146 TargetPassConfig::addIRPasses(); 147 addPass(createNVPTXAssignValidGlobalNamesPass()); 148 addPass(createGenericToNVVMPass()); 149 addPass(createNVPTXFavorNonGenericAddrSpacesPass()); 150 // The FavorNonGenericAddrSpaces pass may remove instructions and leave some 151 // values unused. Therefore, we run a DCE pass right afterwards. We could 152 // remove unused values in an ad-hoc manner, but it requires manual work and 153 // might be error-prone. 154 addPass(createDeadCodeEliminationPass()); 155 } 156 157 bool NVPTXPassConfig::addInstSelector() { 158 const NVPTXSubtarget &ST = 159 getTM<NVPTXTargetMachine>().getSubtarget<NVPTXSubtarget>(); 160 161 addPass(createLowerAggrCopies()); 162 addPass(createAllocaHoisting()); 163 addPass(createNVPTXISelDag(getNVPTXTargetMachine(), getOptLevel())); 164 165 if (!ST.hasImageHandles()) 166 addPass(createNVPTXReplaceImageHandlesPass()); 167 168 return false; 169 } 170 171 bool NVPTXPassConfig::addPreRegAlloc() { return false; } 172 bool NVPTXPassConfig::addPostRegAlloc() { 173 addPass(createNVPTXPrologEpilogPass()); 174 return false; 175 } 176 177 FunctionPass *NVPTXPassConfig::createTargetRegisterAllocator(bool) { 178 return 0; // No reg alloc 179 } 180 181 void NVPTXPassConfig::addFastRegAlloc(FunctionPass *RegAllocPass) { 182 assert(!RegAllocPass && "NVPTX uses no regalloc!"); 183 addPass(&PHIEliminationID); 184 addPass(&TwoAddressInstructionPassID); 185 } 186 187 void NVPTXPassConfig::addOptimizedRegAlloc(FunctionPass *RegAllocPass) { 188 assert(!RegAllocPass && "NVPTX uses no regalloc!"); 189 190 addPass(&ProcessImplicitDefsID); 191 addPass(&LiveVariablesID); 192 addPass(&MachineLoopInfoID); 193 addPass(&PHIEliminationID); 194 195 addPass(&TwoAddressInstructionPassID); 196 addPass(&RegisterCoalescerID); 197 198 // PreRA instruction scheduling. 199 if (addPass(&MachineSchedulerID)) 200 printAndVerify("After Machine Scheduling"); 201 202 203 addPass(&StackSlotColoringID); 204 205 // FIXME: Needs physical registers 206 //addPass(&PostRAMachineLICMID); 207 208 printAndVerify("After StackSlotColoring"); 209 } 210