1 //===-- NVPTXTargetMachine.cpp - Define TargetMachine for NVPTX -----------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // Top-level implementation for the NVPTX target.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "NVPTXTargetMachine.h"
15 #include "MCTargetDesc/NVPTXMCAsmInfo.h"
16 #include "NVPTX.h"
17 #include "NVPTXAllocaHoisting.h"
18 #include "NVPTXLowerAggrCopies.h"
19 #include "NVPTXSplitBBatBar.h"
20 #include "llvm/ADT/OwningPtr.h"
21 #include "llvm/Analysis/Passes.h"
22 #include "llvm/Analysis/Verifier.h"
23 #include "llvm/Assembly/PrintModulePass.h"
24 #include "llvm/CodeGen/AsmPrinter.h"
25 #include "llvm/CodeGen/MachineFunctionAnalysis.h"
26 #include "llvm/CodeGen/MachineModuleInfo.h"
27 #include "llvm/CodeGen/Passes.h"
28 #include "llvm/IR/DataLayout.h"
29 #include "llvm/MC/MCAsmInfo.h"
30 #include "llvm/MC/MCInstrInfo.h"
31 #include "llvm/MC/MCStreamer.h"
32 #include "llvm/MC/MCSubtargetInfo.h"
33 #include "llvm/PassManager.h"
34 #include "llvm/Support/CommandLine.h"
35 #include "llvm/Support/Debug.h"
36 #include "llvm/Support/FormattedStream.h"
37 #include "llvm/Support/TargetRegistry.h"
38 #include "llvm/Support/raw_ostream.h"
39 #include "llvm/Target/TargetInstrInfo.h"
40 #include "llvm/Target/TargetLowering.h"
41 #include "llvm/Target/TargetLoweringObjectFile.h"
42 #include "llvm/Target/TargetMachine.h"
43 #include "llvm/Target/TargetOptions.h"
44 #include "llvm/Target/TargetRegisterInfo.h"
45 #include "llvm/Target/TargetSubtargetInfo.h"
46 #include "llvm/Transforms/Scalar.h"
47 
48 using namespace llvm;
49 
50 namespace llvm {
51 void initializeNVVMReflectPass(PassRegistry&);
52 void initializeGenericToNVVMPass(PassRegistry&);
53 }
54 
55 extern "C" void LLVMInitializeNVPTXTarget() {
56   // Register the target.
57   RegisterTargetMachine<NVPTXTargetMachine32> X(TheNVPTXTarget32);
58   RegisterTargetMachine<NVPTXTargetMachine64> Y(TheNVPTXTarget64);
59 
60   // FIXME: This pass is really intended to be invoked during IR optimization,
61   // but it's very NVPTX-specific.
62   initializeNVVMReflectPass(*PassRegistry::getPassRegistry());
63   initializeGenericToNVVMPass(*PassRegistry::getPassRegistry());
64 }
65 
66 NVPTXTargetMachine::NVPTXTargetMachine(
67     const Target &T, StringRef TT, StringRef CPU, StringRef FS,
68     const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM,
69     CodeGenOpt::Level OL, bool is64bit)
70     : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL),
71       Subtarget(TT, CPU, FS, is64bit), DL(Subtarget.getDataLayout()),
72       InstrInfo(*this), TLInfo(*this), TSInfo(*this),
73       FrameLowering(
74           *this, is64bit) /*FrameInfo(TargetFrameInfo::StackGrowsUp, 8, 0)*/ {
75   initAsmInfo();
76 }
77 
78 void NVPTXTargetMachine32::anchor() {}
79 
80 NVPTXTargetMachine32::NVPTXTargetMachine32(
81     const Target &T, StringRef TT, StringRef CPU, StringRef FS,
82     const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM,
83     CodeGenOpt::Level OL)
84     : NVPTXTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) {}
85 
86 void NVPTXTargetMachine64::anchor() {}
87 
88 NVPTXTargetMachine64::NVPTXTargetMachine64(
89     const Target &T, StringRef TT, StringRef CPU, StringRef FS,
90     const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM,
91     CodeGenOpt::Level OL)
92     : NVPTXTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) {}
93 
94 namespace {
95 class NVPTXPassConfig : public TargetPassConfig {
96 public:
97   NVPTXPassConfig(NVPTXTargetMachine *TM, PassManagerBase &PM)
98       : TargetPassConfig(TM, PM) {}
99 
100   NVPTXTargetMachine &getNVPTXTargetMachine() const {
101     return getTM<NVPTXTargetMachine>();
102   }
103 
104   virtual void addIRPasses();
105   virtual bool addInstSelector();
106   virtual bool addPreRegAlloc();
107   virtual bool addPostRegAlloc();
108 
109   virtual FunctionPass *createTargetRegisterAllocator(bool) LLVM_OVERRIDE;
110   virtual void addFastRegAlloc(FunctionPass *RegAllocPass);
111   virtual void addOptimizedRegAlloc(FunctionPass *RegAllocPass);
112 };
113 } // end anonymous namespace
114 
115 TargetPassConfig *NVPTXTargetMachine::createPassConfig(PassManagerBase &PM) {
116   NVPTXPassConfig *PassConfig = new NVPTXPassConfig(this, PM);
117   return PassConfig;
118 }
119 
120 void NVPTXPassConfig::addIRPasses() {
121   // The following passes are known to not play well with virtual regs hanging
122   // around after register allocation (which in our case, is *all* registers).
123   // We explicitly disable them here.  We do, however, need some functionality
124   // of the PrologEpilogCodeInserter pass, so we emulate that behavior in the
125   // NVPTXPrologEpilog pass (see NVPTXPrologEpilogPass.cpp).
126   disablePass(&PrologEpilogCodeInserterID);
127   disablePass(&MachineCopyPropagationID);
128   disablePass(&BranchFolderPassID);
129 
130   TargetPassConfig::addIRPasses();
131   addPass(createGenericToNVVMPass());
132 }
133 
134 bool NVPTXPassConfig::addInstSelector() {
135   addPass(createLowerAggrCopies());
136   addPass(createSplitBBatBarPass());
137   addPass(createAllocaHoisting());
138   addPass(createNVPTXISelDag(getNVPTXTargetMachine(), getOptLevel()));
139   return false;
140 }
141 
142 bool NVPTXPassConfig::addPreRegAlloc() { return false; }
143 bool NVPTXPassConfig::addPostRegAlloc() {
144   addPass(createNVPTXPrologEpilogPass());
145   return false;
146 }
147 
148 FunctionPass *NVPTXPassConfig::createTargetRegisterAllocator(bool) {
149   return 0; // No reg alloc
150 }
151 
152 void NVPTXPassConfig::addFastRegAlloc(FunctionPass *RegAllocPass) {
153   assert(!RegAllocPass && "NVPTX uses no regalloc!");
154   addPass(&PHIEliminationID);
155   addPass(&TwoAddressInstructionPassID);
156 }
157 
158 void NVPTXPassConfig::addOptimizedRegAlloc(FunctionPass *RegAllocPass) {
159   assert(!RegAllocPass && "NVPTX uses no regalloc!");
160 
161   addPass(&ProcessImplicitDefsID);
162   addPass(&LiveVariablesID);
163   addPass(&MachineLoopInfoID);
164   addPass(&PHIEliminationID);
165 
166   addPass(&TwoAddressInstructionPassID);
167   addPass(&RegisterCoalescerID);
168 
169   // PreRA instruction scheduling.
170   if (addPass(&MachineSchedulerID))
171     printAndVerify("After Machine Scheduling");
172 
173 
174   addPass(&StackSlotColoringID);
175 
176   // FIXME: Needs physical registers
177   //addPass(&PostRAMachineLICMID);
178 
179   printAndVerify("After StackSlotColoring");
180 }
181