1 //===- AMDGPUMCInstLower.cpp - Lower AMDGPU MachineInstr to an MCInst -----===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 /// \file
11 /// \brief Code to lower AMDGPU MachineInstrs to their corresponding MCInst.
12 //
13 //===----------------------------------------------------------------------===//
14 //
15 
16 #include "AMDGPUMCInstLower.h"
17 #include "AMDGPUAsmPrinter.h"
18 #include "AMDGPUSubtarget.h"
19 #include "AMDGPUTargetMachine.h"
20 #include "InstPrinter/AMDGPUInstPrinter.h"
21 #include "SIInstrInfo.h"
22 #include "llvm/CodeGen/MachineBasicBlock.h"
23 #include "llvm/CodeGen/MachineInstr.h"
24 #include "llvm/IR/Constants.h"
25 #include "llvm/IR/Function.h"
26 #include "llvm/IR/GlobalVariable.h"
27 #include "llvm/MC/MCCodeEmitter.h"
28 #include "llvm/MC/MCContext.h"
29 #include "llvm/MC/MCExpr.h"
30 #include "llvm/MC/MCInst.h"
31 #include "llvm/MC/MCObjectStreamer.h"
32 #include "llvm/MC/MCStreamer.h"
33 #include "llvm/Support/ErrorHandling.h"
34 #include "llvm/Support/Format.h"
35 #include <algorithm>
36 
37 using namespace llvm;
38 
39 #include "AMDGPUGenMCPseudoLowering.inc"
40 
41 
42 AMDGPUMCInstLower::AMDGPUMCInstLower(MCContext &ctx, const AMDGPUSubtarget &st,
43                                      const AsmPrinter &ap):
44   Ctx(ctx), ST(st), AP(ap) { }
45 
46 static MCSymbolRefExpr::VariantKind getVariantKind(unsigned MOFlags) {
47   switch (MOFlags) {
48   default:
49     return MCSymbolRefExpr::VK_None;
50   case SIInstrInfo::MO_GOTPCREL:
51     return MCSymbolRefExpr::VK_GOTPCREL;
52   case SIInstrInfo::MO_GOTPCREL32_LO:
53     return MCSymbolRefExpr::VK_AMDGPU_GOTPCREL32_LO;
54   case SIInstrInfo::MO_GOTPCREL32_HI:
55     return MCSymbolRefExpr::VK_AMDGPU_GOTPCREL32_HI;
56   case SIInstrInfo::MO_REL32_LO:
57     return MCSymbolRefExpr::VK_AMDGPU_REL32_LO;
58   case SIInstrInfo::MO_REL32_HI:
59     return MCSymbolRefExpr::VK_AMDGPU_REL32_HI;
60   }
61 }
62 
63 const MCExpr *AMDGPUMCInstLower::getLongBranchBlockExpr(
64   const MachineBasicBlock &SrcBB,
65   const MachineOperand &MO) const {
66   const MCExpr *DestBBSym
67     = MCSymbolRefExpr::create(MO.getMBB()->getSymbol(), Ctx);
68   const MCExpr *SrcBBSym = MCSymbolRefExpr::create(SrcBB.getSymbol(), Ctx);
69 
70   assert(SrcBB.front().getOpcode() == AMDGPU::S_GETPC_B64 &&
71          ST.getInstrInfo()->get(AMDGPU::S_GETPC_B64).Size == 4);
72 
73   // s_getpc_b64 returns the address of next instruction.
74   const MCConstantExpr *One = MCConstantExpr::create(4, Ctx);
75   SrcBBSym = MCBinaryExpr::createAdd(SrcBBSym, One, Ctx);
76 
77   if (MO.getTargetFlags() == AMDGPU::TF_LONG_BRANCH_FORWARD)
78     return MCBinaryExpr::createSub(DestBBSym, SrcBBSym, Ctx);
79 
80   assert(MO.getTargetFlags() == AMDGPU::TF_LONG_BRANCH_BACKWARD);
81   return MCBinaryExpr::createSub(SrcBBSym, DestBBSym, Ctx);
82 }
83 
84 bool AMDGPUMCInstLower::lowerOperand(const MachineOperand &MO,
85                                      MCOperand &MCOp) const {
86   switch (MO.getType()) {
87   default:
88     llvm_unreachable("unknown operand type");
89   case MachineOperand::MO_Immediate:
90     MCOp = MCOperand::createImm(MO.getImm());
91     return true;
92   case MachineOperand::MO_Register:
93     MCOp = MCOperand::createReg(AMDGPU::getMCReg(MO.getReg(), ST));
94     return true;
95   case MachineOperand::MO_MachineBasicBlock: {
96     if (MO.getTargetFlags() != 0) {
97       MCOp = MCOperand::createExpr(
98         getLongBranchBlockExpr(*MO.getParent()->getParent(), MO));
99     } else {
100       MCOp = MCOperand::createExpr(
101         MCSymbolRefExpr::create(MO.getMBB()->getSymbol(), Ctx));
102     }
103 
104     return true;
105   }
106   case MachineOperand::MO_GlobalAddress: {
107     const GlobalValue *GV = MO.getGlobal();
108     SmallString<128> SymbolName;
109     AP.getNameWithPrefix(SymbolName, GV);
110     MCSymbol *Sym = Ctx.getOrCreateSymbol(SymbolName);
111     const MCExpr *SymExpr =
112       MCSymbolRefExpr::create(Sym, getVariantKind(MO.getTargetFlags()),Ctx);
113     const MCExpr *Expr = MCBinaryExpr::createAdd(SymExpr,
114       MCConstantExpr::create(MO.getOffset(), Ctx), Ctx);
115     MCOp = MCOperand::createExpr(Expr);
116     return true;
117   }
118   case MachineOperand::MO_ExternalSymbol: {
119     MCSymbol *Sym = Ctx.getOrCreateSymbol(StringRef(MO.getSymbolName()));
120     Sym->setExternal(true);
121     const MCSymbolRefExpr *Expr = MCSymbolRefExpr::create(Sym, Ctx);
122     MCOp = MCOperand::createExpr(Expr);
123     return true;
124   }
125   }
126 }
127 
128 void AMDGPUMCInstLower::lower(const MachineInstr *MI, MCInst &OutMI) const {
129 
130   int MCOpcode = ST.getInstrInfo()->pseudoToMCOpcode(MI->getOpcode());
131 
132   if (MCOpcode == -1) {
133     LLVMContext &C = MI->getParent()->getParent()->getFunction()->getContext();
134     C.emitError("AMDGPUMCInstLower::lower - Pseudo instruction doesn't have "
135                 "a target-specific version: " + Twine(MI->getOpcode()));
136   }
137 
138   OutMI.setOpcode(MCOpcode);
139 
140   for (const MachineOperand &MO : MI->explicit_operands()) {
141     MCOperand MCOp;
142     lowerOperand(MO, MCOp);
143     OutMI.addOperand(MCOp);
144   }
145 }
146 
147 bool AMDGPUAsmPrinter::lowerOperand(const MachineOperand &MO,
148                                     MCOperand &MCOp) const {
149   const AMDGPUSubtarget &STI = MF->getSubtarget<AMDGPUSubtarget>();
150   AMDGPUMCInstLower MCInstLowering(OutContext, STI, *this);
151   return MCInstLowering.lowerOperand(MO, MCOp);
152 }
153 
154 const MCExpr *AMDGPUAsmPrinter::lowerConstant(const Constant *CV) {
155   // TargetMachine does not support llvm-style cast. Use C++-style cast.
156   // This is safe since TM is always of type AMDGPUTargetMachine or its
157   // derived class.
158   auto *AT = static_cast<AMDGPUTargetMachine*>(&TM);
159   auto *CE = dyn_cast<ConstantExpr>(CV);
160 
161   // Lower null pointers in private and local address space.
162   // Clang generates addrspacecast for null pointers in private and local
163   // address space, which needs to be lowered.
164   if (CE && CE->getOpcode() == Instruction::AddrSpaceCast) {
165     auto Op = CE->getOperand(0);
166     auto SrcAddr = Op->getType()->getPointerAddressSpace();
167     if (Op->isNullValue() && AT->getNullPointerValue(SrcAddr) == 0) {
168       auto DstAddr = CE->getType()->getPointerAddressSpace();
169       return MCConstantExpr::create(AT->getNullPointerValue(DstAddr),
170         OutContext);
171     }
172   }
173   return AsmPrinter::lowerConstant(CV);
174 }
175 
176 void AMDGPUAsmPrinter::EmitInstruction(const MachineInstr *MI) {
177   if (emitPseudoExpansionLowering(*OutStreamer, MI))
178     return;
179 
180   const AMDGPUSubtarget &STI = MF->getSubtarget<AMDGPUSubtarget>();
181   AMDGPUMCInstLower MCInstLowering(OutContext, STI, *this);
182 
183   StringRef Err;
184   if (!STI.getInstrInfo()->verifyInstruction(*MI, Err)) {
185     LLVMContext &C = MI->getParent()->getParent()->getFunction()->getContext();
186     C.emitError("Illegal instruction detected: " + Err);
187     MI->print(errs());
188   }
189 
190   if (MI->isBundle()) {
191     const MachineBasicBlock *MBB = MI->getParent();
192     MachineBasicBlock::const_instr_iterator I = ++MI->getIterator();
193     while (I != MBB->instr_end() && I->isInsideBundle()) {
194       EmitInstruction(&*I);
195       ++I;
196     }
197   } else {
198     // We don't want SI_MASK_BRANCH/SI_RETURN encoded. They are placeholder
199     // terminator instructions and should only be printed as comments.
200     if (MI->getOpcode() == AMDGPU::SI_MASK_BRANCH) {
201       if (isVerbose()) {
202         SmallVector<char, 16> BBStr;
203         raw_svector_ostream Str(BBStr);
204 
205         const MachineBasicBlock *MBB = MI->getOperand(0).getMBB();
206         const MCSymbolRefExpr *Expr
207           = MCSymbolRefExpr::create(MBB->getSymbol(), OutContext);
208         Expr->print(Str, MAI);
209         OutStreamer->emitRawComment(" mask branch " + BBStr);
210       }
211 
212       return;
213     }
214 
215     if (MI->getOpcode() == AMDGPU::SI_RETURN) {
216       if (isVerbose())
217         OutStreamer->emitRawComment(" return");
218       return;
219     }
220 
221     if (MI->getOpcode() == AMDGPU::WAVE_BARRIER) {
222       if (isVerbose())
223         OutStreamer->emitRawComment(" wave barrier");
224       return;
225     }
226 
227     MCInst TmpInst;
228     MCInstLowering.lower(MI, TmpInst);
229     EmitToStreamer(*OutStreamer, TmpInst);
230 
231     if (STI.dumpCode()) {
232       // Disassemble instruction/operands to text.
233       DisasmLines.resize(DisasmLines.size() + 1);
234       std::string &DisasmLine = DisasmLines.back();
235       raw_string_ostream DisasmStream(DisasmLine);
236 
237       AMDGPUInstPrinter InstPrinter(*TM.getMCAsmInfo(),
238                                     *STI.getInstrInfo(),
239                                     *STI.getRegisterInfo());
240       InstPrinter.printInst(&TmpInst, DisasmStream, StringRef(), STI);
241 
242       // Disassemble instruction/operands to hex representation.
243       SmallVector<MCFixup, 4> Fixups;
244       SmallVector<char, 16> CodeBytes;
245       raw_svector_ostream CodeStream(CodeBytes);
246 
247       auto &ObjStreamer = static_cast<MCObjectStreamer&>(*OutStreamer);
248       MCCodeEmitter &InstEmitter = ObjStreamer.getAssembler().getEmitter();
249       InstEmitter.encodeInstruction(TmpInst, CodeStream, Fixups,
250                                     MF->getSubtarget<MCSubtargetInfo>());
251       HexLines.resize(HexLines.size() + 1);
252       std::string &HexLine = HexLines.back();
253       raw_string_ostream HexStream(HexLine);
254 
255       for (size_t i = 0; i < CodeBytes.size(); i += 4) {
256         unsigned int CodeDWord = *(unsigned int *)&CodeBytes[i];
257         HexStream << format("%s%08X", (i > 0 ? " " : ""), CodeDWord);
258       }
259 
260       DisasmStream.flush();
261       DisasmLineMaxLen = std::max(DisasmLineMaxLen, DisasmLine.size());
262     }
263   }
264 }
265