1 //===-- AMDGPUInstPrinter.cpp - AMDGPU MC Inst -> ASM ---------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 // \file
8 //===----------------------------------------------------------------------===//
9 
10 #include "AMDGPUInstPrinter.h"
11 #include "MCTargetDesc/AMDGPUMCTargetDesc.h"
12 #include "SIDefines.h"
13 #include "Utils/AMDGPUAsmUtils.h"
14 #include "Utils/AMDGPUBaseInfo.h"
15 #include "llvm/MC/MCExpr.h"
16 #include "llvm/MC/MCInst.h"
17 #include "llvm/MC/MCInstrDesc.h"
18 #include "llvm/MC/MCInstrInfo.h"
19 #include "llvm/MC/MCRegisterInfo.h"
20 #include "llvm/MC/MCSubtargetInfo.h"
21 #include "llvm/Support/ErrorHandling.h"
22 #include "llvm/Support/MathExtras.h"
23 #include "llvm/Support/raw_ostream.h"
24 #include <cassert>
25 
26 using namespace llvm;
27 using namespace llvm::AMDGPU;
28 
29 void AMDGPUInstPrinter::printRegName(raw_ostream &OS, unsigned RegNo) const {
30   // FIXME: The current implementation of
31   // AsmParser::parseRegisterOrRegisterNumber in MC implies we either emit this
32   // as an integer or we provide a name which represents a physical register.
33   // For CFI instructions we really want to emit a name for the DWARF register
34   // instead, because there may be multiple DWARF registers corresponding to a
35   // single physical register. One case where this problem manifests is with
36   // wave32/wave64 where using the physical register name is ambiguous: if we
37   // write e.g. `.cfi_undefined v0` we lose information about the wavefront
38   // size which we need to encode the register in the final DWARF. Ideally we
39   // would extend MC to support parsing DWARF register names so we could do
40   // something like `.cfi_undefined dwarf_wave32_v0`. For now we just live with
41   // non-pretty DWARF register names in assembly text.
42   OS << RegNo;
43 }
44 
45 void AMDGPUInstPrinter::printInst(const MCInst *MI, uint64_t Address,
46                                   StringRef Annot, const MCSubtargetInfo &STI,
47                                   raw_ostream &OS) {
48   OS.flush();
49   printInstruction(MI, Address, STI, OS);
50   printAnnotation(OS, Annot);
51 }
52 
53 void AMDGPUInstPrinter::printU4ImmOperand(const MCInst *MI, unsigned OpNo,
54                                           const MCSubtargetInfo &STI,
55                                           raw_ostream &O) {
56   O << formatHex(MI->getOperand(OpNo).getImm() & 0xf);
57 }
58 
59 void AMDGPUInstPrinter::printU8ImmOperand(const MCInst *MI, unsigned OpNo,
60                                           raw_ostream &O) {
61   O << formatHex(MI->getOperand(OpNo).getImm() & 0xff);
62 }
63 
64 void AMDGPUInstPrinter::printU16ImmOperand(const MCInst *MI, unsigned OpNo,
65                                            const MCSubtargetInfo &STI,
66                                            raw_ostream &O) {
67   // It's possible to end up with a 32-bit literal used with a 16-bit operand
68   // with ignored high bits. Print as 32-bit anyway in that case.
69   int64_t Imm = MI->getOperand(OpNo).getImm();
70   if (isInt<16>(Imm) || isUInt<16>(Imm))
71     O << formatHex(static_cast<uint64_t>(Imm & 0xffff));
72   else
73     printU32ImmOperand(MI, OpNo, STI, O);
74 }
75 
76 void AMDGPUInstPrinter::printU4ImmDecOperand(const MCInst *MI, unsigned OpNo,
77                                              raw_ostream &O) {
78   O << formatDec(MI->getOperand(OpNo).getImm() & 0xf);
79 }
80 
81 void AMDGPUInstPrinter::printU8ImmDecOperand(const MCInst *MI, unsigned OpNo,
82                                              raw_ostream &O) {
83   O << formatDec(MI->getOperand(OpNo).getImm() & 0xff);
84 }
85 
86 void AMDGPUInstPrinter::printU16ImmDecOperand(const MCInst *MI, unsigned OpNo,
87                                               raw_ostream &O) {
88   O << formatDec(MI->getOperand(OpNo).getImm() & 0xffff);
89 }
90 
91 void AMDGPUInstPrinter::printU32ImmOperand(const MCInst *MI, unsigned OpNo,
92                                            const MCSubtargetInfo &STI,
93                                            raw_ostream &O) {
94   O << formatHex(MI->getOperand(OpNo).getImm() & 0xffffffff);
95 }
96 
97 void AMDGPUInstPrinter::printNamedBit(const MCInst *MI, unsigned OpNo,
98                                       raw_ostream &O, StringRef BitName) {
99   if (MI->getOperand(OpNo).getImm()) {
100     O << ' ' << BitName;
101   }
102 }
103 
104 void AMDGPUInstPrinter::printOffen(const MCInst *MI, unsigned OpNo,
105                                    raw_ostream &O) {
106   printNamedBit(MI, OpNo, O, "offen");
107 }
108 
109 void AMDGPUInstPrinter::printIdxen(const MCInst *MI, unsigned OpNo,
110                                    raw_ostream &O) {
111   printNamedBit(MI, OpNo, O, "idxen");
112 }
113 
114 void AMDGPUInstPrinter::printAddr64(const MCInst *MI, unsigned OpNo,
115                                     raw_ostream &O) {
116   printNamedBit(MI, OpNo, O, "addr64");
117 }
118 
119 void AMDGPUInstPrinter::printMBUFOffset(const MCInst *MI, unsigned OpNo,
120                                         raw_ostream &O) {
121   if (MI->getOperand(OpNo).getImm()) {
122     O << " offset:";
123     printU16ImmDecOperand(MI, OpNo, O);
124   }
125 }
126 
127 void AMDGPUInstPrinter::printOffset(const MCInst *MI, unsigned OpNo,
128                                     const MCSubtargetInfo &STI,
129                                     raw_ostream &O) {
130   uint16_t Imm = MI->getOperand(OpNo).getImm();
131   if (Imm != 0) {
132     O << ((OpNo == 0)? "offset:" : " offset:");
133     printU16ImmDecOperand(MI, OpNo, O);
134   }
135 }
136 
137 void AMDGPUInstPrinter::printFlatOffset(const MCInst *MI, unsigned OpNo,
138                                         const MCSubtargetInfo &STI,
139                                         raw_ostream &O) {
140   uint16_t Imm = MI->getOperand(OpNo).getImm();
141   if (Imm != 0) {
142     O << ((OpNo == 0)? "offset:" : " offset:");
143 
144     const MCInstrDesc &Desc = MII.get(MI->getOpcode());
145     bool IsFlatSeg = !(Desc.TSFlags & SIInstrFlags::IsNonFlatSeg);
146 
147     if (IsFlatSeg) { // Unsigned offset
148       printU16ImmDecOperand(MI, OpNo, O);
149     } else {         // Signed offset
150       if (AMDGPU::isGFX10(STI)) {
151         O << formatDec(SignExtend32<12>(MI->getOperand(OpNo).getImm()));
152       } else {
153         O << formatDec(SignExtend32<13>(MI->getOperand(OpNo).getImm()));
154       }
155     }
156   }
157 }
158 
159 void AMDGPUInstPrinter::printOffset0(const MCInst *MI, unsigned OpNo,
160                                      const MCSubtargetInfo &STI,
161                                      raw_ostream &O) {
162   if (MI->getOperand(OpNo).getImm()) {
163     O << " offset0:";
164     printU8ImmDecOperand(MI, OpNo, O);
165   }
166 }
167 
168 void AMDGPUInstPrinter::printOffset1(const MCInst *MI, unsigned OpNo,
169                                      const MCSubtargetInfo &STI,
170                                      raw_ostream &O) {
171   if (MI->getOperand(OpNo).getImm()) {
172     O << " offset1:";
173     printU8ImmDecOperand(MI, OpNo, O);
174   }
175 }
176 
177 void AMDGPUInstPrinter::printSMRDOffset8(const MCInst *MI, unsigned OpNo,
178                                         const MCSubtargetInfo &STI,
179                                         raw_ostream &O) {
180   printU32ImmOperand(MI, OpNo, STI, O);
181 }
182 
183 void AMDGPUInstPrinter::printSMRDOffset20(const MCInst *MI, unsigned OpNo,
184                                         const MCSubtargetInfo &STI,
185                                         raw_ostream &O) {
186   printU32ImmOperand(MI, OpNo, STI, O);
187 }
188 
189 void AMDGPUInstPrinter::printSMRDLiteralOffset(const MCInst *MI, unsigned OpNo,
190                                                const MCSubtargetInfo &STI,
191                                                raw_ostream &O) {
192   printU32ImmOperand(MI, OpNo, STI, O);
193 }
194 
195 void AMDGPUInstPrinter::printGDS(const MCInst *MI, unsigned OpNo,
196                                  const MCSubtargetInfo &STI, raw_ostream &O) {
197   printNamedBit(MI, OpNo, O, "gds");
198 }
199 
200 void AMDGPUInstPrinter::printDLC(const MCInst *MI, unsigned OpNo,
201                                  const MCSubtargetInfo &STI, raw_ostream &O) {
202   if (AMDGPU::isGFX10(STI))
203     printNamedBit(MI, OpNo, O, "dlc");
204 }
205 
206 void AMDGPUInstPrinter::printGLC(const MCInst *MI, unsigned OpNo,
207                                  const MCSubtargetInfo &STI, raw_ostream &O) {
208   printNamedBit(MI, OpNo, O, "glc");
209 }
210 
211 void AMDGPUInstPrinter::printSLC(const MCInst *MI, unsigned OpNo,
212                                  const MCSubtargetInfo &STI, raw_ostream &O) {
213   printNamedBit(MI, OpNo, O, "slc");
214 }
215 
216 void AMDGPUInstPrinter::printSWZ(const MCInst *MI, unsigned OpNo,
217                                  const MCSubtargetInfo &STI, raw_ostream &O) {
218 }
219 
220 void AMDGPUInstPrinter::printTFE(const MCInst *MI, unsigned OpNo,
221                                  const MCSubtargetInfo &STI, raw_ostream &O) {
222   printNamedBit(MI, OpNo, O, "tfe");
223 }
224 
225 void AMDGPUInstPrinter::printDMask(const MCInst *MI, unsigned OpNo,
226                                    const MCSubtargetInfo &STI, raw_ostream &O) {
227   if (MI->getOperand(OpNo).getImm()) {
228     O << " dmask:";
229     printU16ImmOperand(MI, OpNo, STI, O);
230   }
231 }
232 
233 void AMDGPUInstPrinter::printDim(const MCInst *MI, unsigned OpNo,
234                                  const MCSubtargetInfo &STI, raw_ostream &O) {
235   unsigned Dim = MI->getOperand(OpNo).getImm();
236   O << " dim:SQ_RSRC_IMG_";
237 
238   const AMDGPU::MIMGDimInfo *DimInfo = AMDGPU::getMIMGDimInfoByEncoding(Dim);
239   if (DimInfo)
240     O << DimInfo->AsmSuffix;
241   else
242     O << Dim;
243 }
244 
245 void AMDGPUInstPrinter::printUNorm(const MCInst *MI, unsigned OpNo,
246                                    const MCSubtargetInfo &STI, raw_ostream &O) {
247   printNamedBit(MI, OpNo, O, "unorm");
248 }
249 
250 void AMDGPUInstPrinter::printDA(const MCInst *MI, unsigned OpNo,
251                                 const MCSubtargetInfo &STI, raw_ostream &O) {
252   printNamedBit(MI, OpNo, O, "da");
253 }
254 
255 void AMDGPUInstPrinter::printR128A16(const MCInst *MI, unsigned OpNo,
256                                   const MCSubtargetInfo &STI, raw_ostream &O) {
257   if (STI.hasFeature(AMDGPU::FeatureR128A16))
258     printNamedBit(MI, OpNo, O, "a16");
259   else
260     printNamedBit(MI, OpNo, O, "r128");
261 }
262 
263 void AMDGPUInstPrinter::printGFX10A16(const MCInst *MI, unsigned OpNo,
264                                   const MCSubtargetInfo &STI, raw_ostream &O) {
265   printNamedBit(MI, OpNo, O, "a16");
266 }
267 
268 void AMDGPUInstPrinter::printLWE(const MCInst *MI, unsigned OpNo,
269                                  const MCSubtargetInfo &STI, raw_ostream &O) {
270   printNamedBit(MI, OpNo, O, "lwe");
271 }
272 
273 void AMDGPUInstPrinter::printD16(const MCInst *MI, unsigned OpNo,
274                                  const MCSubtargetInfo &STI, raw_ostream &O) {
275   printNamedBit(MI, OpNo, O, "d16");
276 }
277 
278 void AMDGPUInstPrinter::printExpCompr(const MCInst *MI, unsigned OpNo,
279                                       const MCSubtargetInfo &STI,
280                                       raw_ostream &O) {
281   if (MI->getOperand(OpNo).getImm())
282     O << " compr";
283 }
284 
285 void AMDGPUInstPrinter::printExpVM(const MCInst *MI, unsigned OpNo,
286                                    const MCSubtargetInfo &STI,
287                                    raw_ostream &O) {
288   if (MI->getOperand(OpNo).getImm())
289     O << " vm";
290 }
291 
292 void AMDGPUInstPrinter::printFORMAT(const MCInst *MI, unsigned OpNo,
293                                     const MCSubtargetInfo &STI,
294                                     raw_ostream &O) {
295   if (unsigned Val = MI->getOperand(OpNo).getImm()) {
296     if (AMDGPU::isGFX10(STI))
297       O << " format:" << Val;
298     else {
299       O << " dfmt:" << (Val & 15);
300       O << ", nfmt:" << (Val >> 4);
301     }
302   }
303 }
304 
305 void AMDGPUInstPrinter::printRegOperand(unsigned RegNo, raw_ostream &O,
306                                         const MCRegisterInfo &MRI) {
307 #if !defined(NDEBUG)
308   switch (RegNo) {
309   case AMDGPU::FP_REG:
310   case AMDGPU::SP_REG:
311   case AMDGPU::PRIVATE_RSRC_REG:
312     llvm_unreachable("pseudo-register should not ever be emitted");
313   case AMDGPU::SCC:
314     llvm_unreachable("pseudo scc should not ever be emitted");
315   default:
316     break;
317   }
318 #endif
319 
320   O << getRegisterName(RegNo);
321 }
322 
323 void AMDGPUInstPrinter::printVOPDst(const MCInst *MI, unsigned OpNo,
324                                     const MCSubtargetInfo &STI, raw_ostream &O) {
325   if (OpNo == 0) {
326     if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::VOP3)
327       O << "_e64 ";
328     else if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::DPP)
329       O << "_dpp ";
330     else if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::SDWA)
331       O << "_sdwa ";
332     else
333       O << "_e32 ";
334   }
335 
336   printOperand(MI, OpNo, STI, O);
337 
338   // Print default vcc/vcc_lo operand.
339   switch (MI->getOpcode()) {
340   default: break;
341 
342   case AMDGPU::V_ADD_CO_CI_U32_e32_gfx10:
343   case AMDGPU::V_SUB_CO_CI_U32_e32_gfx10:
344   case AMDGPU::V_SUBREV_CO_CI_U32_e32_gfx10:
345   case AMDGPU::V_ADD_CO_CI_U32_sdwa_gfx10:
346   case AMDGPU::V_SUB_CO_CI_U32_sdwa_gfx10:
347   case AMDGPU::V_SUBREV_CO_CI_U32_sdwa_gfx10:
348   case AMDGPU::V_ADD_CO_CI_U32_dpp_gfx10:
349   case AMDGPU::V_SUB_CO_CI_U32_dpp_gfx10:
350   case AMDGPU::V_SUBREV_CO_CI_U32_dpp_gfx10:
351   case AMDGPU::V_ADD_CO_CI_U32_dpp8_gfx10:
352   case AMDGPU::V_SUB_CO_CI_U32_dpp8_gfx10:
353   case AMDGPU::V_SUBREV_CO_CI_U32_dpp8_gfx10:
354     printDefaultVccOperand(1, STI, O);
355     break;
356   }
357 }
358 
359 void AMDGPUInstPrinter::printVINTRPDst(const MCInst *MI, unsigned OpNo,
360                                        const MCSubtargetInfo &STI, raw_ostream &O) {
361   if (AMDGPU::isSI(STI) || AMDGPU::isCI(STI))
362     O << " ";
363   else
364     O << "_e32 ";
365 
366   printOperand(MI, OpNo, STI, O);
367 }
368 
369 void AMDGPUInstPrinter::printImmediate16(uint32_t Imm,
370                                          const MCSubtargetInfo &STI,
371                                          raw_ostream &O) {
372   int16_t SImm = static_cast<int16_t>(Imm);
373   if (SImm >= -16 && SImm <= 64) {
374     O << SImm;
375     return;
376   }
377 
378   if (Imm == 0x3C00)
379     O<< "1.0";
380   else if (Imm == 0xBC00)
381     O<< "-1.0";
382   else if (Imm == 0x3800)
383     O<< "0.5";
384   else if (Imm == 0xB800)
385     O<< "-0.5";
386   else if (Imm == 0x4000)
387     O<< "2.0";
388   else if (Imm == 0xC000)
389     O<< "-2.0";
390   else if (Imm == 0x4400)
391     O<< "4.0";
392   else if (Imm == 0xC400)
393     O<< "-4.0";
394   else if (Imm == 0x3118) {
395     assert(STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm]);
396     O << "0.15915494";
397   } else
398     O << formatHex(static_cast<uint64_t>(Imm));
399 }
400 
401 void AMDGPUInstPrinter::printImmediateV216(uint32_t Imm,
402                                            const MCSubtargetInfo &STI,
403                                            raw_ostream &O) {
404   uint16_t Lo16 = static_cast<uint16_t>(Imm);
405   printImmediate16(Lo16, STI, O);
406 }
407 
408 void AMDGPUInstPrinter::printImmediate32(uint32_t Imm,
409                                          const MCSubtargetInfo &STI,
410                                          raw_ostream &O) {
411   int32_t SImm = static_cast<int32_t>(Imm);
412   if (SImm >= -16 && SImm <= 64) {
413     O << SImm;
414     return;
415   }
416 
417   if (Imm == FloatToBits(0.0f))
418     O << "0.0";
419   else if (Imm == FloatToBits(1.0f))
420     O << "1.0";
421   else if (Imm == FloatToBits(-1.0f))
422     O << "-1.0";
423   else if (Imm == FloatToBits(0.5f))
424     O << "0.5";
425   else if (Imm == FloatToBits(-0.5f))
426     O << "-0.5";
427   else if (Imm == FloatToBits(2.0f))
428     O << "2.0";
429   else if (Imm == FloatToBits(-2.0f))
430     O << "-2.0";
431   else if (Imm == FloatToBits(4.0f))
432     O << "4.0";
433   else if (Imm == FloatToBits(-4.0f))
434     O << "-4.0";
435   else if (Imm == 0x3e22f983 &&
436            STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm])
437     O << "0.15915494";
438   else
439     O << formatHex(static_cast<uint64_t>(Imm));
440 }
441 
442 void AMDGPUInstPrinter::printImmediate64(uint64_t Imm,
443                                          const MCSubtargetInfo &STI,
444                                          raw_ostream &O) {
445   int64_t SImm = static_cast<int64_t>(Imm);
446   if (SImm >= -16 && SImm <= 64) {
447     O << SImm;
448     return;
449   }
450 
451   if (Imm == DoubleToBits(0.0))
452     O << "0.0";
453   else if (Imm == DoubleToBits(1.0))
454     O << "1.0";
455   else if (Imm == DoubleToBits(-1.0))
456     O << "-1.0";
457   else if (Imm == DoubleToBits(0.5))
458     O << "0.5";
459   else if (Imm == DoubleToBits(-0.5))
460     O << "-0.5";
461   else if (Imm == DoubleToBits(2.0))
462     O << "2.0";
463   else if (Imm == DoubleToBits(-2.0))
464     O << "-2.0";
465   else if (Imm == DoubleToBits(4.0))
466     O << "4.0";
467   else if (Imm == DoubleToBits(-4.0))
468     O << "-4.0";
469   else if (Imm == 0x3fc45f306dc9c882 &&
470            STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm])
471     O << "0.15915494309189532";
472   else {
473     assert(isUInt<32>(Imm) || Imm == 0x3fc45f306dc9c882);
474 
475     // In rare situations, we will have a 32-bit literal in a 64-bit
476     // operand. This is technically allowed for the encoding of s_mov_b64.
477     O << formatHex(static_cast<uint64_t>(Imm));
478   }
479 }
480 
481 void AMDGPUInstPrinter::printBLGP(const MCInst *MI, unsigned OpNo,
482                                   const MCSubtargetInfo &STI,
483                                   raw_ostream &O) {
484   unsigned Imm = MI->getOperand(OpNo).getImm();
485   if (!Imm)
486     return;
487 
488   O << " blgp:" << Imm;
489 }
490 
491 void AMDGPUInstPrinter::printCBSZ(const MCInst *MI, unsigned OpNo,
492                                   const MCSubtargetInfo &STI,
493                                   raw_ostream &O) {
494   unsigned Imm = MI->getOperand(OpNo).getImm();
495   if (!Imm)
496     return;
497 
498   O << " cbsz:" << Imm;
499 }
500 
501 void AMDGPUInstPrinter::printABID(const MCInst *MI, unsigned OpNo,
502                                   const MCSubtargetInfo &STI,
503                                   raw_ostream &O) {
504   unsigned Imm = MI->getOperand(OpNo).getImm();
505   if (!Imm)
506     return;
507 
508   O << " abid:" << Imm;
509 }
510 
511 void AMDGPUInstPrinter::printDefaultVccOperand(unsigned OpNo,
512                                                const MCSubtargetInfo &STI,
513                                                raw_ostream &O) {
514   if (OpNo > 0)
515     O << ", ";
516   printRegOperand(STI.getFeatureBits()[AMDGPU::FeatureWavefrontSize64] ?
517                   AMDGPU::VCC : AMDGPU::VCC_LO, O, MRI);
518   if (OpNo == 0)
519     O << ", ";
520 }
521 
522 void AMDGPUInstPrinter::printOperand(const MCInst *MI, unsigned OpNo,
523                                      const MCSubtargetInfo &STI,
524                                      raw_ostream &O) {
525   // Print default vcc/vcc_lo operand of VOPC.
526   const MCInstrDesc &Desc = MII.get(MI->getOpcode());
527   if (OpNo == 0 && (Desc.TSFlags & SIInstrFlags::VOPC) &&
528       (Desc.hasImplicitDefOfPhysReg(AMDGPU::VCC) ||
529        Desc.hasImplicitDefOfPhysReg(AMDGPU::VCC_LO)))
530     printDefaultVccOperand(OpNo, STI, O);
531 
532   if (OpNo >= MI->getNumOperands()) {
533     O << "/*Missing OP" << OpNo << "*/";
534     return;
535   }
536 
537   const MCOperand &Op = MI->getOperand(OpNo);
538   if (Op.isReg()) {
539     printRegOperand(Op.getReg(), O, MRI);
540   } else if (Op.isImm()) {
541     switch (Desc.OpInfo[OpNo].OperandType) {
542     case AMDGPU::OPERAND_REG_IMM_INT32:
543     case AMDGPU::OPERAND_REG_IMM_FP32:
544     case AMDGPU::OPERAND_REG_INLINE_C_INT32:
545     case AMDGPU::OPERAND_REG_INLINE_C_FP32:
546     case AMDGPU::OPERAND_REG_INLINE_AC_INT32:
547     case AMDGPU::OPERAND_REG_INLINE_AC_FP32:
548     case MCOI::OPERAND_IMMEDIATE:
549       printImmediate32(Op.getImm(), STI, O);
550       break;
551     case AMDGPU::OPERAND_REG_IMM_INT64:
552     case AMDGPU::OPERAND_REG_IMM_FP64:
553     case AMDGPU::OPERAND_REG_INLINE_C_INT64:
554     case AMDGPU::OPERAND_REG_INLINE_C_FP64:
555       printImmediate64(Op.getImm(), STI, O);
556       break;
557     case AMDGPU::OPERAND_REG_INLINE_C_INT16:
558     case AMDGPU::OPERAND_REG_INLINE_C_FP16:
559     case AMDGPU::OPERAND_REG_INLINE_AC_INT16:
560     case AMDGPU::OPERAND_REG_INLINE_AC_FP16:
561     case AMDGPU::OPERAND_REG_IMM_INT16:
562     case AMDGPU::OPERAND_REG_IMM_FP16:
563       printImmediate16(Op.getImm(), STI, O);
564       break;
565     case AMDGPU::OPERAND_REG_IMM_V2INT16:
566     case AMDGPU::OPERAND_REG_IMM_V2FP16:
567       if (!isUInt<16>(Op.getImm()) &&
568           STI.getFeatureBits()[AMDGPU::FeatureVOP3Literal]) {
569         printImmediate32(Op.getImm(), STI, O);
570         break;
571       }
572       LLVM_FALLTHROUGH;
573     case AMDGPU::OPERAND_REG_INLINE_C_V2FP16:
574     case AMDGPU::OPERAND_REG_INLINE_C_V2INT16:
575     case AMDGPU::OPERAND_REG_INLINE_AC_V2FP16:
576     case AMDGPU::OPERAND_REG_INLINE_AC_V2INT16:
577       printImmediateV216(Op.getImm(), STI, O);
578       break;
579     case MCOI::OPERAND_UNKNOWN:
580     case MCOI::OPERAND_PCREL:
581       O << formatDec(Op.getImm());
582       break;
583     case MCOI::OPERAND_REGISTER:
584       // FIXME: This should be removed and handled somewhere else. Seems to come
585       // from a disassembler bug.
586       O << "/*invalid immediate*/";
587       break;
588     default:
589       // We hit this for the immediate instruction bits that don't yet have a
590       // custom printer.
591       llvm_unreachable("unexpected immediate operand type");
592     }
593   } else if (Op.isFPImm()) {
594     // We special case 0.0 because otherwise it will be printed as an integer.
595     if (Op.getFPImm() == 0.0)
596       O << "0.0";
597     else {
598       const MCInstrDesc &Desc = MII.get(MI->getOpcode());
599       int RCID = Desc.OpInfo[OpNo].RegClass;
600       unsigned RCBits = AMDGPU::getRegBitWidth(MRI.getRegClass(RCID));
601       if (RCBits == 32)
602         printImmediate32(FloatToBits(Op.getFPImm()), STI, O);
603       else if (RCBits == 64)
604         printImmediate64(DoubleToBits(Op.getFPImm()), STI, O);
605       else
606         llvm_unreachable("Invalid register class size");
607     }
608   } else if (Op.isExpr()) {
609     const MCExpr *Exp = Op.getExpr();
610     Exp->print(O, &MAI);
611   } else {
612     O << "/*INV_OP*/";
613   }
614 
615   // Print default vcc/vcc_lo operand of v_cndmask_b32_e32.
616   switch (MI->getOpcode()) {
617   default: break;
618 
619   case AMDGPU::V_CNDMASK_B32_e32_gfx10:
620   case AMDGPU::V_ADD_CO_CI_U32_e32_gfx10:
621   case AMDGPU::V_SUB_CO_CI_U32_e32_gfx10:
622   case AMDGPU::V_SUBREV_CO_CI_U32_e32_gfx10:
623   case AMDGPU::V_CNDMASK_B32_dpp_gfx10:
624   case AMDGPU::V_ADD_CO_CI_U32_dpp_gfx10:
625   case AMDGPU::V_SUB_CO_CI_U32_dpp_gfx10:
626   case AMDGPU::V_SUBREV_CO_CI_U32_dpp_gfx10:
627   case AMDGPU::V_CNDMASK_B32_dpp8_gfx10:
628   case AMDGPU::V_ADD_CO_CI_U32_dpp8_gfx10:
629   case AMDGPU::V_SUB_CO_CI_U32_dpp8_gfx10:
630   case AMDGPU::V_SUBREV_CO_CI_U32_dpp8_gfx10:
631 
632   case AMDGPU::V_CNDMASK_B32_e32_gfx6_gfx7:
633   case AMDGPU::V_CNDMASK_B32_e32_vi:
634     if ((int)OpNo == AMDGPU::getNamedOperandIdx(MI->getOpcode(),
635                                                 AMDGPU::OpName::src1))
636       printDefaultVccOperand(OpNo, STI, O);
637     break;
638   }
639 }
640 
641 void AMDGPUInstPrinter::printOperandAndFPInputMods(const MCInst *MI,
642                                                    unsigned OpNo,
643                                                    const MCSubtargetInfo &STI,
644                                                    raw_ostream &O) {
645   unsigned InputModifiers = MI->getOperand(OpNo).getImm();
646 
647   // Use 'neg(...)' instead of '-' to avoid ambiguity.
648   // This is important for integer literals because
649   // -1 is not the same value as neg(1).
650   bool NegMnemo = false;
651 
652   if (InputModifiers & SISrcMods::NEG) {
653     if (OpNo + 1 < MI->getNumOperands() &&
654         (InputModifiers & SISrcMods::ABS) == 0) {
655       const MCOperand &Op = MI->getOperand(OpNo + 1);
656       NegMnemo = Op.isImm() || Op.isFPImm();
657     }
658     if (NegMnemo) {
659       O << "neg(";
660     } else {
661       O << '-';
662     }
663   }
664 
665   if (InputModifiers & SISrcMods::ABS)
666     O << '|';
667   printOperand(MI, OpNo + 1, STI, O);
668   if (InputModifiers & SISrcMods::ABS)
669     O << '|';
670 
671   if (NegMnemo) {
672     O << ')';
673   }
674 }
675 
676 void AMDGPUInstPrinter::printOperandAndIntInputMods(const MCInst *MI,
677                                                     unsigned OpNo,
678                                                     const MCSubtargetInfo &STI,
679                                                     raw_ostream &O) {
680   unsigned InputModifiers = MI->getOperand(OpNo).getImm();
681   if (InputModifiers & SISrcMods::SEXT)
682     O << "sext(";
683   printOperand(MI, OpNo + 1, STI, O);
684   if (InputModifiers & SISrcMods::SEXT)
685     O << ')';
686 
687   // Print default vcc/vcc_lo operand of VOP2b.
688   switch (MI->getOpcode()) {
689   default: break;
690 
691   case AMDGPU::V_CNDMASK_B32_sdwa_gfx10:
692   case AMDGPU::V_ADD_CO_CI_U32_sdwa_gfx10:
693   case AMDGPU::V_SUB_CO_CI_U32_sdwa_gfx10:
694   case AMDGPU::V_SUBREV_CO_CI_U32_sdwa_gfx10:
695     if ((int)OpNo + 1 == AMDGPU::getNamedOperandIdx(MI->getOpcode(),
696                                                     AMDGPU::OpName::src1))
697       printDefaultVccOperand(OpNo, STI, O);
698     break;
699   }
700 }
701 
702 void AMDGPUInstPrinter::printDPP8(const MCInst *MI, unsigned OpNo,
703                                   const MCSubtargetInfo &STI,
704                                   raw_ostream &O) {
705   if (!AMDGPU::isGFX10(STI))
706     llvm_unreachable("dpp8 is not supported on ASICs earlier than GFX10");
707 
708   unsigned Imm = MI->getOperand(OpNo).getImm();
709   O << " dpp8:[" << formatDec(Imm & 0x7);
710   for (size_t i = 1; i < 8; ++i) {
711     O << ',' << formatDec((Imm >> (3 * i)) & 0x7);
712   }
713   O << ']';
714 }
715 
716 void AMDGPUInstPrinter::printDPPCtrl(const MCInst *MI, unsigned OpNo,
717                                      const MCSubtargetInfo &STI,
718                                      raw_ostream &O) {
719   using namespace AMDGPU::DPP;
720 
721   unsigned Imm = MI->getOperand(OpNo).getImm();
722   if (Imm <= DppCtrl::QUAD_PERM_LAST) {
723     O << " quad_perm:[";
724     O << formatDec(Imm & 0x3)         << ',';
725     O << formatDec((Imm & 0xc)  >> 2) << ',';
726     O << formatDec((Imm & 0x30) >> 4) << ',';
727     O << formatDec((Imm & 0xc0) >> 6) << ']';
728   } else if ((Imm >= DppCtrl::ROW_SHL_FIRST) &&
729              (Imm <= DppCtrl::ROW_SHL_LAST)) {
730     O << " row_shl:";
731     printU4ImmDecOperand(MI, OpNo, O);
732   } else if ((Imm >= DppCtrl::ROW_SHR_FIRST) &&
733              (Imm <= DppCtrl::ROW_SHR_LAST)) {
734     O << " row_shr:";
735     printU4ImmDecOperand(MI, OpNo, O);
736   } else if ((Imm >= DppCtrl::ROW_ROR_FIRST) &&
737              (Imm <= DppCtrl::ROW_ROR_LAST)) {
738     O << " row_ror:";
739     printU4ImmDecOperand(MI, OpNo, O);
740   } else if (Imm == DppCtrl::WAVE_SHL1) {
741     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
742       O << " /* wave_shl is not supported starting from GFX10 */";
743       return;
744     }
745     O << " wave_shl:1";
746   } else if (Imm == DppCtrl::WAVE_ROL1) {
747     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
748       O << " /* wave_rol is not supported starting from GFX10 */";
749       return;
750     }
751     O << " wave_rol:1";
752   } else if (Imm == DppCtrl::WAVE_SHR1) {
753     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
754       O << " /* wave_shr is not supported starting from GFX10 */";
755       return;
756     }
757     O << " wave_shr:1";
758   } else if (Imm == DppCtrl::WAVE_ROR1) {
759     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
760       O << " /* wave_ror is not supported starting from GFX10 */";
761       return;
762     }
763     O << " wave_ror:1";
764   } else if (Imm == DppCtrl::ROW_MIRROR) {
765     O << " row_mirror";
766   } else if (Imm == DppCtrl::ROW_HALF_MIRROR) {
767     O << " row_half_mirror";
768   } else if (Imm == DppCtrl::BCAST15) {
769     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
770       O << " /* row_bcast is not supported starting from GFX10 */";
771       return;
772     }
773     O << " row_bcast:15";
774   } else if (Imm == DppCtrl::BCAST31) {
775     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
776       O << " /* row_bcast is not supported starting from GFX10 */";
777       return;
778     }
779     O << " row_bcast:31";
780   } else if ((Imm >= DppCtrl::ROW_SHARE_FIRST) &&
781              (Imm <= DppCtrl::ROW_SHARE_LAST)) {
782     if (!AMDGPU::isGFX10(STI)) {
783       O << " /* row_share is not supported on ASICs earlier than GFX10 */";
784       return;
785     }
786     O << " row_share:";
787     printU4ImmDecOperand(MI, OpNo, O);
788   } else if ((Imm >= DppCtrl::ROW_XMASK_FIRST) &&
789              (Imm <= DppCtrl::ROW_XMASK_LAST)) {
790     if (!AMDGPU::isGFX10(STI)) {
791       O << " /* row_xmask is not supported on ASICs earlier than GFX10 */";
792       return;
793     }
794     O << "row_xmask:";
795     printU4ImmDecOperand(MI, OpNo, O);
796   } else {
797     O << " /* Invalid dpp_ctrl value */";
798   }
799 }
800 
801 void AMDGPUInstPrinter::printRowMask(const MCInst *MI, unsigned OpNo,
802                                      const MCSubtargetInfo &STI,
803                                      raw_ostream &O) {
804   O << " row_mask:";
805   printU4ImmOperand(MI, OpNo, STI, O);
806 }
807 
808 void AMDGPUInstPrinter::printBankMask(const MCInst *MI, unsigned OpNo,
809                                       const MCSubtargetInfo &STI,
810                                       raw_ostream &O) {
811   O << " bank_mask:";
812   printU4ImmOperand(MI, OpNo, STI, O);
813 }
814 
815 void AMDGPUInstPrinter::printBoundCtrl(const MCInst *MI, unsigned OpNo,
816                                        const MCSubtargetInfo &STI,
817                                        raw_ostream &O) {
818   unsigned Imm = MI->getOperand(OpNo).getImm();
819   if (Imm) {
820     O << " bound_ctrl:0"; // XXX - this syntax is used in sp3
821   }
822 }
823 
824 void AMDGPUInstPrinter::printFI(const MCInst *MI, unsigned OpNo,
825                                 const MCSubtargetInfo &STI,
826                                 raw_ostream &O) {
827   using namespace llvm::AMDGPU::DPP;
828   unsigned Imm = MI->getOperand(OpNo).getImm();
829   if (Imm == DPP_FI_1 || Imm == DPP8_FI_1) {
830     O << " fi:1";
831   }
832 }
833 
834 void AMDGPUInstPrinter::printSDWASel(const MCInst *MI, unsigned OpNo,
835                                      raw_ostream &O) {
836   using namespace llvm::AMDGPU::SDWA;
837 
838   unsigned Imm = MI->getOperand(OpNo).getImm();
839   switch (Imm) {
840   case SdwaSel::BYTE_0: O << "BYTE_0"; break;
841   case SdwaSel::BYTE_1: O << "BYTE_1"; break;
842   case SdwaSel::BYTE_2: O << "BYTE_2"; break;
843   case SdwaSel::BYTE_3: O << "BYTE_3"; break;
844   case SdwaSel::WORD_0: O << "WORD_0"; break;
845   case SdwaSel::WORD_1: O << "WORD_1"; break;
846   case SdwaSel::DWORD: O << "DWORD"; break;
847   default: llvm_unreachable("Invalid SDWA data select operand");
848   }
849 }
850 
851 void AMDGPUInstPrinter::printSDWADstSel(const MCInst *MI, unsigned OpNo,
852                                         const MCSubtargetInfo &STI,
853                                         raw_ostream &O) {
854   O << "dst_sel:";
855   printSDWASel(MI, OpNo, O);
856 }
857 
858 void AMDGPUInstPrinter::printSDWASrc0Sel(const MCInst *MI, unsigned OpNo,
859                                          const MCSubtargetInfo &STI,
860                                          raw_ostream &O) {
861   O << "src0_sel:";
862   printSDWASel(MI, OpNo, O);
863 }
864 
865 void AMDGPUInstPrinter::printSDWASrc1Sel(const MCInst *MI, unsigned OpNo,
866                                          const MCSubtargetInfo &STI,
867                                          raw_ostream &O) {
868   O << "src1_sel:";
869   printSDWASel(MI, OpNo, O);
870 }
871 
872 void AMDGPUInstPrinter::printSDWADstUnused(const MCInst *MI, unsigned OpNo,
873                                            const MCSubtargetInfo &STI,
874                                            raw_ostream &O) {
875   using namespace llvm::AMDGPU::SDWA;
876 
877   O << "dst_unused:";
878   unsigned Imm = MI->getOperand(OpNo).getImm();
879   switch (Imm) {
880   case DstUnused::UNUSED_PAD: O << "UNUSED_PAD"; break;
881   case DstUnused::UNUSED_SEXT: O << "UNUSED_SEXT"; break;
882   case DstUnused::UNUSED_PRESERVE: O << "UNUSED_PRESERVE"; break;
883   default: llvm_unreachable("Invalid SDWA dest_unused operand");
884   }
885 }
886 
887 template <unsigned N>
888 void AMDGPUInstPrinter::printExpSrcN(const MCInst *MI, unsigned OpNo,
889                                      const MCSubtargetInfo &STI,
890                                      raw_ostream &O) {
891   unsigned Opc = MI->getOpcode();
892   int EnIdx = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::en);
893   unsigned En = MI->getOperand(EnIdx).getImm();
894 
895   int ComprIdx = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::compr);
896 
897   // If compr is set, print as src0, src0, src1, src1
898   if (MI->getOperand(ComprIdx).getImm()) {
899     if (N == 1 || N == 2)
900       --OpNo;
901     else if (N == 3)
902       OpNo -= 2;
903   }
904 
905   if (En & (1 << N))
906     printRegOperand(MI->getOperand(OpNo).getReg(), O, MRI);
907   else
908     O << "off";
909 }
910 
911 void AMDGPUInstPrinter::printExpSrc0(const MCInst *MI, unsigned OpNo,
912                                      const MCSubtargetInfo &STI,
913                                      raw_ostream &O) {
914   printExpSrcN<0>(MI, OpNo, STI, O);
915 }
916 
917 void AMDGPUInstPrinter::printExpSrc1(const MCInst *MI, unsigned OpNo,
918                                      const MCSubtargetInfo &STI,
919                                      raw_ostream &O) {
920   printExpSrcN<1>(MI, OpNo, STI, O);
921 }
922 
923 void AMDGPUInstPrinter::printExpSrc2(const MCInst *MI, unsigned OpNo,
924                                      const MCSubtargetInfo &STI,
925                                      raw_ostream &O) {
926   printExpSrcN<2>(MI, OpNo, STI, O);
927 }
928 
929 void AMDGPUInstPrinter::printExpSrc3(const MCInst *MI, unsigned OpNo,
930                                      const MCSubtargetInfo &STI,
931                                      raw_ostream &O) {
932   printExpSrcN<3>(MI, OpNo, STI, O);
933 }
934 
935 void AMDGPUInstPrinter::printExpTgt(const MCInst *MI, unsigned OpNo,
936                                     const MCSubtargetInfo &STI,
937                                     raw_ostream &O) {
938   // This is really a 6 bit field.
939   uint32_t Tgt = MI->getOperand(OpNo).getImm() & ((1 << 6) - 1);
940 
941   if (Tgt <= 7)
942     O << " mrt" << Tgt;
943   else if (Tgt == 8)
944     O << " mrtz";
945   else if (Tgt == 9)
946     O << " null";
947   else if ((Tgt >= 12 && Tgt <= 15) || (Tgt == 16 && AMDGPU::isGFX10(STI)))
948     O << " pos" << Tgt - 12;
949   else if (AMDGPU::isGFX10(STI) && Tgt == 20)
950     O << " prim";
951   else if (Tgt >= 32 && Tgt <= 63)
952     O << " param" << Tgt - 32;
953   else {
954     // Reserved values 10, 11
955     O << " invalid_target_" << Tgt;
956   }
957 }
958 
959 static bool allOpsDefaultValue(const int* Ops, int NumOps, int Mod,
960                                bool IsPacked, bool HasDstSel) {
961   int DefaultValue = IsPacked && (Mod == SISrcMods::OP_SEL_1);
962 
963   for (int I = 0; I < NumOps; ++I) {
964     if (!!(Ops[I] & Mod) != DefaultValue)
965       return false;
966   }
967 
968   if (HasDstSel && (Ops[0] & SISrcMods::DST_OP_SEL) != 0)
969     return false;
970 
971   return true;
972 }
973 
974 void AMDGPUInstPrinter::printPackedModifier(const MCInst *MI,
975                                             StringRef Name,
976                                             unsigned Mod,
977                                             raw_ostream &O) {
978   unsigned Opc = MI->getOpcode();
979   int NumOps = 0;
980   int Ops[3];
981 
982   for (int OpName : { AMDGPU::OpName::src0_modifiers,
983                       AMDGPU::OpName::src1_modifiers,
984                       AMDGPU::OpName::src2_modifiers }) {
985     int Idx = AMDGPU::getNamedOperandIdx(Opc, OpName);
986     if (Idx == -1)
987       break;
988 
989     Ops[NumOps++] = MI->getOperand(Idx).getImm();
990   }
991 
992   const bool HasDstSel =
993     NumOps > 0 &&
994     Mod == SISrcMods::OP_SEL_0 &&
995     MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::VOP3_OPSEL;
996 
997   const bool IsPacked =
998     MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::IsPacked;
999 
1000   if (allOpsDefaultValue(Ops, NumOps, Mod, IsPacked, HasDstSel))
1001     return;
1002 
1003   O << Name;
1004   for (int I = 0; I < NumOps; ++I) {
1005     if (I != 0)
1006       O << ',';
1007 
1008     O << !!(Ops[I] & Mod);
1009   }
1010 
1011   if (HasDstSel) {
1012     O << ',' << !!(Ops[0] & SISrcMods::DST_OP_SEL);
1013   }
1014 
1015   O << ']';
1016 }
1017 
1018 void AMDGPUInstPrinter::printOpSel(const MCInst *MI, unsigned,
1019                                    const MCSubtargetInfo &STI,
1020                                    raw_ostream &O) {
1021   unsigned Opc = MI->getOpcode();
1022   if (Opc == AMDGPU::V_PERMLANE16_B32_gfx10 ||
1023       Opc == AMDGPU::V_PERMLANEX16_B32_gfx10) {
1024     auto FIN = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::src0_modifiers);
1025     auto BCN = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::src1_modifiers);
1026     unsigned FI = !!(MI->getOperand(FIN).getImm() & SISrcMods::OP_SEL_0);
1027     unsigned BC = !!(MI->getOperand(BCN).getImm() & SISrcMods::OP_SEL_0);
1028     if (FI || BC)
1029       O << " op_sel:[" << FI << ',' << BC << ']';
1030     return;
1031   }
1032 
1033   printPackedModifier(MI, " op_sel:[", SISrcMods::OP_SEL_0, O);
1034 }
1035 
1036 void AMDGPUInstPrinter::printOpSelHi(const MCInst *MI, unsigned OpNo,
1037                                      const MCSubtargetInfo &STI,
1038                                      raw_ostream &O) {
1039   printPackedModifier(MI, " op_sel_hi:[", SISrcMods::OP_SEL_1, O);
1040 }
1041 
1042 void AMDGPUInstPrinter::printNegLo(const MCInst *MI, unsigned OpNo,
1043                                    const MCSubtargetInfo &STI,
1044                                    raw_ostream &O) {
1045   printPackedModifier(MI, " neg_lo:[", SISrcMods::NEG, O);
1046 }
1047 
1048 void AMDGPUInstPrinter::printNegHi(const MCInst *MI, unsigned OpNo,
1049                                    const MCSubtargetInfo &STI,
1050                                    raw_ostream &O) {
1051   printPackedModifier(MI, " neg_hi:[", SISrcMods::NEG_HI, O);
1052 }
1053 
1054 void AMDGPUInstPrinter::printInterpSlot(const MCInst *MI, unsigned OpNum,
1055                                         const MCSubtargetInfo &STI,
1056                                         raw_ostream &O) {
1057   unsigned Imm = MI->getOperand(OpNum).getImm();
1058   switch (Imm) {
1059   case 0:
1060     O << "p10";
1061     break;
1062   case 1:
1063     O << "p20";
1064     break;
1065   case 2:
1066     O << "p0";
1067     break;
1068   default:
1069     O << "invalid_param_" << Imm;
1070   }
1071 }
1072 
1073 void AMDGPUInstPrinter::printInterpAttr(const MCInst *MI, unsigned OpNum,
1074                                         const MCSubtargetInfo &STI,
1075                                         raw_ostream &O) {
1076   unsigned Attr = MI->getOperand(OpNum).getImm();
1077   O << "attr" << Attr;
1078 }
1079 
1080 void AMDGPUInstPrinter::printInterpAttrChan(const MCInst *MI, unsigned OpNum,
1081                                         const MCSubtargetInfo &STI,
1082                                         raw_ostream &O) {
1083   unsigned Chan = MI->getOperand(OpNum).getImm();
1084   O << '.' << "xyzw"[Chan & 0x3];
1085 }
1086 
1087 void AMDGPUInstPrinter::printVGPRIndexMode(const MCInst *MI, unsigned OpNo,
1088                                            const MCSubtargetInfo &STI,
1089                                            raw_ostream &O) {
1090   using namespace llvm::AMDGPU::VGPRIndexMode;
1091   unsigned Val = MI->getOperand(OpNo).getImm();
1092 
1093   if ((Val & ~ENABLE_MASK) != 0) {
1094     O << " " << formatHex(static_cast<uint64_t>(Val));
1095   } else {
1096     O << " gpr_idx(";
1097     bool NeedComma = false;
1098     for (unsigned ModeId = ID_MIN; ModeId <= ID_MAX; ++ModeId) {
1099       if (Val & (1 << ModeId)) {
1100         if (NeedComma)
1101           O << ',';
1102         O << IdSymbolic[ModeId];
1103         NeedComma = true;
1104       }
1105     }
1106     O << ')';
1107   }
1108 }
1109 
1110 void AMDGPUInstPrinter::printMemOperand(const MCInst *MI, unsigned OpNo,
1111                                         const MCSubtargetInfo &STI,
1112                                         raw_ostream &O) {
1113   printOperand(MI, OpNo, STI, O);
1114   O  << ", ";
1115   printOperand(MI, OpNo + 1, STI, O);
1116 }
1117 
1118 void AMDGPUInstPrinter::printIfSet(const MCInst *MI, unsigned OpNo,
1119                                    raw_ostream &O, StringRef Asm,
1120                                    StringRef Default) {
1121   const MCOperand &Op = MI->getOperand(OpNo);
1122   assert(Op.isImm());
1123   if (Op.getImm() == 1) {
1124     O << Asm;
1125   } else {
1126     O << Default;
1127   }
1128 }
1129 
1130 void AMDGPUInstPrinter::printIfSet(const MCInst *MI, unsigned OpNo,
1131                                    raw_ostream &O, char Asm) {
1132   const MCOperand &Op = MI->getOperand(OpNo);
1133   assert(Op.isImm());
1134   if (Op.getImm() == 1)
1135     O << Asm;
1136 }
1137 
1138 void AMDGPUInstPrinter::printHigh(const MCInst *MI, unsigned OpNo,
1139                                   const MCSubtargetInfo &STI,
1140                                   raw_ostream &O) {
1141   if (MI->getOperand(OpNo).getImm())
1142     O << " high";
1143 }
1144 
1145 void AMDGPUInstPrinter::printClampSI(const MCInst *MI, unsigned OpNo,
1146                                      const MCSubtargetInfo &STI,
1147                                      raw_ostream &O) {
1148   if (MI->getOperand(OpNo).getImm())
1149     O << " clamp";
1150 }
1151 
1152 void AMDGPUInstPrinter::printOModSI(const MCInst *MI, unsigned OpNo,
1153                                     const MCSubtargetInfo &STI,
1154                                     raw_ostream &O) {
1155   int Imm = MI->getOperand(OpNo).getImm();
1156   if (Imm == SIOutMods::MUL2)
1157     O << " mul:2";
1158   else if (Imm == SIOutMods::MUL4)
1159     O << " mul:4";
1160   else if (Imm == SIOutMods::DIV2)
1161     O << " div:2";
1162 }
1163 
1164 void AMDGPUInstPrinter::printSendMsg(const MCInst *MI, unsigned OpNo,
1165                                      const MCSubtargetInfo &STI,
1166                                      raw_ostream &O) {
1167   using namespace llvm::AMDGPU::SendMsg;
1168 
1169   const unsigned Imm16 = MI->getOperand(OpNo).getImm();
1170 
1171   uint16_t MsgId;
1172   uint16_t OpId;
1173   uint16_t StreamId;
1174   decodeMsg(Imm16, MsgId, OpId, StreamId);
1175 
1176   if (isValidMsgId(MsgId, STI) &&
1177       isValidMsgOp(MsgId, OpId) &&
1178       isValidMsgStream(MsgId, OpId, StreamId)) {
1179     O << "sendmsg(" << getMsgName(MsgId);
1180     if (msgRequiresOp(MsgId)) {
1181       O << ", " << getMsgOpName(MsgId, OpId);
1182       if (msgSupportsStream(MsgId, OpId)) {
1183         O << ", " << StreamId;
1184       }
1185     }
1186     O << ')';
1187   } else if (encodeMsg(MsgId, OpId, StreamId) == Imm16) {
1188     O << "sendmsg(" << MsgId << ", " << OpId << ", " << StreamId << ')';
1189   } else {
1190     O << Imm16; // Unknown imm16 code.
1191   }
1192 }
1193 
1194 static void printSwizzleBitmask(const uint16_t AndMask,
1195                                 const uint16_t OrMask,
1196                                 const uint16_t XorMask,
1197                                 raw_ostream &O) {
1198   using namespace llvm::AMDGPU::Swizzle;
1199 
1200   uint16_t Probe0 = ((0            & AndMask) | OrMask) ^ XorMask;
1201   uint16_t Probe1 = ((BITMASK_MASK & AndMask) | OrMask) ^ XorMask;
1202 
1203   O << "\"";
1204 
1205   for (unsigned Mask = 1 << (BITMASK_WIDTH - 1); Mask > 0; Mask >>= 1) {
1206     uint16_t p0 = Probe0 & Mask;
1207     uint16_t p1 = Probe1 & Mask;
1208 
1209     if (p0 == p1) {
1210       if (p0 == 0) {
1211         O << "0";
1212       } else {
1213         O << "1";
1214       }
1215     } else {
1216       if (p0 == 0) {
1217         O << "p";
1218       } else {
1219         O << "i";
1220       }
1221     }
1222   }
1223 
1224   O << "\"";
1225 }
1226 
1227 void AMDGPUInstPrinter::printSwizzle(const MCInst *MI, unsigned OpNo,
1228                                      const MCSubtargetInfo &STI,
1229                                      raw_ostream &O) {
1230   using namespace llvm::AMDGPU::Swizzle;
1231 
1232   uint16_t Imm = MI->getOperand(OpNo).getImm();
1233   if (Imm == 0) {
1234     return;
1235   }
1236 
1237   O << " offset:";
1238 
1239   if ((Imm & QUAD_PERM_ENC_MASK) == QUAD_PERM_ENC) {
1240 
1241     O << "swizzle(" << IdSymbolic[ID_QUAD_PERM];
1242     for (unsigned I = 0; I < LANE_NUM; ++I) {
1243       O << ",";
1244       O << formatDec(Imm & LANE_MASK);
1245       Imm >>= LANE_SHIFT;
1246     }
1247     O << ")";
1248 
1249   } else if ((Imm & BITMASK_PERM_ENC_MASK) == BITMASK_PERM_ENC) {
1250 
1251     uint16_t AndMask = (Imm >> BITMASK_AND_SHIFT) & BITMASK_MASK;
1252     uint16_t OrMask  = (Imm >> BITMASK_OR_SHIFT)  & BITMASK_MASK;
1253     uint16_t XorMask = (Imm >> BITMASK_XOR_SHIFT) & BITMASK_MASK;
1254 
1255     if (AndMask == BITMASK_MAX &&
1256         OrMask == 0 &&
1257         countPopulation(XorMask) == 1) {
1258 
1259       O << "swizzle(" << IdSymbolic[ID_SWAP];
1260       O << ",";
1261       O << formatDec(XorMask);
1262       O << ")";
1263 
1264     } else if (AndMask == BITMASK_MAX &&
1265                OrMask == 0 && XorMask > 0 &&
1266                isPowerOf2_64(XorMask + 1)) {
1267 
1268       O << "swizzle(" << IdSymbolic[ID_REVERSE];
1269       O << ",";
1270       O << formatDec(XorMask + 1);
1271       O << ")";
1272 
1273     } else {
1274 
1275       uint16_t GroupSize = BITMASK_MAX - AndMask + 1;
1276       if (GroupSize > 1 &&
1277           isPowerOf2_64(GroupSize) &&
1278           OrMask < GroupSize &&
1279           XorMask == 0) {
1280 
1281         O << "swizzle(" << IdSymbolic[ID_BROADCAST];
1282         O << ",";
1283         O << formatDec(GroupSize);
1284         O << ",";
1285         O << formatDec(OrMask);
1286         O << ")";
1287 
1288       } else {
1289         O << "swizzle(" << IdSymbolic[ID_BITMASK_PERM];
1290         O << ",";
1291         printSwizzleBitmask(AndMask, OrMask, XorMask, O);
1292         O << ")";
1293       }
1294     }
1295   } else {
1296     printU16ImmDecOperand(MI, OpNo, O);
1297   }
1298 }
1299 
1300 void AMDGPUInstPrinter::printWaitFlag(const MCInst *MI, unsigned OpNo,
1301                                       const MCSubtargetInfo &STI,
1302                                       raw_ostream &O) {
1303   AMDGPU::IsaVersion ISA = AMDGPU::getIsaVersion(STI.getCPU());
1304 
1305   unsigned SImm16 = MI->getOperand(OpNo).getImm();
1306   unsigned Vmcnt, Expcnt, Lgkmcnt;
1307   decodeWaitcnt(ISA, SImm16, Vmcnt, Expcnt, Lgkmcnt);
1308 
1309   bool NeedSpace = false;
1310 
1311   if (Vmcnt != getVmcntBitMask(ISA)) {
1312     O << "vmcnt(" << Vmcnt << ')';
1313     NeedSpace = true;
1314   }
1315 
1316   if (Expcnt != getExpcntBitMask(ISA)) {
1317     if (NeedSpace)
1318       O << ' ';
1319     O << "expcnt(" << Expcnt << ')';
1320     NeedSpace = true;
1321   }
1322 
1323   if (Lgkmcnt != getLgkmcntBitMask(ISA)) {
1324     if (NeedSpace)
1325       O << ' ';
1326     O << "lgkmcnt(" << Lgkmcnt << ')';
1327   }
1328 }
1329 
1330 void AMDGPUInstPrinter::printHwreg(const MCInst *MI, unsigned OpNo,
1331                                    const MCSubtargetInfo &STI, raw_ostream &O) {
1332   unsigned Id;
1333   unsigned Offset;
1334   unsigned Width;
1335 
1336   using namespace llvm::AMDGPU::Hwreg;
1337   unsigned Val = MI->getOperand(OpNo).getImm();
1338   decodeHwreg(Val, Id, Offset, Width);
1339   StringRef HwRegName = getHwreg(Id, STI);
1340 
1341   O << "hwreg(";
1342   if (!HwRegName.empty()) {
1343     O << HwRegName;
1344   } else {
1345     O << Id;
1346   }
1347   if (Width != WIDTH_DEFAULT_ || Offset != OFFSET_DEFAULT_) {
1348     O << ", " << Offset << ", " << Width;
1349   }
1350   O << ')';
1351 }
1352 
1353 void AMDGPUInstPrinter::printEndpgm(const MCInst *MI, unsigned OpNo,
1354                                     const MCSubtargetInfo &STI,
1355                                     raw_ostream &O) {
1356   uint16_t Imm = MI->getOperand(OpNo).getImm();
1357   if (Imm == 0) {
1358     return;
1359   }
1360 
1361   O << ' ' << formatDec(Imm);
1362 }
1363 
1364 #include "AMDGPUGenAsmWriter.inc"
1365 
1366 void R600InstPrinter::printInst(const MCInst *MI, uint64_t Address,
1367                                 StringRef Annot, const MCSubtargetInfo &STI,
1368                                 raw_ostream &O) {
1369   O.flush();
1370   printInstruction(MI, Address, O);
1371   printAnnotation(O, Annot);
1372 }
1373 
1374 void R600InstPrinter::printAbs(const MCInst *MI, unsigned OpNo,
1375                                raw_ostream &O) {
1376   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '|');
1377 }
1378 
1379 void R600InstPrinter::printBankSwizzle(const MCInst *MI, unsigned OpNo,
1380                                        raw_ostream &O) {
1381   int BankSwizzle = MI->getOperand(OpNo).getImm();
1382   switch (BankSwizzle) {
1383   case 1:
1384     O << "BS:VEC_021/SCL_122";
1385     break;
1386   case 2:
1387     O << "BS:VEC_120/SCL_212";
1388     break;
1389   case 3:
1390     O << "BS:VEC_102/SCL_221";
1391     break;
1392   case 4:
1393     O << "BS:VEC_201";
1394     break;
1395   case 5:
1396     O << "BS:VEC_210";
1397     break;
1398   default:
1399     break;
1400   }
1401 }
1402 
1403 void R600InstPrinter::printClamp(const MCInst *MI, unsigned OpNo,
1404                                  raw_ostream &O) {
1405   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "_SAT");
1406 }
1407 
1408 void R600InstPrinter::printCT(const MCInst *MI, unsigned OpNo,
1409                                 raw_ostream &O) {
1410   unsigned CT = MI->getOperand(OpNo).getImm();
1411   switch (CT) {
1412   case 0:
1413     O << 'U';
1414     break;
1415   case 1:
1416     O << 'N';
1417     break;
1418   default:
1419     break;
1420   }
1421 }
1422 
1423 void R600InstPrinter::printKCache(const MCInst *MI, unsigned OpNo,
1424                                   raw_ostream &O) {
1425   int KCacheMode = MI->getOperand(OpNo).getImm();
1426   if (KCacheMode > 0) {
1427     int KCacheBank = MI->getOperand(OpNo - 2).getImm();
1428     O << "CB" << KCacheBank << ':';
1429     int KCacheAddr = MI->getOperand(OpNo + 2).getImm();
1430     int LineSize = (KCacheMode == 1) ? 16 : 32;
1431     O << KCacheAddr * 16 << '-' << KCacheAddr * 16 + LineSize;
1432   }
1433 }
1434 
1435 void R600InstPrinter::printLast(const MCInst *MI, unsigned OpNo,
1436                                 raw_ostream &O) {
1437   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "*", " ");
1438 }
1439 
1440 void R600InstPrinter::printLiteral(const MCInst *MI, unsigned OpNo,
1441                                    raw_ostream &O) {
1442   const MCOperand &Op = MI->getOperand(OpNo);
1443   assert(Op.isImm() || Op.isExpr());
1444   if (Op.isImm()) {
1445     int64_t Imm = Op.getImm();
1446     O << Imm << '(' << BitsToFloat(Imm) << ')';
1447   }
1448   if (Op.isExpr()) {
1449     Op.getExpr()->print(O << '@', &MAI);
1450   }
1451 }
1452 
1453 void R600InstPrinter::printNeg(const MCInst *MI, unsigned OpNo,
1454                                raw_ostream &O) {
1455   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '-');
1456 }
1457 
1458 void R600InstPrinter::printOMOD(const MCInst *MI, unsigned OpNo,
1459                                 raw_ostream &O) {
1460   switch (MI->getOperand(OpNo).getImm()) {
1461   default: break;
1462   case 1:
1463     O << " * 2.0";
1464     break;
1465   case 2:
1466     O << " * 4.0";
1467     break;
1468   case 3:
1469     O << " / 2.0";
1470     break;
1471   }
1472 }
1473 
1474 void R600InstPrinter::printMemOperand(const MCInst *MI, unsigned OpNo,
1475                                       raw_ostream &O) {
1476   printOperand(MI, OpNo, O);
1477   O  << ", ";
1478   printOperand(MI, OpNo + 1, O);
1479 }
1480 
1481 void R600InstPrinter::printOperand(const MCInst *MI, unsigned OpNo,
1482                                    raw_ostream &O) {
1483   if (OpNo >= MI->getNumOperands()) {
1484     O << "/*Missing OP" << OpNo << "*/";
1485     return;
1486   }
1487 
1488   const MCOperand &Op = MI->getOperand(OpNo);
1489   if (Op.isReg()) {
1490     switch (Op.getReg()) {
1491     // This is the default predicate state, so we don't need to print it.
1492     case R600::PRED_SEL_OFF:
1493       break;
1494 
1495     default:
1496       O << getRegisterName(Op.getReg());
1497       break;
1498     }
1499   } else if (Op.isImm()) {
1500       O << Op.getImm();
1501   } else if (Op.isFPImm()) {
1502     // We special case 0.0 because otherwise it will be printed as an integer.
1503     if (Op.getFPImm() == 0.0)
1504       O << "0.0";
1505     else {
1506       O << Op.getFPImm();
1507     }
1508   } else if (Op.isExpr()) {
1509     const MCExpr *Exp = Op.getExpr();
1510     Exp->print(O, &MAI);
1511   } else {
1512     O << "/*INV_OP*/";
1513   }
1514 }
1515 
1516 void R600InstPrinter::printRel(const MCInst *MI, unsigned OpNo,
1517                                raw_ostream &O) {
1518   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '+');
1519 }
1520 
1521 void R600InstPrinter::printRSel(const MCInst *MI, unsigned OpNo,
1522                                   raw_ostream &O) {
1523   unsigned Sel = MI->getOperand(OpNo).getImm();
1524   switch (Sel) {
1525   case 0:
1526     O << 'X';
1527     break;
1528   case 1:
1529     O << 'Y';
1530     break;
1531   case 2:
1532     O << 'Z';
1533     break;
1534   case 3:
1535     O << 'W';
1536     break;
1537   case 4:
1538     O << '0';
1539     break;
1540   case 5:
1541     O << '1';
1542     break;
1543   case 7:
1544     O << '_';
1545     break;
1546   default:
1547     break;
1548   }
1549 }
1550 
1551 void R600InstPrinter::printUpdateExecMask(const MCInst *MI, unsigned OpNo,
1552                                           raw_ostream &O) {
1553   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "ExecMask,");
1554 }
1555 
1556 void R600InstPrinter::printUpdatePred(const MCInst *MI, unsigned OpNo,
1557                                       raw_ostream &O) {
1558   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "Pred,");
1559 }
1560 
1561 void R600InstPrinter::printWrite(const MCInst *MI, unsigned OpNo,
1562                                  raw_ostream &O) {
1563   const MCOperand &Op = MI->getOperand(OpNo);
1564   if (Op.getImm() == 0) {
1565     O << " (MASKED)";
1566   }
1567 }
1568 
1569 #include "R600GenAsmWriter.inc"
1570