1 //===-- AMDGPUInstPrinter.cpp - AMDGPU MC Inst -> ASM ---------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 // \file 8 //===----------------------------------------------------------------------===// 9 10 #include "AMDGPUInstPrinter.h" 11 #include "MCTargetDesc/AMDGPUMCTargetDesc.h" 12 #include "SIDefines.h" 13 #include "Utils/AMDGPUAsmUtils.h" 14 #include "Utils/AMDGPUBaseInfo.h" 15 #include "llvm/MC/MCExpr.h" 16 #include "llvm/MC/MCInst.h" 17 #include "llvm/MC/MCInstrDesc.h" 18 #include "llvm/MC/MCInstrInfo.h" 19 #include "llvm/MC/MCRegisterInfo.h" 20 #include "llvm/MC/MCSubtargetInfo.h" 21 #include "llvm/Support/ErrorHandling.h" 22 #include "llvm/Support/MathExtras.h" 23 #include "llvm/Support/raw_ostream.h" 24 #include <cassert> 25 26 using namespace llvm; 27 using namespace llvm::AMDGPU; 28 29 void AMDGPUInstPrinter::printRegName(raw_ostream &OS, unsigned RegNo) const { 30 // FIXME: The current implementation of 31 // AsmParser::parseRegisterOrRegisterNumber in MC implies we either emit this 32 // as an integer or we provide a name which represents a physical register. 33 // For CFI instructions we really want to emit a name for the DWARF register 34 // instead, because there may be multiple DWARF registers corresponding to a 35 // single physical register. One case where this problem manifests is with 36 // wave32/wave64 where using the physical register name is ambiguous: if we 37 // write e.g. `.cfi_undefined v0` we lose information about the wavefront 38 // size which we need to encode the register in the final DWARF. Ideally we 39 // would extend MC to support parsing DWARF register names so we could do 40 // something like `.cfi_undefined dwarf_wave32_v0`. For now we just live with 41 // non-pretty DWARF register names in assembly text. 42 OS << RegNo; 43 } 44 45 void AMDGPUInstPrinter::printInst(const MCInst *MI, uint64_t Address, 46 StringRef Annot, const MCSubtargetInfo &STI, 47 raw_ostream &OS) { 48 OS.flush(); 49 printInstruction(MI, Address, STI, OS); 50 printAnnotation(OS, Annot); 51 } 52 53 void AMDGPUInstPrinter::printU4ImmOperand(const MCInst *MI, unsigned OpNo, 54 const MCSubtargetInfo &STI, 55 raw_ostream &O) { 56 O << formatHex(MI->getOperand(OpNo).getImm() & 0xf); 57 } 58 59 void AMDGPUInstPrinter::printU8ImmOperand(const MCInst *MI, unsigned OpNo, 60 raw_ostream &O) { 61 O << formatHex(MI->getOperand(OpNo).getImm() & 0xff); 62 } 63 64 void AMDGPUInstPrinter::printU16ImmOperand(const MCInst *MI, unsigned OpNo, 65 const MCSubtargetInfo &STI, 66 raw_ostream &O) { 67 // It's possible to end up with a 32-bit literal used with a 16-bit operand 68 // with ignored high bits. Print as 32-bit anyway in that case. 69 int64_t Imm = MI->getOperand(OpNo).getImm(); 70 if (isInt<16>(Imm) || isUInt<16>(Imm)) 71 O << formatHex(static_cast<uint64_t>(Imm & 0xffff)); 72 else 73 printU32ImmOperand(MI, OpNo, STI, O); 74 } 75 76 void AMDGPUInstPrinter::printU4ImmDecOperand(const MCInst *MI, unsigned OpNo, 77 raw_ostream &O) { 78 O << formatDec(MI->getOperand(OpNo).getImm() & 0xf); 79 } 80 81 void AMDGPUInstPrinter::printU8ImmDecOperand(const MCInst *MI, unsigned OpNo, 82 raw_ostream &O) { 83 O << formatDec(MI->getOperand(OpNo).getImm() & 0xff); 84 } 85 86 void AMDGPUInstPrinter::printU16ImmDecOperand(const MCInst *MI, unsigned OpNo, 87 raw_ostream &O) { 88 O << formatDec(MI->getOperand(OpNo).getImm() & 0xffff); 89 } 90 91 void AMDGPUInstPrinter::printU32ImmOperand(const MCInst *MI, unsigned OpNo, 92 const MCSubtargetInfo &STI, 93 raw_ostream &O) { 94 O << formatHex(MI->getOperand(OpNo).getImm() & 0xffffffff); 95 } 96 97 void AMDGPUInstPrinter::printNamedBit(const MCInst *MI, unsigned OpNo, 98 raw_ostream &O, StringRef BitName) { 99 if (MI->getOperand(OpNo).getImm()) { 100 O << ' ' << BitName; 101 } 102 } 103 104 void AMDGPUInstPrinter::printOffen(const MCInst *MI, unsigned OpNo, 105 raw_ostream &O) { 106 printNamedBit(MI, OpNo, O, "offen"); 107 } 108 109 void AMDGPUInstPrinter::printIdxen(const MCInst *MI, unsigned OpNo, 110 raw_ostream &O) { 111 printNamedBit(MI, OpNo, O, "idxen"); 112 } 113 114 void AMDGPUInstPrinter::printAddr64(const MCInst *MI, unsigned OpNo, 115 raw_ostream &O) { 116 printNamedBit(MI, OpNo, O, "addr64"); 117 } 118 119 void AMDGPUInstPrinter::printMBUFOffset(const MCInst *MI, unsigned OpNo, 120 raw_ostream &O) { 121 if (MI->getOperand(OpNo).getImm()) { 122 O << " offset:"; 123 printU16ImmDecOperand(MI, OpNo, O); 124 } 125 } 126 127 void AMDGPUInstPrinter::printOffset(const MCInst *MI, unsigned OpNo, 128 const MCSubtargetInfo &STI, 129 raw_ostream &O) { 130 uint16_t Imm = MI->getOperand(OpNo).getImm(); 131 if (Imm != 0) { 132 O << ((OpNo == 0)? "offset:" : " offset:"); 133 printU16ImmDecOperand(MI, OpNo, O); 134 } 135 } 136 137 void AMDGPUInstPrinter::printFlatOffset(const MCInst *MI, unsigned OpNo, 138 const MCSubtargetInfo &STI, 139 raw_ostream &O) { 140 uint16_t Imm = MI->getOperand(OpNo).getImm(); 141 if (Imm != 0) { 142 O << ((OpNo == 0)? "offset:" : " offset:"); 143 144 const MCInstrDesc &Desc = MII.get(MI->getOpcode()); 145 bool IsFlatSeg = !(Desc.TSFlags & SIInstrFlags::IsNonFlatSeg); 146 147 if (IsFlatSeg) { // Unsigned offset 148 printU16ImmDecOperand(MI, OpNo, O); 149 } else { // Signed offset 150 if (AMDGPU::isGFX10(STI)) { 151 O << formatDec(SignExtend32<12>(MI->getOperand(OpNo).getImm())); 152 } else { 153 O << formatDec(SignExtend32<13>(MI->getOperand(OpNo).getImm())); 154 } 155 } 156 } 157 } 158 159 void AMDGPUInstPrinter::printOffset0(const MCInst *MI, unsigned OpNo, 160 const MCSubtargetInfo &STI, 161 raw_ostream &O) { 162 if (MI->getOperand(OpNo).getImm()) { 163 O << " offset0:"; 164 printU8ImmDecOperand(MI, OpNo, O); 165 } 166 } 167 168 void AMDGPUInstPrinter::printOffset1(const MCInst *MI, unsigned OpNo, 169 const MCSubtargetInfo &STI, 170 raw_ostream &O) { 171 if (MI->getOperand(OpNo).getImm()) { 172 O << " offset1:"; 173 printU8ImmDecOperand(MI, OpNo, O); 174 } 175 } 176 177 void AMDGPUInstPrinter::printSMRDOffset8(const MCInst *MI, unsigned OpNo, 178 const MCSubtargetInfo &STI, 179 raw_ostream &O) { 180 printU32ImmOperand(MI, OpNo, STI, O); 181 } 182 183 void AMDGPUInstPrinter::printSMRDOffset20(const MCInst *MI, unsigned OpNo, 184 const MCSubtargetInfo &STI, 185 raw_ostream &O) { 186 printU32ImmOperand(MI, OpNo, STI, O); 187 } 188 189 void AMDGPUInstPrinter::printSMRDLiteralOffset(const MCInst *MI, unsigned OpNo, 190 const MCSubtargetInfo &STI, 191 raw_ostream &O) { 192 printU32ImmOperand(MI, OpNo, STI, O); 193 } 194 195 void AMDGPUInstPrinter::printGDS(const MCInst *MI, unsigned OpNo, 196 const MCSubtargetInfo &STI, raw_ostream &O) { 197 printNamedBit(MI, OpNo, O, "gds"); 198 } 199 200 void AMDGPUInstPrinter::printDLC(const MCInst *MI, unsigned OpNo, 201 const MCSubtargetInfo &STI, raw_ostream &O) { 202 if (AMDGPU::isGFX10(STI)) 203 printNamedBit(MI, OpNo, O, "dlc"); 204 } 205 206 void AMDGPUInstPrinter::printGLC(const MCInst *MI, unsigned OpNo, 207 const MCSubtargetInfo &STI, raw_ostream &O) { 208 printNamedBit(MI, OpNo, O, "glc"); 209 } 210 211 void AMDGPUInstPrinter::printSLC(const MCInst *MI, unsigned OpNo, 212 const MCSubtargetInfo &STI, raw_ostream &O) { 213 printNamedBit(MI, OpNo, O, "slc"); 214 } 215 216 void AMDGPUInstPrinter::printSWZ(const MCInst *MI, unsigned OpNo, 217 const MCSubtargetInfo &STI, raw_ostream &O) { 218 } 219 220 void AMDGPUInstPrinter::printTFE(const MCInst *MI, unsigned OpNo, 221 const MCSubtargetInfo &STI, raw_ostream &O) { 222 printNamedBit(MI, OpNo, O, "tfe"); 223 } 224 225 void AMDGPUInstPrinter::printDMask(const MCInst *MI, unsigned OpNo, 226 const MCSubtargetInfo &STI, raw_ostream &O) { 227 if (MI->getOperand(OpNo).getImm()) { 228 O << " dmask:"; 229 printU16ImmOperand(MI, OpNo, STI, O); 230 } 231 } 232 233 void AMDGPUInstPrinter::printDim(const MCInst *MI, unsigned OpNo, 234 const MCSubtargetInfo &STI, raw_ostream &O) { 235 unsigned Dim = MI->getOperand(OpNo).getImm(); 236 O << " dim:SQ_RSRC_IMG_"; 237 238 const AMDGPU::MIMGDimInfo *DimInfo = AMDGPU::getMIMGDimInfoByEncoding(Dim); 239 if (DimInfo) 240 O << DimInfo->AsmSuffix; 241 else 242 O << Dim; 243 } 244 245 void AMDGPUInstPrinter::printUNorm(const MCInst *MI, unsigned OpNo, 246 const MCSubtargetInfo &STI, raw_ostream &O) { 247 printNamedBit(MI, OpNo, O, "unorm"); 248 } 249 250 void AMDGPUInstPrinter::printDA(const MCInst *MI, unsigned OpNo, 251 const MCSubtargetInfo &STI, raw_ostream &O) { 252 printNamedBit(MI, OpNo, O, "da"); 253 } 254 255 void AMDGPUInstPrinter::printR128A16(const MCInst *MI, unsigned OpNo, 256 const MCSubtargetInfo &STI, raw_ostream &O) { 257 if (STI.hasFeature(AMDGPU::FeatureR128A16)) 258 printNamedBit(MI, OpNo, O, "a16"); 259 else 260 printNamedBit(MI, OpNo, O, "r128"); 261 } 262 263 void AMDGPUInstPrinter::printGFX10A16(const MCInst *MI, unsigned OpNo, 264 const MCSubtargetInfo &STI, raw_ostream &O) { 265 printNamedBit(MI, OpNo, O, "a16"); 266 } 267 268 void AMDGPUInstPrinter::printLWE(const MCInst *MI, unsigned OpNo, 269 const MCSubtargetInfo &STI, raw_ostream &O) { 270 printNamedBit(MI, OpNo, O, "lwe"); 271 } 272 273 void AMDGPUInstPrinter::printD16(const MCInst *MI, unsigned OpNo, 274 const MCSubtargetInfo &STI, raw_ostream &O) { 275 printNamedBit(MI, OpNo, O, "d16"); 276 } 277 278 void AMDGPUInstPrinter::printExpCompr(const MCInst *MI, unsigned OpNo, 279 const MCSubtargetInfo &STI, 280 raw_ostream &O) { 281 if (MI->getOperand(OpNo).getImm()) 282 O << " compr"; 283 } 284 285 void AMDGPUInstPrinter::printExpVM(const MCInst *MI, unsigned OpNo, 286 const MCSubtargetInfo &STI, 287 raw_ostream &O) { 288 if (MI->getOperand(OpNo).getImm()) 289 O << " vm"; 290 } 291 292 void AMDGPUInstPrinter::printFORMAT(const MCInst *MI, unsigned OpNo, 293 const MCSubtargetInfo &STI, 294 raw_ostream &O) { 295 if (unsigned Val = MI->getOperand(OpNo).getImm()) { 296 if (AMDGPU::isGFX10(STI)) 297 O << " format:" << Val; 298 else { 299 O << " dfmt:" << (Val & 15); 300 O << ", nfmt:" << (Val >> 4); 301 } 302 } 303 } 304 305 void AMDGPUInstPrinter::printRegOperand(unsigned RegNo, raw_ostream &O, 306 const MCRegisterInfo &MRI) { 307 #if !defined(NDEBUG) 308 switch (RegNo) { 309 case AMDGPU::FP_REG: 310 case AMDGPU::SP_REG: 311 case AMDGPU::PRIVATE_RSRC_REG: 312 llvm_unreachable("pseudo-register should not ever be emitted"); 313 case AMDGPU::SCC: 314 llvm_unreachable("pseudo scc should not ever be emitted"); 315 default: 316 break; 317 } 318 #endif 319 320 O << getRegisterName(RegNo); 321 } 322 323 void AMDGPUInstPrinter::printVOPDst(const MCInst *MI, unsigned OpNo, 324 const MCSubtargetInfo &STI, raw_ostream &O) { 325 if (OpNo == 0) { 326 if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::VOP3) 327 O << "_e64 "; 328 else if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::DPP) 329 O << "_dpp "; 330 else if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::SDWA) 331 O << "_sdwa "; 332 else 333 O << "_e32 "; 334 } 335 336 printOperand(MI, OpNo, STI, O); 337 338 // Print default vcc/vcc_lo operand. 339 switch (MI->getOpcode()) { 340 default: break; 341 342 case AMDGPU::V_ADD_CO_CI_U32_e32_gfx10: 343 case AMDGPU::V_SUB_CO_CI_U32_e32_gfx10: 344 case AMDGPU::V_SUBREV_CO_CI_U32_e32_gfx10: 345 case AMDGPU::V_ADD_CO_CI_U32_sdwa_gfx10: 346 case AMDGPU::V_SUB_CO_CI_U32_sdwa_gfx10: 347 case AMDGPU::V_SUBREV_CO_CI_U32_sdwa_gfx10: 348 case AMDGPU::V_ADD_CO_CI_U32_dpp_gfx10: 349 case AMDGPU::V_SUB_CO_CI_U32_dpp_gfx10: 350 case AMDGPU::V_SUBREV_CO_CI_U32_dpp_gfx10: 351 case AMDGPU::V_ADD_CO_CI_U32_dpp8_gfx10: 352 case AMDGPU::V_SUB_CO_CI_U32_dpp8_gfx10: 353 case AMDGPU::V_SUBREV_CO_CI_U32_dpp8_gfx10: 354 printDefaultVccOperand(1, STI, O); 355 break; 356 } 357 } 358 359 void AMDGPUInstPrinter::printVINTRPDst(const MCInst *MI, unsigned OpNo, 360 const MCSubtargetInfo &STI, raw_ostream &O) { 361 if (AMDGPU::isSI(STI) || AMDGPU::isCI(STI)) 362 O << " "; 363 else 364 O << "_e32 "; 365 366 printOperand(MI, OpNo, STI, O); 367 } 368 369 void AMDGPUInstPrinter::printImmediate16(uint32_t Imm, 370 const MCSubtargetInfo &STI, 371 raw_ostream &O) { 372 int16_t SImm = static_cast<int16_t>(Imm); 373 if (SImm >= -16 && SImm <= 64) { 374 O << SImm; 375 return; 376 } 377 378 if (Imm == 0x3C00) 379 O<< "1.0"; 380 else if (Imm == 0xBC00) 381 O<< "-1.0"; 382 else if (Imm == 0x3800) 383 O<< "0.5"; 384 else if (Imm == 0xB800) 385 O<< "-0.5"; 386 else if (Imm == 0x4000) 387 O<< "2.0"; 388 else if (Imm == 0xC000) 389 O<< "-2.0"; 390 else if (Imm == 0x4400) 391 O<< "4.0"; 392 else if (Imm == 0xC400) 393 O<< "-4.0"; 394 else if (Imm == 0x3118) { 395 assert(STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm]); 396 O << "0.15915494"; 397 } else 398 O << formatHex(static_cast<uint64_t>(Imm)); 399 } 400 401 void AMDGPUInstPrinter::printImmediateV216(uint32_t Imm, 402 const MCSubtargetInfo &STI, 403 raw_ostream &O) { 404 uint16_t Lo16 = static_cast<uint16_t>(Imm); 405 printImmediate16(Lo16, STI, O); 406 } 407 408 void AMDGPUInstPrinter::printImmediate32(uint32_t Imm, 409 const MCSubtargetInfo &STI, 410 raw_ostream &O) { 411 int32_t SImm = static_cast<int32_t>(Imm); 412 if (SImm >= -16 && SImm <= 64) { 413 O << SImm; 414 return; 415 } 416 417 if (Imm == FloatToBits(0.0f)) 418 O << "0.0"; 419 else if (Imm == FloatToBits(1.0f)) 420 O << "1.0"; 421 else if (Imm == FloatToBits(-1.0f)) 422 O << "-1.0"; 423 else if (Imm == FloatToBits(0.5f)) 424 O << "0.5"; 425 else if (Imm == FloatToBits(-0.5f)) 426 O << "-0.5"; 427 else if (Imm == FloatToBits(2.0f)) 428 O << "2.0"; 429 else if (Imm == FloatToBits(-2.0f)) 430 O << "-2.0"; 431 else if (Imm == FloatToBits(4.0f)) 432 O << "4.0"; 433 else if (Imm == FloatToBits(-4.0f)) 434 O << "-4.0"; 435 else if (Imm == 0x3e22f983 && 436 STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm]) 437 O << "0.15915494"; 438 else 439 O << formatHex(static_cast<uint64_t>(Imm)); 440 } 441 442 void AMDGPUInstPrinter::printImmediate64(uint64_t Imm, 443 const MCSubtargetInfo &STI, 444 raw_ostream &O) { 445 int64_t SImm = static_cast<int64_t>(Imm); 446 if (SImm >= -16 && SImm <= 64) { 447 O << SImm; 448 return; 449 } 450 451 if (Imm == DoubleToBits(0.0)) 452 O << "0.0"; 453 else if (Imm == DoubleToBits(1.0)) 454 O << "1.0"; 455 else if (Imm == DoubleToBits(-1.0)) 456 O << "-1.0"; 457 else if (Imm == DoubleToBits(0.5)) 458 O << "0.5"; 459 else if (Imm == DoubleToBits(-0.5)) 460 O << "-0.5"; 461 else if (Imm == DoubleToBits(2.0)) 462 O << "2.0"; 463 else if (Imm == DoubleToBits(-2.0)) 464 O << "-2.0"; 465 else if (Imm == DoubleToBits(4.0)) 466 O << "4.0"; 467 else if (Imm == DoubleToBits(-4.0)) 468 O << "-4.0"; 469 else if (Imm == 0x3fc45f306dc9c882 && 470 STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm]) 471 O << "0.15915494309189532"; 472 else { 473 assert(isUInt<32>(Imm) || Imm == 0x3fc45f306dc9c882); 474 475 // In rare situations, we will have a 32-bit literal in a 64-bit 476 // operand. This is technically allowed for the encoding of s_mov_b64. 477 O << formatHex(static_cast<uint64_t>(Imm)); 478 } 479 } 480 481 void AMDGPUInstPrinter::printBLGP(const MCInst *MI, unsigned OpNo, 482 const MCSubtargetInfo &STI, 483 raw_ostream &O) { 484 unsigned Imm = MI->getOperand(OpNo).getImm(); 485 if (!Imm) 486 return; 487 488 O << " blgp:" << Imm; 489 } 490 491 void AMDGPUInstPrinter::printCBSZ(const MCInst *MI, unsigned OpNo, 492 const MCSubtargetInfo &STI, 493 raw_ostream &O) { 494 unsigned Imm = MI->getOperand(OpNo).getImm(); 495 if (!Imm) 496 return; 497 498 O << " cbsz:" << Imm; 499 } 500 501 void AMDGPUInstPrinter::printABID(const MCInst *MI, unsigned OpNo, 502 const MCSubtargetInfo &STI, 503 raw_ostream &O) { 504 unsigned Imm = MI->getOperand(OpNo).getImm(); 505 if (!Imm) 506 return; 507 508 O << " abid:" << Imm; 509 } 510 511 void AMDGPUInstPrinter::printDefaultVccOperand(unsigned OpNo, 512 const MCSubtargetInfo &STI, 513 raw_ostream &O) { 514 if (OpNo > 0) 515 O << ", "; 516 printRegOperand(STI.getFeatureBits()[AMDGPU::FeatureWavefrontSize64] ? 517 AMDGPU::VCC : AMDGPU::VCC_LO, O, MRI); 518 if (OpNo == 0) 519 O << ", "; 520 } 521 522 void AMDGPUInstPrinter::printOperand(const MCInst *MI, unsigned OpNo, 523 const MCSubtargetInfo &STI, 524 raw_ostream &O) { 525 // Print default vcc/vcc_lo operand of VOPC. 526 const MCInstrDesc &Desc = MII.get(MI->getOpcode()); 527 if (OpNo == 0 && (Desc.TSFlags & SIInstrFlags::VOPC) && 528 (Desc.hasImplicitDefOfPhysReg(AMDGPU::VCC) || 529 Desc.hasImplicitDefOfPhysReg(AMDGPU::VCC_LO))) 530 printDefaultVccOperand(OpNo, STI, O); 531 532 if (OpNo >= MI->getNumOperands()) { 533 O << "/*Missing OP" << OpNo << "*/"; 534 return; 535 } 536 537 const MCOperand &Op = MI->getOperand(OpNo); 538 if (Op.isReg()) { 539 printRegOperand(Op.getReg(), O, MRI); 540 } else if (Op.isImm()) { 541 switch (Desc.OpInfo[OpNo].OperandType) { 542 case AMDGPU::OPERAND_REG_IMM_INT32: 543 case AMDGPU::OPERAND_REG_IMM_FP32: 544 case AMDGPU::OPERAND_REG_INLINE_C_INT32: 545 case AMDGPU::OPERAND_REG_INLINE_C_FP32: 546 case AMDGPU::OPERAND_REG_INLINE_AC_INT32: 547 case AMDGPU::OPERAND_REG_INLINE_AC_FP32: 548 case MCOI::OPERAND_IMMEDIATE: 549 printImmediate32(Op.getImm(), STI, O); 550 break; 551 case AMDGPU::OPERAND_REG_IMM_INT64: 552 case AMDGPU::OPERAND_REG_IMM_FP64: 553 case AMDGPU::OPERAND_REG_INLINE_C_INT64: 554 case AMDGPU::OPERAND_REG_INLINE_C_FP64: 555 printImmediate64(Op.getImm(), STI, O); 556 break; 557 case AMDGPU::OPERAND_REG_INLINE_C_INT16: 558 case AMDGPU::OPERAND_REG_INLINE_C_FP16: 559 case AMDGPU::OPERAND_REG_INLINE_AC_INT16: 560 case AMDGPU::OPERAND_REG_INLINE_AC_FP16: 561 case AMDGPU::OPERAND_REG_IMM_INT16: 562 case AMDGPU::OPERAND_REG_IMM_FP16: 563 printImmediate16(Op.getImm(), STI, O); 564 break; 565 case AMDGPU::OPERAND_REG_IMM_V2INT16: 566 case AMDGPU::OPERAND_REG_IMM_V2FP16: 567 if (!isUInt<16>(Op.getImm()) && 568 STI.getFeatureBits()[AMDGPU::FeatureVOP3Literal]) { 569 printImmediate32(Op.getImm(), STI, O); 570 break; 571 } 572 LLVM_FALLTHROUGH; 573 case AMDGPU::OPERAND_REG_INLINE_C_V2FP16: 574 case AMDGPU::OPERAND_REG_INLINE_C_V2INT16: 575 case AMDGPU::OPERAND_REG_INLINE_AC_V2FP16: 576 case AMDGPU::OPERAND_REG_INLINE_AC_V2INT16: 577 printImmediateV216(Op.getImm(), STI, O); 578 break; 579 case MCOI::OPERAND_UNKNOWN: 580 case MCOI::OPERAND_PCREL: 581 O << formatDec(Op.getImm()); 582 break; 583 case MCOI::OPERAND_REGISTER: 584 // FIXME: This should be removed and handled somewhere else. Seems to come 585 // from a disassembler bug. 586 O << "/*invalid immediate*/"; 587 break; 588 default: 589 // We hit this for the immediate instruction bits that don't yet have a 590 // custom printer. 591 llvm_unreachable("unexpected immediate operand type"); 592 } 593 } else if (Op.isFPImm()) { 594 // We special case 0.0 because otherwise it will be printed as an integer. 595 if (Op.getFPImm() == 0.0) 596 O << "0.0"; 597 else { 598 const MCInstrDesc &Desc = MII.get(MI->getOpcode()); 599 int RCID = Desc.OpInfo[OpNo].RegClass; 600 unsigned RCBits = AMDGPU::getRegBitWidth(MRI.getRegClass(RCID)); 601 if (RCBits == 32) 602 printImmediate32(FloatToBits(Op.getFPImm()), STI, O); 603 else if (RCBits == 64) 604 printImmediate64(DoubleToBits(Op.getFPImm()), STI, O); 605 else 606 llvm_unreachable("Invalid register class size"); 607 } 608 } else if (Op.isExpr()) { 609 const MCExpr *Exp = Op.getExpr(); 610 Exp->print(O, &MAI); 611 } else { 612 O << "/*INV_OP*/"; 613 } 614 615 // Print default vcc/vcc_lo operand of v_cndmask_b32_e32. 616 switch (MI->getOpcode()) { 617 default: break; 618 619 case AMDGPU::V_CNDMASK_B32_e32_gfx10: 620 case AMDGPU::V_ADD_CO_CI_U32_e32_gfx10: 621 case AMDGPU::V_SUB_CO_CI_U32_e32_gfx10: 622 case AMDGPU::V_SUBREV_CO_CI_U32_e32_gfx10: 623 case AMDGPU::V_CNDMASK_B32_dpp_gfx10: 624 case AMDGPU::V_ADD_CO_CI_U32_dpp_gfx10: 625 case AMDGPU::V_SUB_CO_CI_U32_dpp_gfx10: 626 case AMDGPU::V_SUBREV_CO_CI_U32_dpp_gfx10: 627 case AMDGPU::V_CNDMASK_B32_dpp8_gfx10: 628 case AMDGPU::V_ADD_CO_CI_U32_dpp8_gfx10: 629 case AMDGPU::V_SUB_CO_CI_U32_dpp8_gfx10: 630 case AMDGPU::V_SUBREV_CO_CI_U32_dpp8_gfx10: 631 632 case AMDGPU::V_CNDMASK_B32_e32_gfx6_gfx7: 633 case AMDGPU::V_CNDMASK_B32_e32_vi: 634 if ((int)OpNo == AMDGPU::getNamedOperandIdx(MI->getOpcode(), 635 AMDGPU::OpName::src1)) 636 printDefaultVccOperand(OpNo, STI, O); 637 break; 638 } 639 } 640 641 void AMDGPUInstPrinter::printOperandAndFPInputMods(const MCInst *MI, 642 unsigned OpNo, 643 const MCSubtargetInfo &STI, 644 raw_ostream &O) { 645 unsigned InputModifiers = MI->getOperand(OpNo).getImm(); 646 647 // Use 'neg(...)' instead of '-' to avoid ambiguity. 648 // This is important for integer literals because 649 // -1 is not the same value as neg(1). 650 bool NegMnemo = false; 651 652 if (InputModifiers & SISrcMods::NEG) { 653 if (OpNo + 1 < MI->getNumOperands() && 654 (InputModifiers & SISrcMods::ABS) == 0) { 655 const MCOperand &Op = MI->getOperand(OpNo + 1); 656 NegMnemo = Op.isImm() || Op.isFPImm(); 657 } 658 if (NegMnemo) { 659 O << "neg("; 660 } else { 661 O << '-'; 662 } 663 } 664 665 if (InputModifiers & SISrcMods::ABS) 666 O << '|'; 667 printOperand(MI, OpNo + 1, STI, O); 668 if (InputModifiers & SISrcMods::ABS) 669 O << '|'; 670 671 if (NegMnemo) { 672 O << ')'; 673 } 674 } 675 676 void AMDGPUInstPrinter::printOperandAndIntInputMods(const MCInst *MI, 677 unsigned OpNo, 678 const MCSubtargetInfo &STI, 679 raw_ostream &O) { 680 unsigned InputModifiers = MI->getOperand(OpNo).getImm(); 681 if (InputModifiers & SISrcMods::SEXT) 682 O << "sext("; 683 printOperand(MI, OpNo + 1, STI, O); 684 if (InputModifiers & SISrcMods::SEXT) 685 O << ')'; 686 687 // Print default vcc/vcc_lo operand of VOP2b. 688 switch (MI->getOpcode()) { 689 default: break; 690 691 case AMDGPU::V_CNDMASK_B32_sdwa_gfx10: 692 case AMDGPU::V_ADD_CO_CI_U32_sdwa_gfx10: 693 case AMDGPU::V_SUB_CO_CI_U32_sdwa_gfx10: 694 case AMDGPU::V_SUBREV_CO_CI_U32_sdwa_gfx10: 695 if ((int)OpNo + 1 == AMDGPU::getNamedOperandIdx(MI->getOpcode(), 696 AMDGPU::OpName::src1)) 697 printDefaultVccOperand(OpNo, STI, O); 698 break; 699 } 700 } 701 702 void AMDGPUInstPrinter::printDPP8(const MCInst *MI, unsigned OpNo, 703 const MCSubtargetInfo &STI, 704 raw_ostream &O) { 705 if (!AMDGPU::isGFX10(STI)) 706 llvm_unreachable("dpp8 is not supported on ASICs earlier than GFX10"); 707 708 unsigned Imm = MI->getOperand(OpNo).getImm(); 709 O << " dpp8:[" << formatDec(Imm & 0x7); 710 for (size_t i = 1; i < 8; ++i) { 711 O << ',' << formatDec((Imm >> (3 * i)) & 0x7); 712 } 713 O << ']'; 714 } 715 716 void AMDGPUInstPrinter::printDPPCtrl(const MCInst *MI, unsigned OpNo, 717 const MCSubtargetInfo &STI, 718 raw_ostream &O) { 719 using namespace AMDGPU::DPP; 720 721 unsigned Imm = MI->getOperand(OpNo).getImm(); 722 if (Imm <= DppCtrl::QUAD_PERM_LAST) { 723 O << " quad_perm:["; 724 O << formatDec(Imm & 0x3) << ','; 725 O << formatDec((Imm & 0xc) >> 2) << ','; 726 O << formatDec((Imm & 0x30) >> 4) << ','; 727 O << formatDec((Imm & 0xc0) >> 6) << ']'; 728 } else if ((Imm >= DppCtrl::ROW_SHL_FIRST) && 729 (Imm <= DppCtrl::ROW_SHL_LAST)) { 730 O << " row_shl:"; 731 printU4ImmDecOperand(MI, OpNo, O); 732 } else if ((Imm >= DppCtrl::ROW_SHR_FIRST) && 733 (Imm <= DppCtrl::ROW_SHR_LAST)) { 734 O << " row_shr:"; 735 printU4ImmDecOperand(MI, OpNo, O); 736 } else if ((Imm >= DppCtrl::ROW_ROR_FIRST) && 737 (Imm <= DppCtrl::ROW_ROR_LAST)) { 738 O << " row_ror:"; 739 printU4ImmDecOperand(MI, OpNo, O); 740 } else if (Imm == DppCtrl::WAVE_SHL1) { 741 if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) { 742 O << " /* wave_shl is not supported starting from GFX10 */"; 743 return; 744 } 745 O << " wave_shl:1"; 746 } else if (Imm == DppCtrl::WAVE_ROL1) { 747 if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) { 748 O << " /* wave_rol is not supported starting from GFX10 */"; 749 return; 750 } 751 O << " wave_rol:1"; 752 } else if (Imm == DppCtrl::WAVE_SHR1) { 753 if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) { 754 O << " /* wave_shr is not supported starting from GFX10 */"; 755 return; 756 } 757 O << " wave_shr:1"; 758 } else if (Imm == DppCtrl::WAVE_ROR1) { 759 if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) { 760 O << " /* wave_ror is not supported starting from GFX10 */"; 761 return; 762 } 763 O << " wave_ror:1"; 764 } else if (Imm == DppCtrl::ROW_MIRROR) { 765 O << " row_mirror"; 766 } else if (Imm == DppCtrl::ROW_HALF_MIRROR) { 767 O << " row_half_mirror"; 768 } else if (Imm == DppCtrl::BCAST15) { 769 if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) { 770 O << " /* row_bcast is not supported starting from GFX10 */"; 771 return; 772 } 773 O << " row_bcast:15"; 774 } else if (Imm == DppCtrl::BCAST31) { 775 if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) { 776 O << " /* row_bcast is not supported starting from GFX10 */"; 777 return; 778 } 779 O << " row_bcast:31"; 780 } else if ((Imm >= DppCtrl::ROW_SHARE_FIRST) && 781 (Imm <= DppCtrl::ROW_SHARE_LAST)) { 782 if (!AMDGPU::isGFX10(STI)) { 783 O << " /* row_share is not supported on ASICs earlier than GFX10 */"; 784 return; 785 } 786 O << " row_share:"; 787 printU4ImmDecOperand(MI, OpNo, O); 788 } else if ((Imm >= DppCtrl::ROW_XMASK_FIRST) && 789 (Imm <= DppCtrl::ROW_XMASK_LAST)) { 790 if (!AMDGPU::isGFX10(STI)) { 791 O << " /* row_xmask is not supported on ASICs earlier than GFX10 */"; 792 return; 793 } 794 O << "row_xmask:"; 795 printU4ImmDecOperand(MI, OpNo, O); 796 } else { 797 O << " /* Invalid dpp_ctrl value */"; 798 } 799 } 800 801 void AMDGPUInstPrinter::printRowMask(const MCInst *MI, unsigned OpNo, 802 const MCSubtargetInfo &STI, 803 raw_ostream &O) { 804 O << " row_mask:"; 805 printU4ImmOperand(MI, OpNo, STI, O); 806 } 807 808 void AMDGPUInstPrinter::printBankMask(const MCInst *MI, unsigned OpNo, 809 const MCSubtargetInfo &STI, 810 raw_ostream &O) { 811 O << " bank_mask:"; 812 printU4ImmOperand(MI, OpNo, STI, O); 813 } 814 815 void AMDGPUInstPrinter::printBoundCtrl(const MCInst *MI, unsigned OpNo, 816 const MCSubtargetInfo &STI, 817 raw_ostream &O) { 818 unsigned Imm = MI->getOperand(OpNo).getImm(); 819 if (Imm) { 820 O << " bound_ctrl:0"; // XXX - this syntax is used in sp3 821 } 822 } 823 824 void AMDGPUInstPrinter::printFI(const MCInst *MI, unsigned OpNo, 825 const MCSubtargetInfo &STI, 826 raw_ostream &O) { 827 using namespace llvm::AMDGPU::DPP; 828 unsigned Imm = MI->getOperand(OpNo).getImm(); 829 if (Imm == DPP_FI_1 || Imm == DPP8_FI_1) { 830 O << " fi:1"; 831 } 832 } 833 834 void AMDGPUInstPrinter::printSDWASel(const MCInst *MI, unsigned OpNo, 835 raw_ostream &O) { 836 using namespace llvm::AMDGPU::SDWA; 837 838 unsigned Imm = MI->getOperand(OpNo).getImm(); 839 switch (Imm) { 840 case SdwaSel::BYTE_0: O << "BYTE_0"; break; 841 case SdwaSel::BYTE_1: O << "BYTE_1"; break; 842 case SdwaSel::BYTE_2: O << "BYTE_2"; break; 843 case SdwaSel::BYTE_3: O << "BYTE_3"; break; 844 case SdwaSel::WORD_0: O << "WORD_0"; break; 845 case SdwaSel::WORD_1: O << "WORD_1"; break; 846 case SdwaSel::DWORD: O << "DWORD"; break; 847 default: llvm_unreachable("Invalid SDWA data select operand"); 848 } 849 } 850 851 void AMDGPUInstPrinter::printSDWADstSel(const MCInst *MI, unsigned OpNo, 852 const MCSubtargetInfo &STI, 853 raw_ostream &O) { 854 O << "dst_sel:"; 855 printSDWASel(MI, OpNo, O); 856 } 857 858 void AMDGPUInstPrinter::printSDWASrc0Sel(const MCInst *MI, unsigned OpNo, 859 const MCSubtargetInfo &STI, 860 raw_ostream &O) { 861 O << "src0_sel:"; 862 printSDWASel(MI, OpNo, O); 863 } 864 865 void AMDGPUInstPrinter::printSDWASrc1Sel(const MCInst *MI, unsigned OpNo, 866 const MCSubtargetInfo &STI, 867 raw_ostream &O) { 868 O << "src1_sel:"; 869 printSDWASel(MI, OpNo, O); 870 } 871 872 void AMDGPUInstPrinter::printSDWADstUnused(const MCInst *MI, unsigned OpNo, 873 const MCSubtargetInfo &STI, 874 raw_ostream &O) { 875 using namespace llvm::AMDGPU::SDWA; 876 877 O << "dst_unused:"; 878 unsigned Imm = MI->getOperand(OpNo).getImm(); 879 switch (Imm) { 880 case DstUnused::UNUSED_PAD: O << "UNUSED_PAD"; break; 881 case DstUnused::UNUSED_SEXT: O << "UNUSED_SEXT"; break; 882 case DstUnused::UNUSED_PRESERVE: O << "UNUSED_PRESERVE"; break; 883 default: llvm_unreachable("Invalid SDWA dest_unused operand"); 884 } 885 } 886 887 template <unsigned N> 888 void AMDGPUInstPrinter::printExpSrcN(const MCInst *MI, unsigned OpNo, 889 const MCSubtargetInfo &STI, 890 raw_ostream &O) { 891 unsigned Opc = MI->getOpcode(); 892 int EnIdx = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::en); 893 unsigned En = MI->getOperand(EnIdx).getImm(); 894 895 int ComprIdx = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::compr); 896 897 // If compr is set, print as src0, src0, src1, src1 898 if (MI->getOperand(ComprIdx).getImm()) { 899 if (N == 1 || N == 2) 900 --OpNo; 901 else if (N == 3) 902 OpNo -= 2; 903 } 904 905 if (En & (1 << N)) 906 printRegOperand(MI->getOperand(OpNo).getReg(), O, MRI); 907 else 908 O << "off"; 909 } 910 911 void AMDGPUInstPrinter::printExpSrc0(const MCInst *MI, unsigned OpNo, 912 const MCSubtargetInfo &STI, 913 raw_ostream &O) { 914 printExpSrcN<0>(MI, OpNo, STI, O); 915 } 916 917 void AMDGPUInstPrinter::printExpSrc1(const MCInst *MI, unsigned OpNo, 918 const MCSubtargetInfo &STI, 919 raw_ostream &O) { 920 printExpSrcN<1>(MI, OpNo, STI, O); 921 } 922 923 void AMDGPUInstPrinter::printExpSrc2(const MCInst *MI, unsigned OpNo, 924 const MCSubtargetInfo &STI, 925 raw_ostream &O) { 926 printExpSrcN<2>(MI, OpNo, STI, O); 927 } 928 929 void AMDGPUInstPrinter::printExpSrc3(const MCInst *MI, unsigned OpNo, 930 const MCSubtargetInfo &STI, 931 raw_ostream &O) { 932 printExpSrcN<3>(MI, OpNo, STI, O); 933 } 934 935 void AMDGPUInstPrinter::printExpTgt(const MCInst *MI, unsigned OpNo, 936 const MCSubtargetInfo &STI, 937 raw_ostream &O) { 938 // This is really a 6 bit field. 939 uint32_t Tgt = MI->getOperand(OpNo).getImm() & ((1 << 6) - 1); 940 941 if (Tgt <= 7) 942 O << " mrt" << Tgt; 943 else if (Tgt == 8) 944 O << " mrtz"; 945 else if (Tgt == 9) 946 O << " null"; 947 else if ((Tgt >= 12 && Tgt <= 15) || (Tgt == 16 && AMDGPU::isGFX10(STI))) 948 O << " pos" << Tgt - 12; 949 else if (AMDGPU::isGFX10(STI) && Tgt == 20) 950 O << " prim"; 951 else if (Tgt >= 32 && Tgt <= 63) 952 O << " param" << Tgt - 32; 953 else { 954 // Reserved values 10, 11 955 O << " invalid_target_" << Tgt; 956 } 957 } 958 959 static bool allOpsDefaultValue(const int* Ops, int NumOps, int Mod, 960 bool IsPacked, bool HasDstSel) { 961 int DefaultValue = IsPacked && (Mod == SISrcMods::OP_SEL_1); 962 963 for (int I = 0; I < NumOps; ++I) { 964 if (!!(Ops[I] & Mod) != DefaultValue) 965 return false; 966 } 967 968 if (HasDstSel && (Ops[0] & SISrcMods::DST_OP_SEL) != 0) 969 return false; 970 971 return true; 972 } 973 974 void AMDGPUInstPrinter::printPackedModifier(const MCInst *MI, 975 StringRef Name, 976 unsigned Mod, 977 raw_ostream &O) { 978 unsigned Opc = MI->getOpcode(); 979 int NumOps = 0; 980 int Ops[3]; 981 982 for (int OpName : { AMDGPU::OpName::src0_modifiers, 983 AMDGPU::OpName::src1_modifiers, 984 AMDGPU::OpName::src2_modifiers }) { 985 int Idx = AMDGPU::getNamedOperandIdx(Opc, OpName); 986 if (Idx == -1) 987 break; 988 989 Ops[NumOps++] = MI->getOperand(Idx).getImm(); 990 } 991 992 const bool HasDstSel = 993 NumOps > 0 && 994 Mod == SISrcMods::OP_SEL_0 && 995 MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::VOP3_OPSEL; 996 997 const bool IsPacked = 998 MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::IsPacked; 999 1000 if (allOpsDefaultValue(Ops, NumOps, Mod, IsPacked, HasDstSel)) 1001 return; 1002 1003 O << Name; 1004 for (int I = 0; I < NumOps; ++I) { 1005 if (I != 0) 1006 O << ','; 1007 1008 O << !!(Ops[I] & Mod); 1009 } 1010 1011 if (HasDstSel) { 1012 O << ',' << !!(Ops[0] & SISrcMods::DST_OP_SEL); 1013 } 1014 1015 O << ']'; 1016 } 1017 1018 void AMDGPUInstPrinter::printOpSel(const MCInst *MI, unsigned, 1019 const MCSubtargetInfo &STI, 1020 raw_ostream &O) { 1021 unsigned Opc = MI->getOpcode(); 1022 if (Opc == AMDGPU::V_PERMLANE16_B32_gfx10 || 1023 Opc == AMDGPU::V_PERMLANEX16_B32_gfx10) { 1024 auto FIN = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::src0_modifiers); 1025 auto BCN = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::src1_modifiers); 1026 unsigned FI = !!(MI->getOperand(FIN).getImm() & SISrcMods::OP_SEL_0); 1027 unsigned BC = !!(MI->getOperand(BCN).getImm() & SISrcMods::OP_SEL_0); 1028 if (FI || BC) 1029 O << " op_sel:[" << FI << ',' << BC << ']'; 1030 return; 1031 } 1032 1033 printPackedModifier(MI, " op_sel:[", SISrcMods::OP_SEL_0, O); 1034 } 1035 1036 void AMDGPUInstPrinter::printOpSelHi(const MCInst *MI, unsigned OpNo, 1037 const MCSubtargetInfo &STI, 1038 raw_ostream &O) { 1039 printPackedModifier(MI, " op_sel_hi:[", SISrcMods::OP_SEL_1, O); 1040 } 1041 1042 void AMDGPUInstPrinter::printNegLo(const MCInst *MI, unsigned OpNo, 1043 const MCSubtargetInfo &STI, 1044 raw_ostream &O) { 1045 printPackedModifier(MI, " neg_lo:[", SISrcMods::NEG, O); 1046 } 1047 1048 void AMDGPUInstPrinter::printNegHi(const MCInst *MI, unsigned OpNo, 1049 const MCSubtargetInfo &STI, 1050 raw_ostream &O) { 1051 printPackedModifier(MI, " neg_hi:[", SISrcMods::NEG_HI, O); 1052 } 1053 1054 void AMDGPUInstPrinter::printInterpSlot(const MCInst *MI, unsigned OpNum, 1055 const MCSubtargetInfo &STI, 1056 raw_ostream &O) { 1057 unsigned Imm = MI->getOperand(OpNum).getImm(); 1058 switch (Imm) { 1059 case 0: 1060 O << "p10"; 1061 break; 1062 case 1: 1063 O << "p20"; 1064 break; 1065 case 2: 1066 O << "p0"; 1067 break; 1068 default: 1069 O << "invalid_param_" << Imm; 1070 } 1071 } 1072 1073 void AMDGPUInstPrinter::printInterpAttr(const MCInst *MI, unsigned OpNum, 1074 const MCSubtargetInfo &STI, 1075 raw_ostream &O) { 1076 unsigned Attr = MI->getOperand(OpNum).getImm(); 1077 O << "attr" << Attr; 1078 } 1079 1080 void AMDGPUInstPrinter::printInterpAttrChan(const MCInst *MI, unsigned OpNum, 1081 const MCSubtargetInfo &STI, 1082 raw_ostream &O) { 1083 unsigned Chan = MI->getOperand(OpNum).getImm(); 1084 O << '.' << "xyzw"[Chan & 0x3]; 1085 } 1086 1087 void AMDGPUInstPrinter::printVGPRIndexMode(const MCInst *MI, unsigned OpNo, 1088 const MCSubtargetInfo &STI, 1089 raw_ostream &O) { 1090 using namespace llvm::AMDGPU::VGPRIndexMode; 1091 unsigned Val = MI->getOperand(OpNo).getImm(); 1092 1093 if ((Val & ~ENABLE_MASK) != 0) { 1094 O << " " << formatHex(static_cast<uint64_t>(Val)); 1095 } else { 1096 O << " gpr_idx("; 1097 bool NeedComma = false; 1098 for (unsigned ModeId = ID_MIN; ModeId <= ID_MAX; ++ModeId) { 1099 if (Val & (1 << ModeId)) { 1100 if (NeedComma) 1101 O << ','; 1102 O << IdSymbolic[ModeId]; 1103 NeedComma = true; 1104 } 1105 } 1106 O << ')'; 1107 } 1108 } 1109 1110 void AMDGPUInstPrinter::printMemOperand(const MCInst *MI, unsigned OpNo, 1111 const MCSubtargetInfo &STI, 1112 raw_ostream &O) { 1113 printOperand(MI, OpNo, STI, O); 1114 O << ", "; 1115 printOperand(MI, OpNo + 1, STI, O); 1116 } 1117 1118 void AMDGPUInstPrinter::printIfSet(const MCInst *MI, unsigned OpNo, 1119 raw_ostream &O, StringRef Asm, 1120 StringRef Default) { 1121 const MCOperand &Op = MI->getOperand(OpNo); 1122 assert(Op.isImm()); 1123 if (Op.getImm() == 1) { 1124 O << Asm; 1125 } else { 1126 O << Default; 1127 } 1128 } 1129 1130 void AMDGPUInstPrinter::printIfSet(const MCInst *MI, unsigned OpNo, 1131 raw_ostream &O, char Asm) { 1132 const MCOperand &Op = MI->getOperand(OpNo); 1133 assert(Op.isImm()); 1134 if (Op.getImm() == 1) 1135 O << Asm; 1136 } 1137 1138 void AMDGPUInstPrinter::printHigh(const MCInst *MI, unsigned OpNo, 1139 const MCSubtargetInfo &STI, 1140 raw_ostream &O) { 1141 if (MI->getOperand(OpNo).getImm()) 1142 O << " high"; 1143 } 1144 1145 void AMDGPUInstPrinter::printClampSI(const MCInst *MI, unsigned OpNo, 1146 const MCSubtargetInfo &STI, 1147 raw_ostream &O) { 1148 if (MI->getOperand(OpNo).getImm()) 1149 O << " clamp"; 1150 } 1151 1152 void AMDGPUInstPrinter::printOModSI(const MCInst *MI, unsigned OpNo, 1153 const MCSubtargetInfo &STI, 1154 raw_ostream &O) { 1155 int Imm = MI->getOperand(OpNo).getImm(); 1156 if (Imm == SIOutMods::MUL2) 1157 O << " mul:2"; 1158 else if (Imm == SIOutMods::MUL4) 1159 O << " mul:4"; 1160 else if (Imm == SIOutMods::DIV2) 1161 O << " div:2"; 1162 } 1163 1164 void AMDGPUInstPrinter::printSendMsg(const MCInst *MI, unsigned OpNo, 1165 const MCSubtargetInfo &STI, 1166 raw_ostream &O) { 1167 using namespace llvm::AMDGPU::SendMsg; 1168 1169 const unsigned Imm16 = MI->getOperand(OpNo).getImm(); 1170 1171 uint16_t MsgId; 1172 uint16_t OpId; 1173 uint16_t StreamId; 1174 decodeMsg(Imm16, MsgId, OpId, StreamId); 1175 1176 if (isValidMsgId(MsgId, STI) && 1177 isValidMsgOp(MsgId, OpId) && 1178 isValidMsgStream(MsgId, OpId, StreamId)) { 1179 O << "sendmsg(" << getMsgName(MsgId); 1180 if (msgRequiresOp(MsgId)) { 1181 O << ", " << getMsgOpName(MsgId, OpId); 1182 if (msgSupportsStream(MsgId, OpId)) { 1183 O << ", " << StreamId; 1184 } 1185 } 1186 O << ')'; 1187 } else if (encodeMsg(MsgId, OpId, StreamId) == Imm16) { 1188 O << "sendmsg(" << MsgId << ", " << OpId << ", " << StreamId << ')'; 1189 } else { 1190 O << Imm16; // Unknown imm16 code. 1191 } 1192 } 1193 1194 static void printSwizzleBitmask(const uint16_t AndMask, 1195 const uint16_t OrMask, 1196 const uint16_t XorMask, 1197 raw_ostream &O) { 1198 using namespace llvm::AMDGPU::Swizzle; 1199 1200 uint16_t Probe0 = ((0 & AndMask) | OrMask) ^ XorMask; 1201 uint16_t Probe1 = ((BITMASK_MASK & AndMask) | OrMask) ^ XorMask; 1202 1203 O << "\""; 1204 1205 for (unsigned Mask = 1 << (BITMASK_WIDTH - 1); Mask > 0; Mask >>= 1) { 1206 uint16_t p0 = Probe0 & Mask; 1207 uint16_t p1 = Probe1 & Mask; 1208 1209 if (p0 == p1) { 1210 if (p0 == 0) { 1211 O << "0"; 1212 } else { 1213 O << "1"; 1214 } 1215 } else { 1216 if (p0 == 0) { 1217 O << "p"; 1218 } else { 1219 O << "i"; 1220 } 1221 } 1222 } 1223 1224 O << "\""; 1225 } 1226 1227 void AMDGPUInstPrinter::printSwizzle(const MCInst *MI, unsigned OpNo, 1228 const MCSubtargetInfo &STI, 1229 raw_ostream &O) { 1230 using namespace llvm::AMDGPU::Swizzle; 1231 1232 uint16_t Imm = MI->getOperand(OpNo).getImm(); 1233 if (Imm == 0) { 1234 return; 1235 } 1236 1237 O << " offset:"; 1238 1239 if ((Imm & QUAD_PERM_ENC_MASK) == QUAD_PERM_ENC) { 1240 1241 O << "swizzle(" << IdSymbolic[ID_QUAD_PERM]; 1242 for (unsigned I = 0; I < LANE_NUM; ++I) { 1243 O << ","; 1244 O << formatDec(Imm & LANE_MASK); 1245 Imm >>= LANE_SHIFT; 1246 } 1247 O << ")"; 1248 1249 } else if ((Imm & BITMASK_PERM_ENC_MASK) == BITMASK_PERM_ENC) { 1250 1251 uint16_t AndMask = (Imm >> BITMASK_AND_SHIFT) & BITMASK_MASK; 1252 uint16_t OrMask = (Imm >> BITMASK_OR_SHIFT) & BITMASK_MASK; 1253 uint16_t XorMask = (Imm >> BITMASK_XOR_SHIFT) & BITMASK_MASK; 1254 1255 if (AndMask == BITMASK_MAX && 1256 OrMask == 0 && 1257 countPopulation(XorMask) == 1) { 1258 1259 O << "swizzle(" << IdSymbolic[ID_SWAP]; 1260 O << ","; 1261 O << formatDec(XorMask); 1262 O << ")"; 1263 1264 } else if (AndMask == BITMASK_MAX && 1265 OrMask == 0 && XorMask > 0 && 1266 isPowerOf2_64(XorMask + 1)) { 1267 1268 O << "swizzle(" << IdSymbolic[ID_REVERSE]; 1269 O << ","; 1270 O << formatDec(XorMask + 1); 1271 O << ")"; 1272 1273 } else { 1274 1275 uint16_t GroupSize = BITMASK_MAX - AndMask + 1; 1276 if (GroupSize > 1 && 1277 isPowerOf2_64(GroupSize) && 1278 OrMask < GroupSize && 1279 XorMask == 0) { 1280 1281 O << "swizzle(" << IdSymbolic[ID_BROADCAST]; 1282 O << ","; 1283 O << formatDec(GroupSize); 1284 O << ","; 1285 O << formatDec(OrMask); 1286 O << ")"; 1287 1288 } else { 1289 O << "swizzle(" << IdSymbolic[ID_BITMASK_PERM]; 1290 O << ","; 1291 printSwizzleBitmask(AndMask, OrMask, XorMask, O); 1292 O << ")"; 1293 } 1294 } 1295 } else { 1296 printU16ImmDecOperand(MI, OpNo, O); 1297 } 1298 } 1299 1300 void AMDGPUInstPrinter::printWaitFlag(const MCInst *MI, unsigned OpNo, 1301 const MCSubtargetInfo &STI, 1302 raw_ostream &O) { 1303 AMDGPU::IsaVersion ISA = AMDGPU::getIsaVersion(STI.getCPU()); 1304 1305 unsigned SImm16 = MI->getOperand(OpNo).getImm(); 1306 unsigned Vmcnt, Expcnt, Lgkmcnt; 1307 decodeWaitcnt(ISA, SImm16, Vmcnt, Expcnt, Lgkmcnt); 1308 1309 bool NeedSpace = false; 1310 1311 if (Vmcnt != getVmcntBitMask(ISA)) { 1312 O << "vmcnt(" << Vmcnt << ')'; 1313 NeedSpace = true; 1314 } 1315 1316 if (Expcnt != getExpcntBitMask(ISA)) { 1317 if (NeedSpace) 1318 O << ' '; 1319 O << "expcnt(" << Expcnt << ')'; 1320 NeedSpace = true; 1321 } 1322 1323 if (Lgkmcnt != getLgkmcntBitMask(ISA)) { 1324 if (NeedSpace) 1325 O << ' '; 1326 O << "lgkmcnt(" << Lgkmcnt << ')'; 1327 } 1328 } 1329 1330 void AMDGPUInstPrinter::printHwreg(const MCInst *MI, unsigned OpNo, 1331 const MCSubtargetInfo &STI, raw_ostream &O) { 1332 unsigned Id; 1333 unsigned Offset; 1334 unsigned Width; 1335 1336 using namespace llvm::AMDGPU::Hwreg; 1337 unsigned Val = MI->getOperand(OpNo).getImm(); 1338 decodeHwreg(Val, Id, Offset, Width); 1339 StringRef HwRegName = getHwreg(Id, STI); 1340 1341 O << "hwreg("; 1342 if (!HwRegName.empty()) { 1343 O << HwRegName; 1344 } else { 1345 O << Id; 1346 } 1347 if (Width != WIDTH_DEFAULT_ || Offset != OFFSET_DEFAULT_) { 1348 O << ", " << Offset << ", " << Width; 1349 } 1350 O << ')'; 1351 } 1352 1353 void AMDGPUInstPrinter::printEndpgm(const MCInst *MI, unsigned OpNo, 1354 const MCSubtargetInfo &STI, 1355 raw_ostream &O) { 1356 uint16_t Imm = MI->getOperand(OpNo).getImm(); 1357 if (Imm == 0) { 1358 return; 1359 } 1360 1361 O << ' ' << formatDec(Imm); 1362 } 1363 1364 #include "AMDGPUGenAsmWriter.inc" 1365 1366 void R600InstPrinter::printInst(const MCInst *MI, uint64_t Address, 1367 StringRef Annot, const MCSubtargetInfo &STI, 1368 raw_ostream &O) { 1369 O.flush(); 1370 printInstruction(MI, Address, O); 1371 printAnnotation(O, Annot); 1372 } 1373 1374 void R600InstPrinter::printAbs(const MCInst *MI, unsigned OpNo, 1375 raw_ostream &O) { 1376 AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '|'); 1377 } 1378 1379 void R600InstPrinter::printBankSwizzle(const MCInst *MI, unsigned OpNo, 1380 raw_ostream &O) { 1381 int BankSwizzle = MI->getOperand(OpNo).getImm(); 1382 switch (BankSwizzle) { 1383 case 1: 1384 O << "BS:VEC_021/SCL_122"; 1385 break; 1386 case 2: 1387 O << "BS:VEC_120/SCL_212"; 1388 break; 1389 case 3: 1390 O << "BS:VEC_102/SCL_221"; 1391 break; 1392 case 4: 1393 O << "BS:VEC_201"; 1394 break; 1395 case 5: 1396 O << "BS:VEC_210"; 1397 break; 1398 default: 1399 break; 1400 } 1401 } 1402 1403 void R600InstPrinter::printClamp(const MCInst *MI, unsigned OpNo, 1404 raw_ostream &O) { 1405 AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "_SAT"); 1406 } 1407 1408 void R600InstPrinter::printCT(const MCInst *MI, unsigned OpNo, 1409 raw_ostream &O) { 1410 unsigned CT = MI->getOperand(OpNo).getImm(); 1411 switch (CT) { 1412 case 0: 1413 O << 'U'; 1414 break; 1415 case 1: 1416 O << 'N'; 1417 break; 1418 default: 1419 break; 1420 } 1421 } 1422 1423 void R600InstPrinter::printKCache(const MCInst *MI, unsigned OpNo, 1424 raw_ostream &O) { 1425 int KCacheMode = MI->getOperand(OpNo).getImm(); 1426 if (KCacheMode > 0) { 1427 int KCacheBank = MI->getOperand(OpNo - 2).getImm(); 1428 O << "CB" << KCacheBank << ':'; 1429 int KCacheAddr = MI->getOperand(OpNo + 2).getImm(); 1430 int LineSize = (KCacheMode == 1) ? 16 : 32; 1431 O << KCacheAddr * 16 << '-' << KCacheAddr * 16 + LineSize; 1432 } 1433 } 1434 1435 void R600InstPrinter::printLast(const MCInst *MI, unsigned OpNo, 1436 raw_ostream &O) { 1437 AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "*", " "); 1438 } 1439 1440 void R600InstPrinter::printLiteral(const MCInst *MI, unsigned OpNo, 1441 raw_ostream &O) { 1442 const MCOperand &Op = MI->getOperand(OpNo); 1443 assert(Op.isImm() || Op.isExpr()); 1444 if (Op.isImm()) { 1445 int64_t Imm = Op.getImm(); 1446 O << Imm << '(' << BitsToFloat(Imm) << ')'; 1447 } 1448 if (Op.isExpr()) { 1449 Op.getExpr()->print(O << '@', &MAI); 1450 } 1451 } 1452 1453 void R600InstPrinter::printNeg(const MCInst *MI, unsigned OpNo, 1454 raw_ostream &O) { 1455 AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '-'); 1456 } 1457 1458 void R600InstPrinter::printOMOD(const MCInst *MI, unsigned OpNo, 1459 raw_ostream &O) { 1460 switch (MI->getOperand(OpNo).getImm()) { 1461 default: break; 1462 case 1: 1463 O << " * 2.0"; 1464 break; 1465 case 2: 1466 O << " * 4.0"; 1467 break; 1468 case 3: 1469 O << " / 2.0"; 1470 break; 1471 } 1472 } 1473 1474 void R600InstPrinter::printMemOperand(const MCInst *MI, unsigned OpNo, 1475 raw_ostream &O) { 1476 printOperand(MI, OpNo, O); 1477 O << ", "; 1478 printOperand(MI, OpNo + 1, O); 1479 } 1480 1481 void R600InstPrinter::printOperand(const MCInst *MI, unsigned OpNo, 1482 raw_ostream &O) { 1483 if (OpNo >= MI->getNumOperands()) { 1484 O << "/*Missing OP" << OpNo << "*/"; 1485 return; 1486 } 1487 1488 const MCOperand &Op = MI->getOperand(OpNo); 1489 if (Op.isReg()) { 1490 switch (Op.getReg()) { 1491 // This is the default predicate state, so we don't need to print it. 1492 case R600::PRED_SEL_OFF: 1493 break; 1494 1495 default: 1496 O << getRegisterName(Op.getReg()); 1497 break; 1498 } 1499 } else if (Op.isImm()) { 1500 O << Op.getImm(); 1501 } else if (Op.isFPImm()) { 1502 // We special case 0.0 because otherwise it will be printed as an integer. 1503 if (Op.getFPImm() == 0.0) 1504 O << "0.0"; 1505 else { 1506 O << Op.getFPImm(); 1507 } 1508 } else if (Op.isExpr()) { 1509 const MCExpr *Exp = Op.getExpr(); 1510 Exp->print(O, &MAI); 1511 } else { 1512 O << "/*INV_OP*/"; 1513 } 1514 } 1515 1516 void R600InstPrinter::printRel(const MCInst *MI, unsigned OpNo, 1517 raw_ostream &O) { 1518 AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '+'); 1519 } 1520 1521 void R600InstPrinter::printRSel(const MCInst *MI, unsigned OpNo, 1522 raw_ostream &O) { 1523 unsigned Sel = MI->getOperand(OpNo).getImm(); 1524 switch (Sel) { 1525 case 0: 1526 O << 'X'; 1527 break; 1528 case 1: 1529 O << 'Y'; 1530 break; 1531 case 2: 1532 O << 'Z'; 1533 break; 1534 case 3: 1535 O << 'W'; 1536 break; 1537 case 4: 1538 O << '0'; 1539 break; 1540 case 5: 1541 O << '1'; 1542 break; 1543 case 7: 1544 O << '_'; 1545 break; 1546 default: 1547 break; 1548 } 1549 } 1550 1551 void R600InstPrinter::printUpdateExecMask(const MCInst *MI, unsigned OpNo, 1552 raw_ostream &O) { 1553 AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "ExecMask,"); 1554 } 1555 1556 void R600InstPrinter::printUpdatePred(const MCInst *MI, unsigned OpNo, 1557 raw_ostream &O) { 1558 AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "Pred,"); 1559 } 1560 1561 void R600InstPrinter::printWrite(const MCInst *MI, unsigned OpNo, 1562 raw_ostream &O) { 1563 const MCOperand &Op = MI->getOperand(OpNo); 1564 if (Op.getImm() == 0) { 1565 O << " (MASKED)"; 1566 } 1567 } 1568 1569 #include "R600GenAsmWriter.inc" 1570