1 //===-- MipsFastISel.cpp - Mips FastISel implementation --------------------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 /// 10 /// \file 11 /// \brief This file defines the MIPS-specific support for the FastISel class. 12 /// Some of the target-specific code is generated by tablegen in the file 13 /// MipsGenFastISel.inc, which is #included here. 14 /// 15 //===----------------------------------------------------------------------===// 16 17 #include "MipsCCState.h" 18 #include "MipsInstrInfo.h" 19 #include "MipsISelLowering.h" 20 #include "MipsMachineFunction.h" 21 #include "MipsRegisterInfo.h" 22 #include "MipsSubtarget.h" 23 #include "MipsTargetMachine.h" 24 #include "llvm/Analysis/TargetLibraryInfo.h" 25 #include "llvm/CodeGen/FastISel.h" 26 #include "llvm/CodeGen/FunctionLoweringInfo.h" 27 #include "llvm/CodeGen/MachineInstrBuilder.h" 28 #include "llvm/CodeGen/MachineRegisterInfo.h" 29 #include "llvm/IR/GetElementPtrTypeIterator.h" 30 #include "llvm/IR/GlobalAlias.h" 31 #include "llvm/IR/GlobalVariable.h" 32 #include "llvm/MC/MCSymbol.h" 33 #include "llvm/Target/TargetInstrInfo.h" 34 #include "llvm/Support/Debug.h" 35 36 #define DEBUG_TYPE "mips-fastisel" 37 38 using namespace llvm; 39 40 namespace { 41 42 class MipsFastISel final : public FastISel { 43 44 // All possible address modes. 45 class Address { 46 public: 47 typedef enum { RegBase, FrameIndexBase } BaseKind; 48 49 private: 50 BaseKind Kind; 51 union { 52 unsigned Reg; 53 int FI; 54 } Base; 55 56 int64_t Offset; 57 58 const GlobalValue *GV; 59 60 public: 61 // Innocuous defaults for our address. 62 Address() : Kind(RegBase), Offset(0), GV(0) { Base.Reg = 0; } 63 void setKind(BaseKind K) { Kind = K; } 64 BaseKind getKind() const { return Kind; } 65 bool isRegBase() const { return Kind == RegBase; } 66 bool isFIBase() const { return Kind == FrameIndexBase; } 67 void setReg(unsigned Reg) { 68 assert(isRegBase() && "Invalid base register access!"); 69 Base.Reg = Reg; 70 } 71 unsigned getReg() const { 72 assert(isRegBase() && "Invalid base register access!"); 73 return Base.Reg; 74 } 75 void setFI(unsigned FI) { 76 assert(isFIBase() && "Invalid base frame index access!"); 77 Base.FI = FI; 78 } 79 unsigned getFI() const { 80 assert(isFIBase() && "Invalid base frame index access!"); 81 return Base.FI; 82 } 83 84 void setOffset(int64_t Offset_) { Offset = Offset_; } 85 int64_t getOffset() const { return Offset; } 86 void setGlobalValue(const GlobalValue *G) { GV = G; } 87 const GlobalValue *getGlobalValue() { return GV; } 88 }; 89 90 /// Subtarget - Keep a pointer to the MipsSubtarget around so that we can 91 /// make the right decision when generating code for different targets. 92 const TargetMachine &TM; 93 const MipsSubtarget *Subtarget; 94 const TargetInstrInfo &TII; 95 const TargetLowering &TLI; 96 MipsFunctionInfo *MFI; 97 98 // Convenience variables to avoid some queries. 99 LLVMContext *Context; 100 101 bool fastLowerArguments() override; 102 bool fastLowerCall(CallLoweringInfo &CLI) override; 103 bool fastLowerIntrinsicCall(const IntrinsicInst *II) override; 104 105 bool TargetSupported; 106 bool UnsupportedFPMode; // To allow fast-isel to proceed and just not handle 107 // floating point but not reject doing fast-isel in other 108 // situations 109 110 private: 111 // Selection routines. 112 bool selectLogicalOp(const Instruction *I); 113 bool selectLoad(const Instruction *I); 114 bool selectStore(const Instruction *I); 115 bool selectBranch(const Instruction *I); 116 bool selectSelect(const Instruction *I); 117 bool selectCmp(const Instruction *I); 118 bool selectFPExt(const Instruction *I); 119 bool selectFPTrunc(const Instruction *I); 120 bool selectFPToInt(const Instruction *I, bool IsSigned); 121 bool selectRet(const Instruction *I); 122 bool selectTrunc(const Instruction *I); 123 bool selectIntExt(const Instruction *I); 124 bool selectShift(const Instruction *I); 125 bool selectDivRem(const Instruction *I, unsigned ISDOpcode); 126 127 // Utility helper routines. 128 bool isTypeLegal(Type *Ty, MVT &VT); 129 bool isTypeSupported(Type *Ty, MVT &VT); 130 bool isLoadTypeLegal(Type *Ty, MVT &VT); 131 bool computeAddress(const Value *Obj, Address &Addr); 132 bool computeCallAddress(const Value *V, Address &Addr); 133 void simplifyAddress(Address &Addr); 134 135 // Emit helper routines. 136 bool emitCmp(unsigned DestReg, const CmpInst *CI); 137 bool emitLoad(MVT VT, unsigned &ResultReg, Address &Addr, 138 unsigned Alignment = 0); 139 bool emitStore(MVT VT, unsigned SrcReg, Address Addr, 140 MachineMemOperand *MMO = nullptr); 141 bool emitStore(MVT VT, unsigned SrcReg, Address &Addr, 142 unsigned Alignment = 0); 143 unsigned emitIntExt(MVT SrcVT, unsigned SrcReg, MVT DestVT, bool isZExt); 144 bool emitIntExt(MVT SrcVT, unsigned SrcReg, MVT DestVT, unsigned DestReg, 145 146 bool IsZExt); 147 bool emitIntZExt(MVT SrcVT, unsigned SrcReg, MVT DestVT, unsigned DestReg); 148 149 bool emitIntSExt(MVT SrcVT, unsigned SrcReg, MVT DestVT, unsigned DestReg); 150 bool emitIntSExt32r1(MVT SrcVT, unsigned SrcReg, MVT DestVT, 151 unsigned DestReg); 152 bool emitIntSExt32r2(MVT SrcVT, unsigned SrcReg, MVT DestVT, 153 unsigned DestReg); 154 155 unsigned getRegEnsuringSimpleIntegerWidening(const Value *, bool IsUnsigned); 156 157 unsigned emitLogicalOp(unsigned ISDOpc, MVT RetVT, const Value *LHS, 158 const Value *RHS); 159 160 unsigned materializeFP(const ConstantFP *CFP, MVT VT); 161 unsigned materializeGV(const GlobalValue *GV, MVT VT); 162 unsigned materializeInt(const Constant *C, MVT VT); 163 unsigned materialize32BitInt(int64_t Imm, const TargetRegisterClass *RC); 164 unsigned materializeExternalCallSym(MCSymbol *Syn); 165 166 MachineInstrBuilder emitInst(unsigned Opc) { 167 return BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, TII.get(Opc)); 168 } 169 MachineInstrBuilder emitInst(unsigned Opc, unsigned DstReg) { 170 return BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, TII.get(Opc), 171 DstReg); 172 } 173 MachineInstrBuilder emitInstStore(unsigned Opc, unsigned SrcReg, 174 unsigned MemReg, int64_t MemOffset) { 175 return emitInst(Opc).addReg(SrcReg).addReg(MemReg).addImm(MemOffset); 176 } 177 MachineInstrBuilder emitInstLoad(unsigned Opc, unsigned DstReg, 178 unsigned MemReg, int64_t MemOffset) { 179 return emitInst(Opc, DstReg).addReg(MemReg).addImm(MemOffset); 180 } 181 182 unsigned fastEmitInst_rr(unsigned MachineInstOpcode, 183 const TargetRegisterClass *RC, 184 unsigned Op0, bool Op0IsKill, 185 unsigned Op1, bool Op1IsKill); 186 187 // for some reason, this default is not generated by tablegen 188 // so we explicitly generate it here. 189 // 190 unsigned fastEmitInst_riir(uint64_t inst, const TargetRegisterClass *RC, 191 unsigned Op0, bool Op0IsKill, uint64_t imm1, 192 uint64_t imm2, unsigned Op3, bool Op3IsKill) { 193 return 0; 194 } 195 196 // Call handling routines. 197 private: 198 CCAssignFn *CCAssignFnForCall(CallingConv::ID CC) const; 199 bool processCallArgs(CallLoweringInfo &CLI, SmallVectorImpl<MVT> &ArgVTs, 200 unsigned &NumBytes); 201 bool finishCall(CallLoweringInfo &CLI, MVT RetVT, unsigned NumBytes); 202 const MipsABIInfo &getABI() const { 203 return static_cast<const MipsTargetMachine &>(TM).getABI(); 204 } 205 206 public: 207 // Backend specific FastISel code. 208 explicit MipsFastISel(FunctionLoweringInfo &funcInfo, 209 const TargetLibraryInfo *libInfo) 210 : FastISel(funcInfo, libInfo), TM(funcInfo.MF->getTarget()), 211 Subtarget(&funcInfo.MF->getSubtarget<MipsSubtarget>()), 212 TII(*Subtarget->getInstrInfo()), TLI(*Subtarget->getTargetLowering()) { 213 MFI = funcInfo.MF->getInfo<MipsFunctionInfo>(); 214 Context = &funcInfo.Fn->getContext(); 215 bool ISASupported = !Subtarget->hasMips32r6() && 216 !Subtarget->inMicroMipsMode() && Subtarget->hasMips32(); 217 TargetSupported = 218 ISASupported && TM.isPositionIndependent() && getABI().IsO32(); 219 UnsupportedFPMode = Subtarget->isFP64bit(); 220 } 221 222 unsigned fastMaterializeAlloca(const AllocaInst *AI) override; 223 unsigned fastMaterializeConstant(const Constant *C) override; 224 bool fastSelectInstruction(const Instruction *I) override; 225 226 #include "MipsGenFastISel.inc" 227 }; 228 } // end anonymous namespace. 229 230 static bool CC_Mips(unsigned ValNo, MVT ValVT, MVT LocVT, 231 CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, 232 CCState &State) LLVM_ATTRIBUTE_UNUSED; 233 234 static bool CC_MipsO32_FP32(unsigned ValNo, MVT ValVT, MVT LocVT, 235 CCValAssign::LocInfo LocInfo, 236 ISD::ArgFlagsTy ArgFlags, CCState &State) { 237 llvm_unreachable("should not be called"); 238 } 239 240 static bool CC_MipsO32_FP64(unsigned ValNo, MVT ValVT, MVT LocVT, 241 CCValAssign::LocInfo LocInfo, 242 ISD::ArgFlagsTy ArgFlags, CCState &State) { 243 llvm_unreachable("should not be called"); 244 } 245 246 #include "MipsGenCallingConv.inc" 247 248 CCAssignFn *MipsFastISel::CCAssignFnForCall(CallingConv::ID CC) const { 249 return CC_MipsO32; 250 } 251 252 unsigned MipsFastISel::emitLogicalOp(unsigned ISDOpc, MVT RetVT, 253 const Value *LHS, const Value *RHS) { 254 // Canonicalize immediates to the RHS first. 255 if (isa<ConstantInt>(LHS) && !isa<ConstantInt>(RHS)) 256 std::swap(LHS, RHS); 257 258 unsigned Opc; 259 switch (ISDOpc) { 260 case ISD::AND: 261 Opc = Mips::AND; 262 break; 263 case ISD::OR: 264 Opc = Mips::OR; 265 break; 266 case ISD::XOR: 267 Opc = Mips::XOR; 268 break; 269 default: 270 llvm_unreachable("unexpected opcode"); 271 } 272 273 unsigned LHSReg = getRegForValue(LHS); 274 if (!LHSReg) 275 return 0; 276 277 unsigned RHSReg; 278 if (const auto *C = dyn_cast<ConstantInt>(RHS)) 279 RHSReg = materializeInt(C, MVT::i32); 280 else 281 RHSReg = getRegForValue(RHS); 282 if (!RHSReg) 283 return 0; 284 285 unsigned ResultReg = createResultReg(&Mips::GPR32RegClass); 286 if (!ResultReg) 287 return 0; 288 289 emitInst(Opc, ResultReg).addReg(LHSReg).addReg(RHSReg); 290 return ResultReg; 291 } 292 293 unsigned MipsFastISel::fastMaterializeAlloca(const AllocaInst *AI) { 294 if (!TargetSupported) 295 return 0; 296 297 assert(TLI.getValueType(DL, AI->getType(), true) == MVT::i32 && 298 "Alloca should always return a pointer."); 299 300 DenseMap<const AllocaInst *, int>::iterator SI = 301 FuncInfo.StaticAllocaMap.find(AI); 302 303 if (SI != FuncInfo.StaticAllocaMap.end()) { 304 unsigned ResultReg = createResultReg(&Mips::GPR32RegClass); 305 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, TII.get(Mips::LEA_ADDiu), 306 ResultReg) 307 .addFrameIndex(SI->second) 308 .addImm(0); 309 return ResultReg; 310 } 311 312 return 0; 313 } 314 315 unsigned MipsFastISel::materializeInt(const Constant *C, MVT VT) { 316 if (VT != MVT::i32 && VT != MVT::i16 && VT != MVT::i8 && VT != MVT::i1) 317 return 0; 318 const TargetRegisterClass *RC = &Mips::GPR32RegClass; 319 const ConstantInt *CI = cast<ConstantInt>(C); 320 return materialize32BitInt(CI->getZExtValue(), RC); 321 } 322 323 unsigned MipsFastISel::materialize32BitInt(int64_t Imm, 324 const TargetRegisterClass *RC) { 325 unsigned ResultReg = createResultReg(RC); 326 327 if (isInt<16>(Imm)) { 328 unsigned Opc = Mips::ADDiu; 329 emitInst(Opc, ResultReg).addReg(Mips::ZERO).addImm(Imm); 330 return ResultReg; 331 } else if (isUInt<16>(Imm)) { 332 emitInst(Mips::ORi, ResultReg).addReg(Mips::ZERO).addImm(Imm); 333 return ResultReg; 334 } 335 unsigned Lo = Imm & 0xFFFF; 336 unsigned Hi = (Imm >> 16) & 0xFFFF; 337 if (Lo) { 338 // Both Lo and Hi have nonzero bits. 339 unsigned TmpReg = createResultReg(RC); 340 emitInst(Mips::LUi, TmpReg).addImm(Hi); 341 emitInst(Mips::ORi, ResultReg).addReg(TmpReg).addImm(Lo); 342 } else { 343 emitInst(Mips::LUi, ResultReg).addImm(Hi); 344 } 345 return ResultReg; 346 } 347 348 unsigned MipsFastISel::materializeFP(const ConstantFP *CFP, MVT VT) { 349 if (UnsupportedFPMode) 350 return 0; 351 int64_t Imm = CFP->getValueAPF().bitcastToAPInt().getZExtValue(); 352 if (VT == MVT::f32) { 353 const TargetRegisterClass *RC = &Mips::FGR32RegClass; 354 unsigned DestReg = createResultReg(RC); 355 unsigned TempReg = materialize32BitInt(Imm, &Mips::GPR32RegClass); 356 emitInst(Mips::MTC1, DestReg).addReg(TempReg); 357 return DestReg; 358 } else if (VT == MVT::f64) { 359 const TargetRegisterClass *RC = &Mips::AFGR64RegClass; 360 unsigned DestReg = createResultReg(RC); 361 unsigned TempReg1 = materialize32BitInt(Imm >> 32, &Mips::GPR32RegClass); 362 unsigned TempReg2 = 363 materialize32BitInt(Imm & 0xFFFFFFFF, &Mips::GPR32RegClass); 364 emitInst(Mips::BuildPairF64, DestReg).addReg(TempReg2).addReg(TempReg1); 365 return DestReg; 366 } 367 return 0; 368 } 369 370 unsigned MipsFastISel::materializeGV(const GlobalValue *GV, MVT VT) { 371 // For now 32-bit only. 372 if (VT != MVT::i32) 373 return 0; 374 const TargetRegisterClass *RC = &Mips::GPR32RegClass; 375 unsigned DestReg = createResultReg(RC); 376 const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV); 377 bool IsThreadLocal = GVar && GVar->isThreadLocal(); 378 // TLS not supported at this time. 379 if (IsThreadLocal) 380 return 0; 381 emitInst(Mips::LW, DestReg) 382 .addReg(MFI->getGlobalBaseReg()) 383 .addGlobalAddress(GV, 0, MipsII::MO_GOT); 384 if ((GV->hasInternalLinkage() || 385 (GV->hasLocalLinkage() && !isa<Function>(GV)))) { 386 unsigned TempReg = createResultReg(RC); 387 emitInst(Mips::ADDiu, TempReg) 388 .addReg(DestReg) 389 .addGlobalAddress(GV, 0, MipsII::MO_ABS_LO); 390 DestReg = TempReg; 391 } 392 return DestReg; 393 } 394 395 unsigned MipsFastISel::materializeExternalCallSym(MCSymbol *Sym) { 396 const TargetRegisterClass *RC = &Mips::GPR32RegClass; 397 unsigned DestReg = createResultReg(RC); 398 emitInst(Mips::LW, DestReg) 399 .addReg(MFI->getGlobalBaseReg()) 400 .addSym(Sym, MipsII::MO_GOT); 401 return DestReg; 402 } 403 404 // Materialize a constant into a register, and return the register 405 // number (or zero if we failed to handle it). 406 unsigned MipsFastISel::fastMaterializeConstant(const Constant *C) { 407 if (!TargetSupported) 408 return 0; 409 410 EVT CEVT = TLI.getValueType(DL, C->getType(), true); 411 412 // Only handle simple types. 413 if (!CEVT.isSimple()) 414 return 0; 415 MVT VT = CEVT.getSimpleVT(); 416 417 if (const ConstantFP *CFP = dyn_cast<ConstantFP>(C)) 418 return (UnsupportedFPMode) ? 0 : materializeFP(CFP, VT); 419 else if (const GlobalValue *GV = dyn_cast<GlobalValue>(C)) 420 return materializeGV(GV, VT); 421 else if (isa<ConstantInt>(C)) 422 return materializeInt(C, VT); 423 424 return 0; 425 } 426 427 bool MipsFastISel::computeAddress(const Value *Obj, Address &Addr) { 428 429 const User *U = nullptr; 430 unsigned Opcode = Instruction::UserOp1; 431 if (const Instruction *I = dyn_cast<Instruction>(Obj)) { 432 // Don't walk into other basic blocks unless the object is an alloca from 433 // another block, otherwise it may not have a virtual register assigned. 434 if (FuncInfo.StaticAllocaMap.count(static_cast<const AllocaInst *>(Obj)) || 435 FuncInfo.MBBMap[I->getParent()] == FuncInfo.MBB) { 436 Opcode = I->getOpcode(); 437 U = I; 438 } 439 } else if (const ConstantExpr *C = dyn_cast<ConstantExpr>(Obj)) { 440 Opcode = C->getOpcode(); 441 U = C; 442 } 443 switch (Opcode) { 444 default: 445 break; 446 case Instruction::BitCast: { 447 // Look through bitcasts. 448 return computeAddress(U->getOperand(0), Addr); 449 } 450 case Instruction::GetElementPtr: { 451 Address SavedAddr = Addr; 452 uint64_t TmpOffset = Addr.getOffset(); 453 // Iterate through the GEP folding the constants into offsets where 454 // we can. 455 gep_type_iterator GTI = gep_type_begin(U); 456 for (User::const_op_iterator i = U->op_begin() + 1, e = U->op_end(); i != e; 457 ++i, ++GTI) { 458 const Value *Op = *i; 459 if (StructType *STy = dyn_cast<StructType>(*GTI)) { 460 const StructLayout *SL = DL.getStructLayout(STy); 461 unsigned Idx = cast<ConstantInt>(Op)->getZExtValue(); 462 TmpOffset += SL->getElementOffset(Idx); 463 } else { 464 uint64_t S = DL.getTypeAllocSize(GTI.getIndexedType()); 465 for (;;) { 466 if (const ConstantInt *CI = dyn_cast<ConstantInt>(Op)) { 467 // Constant-offset addressing. 468 TmpOffset += CI->getSExtValue() * S; 469 break; 470 } 471 if (canFoldAddIntoGEP(U, Op)) { 472 // A compatible add with a constant operand. Fold the constant. 473 ConstantInt *CI = 474 cast<ConstantInt>(cast<AddOperator>(Op)->getOperand(1)); 475 TmpOffset += CI->getSExtValue() * S; 476 // Iterate on the other operand. 477 Op = cast<AddOperator>(Op)->getOperand(0); 478 continue; 479 } 480 // Unsupported 481 goto unsupported_gep; 482 } 483 } 484 } 485 // Try to grab the base operand now. 486 Addr.setOffset(TmpOffset); 487 if (computeAddress(U->getOperand(0), Addr)) 488 return true; 489 // We failed, restore everything and try the other options. 490 Addr = SavedAddr; 491 unsupported_gep: 492 break; 493 } 494 case Instruction::Alloca: { 495 const AllocaInst *AI = cast<AllocaInst>(Obj); 496 DenseMap<const AllocaInst *, int>::iterator SI = 497 FuncInfo.StaticAllocaMap.find(AI); 498 if (SI != FuncInfo.StaticAllocaMap.end()) { 499 Addr.setKind(Address::FrameIndexBase); 500 Addr.setFI(SI->second); 501 return true; 502 } 503 break; 504 } 505 } 506 Addr.setReg(getRegForValue(Obj)); 507 return Addr.getReg() != 0; 508 } 509 510 bool MipsFastISel::computeCallAddress(const Value *V, Address &Addr) { 511 const User *U = nullptr; 512 unsigned Opcode = Instruction::UserOp1; 513 514 if (const auto *I = dyn_cast<Instruction>(V)) { 515 // Check if the value is defined in the same basic block. This information 516 // is crucial to know whether or not folding an operand is valid. 517 if (I->getParent() == FuncInfo.MBB->getBasicBlock()) { 518 Opcode = I->getOpcode(); 519 U = I; 520 } 521 } else if (const auto *C = dyn_cast<ConstantExpr>(V)) { 522 Opcode = C->getOpcode(); 523 U = C; 524 } 525 526 switch (Opcode) { 527 default: 528 break; 529 case Instruction::BitCast: 530 // Look past bitcasts if its operand is in the same BB. 531 return computeCallAddress(U->getOperand(0), Addr); 532 break; 533 case Instruction::IntToPtr: 534 // Look past no-op inttoptrs if its operand is in the same BB. 535 if (TLI.getValueType(DL, U->getOperand(0)->getType()) == 536 TLI.getPointerTy(DL)) 537 return computeCallAddress(U->getOperand(0), Addr); 538 break; 539 case Instruction::PtrToInt: 540 // Look past no-op ptrtoints if its operand is in the same BB. 541 if (TLI.getValueType(DL, U->getType()) == TLI.getPointerTy(DL)) 542 return computeCallAddress(U->getOperand(0), Addr); 543 break; 544 } 545 546 if (const GlobalValue *GV = dyn_cast<GlobalValue>(V)) { 547 Addr.setGlobalValue(GV); 548 return true; 549 } 550 551 // If all else fails, try to materialize the value in a register. 552 if (!Addr.getGlobalValue()) { 553 Addr.setReg(getRegForValue(V)); 554 return Addr.getReg() != 0; 555 } 556 557 return false; 558 } 559 560 bool MipsFastISel::isTypeLegal(Type *Ty, MVT &VT) { 561 EVT evt = TLI.getValueType(DL, Ty, true); 562 // Only handle simple types. 563 if (evt == MVT::Other || !evt.isSimple()) 564 return false; 565 VT = evt.getSimpleVT(); 566 567 // Handle all legal types, i.e. a register that will directly hold this 568 // value. 569 return TLI.isTypeLegal(VT); 570 } 571 572 bool MipsFastISel::isTypeSupported(Type *Ty, MVT &VT) { 573 if (Ty->isVectorTy()) 574 return false; 575 576 if (isTypeLegal(Ty, VT)) 577 return true; 578 579 // If this is a type than can be sign or zero-extended to a basic operation 580 // go ahead and accept it now. 581 if (VT == MVT::i1 || VT == MVT::i8 || VT == MVT::i16) 582 return true; 583 584 return false; 585 } 586 587 bool MipsFastISel::isLoadTypeLegal(Type *Ty, MVT &VT) { 588 if (isTypeLegal(Ty, VT)) 589 return true; 590 // We will extend this in a later patch: 591 // If this is a type than can be sign or zero-extended to a basic operation 592 // go ahead and accept it now. 593 if (VT == MVT::i8 || VT == MVT::i16) 594 return true; 595 return false; 596 } 597 // Because of how EmitCmp is called with fast-isel, you can 598 // end up with redundant "andi" instructions after the sequences emitted below. 599 // We should try and solve this issue in the future. 600 // 601 bool MipsFastISel::emitCmp(unsigned ResultReg, const CmpInst *CI) { 602 const Value *Left = CI->getOperand(0), *Right = CI->getOperand(1); 603 bool IsUnsigned = CI->isUnsigned(); 604 unsigned LeftReg = getRegEnsuringSimpleIntegerWidening(Left, IsUnsigned); 605 if (LeftReg == 0) 606 return false; 607 unsigned RightReg = getRegEnsuringSimpleIntegerWidening(Right, IsUnsigned); 608 if (RightReg == 0) 609 return false; 610 CmpInst::Predicate P = CI->getPredicate(); 611 612 switch (P) { 613 default: 614 return false; 615 case CmpInst::ICMP_EQ: { 616 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 617 emitInst(Mips::XOR, TempReg).addReg(LeftReg).addReg(RightReg); 618 emitInst(Mips::SLTiu, ResultReg).addReg(TempReg).addImm(1); 619 break; 620 } 621 case CmpInst::ICMP_NE: { 622 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 623 emitInst(Mips::XOR, TempReg).addReg(LeftReg).addReg(RightReg); 624 emitInst(Mips::SLTu, ResultReg).addReg(Mips::ZERO).addReg(TempReg); 625 break; 626 } 627 case CmpInst::ICMP_UGT: { 628 emitInst(Mips::SLTu, ResultReg).addReg(RightReg).addReg(LeftReg); 629 break; 630 } 631 case CmpInst::ICMP_ULT: { 632 emitInst(Mips::SLTu, ResultReg).addReg(LeftReg).addReg(RightReg); 633 break; 634 } 635 case CmpInst::ICMP_UGE: { 636 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 637 emitInst(Mips::SLTu, TempReg).addReg(LeftReg).addReg(RightReg); 638 emitInst(Mips::XORi, ResultReg).addReg(TempReg).addImm(1); 639 break; 640 } 641 case CmpInst::ICMP_ULE: { 642 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 643 emitInst(Mips::SLTu, TempReg).addReg(RightReg).addReg(LeftReg); 644 emitInst(Mips::XORi, ResultReg).addReg(TempReg).addImm(1); 645 break; 646 } 647 case CmpInst::ICMP_SGT: { 648 emitInst(Mips::SLT, ResultReg).addReg(RightReg).addReg(LeftReg); 649 break; 650 } 651 case CmpInst::ICMP_SLT: { 652 emitInst(Mips::SLT, ResultReg).addReg(LeftReg).addReg(RightReg); 653 break; 654 } 655 case CmpInst::ICMP_SGE: { 656 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 657 emitInst(Mips::SLT, TempReg).addReg(LeftReg).addReg(RightReg); 658 emitInst(Mips::XORi, ResultReg).addReg(TempReg).addImm(1); 659 break; 660 } 661 case CmpInst::ICMP_SLE: { 662 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 663 emitInst(Mips::SLT, TempReg).addReg(RightReg).addReg(LeftReg); 664 emitInst(Mips::XORi, ResultReg).addReg(TempReg).addImm(1); 665 break; 666 } 667 case CmpInst::FCMP_OEQ: 668 case CmpInst::FCMP_UNE: 669 case CmpInst::FCMP_OLT: 670 case CmpInst::FCMP_OLE: 671 case CmpInst::FCMP_OGT: 672 case CmpInst::FCMP_OGE: { 673 if (UnsupportedFPMode) 674 return false; 675 bool IsFloat = Left->getType()->isFloatTy(); 676 bool IsDouble = Left->getType()->isDoubleTy(); 677 if (!IsFloat && !IsDouble) 678 return false; 679 unsigned Opc, CondMovOpc; 680 switch (P) { 681 case CmpInst::FCMP_OEQ: 682 Opc = IsFloat ? Mips::C_EQ_S : Mips::C_EQ_D32; 683 CondMovOpc = Mips::MOVT_I; 684 break; 685 case CmpInst::FCMP_UNE: 686 Opc = IsFloat ? Mips::C_EQ_S : Mips::C_EQ_D32; 687 CondMovOpc = Mips::MOVF_I; 688 break; 689 case CmpInst::FCMP_OLT: 690 Opc = IsFloat ? Mips::C_OLT_S : Mips::C_OLT_D32; 691 CondMovOpc = Mips::MOVT_I; 692 break; 693 case CmpInst::FCMP_OLE: 694 Opc = IsFloat ? Mips::C_OLE_S : Mips::C_OLE_D32; 695 CondMovOpc = Mips::MOVT_I; 696 break; 697 case CmpInst::FCMP_OGT: 698 Opc = IsFloat ? Mips::C_ULE_S : Mips::C_ULE_D32; 699 CondMovOpc = Mips::MOVF_I; 700 break; 701 case CmpInst::FCMP_OGE: 702 Opc = IsFloat ? Mips::C_ULT_S : Mips::C_ULT_D32; 703 CondMovOpc = Mips::MOVF_I; 704 break; 705 default: 706 llvm_unreachable("Only switching of a subset of CCs."); 707 } 708 unsigned RegWithZero = createResultReg(&Mips::GPR32RegClass); 709 unsigned RegWithOne = createResultReg(&Mips::GPR32RegClass); 710 emitInst(Mips::ADDiu, RegWithZero).addReg(Mips::ZERO).addImm(0); 711 emitInst(Mips::ADDiu, RegWithOne).addReg(Mips::ZERO).addImm(1); 712 emitInst(Opc).addReg(LeftReg).addReg(RightReg).addReg( 713 Mips::FCC0, RegState::ImplicitDefine); 714 emitInst(CondMovOpc, ResultReg) 715 .addReg(RegWithOne) 716 .addReg(Mips::FCC0) 717 .addReg(RegWithZero); 718 break; 719 } 720 } 721 return true; 722 } 723 bool MipsFastISel::emitLoad(MVT VT, unsigned &ResultReg, Address &Addr, 724 unsigned Alignment) { 725 // 726 // more cases will be handled here in following patches. 727 // 728 unsigned Opc; 729 switch (VT.SimpleTy) { 730 case MVT::i32: { 731 ResultReg = createResultReg(&Mips::GPR32RegClass); 732 Opc = Mips::LW; 733 break; 734 } 735 case MVT::i16: { 736 ResultReg = createResultReg(&Mips::GPR32RegClass); 737 Opc = Mips::LHu; 738 break; 739 } 740 case MVT::i8: { 741 ResultReg = createResultReg(&Mips::GPR32RegClass); 742 Opc = Mips::LBu; 743 break; 744 } 745 case MVT::f32: { 746 if (UnsupportedFPMode) 747 return false; 748 ResultReg = createResultReg(&Mips::FGR32RegClass); 749 Opc = Mips::LWC1; 750 break; 751 } 752 case MVT::f64: { 753 if (UnsupportedFPMode) 754 return false; 755 ResultReg = createResultReg(&Mips::AFGR64RegClass); 756 Opc = Mips::LDC1; 757 break; 758 } 759 default: 760 return false; 761 } 762 if (Addr.isRegBase()) { 763 simplifyAddress(Addr); 764 emitInstLoad(Opc, ResultReg, Addr.getReg(), Addr.getOffset()); 765 return true; 766 } 767 if (Addr.isFIBase()) { 768 unsigned FI = Addr.getFI(); 769 unsigned Align = 4; 770 unsigned Offset = Addr.getOffset(); 771 MachineFrameInfo &MFI = MF->getFrameInfo(); 772 MachineMemOperand *MMO = MF->getMachineMemOperand( 773 MachinePointerInfo::getFixedStack(*MF, FI), MachineMemOperand::MOLoad, 774 MFI.getObjectSize(FI), Align); 775 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, TII.get(Opc), ResultReg) 776 .addFrameIndex(FI) 777 .addImm(Offset) 778 .addMemOperand(MMO); 779 return true; 780 } 781 return false; 782 } 783 784 bool MipsFastISel::emitStore(MVT VT, unsigned SrcReg, Address &Addr, 785 unsigned Alignment) { 786 // 787 // more cases will be handled here in following patches. 788 // 789 unsigned Opc; 790 switch (VT.SimpleTy) { 791 case MVT::i8: 792 Opc = Mips::SB; 793 break; 794 case MVT::i16: 795 Opc = Mips::SH; 796 break; 797 case MVT::i32: 798 Opc = Mips::SW; 799 break; 800 case MVT::f32: 801 if (UnsupportedFPMode) 802 return false; 803 Opc = Mips::SWC1; 804 break; 805 case MVT::f64: 806 if (UnsupportedFPMode) 807 return false; 808 Opc = Mips::SDC1; 809 break; 810 default: 811 return false; 812 } 813 if (Addr.isRegBase()) { 814 simplifyAddress(Addr); 815 emitInstStore(Opc, SrcReg, Addr.getReg(), Addr.getOffset()); 816 return true; 817 } 818 if (Addr.isFIBase()) { 819 unsigned FI = Addr.getFI(); 820 unsigned Align = 4; 821 unsigned Offset = Addr.getOffset(); 822 MachineFrameInfo &MFI = MF->getFrameInfo(); 823 MachineMemOperand *MMO = MF->getMachineMemOperand( 824 MachinePointerInfo::getFixedStack(*MF, FI), MachineMemOperand::MOStore, 825 MFI.getObjectSize(FI), Align); 826 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, TII.get(Opc)) 827 .addReg(SrcReg) 828 .addFrameIndex(FI) 829 .addImm(Offset) 830 .addMemOperand(MMO); 831 return true; 832 } 833 return false; 834 } 835 836 bool MipsFastISel::selectLogicalOp(const Instruction *I) { 837 MVT VT; 838 if (!isTypeSupported(I->getType(), VT)) 839 return false; 840 841 unsigned ResultReg; 842 switch (I->getOpcode()) { 843 default: 844 llvm_unreachable("Unexpected instruction."); 845 case Instruction::And: 846 ResultReg = emitLogicalOp(ISD::AND, VT, I->getOperand(0), I->getOperand(1)); 847 break; 848 case Instruction::Or: 849 ResultReg = emitLogicalOp(ISD::OR, VT, I->getOperand(0), I->getOperand(1)); 850 break; 851 case Instruction::Xor: 852 ResultReg = emitLogicalOp(ISD::XOR, VT, I->getOperand(0), I->getOperand(1)); 853 break; 854 } 855 856 if (!ResultReg) 857 return false; 858 859 updateValueMap(I, ResultReg); 860 return true; 861 } 862 863 bool MipsFastISel::selectLoad(const Instruction *I) { 864 // Atomic loads need special handling. 865 if (cast<LoadInst>(I)->isAtomic()) 866 return false; 867 868 // Verify we have a legal type before going any further. 869 MVT VT; 870 if (!isLoadTypeLegal(I->getType(), VT)) 871 return false; 872 873 // See if we can handle this address. 874 Address Addr; 875 if (!computeAddress(I->getOperand(0), Addr)) 876 return false; 877 878 unsigned ResultReg; 879 if (!emitLoad(VT, ResultReg, Addr, cast<LoadInst>(I)->getAlignment())) 880 return false; 881 updateValueMap(I, ResultReg); 882 return true; 883 } 884 885 bool MipsFastISel::selectStore(const Instruction *I) { 886 Value *Op0 = I->getOperand(0); 887 unsigned SrcReg = 0; 888 889 // Atomic stores need special handling. 890 if (cast<StoreInst>(I)->isAtomic()) 891 return false; 892 893 // Verify we have a legal type before going any further. 894 MVT VT; 895 if (!isLoadTypeLegal(I->getOperand(0)->getType(), VT)) 896 return false; 897 898 // Get the value to be stored into a register. 899 SrcReg = getRegForValue(Op0); 900 if (SrcReg == 0) 901 return false; 902 903 // See if we can handle this address. 904 Address Addr; 905 if (!computeAddress(I->getOperand(1), Addr)) 906 return false; 907 908 if (!emitStore(VT, SrcReg, Addr, cast<StoreInst>(I)->getAlignment())) 909 return false; 910 return true; 911 } 912 913 // 914 // This can cause a redundant sltiu to be generated. 915 // FIXME: try and eliminate this in a future patch. 916 // 917 bool MipsFastISel::selectBranch(const Instruction *I) { 918 const BranchInst *BI = cast<BranchInst>(I); 919 MachineBasicBlock *BrBB = FuncInfo.MBB; 920 // 921 // TBB is the basic block for the case where the comparison is true. 922 // FBB is the basic block for the case where the comparison is false. 923 // if (cond) goto TBB 924 // goto FBB 925 // TBB: 926 // 927 MachineBasicBlock *TBB = FuncInfo.MBBMap[BI->getSuccessor(0)]; 928 MachineBasicBlock *FBB = FuncInfo.MBBMap[BI->getSuccessor(1)]; 929 BI->getCondition(); 930 // For now, just try the simplest case where it's fed by a compare. 931 if (const CmpInst *CI = dyn_cast<CmpInst>(BI->getCondition())) { 932 unsigned CondReg = createResultReg(&Mips::GPR32RegClass); 933 if (!emitCmp(CondReg, CI)) 934 return false; 935 BuildMI(*BrBB, FuncInfo.InsertPt, DbgLoc, TII.get(Mips::BGTZ)) 936 .addReg(CondReg) 937 .addMBB(TBB); 938 finishCondBranch(BI->getParent(), TBB, FBB); 939 return true; 940 } 941 return false; 942 } 943 944 bool MipsFastISel::selectCmp(const Instruction *I) { 945 const CmpInst *CI = cast<CmpInst>(I); 946 unsigned ResultReg = createResultReg(&Mips::GPR32RegClass); 947 if (!emitCmp(ResultReg, CI)) 948 return false; 949 updateValueMap(I, ResultReg); 950 return true; 951 } 952 953 // Attempt to fast-select a floating-point extend instruction. 954 bool MipsFastISel::selectFPExt(const Instruction *I) { 955 if (UnsupportedFPMode) 956 return false; 957 Value *Src = I->getOperand(0); 958 EVT SrcVT = TLI.getValueType(DL, Src->getType(), true); 959 EVT DestVT = TLI.getValueType(DL, I->getType(), true); 960 961 if (SrcVT != MVT::f32 || DestVT != MVT::f64) 962 return false; 963 964 unsigned SrcReg = 965 getRegForValue(Src); // this must be a 32bit floating point register class 966 // maybe we should handle this differently 967 if (!SrcReg) 968 return false; 969 970 unsigned DestReg = createResultReg(&Mips::AFGR64RegClass); 971 emitInst(Mips::CVT_D32_S, DestReg).addReg(SrcReg); 972 updateValueMap(I, DestReg); 973 return true; 974 } 975 976 bool MipsFastISel::selectSelect(const Instruction *I) { 977 assert(isa<SelectInst>(I) && "Expected a select instruction."); 978 979 MVT VT; 980 if (!isTypeSupported(I->getType(), VT)) 981 return false; 982 983 unsigned CondMovOpc; 984 const TargetRegisterClass *RC; 985 986 if (VT.isInteger() && !VT.isVector() && VT.getSizeInBits() <= 32) { 987 CondMovOpc = Mips::MOVN_I_I; 988 RC = &Mips::GPR32RegClass; 989 } else if (VT == MVT::f32) { 990 CondMovOpc = Mips::MOVN_I_S; 991 RC = &Mips::FGR32RegClass; 992 } else if (VT == MVT::f64) { 993 CondMovOpc = Mips::MOVN_I_D32; 994 RC = &Mips::AFGR64RegClass; 995 } else 996 return false; 997 998 const SelectInst *SI = cast<SelectInst>(I); 999 const Value *Cond = SI->getCondition(); 1000 unsigned Src1Reg = getRegForValue(SI->getTrueValue()); 1001 unsigned Src2Reg = getRegForValue(SI->getFalseValue()); 1002 unsigned CondReg = getRegForValue(Cond); 1003 1004 if (!Src1Reg || !Src2Reg || !CondReg) 1005 return false; 1006 1007 unsigned ZExtCondReg = createResultReg(&Mips::GPR32RegClass); 1008 if (!ZExtCondReg) 1009 return false; 1010 1011 if (!emitIntExt(MVT::i1, CondReg, MVT::i32, ZExtCondReg, true)) 1012 return false; 1013 1014 unsigned ResultReg = createResultReg(RC); 1015 unsigned TempReg = createResultReg(RC); 1016 1017 if (!ResultReg || !TempReg) 1018 return false; 1019 1020 emitInst(TargetOpcode::COPY, TempReg).addReg(Src2Reg); 1021 emitInst(CondMovOpc, ResultReg) 1022 .addReg(Src1Reg).addReg(ZExtCondReg).addReg(TempReg); 1023 updateValueMap(I, ResultReg); 1024 return true; 1025 } 1026 1027 // Attempt to fast-select a floating-point truncate instruction. 1028 bool MipsFastISel::selectFPTrunc(const Instruction *I) { 1029 if (UnsupportedFPMode) 1030 return false; 1031 Value *Src = I->getOperand(0); 1032 EVT SrcVT = TLI.getValueType(DL, Src->getType(), true); 1033 EVT DestVT = TLI.getValueType(DL, I->getType(), true); 1034 1035 if (SrcVT != MVT::f64 || DestVT != MVT::f32) 1036 return false; 1037 1038 unsigned SrcReg = getRegForValue(Src); 1039 if (!SrcReg) 1040 return false; 1041 1042 unsigned DestReg = createResultReg(&Mips::FGR32RegClass); 1043 if (!DestReg) 1044 return false; 1045 1046 emitInst(Mips::CVT_S_D32, DestReg).addReg(SrcReg); 1047 updateValueMap(I, DestReg); 1048 return true; 1049 } 1050 1051 // Attempt to fast-select a floating-point-to-integer conversion. 1052 bool MipsFastISel::selectFPToInt(const Instruction *I, bool IsSigned) { 1053 if (UnsupportedFPMode) 1054 return false; 1055 MVT DstVT, SrcVT; 1056 if (!IsSigned) 1057 return false; // We don't handle this case yet. There is no native 1058 // instruction for this but it can be synthesized. 1059 Type *DstTy = I->getType(); 1060 if (!isTypeLegal(DstTy, DstVT)) 1061 return false; 1062 1063 if (DstVT != MVT::i32) 1064 return false; 1065 1066 Value *Src = I->getOperand(0); 1067 Type *SrcTy = Src->getType(); 1068 if (!isTypeLegal(SrcTy, SrcVT)) 1069 return false; 1070 1071 if (SrcVT != MVT::f32 && SrcVT != MVT::f64) 1072 return false; 1073 1074 unsigned SrcReg = getRegForValue(Src); 1075 if (SrcReg == 0) 1076 return false; 1077 1078 // Determine the opcode for the conversion, which takes place 1079 // entirely within FPRs. 1080 unsigned DestReg = createResultReg(&Mips::GPR32RegClass); 1081 unsigned TempReg = createResultReg(&Mips::FGR32RegClass); 1082 unsigned Opc = (SrcVT == MVT::f32) ? Mips::TRUNC_W_S : Mips::TRUNC_W_D32; 1083 1084 // Generate the convert. 1085 emitInst(Opc, TempReg).addReg(SrcReg); 1086 emitInst(Mips::MFC1, DestReg).addReg(TempReg); 1087 1088 updateValueMap(I, DestReg); 1089 return true; 1090 } 1091 1092 bool MipsFastISel::processCallArgs(CallLoweringInfo &CLI, 1093 SmallVectorImpl<MVT> &OutVTs, 1094 unsigned &NumBytes) { 1095 CallingConv::ID CC = CLI.CallConv; 1096 SmallVector<CCValAssign, 16> ArgLocs; 1097 CCState CCInfo(CC, false, *FuncInfo.MF, ArgLocs, *Context); 1098 CCInfo.AnalyzeCallOperands(OutVTs, CLI.OutFlags, CCAssignFnForCall(CC)); 1099 // Get a count of how many bytes are to be pushed on the stack. 1100 NumBytes = CCInfo.getNextStackOffset(); 1101 // This is the minimum argument area used for A0-A3. 1102 if (NumBytes < 16) 1103 NumBytes = 16; 1104 1105 emitInst(Mips::ADJCALLSTACKDOWN).addImm(16); 1106 // Process the args. 1107 MVT firstMVT; 1108 for (unsigned i = 0, e = ArgLocs.size(); i != e; ++i) { 1109 CCValAssign &VA = ArgLocs[i]; 1110 const Value *ArgVal = CLI.OutVals[VA.getValNo()]; 1111 MVT ArgVT = OutVTs[VA.getValNo()]; 1112 1113 if (i == 0) { 1114 firstMVT = ArgVT; 1115 if (ArgVT == MVT::f32) { 1116 VA.convertToReg(Mips::F12); 1117 } else if (ArgVT == MVT::f64) { 1118 VA.convertToReg(Mips::D6); 1119 } 1120 } else if (i == 1) { 1121 if ((firstMVT == MVT::f32) || (firstMVT == MVT::f64)) { 1122 if (ArgVT == MVT::f32) { 1123 VA.convertToReg(Mips::F14); 1124 } else if (ArgVT == MVT::f64) { 1125 VA.convertToReg(Mips::D7); 1126 } 1127 } 1128 } 1129 if (((ArgVT == MVT::i32) || (ArgVT == MVT::f32) || (ArgVT == MVT::i16) || 1130 (ArgVT == MVT::i8)) && 1131 VA.isMemLoc()) { 1132 switch (VA.getLocMemOffset()) { 1133 case 0: 1134 VA.convertToReg(Mips::A0); 1135 break; 1136 case 4: 1137 VA.convertToReg(Mips::A1); 1138 break; 1139 case 8: 1140 VA.convertToReg(Mips::A2); 1141 break; 1142 case 12: 1143 VA.convertToReg(Mips::A3); 1144 break; 1145 default: 1146 break; 1147 } 1148 } 1149 unsigned ArgReg = getRegForValue(ArgVal); 1150 if (!ArgReg) 1151 return false; 1152 1153 // Handle arg promotion: SExt, ZExt, AExt. 1154 switch (VA.getLocInfo()) { 1155 case CCValAssign::Full: 1156 break; 1157 case CCValAssign::AExt: 1158 case CCValAssign::SExt: { 1159 MVT DestVT = VA.getLocVT(); 1160 MVT SrcVT = ArgVT; 1161 ArgReg = emitIntExt(SrcVT, ArgReg, DestVT, /*isZExt=*/false); 1162 if (!ArgReg) 1163 return false; 1164 break; 1165 } 1166 case CCValAssign::ZExt: { 1167 MVT DestVT = VA.getLocVT(); 1168 MVT SrcVT = ArgVT; 1169 ArgReg = emitIntExt(SrcVT, ArgReg, DestVT, /*isZExt=*/true); 1170 if (!ArgReg) 1171 return false; 1172 break; 1173 } 1174 default: 1175 llvm_unreachable("Unknown arg promotion!"); 1176 } 1177 1178 // Now copy/store arg to correct locations. 1179 if (VA.isRegLoc() && !VA.needsCustom()) { 1180 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, 1181 TII.get(TargetOpcode::COPY), VA.getLocReg()).addReg(ArgReg); 1182 CLI.OutRegs.push_back(VA.getLocReg()); 1183 } else if (VA.needsCustom()) { 1184 llvm_unreachable("Mips does not use custom args."); 1185 return false; 1186 } else { 1187 // 1188 // FIXME: This path will currently return false. It was copied 1189 // from the AArch64 port and should be essentially fine for Mips too. 1190 // The work to finish up this path will be done in a follow-on patch. 1191 // 1192 assert(VA.isMemLoc() && "Assuming store on stack."); 1193 // Don't emit stores for undef values. 1194 if (isa<UndefValue>(ArgVal)) 1195 continue; 1196 1197 // Need to store on the stack. 1198 // FIXME: This alignment is incorrect but this path is disabled 1199 // for now (will return false). We need to determine the right alignment 1200 // based on the normal alignment for the underlying machine type. 1201 // 1202 unsigned ArgSize = alignTo(ArgVT.getSizeInBits(), 4); 1203 1204 unsigned BEAlign = 0; 1205 if (ArgSize < 8 && !Subtarget->isLittle()) 1206 BEAlign = 8 - ArgSize; 1207 1208 Address Addr; 1209 Addr.setKind(Address::RegBase); 1210 Addr.setReg(Mips::SP); 1211 Addr.setOffset(VA.getLocMemOffset() + BEAlign); 1212 1213 unsigned Alignment = DL.getABITypeAlignment(ArgVal->getType()); 1214 MachineMemOperand *MMO = FuncInfo.MF->getMachineMemOperand( 1215 MachinePointerInfo::getStack(*FuncInfo.MF, Addr.getOffset()), 1216 MachineMemOperand::MOStore, ArgVT.getStoreSize(), Alignment); 1217 (void)(MMO); 1218 // if (!emitStore(ArgVT, ArgReg, Addr, MMO)) 1219 return false; // can't store on the stack yet. 1220 } 1221 } 1222 1223 return true; 1224 } 1225 1226 bool MipsFastISel::finishCall(CallLoweringInfo &CLI, MVT RetVT, 1227 unsigned NumBytes) { 1228 CallingConv::ID CC = CLI.CallConv; 1229 emitInst(Mips::ADJCALLSTACKUP).addImm(16).addImm(0); 1230 if (RetVT != MVT::isVoid) { 1231 SmallVector<CCValAssign, 16> RVLocs; 1232 CCState CCInfo(CC, false, *FuncInfo.MF, RVLocs, *Context); 1233 CCInfo.AnalyzeCallResult(RetVT, RetCC_Mips); 1234 1235 // Only handle a single return value. 1236 if (RVLocs.size() != 1) 1237 return false; 1238 // Copy all of the result registers out of their specified physreg. 1239 MVT CopyVT = RVLocs[0].getValVT(); 1240 // Special handling for extended integers. 1241 if (RetVT == MVT::i1 || RetVT == MVT::i8 || RetVT == MVT::i16) 1242 CopyVT = MVT::i32; 1243 1244 unsigned ResultReg = createResultReg(TLI.getRegClassFor(CopyVT)); 1245 if (!ResultReg) 1246 return false; 1247 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, 1248 TII.get(TargetOpcode::COPY), 1249 ResultReg).addReg(RVLocs[0].getLocReg()); 1250 CLI.InRegs.push_back(RVLocs[0].getLocReg()); 1251 1252 CLI.ResultReg = ResultReg; 1253 CLI.NumResultRegs = 1; 1254 } 1255 return true; 1256 } 1257 1258 bool MipsFastISel::fastLowerArguments() { 1259 DEBUG(dbgs() << "fastLowerArguments\n"); 1260 1261 if (!FuncInfo.CanLowerReturn) { 1262 DEBUG(dbgs() << ".. gave up (!CanLowerReturn)\n"); 1263 return false; 1264 } 1265 1266 const Function *F = FuncInfo.Fn; 1267 if (F->isVarArg()) { 1268 DEBUG(dbgs() << ".. gave up (varargs)\n"); 1269 return false; 1270 } 1271 1272 CallingConv::ID CC = F->getCallingConv(); 1273 if (CC != CallingConv::C) { 1274 DEBUG(dbgs() << ".. gave up (calling convention is not C)\n"); 1275 return false; 1276 } 1277 1278 const ArrayRef<MCPhysReg> GPR32ArgRegs = {Mips::A0, Mips::A1, Mips::A2, 1279 Mips::A3}; 1280 const ArrayRef<MCPhysReg> FGR32ArgRegs = {Mips::F12, Mips::F14}; 1281 const ArrayRef<MCPhysReg> AFGR64ArgRegs = {Mips::D6, Mips::D7}; 1282 ArrayRef<MCPhysReg>::iterator NextGPR32 = GPR32ArgRegs.begin(); 1283 ArrayRef<MCPhysReg>::iterator NextFGR32 = FGR32ArgRegs.begin(); 1284 ArrayRef<MCPhysReg>::iterator NextAFGR64 = AFGR64ArgRegs.begin(); 1285 1286 struct AllocatedReg { 1287 const TargetRegisterClass *RC; 1288 unsigned Reg; 1289 AllocatedReg(const TargetRegisterClass *RC, unsigned Reg) 1290 : RC(RC), Reg(Reg) {} 1291 }; 1292 1293 // Only handle simple cases. i.e. All arguments are directly mapped to 1294 // registers of the appropriate type. 1295 SmallVector<AllocatedReg, 4> Allocation; 1296 unsigned Idx = 1; 1297 for (const auto &FormalArg : F->args()) { 1298 if (F->getAttributes().hasAttribute(Idx, Attribute::InReg) || 1299 F->getAttributes().hasAttribute(Idx, Attribute::StructRet) || 1300 F->getAttributes().hasAttribute(Idx, Attribute::ByVal)) { 1301 DEBUG(dbgs() << ".. gave up (inreg, structret, byval)\n"); 1302 return false; 1303 } 1304 1305 Type *ArgTy = FormalArg.getType(); 1306 if (ArgTy->isStructTy() || ArgTy->isArrayTy() || ArgTy->isVectorTy()) { 1307 DEBUG(dbgs() << ".. gave up (struct, array, or vector)\n"); 1308 return false; 1309 } 1310 1311 EVT ArgVT = TLI.getValueType(DL, ArgTy); 1312 DEBUG(dbgs() << ".. " << (Idx - 1) << ": " << ArgVT.getEVTString() << "\n"); 1313 if (!ArgVT.isSimple()) { 1314 DEBUG(dbgs() << ".. .. gave up (not a simple type)\n"); 1315 return false; 1316 } 1317 1318 switch (ArgVT.getSimpleVT().SimpleTy) { 1319 case MVT::i1: 1320 case MVT::i8: 1321 case MVT::i16: 1322 if (!F->getAttributes().hasAttribute(Idx, Attribute::SExt) && 1323 !F->getAttributes().hasAttribute(Idx, Attribute::ZExt)) { 1324 // It must be any extend, this shouldn't happen for clang-generated IR 1325 // so just fall back on SelectionDAG. 1326 DEBUG(dbgs() << ".. .. gave up (i8/i16 arg is not extended)\n"); 1327 return false; 1328 } 1329 1330 if (NextGPR32 == GPR32ArgRegs.end()) { 1331 DEBUG(dbgs() << ".. .. gave up (ran out of GPR32 arguments)\n"); 1332 return false; 1333 } 1334 1335 DEBUG(dbgs() << ".. .. GPR32(" << *NextGPR32 << ")\n"); 1336 Allocation.emplace_back(&Mips::GPR32RegClass, *NextGPR32++); 1337 1338 // Allocating any GPR32 prohibits further use of floating point arguments. 1339 NextFGR32 = FGR32ArgRegs.end(); 1340 NextAFGR64 = AFGR64ArgRegs.end(); 1341 break; 1342 1343 case MVT::i32: 1344 if (F->getAttributes().hasAttribute(Idx, Attribute::ZExt)) { 1345 // The O32 ABI does not permit a zero-extended i32. 1346 DEBUG(dbgs() << ".. .. gave up (i32 arg is zero extended)\n"); 1347 return false; 1348 } 1349 1350 if (NextGPR32 == GPR32ArgRegs.end()) { 1351 DEBUG(dbgs() << ".. .. gave up (ran out of GPR32 arguments)\n"); 1352 return false; 1353 } 1354 1355 DEBUG(dbgs() << ".. .. GPR32(" << *NextGPR32 << ")\n"); 1356 Allocation.emplace_back(&Mips::GPR32RegClass, *NextGPR32++); 1357 1358 // Allocating any GPR32 prohibits further use of floating point arguments. 1359 NextFGR32 = FGR32ArgRegs.end(); 1360 NextAFGR64 = AFGR64ArgRegs.end(); 1361 break; 1362 1363 case MVT::f32: 1364 if (NextFGR32 == FGR32ArgRegs.end()) { 1365 DEBUG(dbgs() << ".. .. gave up (ran out of FGR32 arguments)\n"); 1366 return false; 1367 } 1368 DEBUG(dbgs() << ".. .. FGR32(" << *NextFGR32 << ")\n"); 1369 Allocation.emplace_back(&Mips::FGR32RegClass, *NextFGR32++); 1370 // Allocating an FGR32 also allocates the super-register AFGR64, and 1371 // ABI rules require us to skip the corresponding GPR32. 1372 if (NextGPR32 != GPR32ArgRegs.end()) 1373 NextGPR32++; 1374 if (NextAFGR64 != AFGR64ArgRegs.end()) 1375 NextAFGR64++; 1376 break; 1377 1378 case MVT::f64: 1379 if (NextAFGR64 == AFGR64ArgRegs.end()) { 1380 DEBUG(dbgs() << ".. .. gave up (ran out of AFGR64 arguments)\n"); 1381 return false; 1382 } 1383 DEBUG(dbgs() << ".. .. AFGR64(" << *NextAFGR64 << ")\n"); 1384 Allocation.emplace_back(&Mips::AFGR64RegClass, *NextAFGR64++); 1385 // Allocating an FGR32 also allocates the super-register AFGR64, and 1386 // ABI rules require us to skip the corresponding GPR32 pair. 1387 if (NextGPR32 != GPR32ArgRegs.end()) 1388 NextGPR32++; 1389 if (NextGPR32 != GPR32ArgRegs.end()) 1390 NextGPR32++; 1391 if (NextFGR32 != FGR32ArgRegs.end()) 1392 NextFGR32++; 1393 break; 1394 1395 default: 1396 DEBUG(dbgs() << ".. .. gave up (unknown type)\n"); 1397 return false; 1398 } 1399 1400 ++Idx; 1401 } 1402 1403 Idx = 0; 1404 for (const auto &FormalArg : F->args()) { 1405 unsigned SrcReg = Allocation[Idx].Reg; 1406 unsigned DstReg = FuncInfo.MF->addLiveIn(SrcReg, Allocation[Idx].RC); 1407 // FIXME: Unfortunately it's necessary to emit a copy from the livein copy. 1408 // Without this, EmitLiveInCopies may eliminate the livein if its only 1409 // use is a bitcast (which isn't turned into an instruction). 1410 unsigned ResultReg = createResultReg(Allocation[Idx].RC); 1411 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, 1412 TII.get(TargetOpcode::COPY), ResultReg) 1413 .addReg(DstReg, getKillRegState(true)); 1414 updateValueMap(&FormalArg, ResultReg); 1415 ++Idx; 1416 } 1417 1418 // Calculate the size of the incoming arguments area. 1419 // We currently reject all the cases where this would be non-zero. 1420 unsigned IncomingArgSizeInBytes = 0; 1421 1422 // Account for the reserved argument area on ABI's that have one (O32). 1423 // It seems strange to do this on the caller side but it's necessary in 1424 // SelectionDAG's implementation. 1425 IncomingArgSizeInBytes = std::min(getABI().GetCalleeAllocdArgSizeInBytes(CC), 1426 IncomingArgSizeInBytes); 1427 1428 MF->getInfo<MipsFunctionInfo>()->setFormalArgInfo(IncomingArgSizeInBytes, 1429 false); 1430 1431 return true; 1432 } 1433 1434 bool MipsFastISel::fastLowerCall(CallLoweringInfo &CLI) { 1435 if (!TargetSupported) 1436 return false; 1437 1438 CallingConv::ID CC = CLI.CallConv; 1439 bool IsTailCall = CLI.IsTailCall; 1440 bool IsVarArg = CLI.IsVarArg; 1441 const Value *Callee = CLI.Callee; 1442 MCSymbol *Symbol = CLI.Symbol; 1443 1444 // Do not handle FastCC. 1445 if (CC == CallingConv::Fast) 1446 return false; 1447 1448 // Allow SelectionDAG isel to handle tail calls. 1449 if (IsTailCall) 1450 return false; 1451 1452 // Let SDISel handle vararg functions. 1453 if (IsVarArg) 1454 return false; 1455 1456 // FIXME: Only handle *simple* calls for now. 1457 MVT RetVT; 1458 if (CLI.RetTy->isVoidTy()) 1459 RetVT = MVT::isVoid; 1460 else if (!isTypeSupported(CLI.RetTy, RetVT)) 1461 return false; 1462 1463 for (auto Flag : CLI.OutFlags) 1464 if (Flag.isInReg() || Flag.isSRet() || Flag.isNest() || Flag.isByVal()) 1465 return false; 1466 1467 // Set up the argument vectors. 1468 SmallVector<MVT, 16> OutVTs; 1469 OutVTs.reserve(CLI.OutVals.size()); 1470 1471 for (auto *Val : CLI.OutVals) { 1472 MVT VT; 1473 if (!isTypeLegal(Val->getType(), VT) && 1474 !(VT == MVT::i1 || VT == MVT::i8 || VT == MVT::i16)) 1475 return false; 1476 1477 // We don't handle vector parameters yet. 1478 if (VT.isVector() || VT.getSizeInBits() > 64) 1479 return false; 1480 1481 OutVTs.push_back(VT); 1482 } 1483 1484 Address Addr; 1485 if (!computeCallAddress(Callee, Addr)) 1486 return false; 1487 1488 // Handle the arguments now that we've gotten them. 1489 unsigned NumBytes; 1490 if (!processCallArgs(CLI, OutVTs, NumBytes)) 1491 return false; 1492 1493 if (!Addr.getGlobalValue()) 1494 return false; 1495 1496 // Issue the call. 1497 unsigned DestAddress; 1498 if (Symbol) 1499 DestAddress = materializeExternalCallSym(Symbol); 1500 else 1501 DestAddress = materializeGV(Addr.getGlobalValue(), MVT::i32); 1502 emitInst(TargetOpcode::COPY, Mips::T9).addReg(DestAddress); 1503 MachineInstrBuilder MIB = 1504 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, TII.get(Mips::JALR), 1505 Mips::RA).addReg(Mips::T9); 1506 1507 // Add implicit physical register uses to the call. 1508 for (auto Reg : CLI.OutRegs) 1509 MIB.addReg(Reg, RegState::Implicit); 1510 1511 // Add a register mask with the call-preserved registers. 1512 // Proper defs for return values will be added by setPhysRegsDeadExcept(). 1513 MIB.addRegMask(TRI.getCallPreservedMask(*FuncInfo.MF, CC)); 1514 1515 CLI.Call = MIB; 1516 1517 // Finish off the call including any return values. 1518 return finishCall(CLI, RetVT, NumBytes); 1519 } 1520 1521 bool MipsFastISel::fastLowerIntrinsicCall(const IntrinsicInst *II) { 1522 if (!TargetSupported) 1523 return false; 1524 1525 switch (II->getIntrinsicID()) { 1526 default: 1527 return false; 1528 case Intrinsic::bswap: { 1529 Type *RetTy = II->getCalledFunction()->getReturnType(); 1530 1531 MVT VT; 1532 if (!isTypeSupported(RetTy, VT)) 1533 return false; 1534 1535 unsigned SrcReg = getRegForValue(II->getOperand(0)); 1536 if (SrcReg == 0) 1537 return false; 1538 unsigned DestReg = createResultReg(&Mips::GPR32RegClass); 1539 if (DestReg == 0) 1540 return false; 1541 if (VT == MVT::i16) { 1542 if (Subtarget->hasMips32r2()) { 1543 emitInst(Mips::WSBH, DestReg).addReg(SrcReg); 1544 updateValueMap(II, DestReg); 1545 return true; 1546 } else { 1547 unsigned TempReg[3]; 1548 for (int i = 0; i < 3; i++) { 1549 TempReg[i] = createResultReg(&Mips::GPR32RegClass); 1550 if (TempReg[i] == 0) 1551 return false; 1552 } 1553 emitInst(Mips::SLL, TempReg[0]).addReg(SrcReg).addImm(8); 1554 emitInst(Mips::SRL, TempReg[1]).addReg(SrcReg).addImm(8); 1555 emitInst(Mips::OR, TempReg[2]).addReg(TempReg[0]).addReg(TempReg[1]); 1556 emitInst(Mips::ANDi, DestReg).addReg(TempReg[2]).addImm(0xFFFF); 1557 updateValueMap(II, DestReg); 1558 return true; 1559 } 1560 } else if (VT == MVT::i32) { 1561 if (Subtarget->hasMips32r2()) { 1562 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 1563 emitInst(Mips::WSBH, TempReg).addReg(SrcReg); 1564 emitInst(Mips::ROTR, DestReg).addReg(TempReg).addImm(16); 1565 updateValueMap(II, DestReg); 1566 return true; 1567 } else { 1568 unsigned TempReg[8]; 1569 for (int i = 0; i < 8; i++) { 1570 TempReg[i] = createResultReg(&Mips::GPR32RegClass); 1571 if (TempReg[i] == 0) 1572 return false; 1573 } 1574 1575 emitInst(Mips::SRL, TempReg[0]).addReg(SrcReg).addImm(8); 1576 emitInst(Mips::SRL, TempReg[1]).addReg(SrcReg).addImm(24); 1577 emitInst(Mips::ANDi, TempReg[2]).addReg(TempReg[0]).addImm(0xFF00); 1578 emitInst(Mips::OR, TempReg[3]).addReg(TempReg[1]).addReg(TempReg[2]); 1579 1580 emitInst(Mips::ANDi, TempReg[4]).addReg(SrcReg).addImm(0xFF00); 1581 emitInst(Mips::SLL, TempReg[5]).addReg(TempReg[4]).addImm(8); 1582 1583 emitInst(Mips::SLL, TempReg[6]).addReg(SrcReg).addImm(24); 1584 emitInst(Mips::OR, TempReg[7]).addReg(TempReg[3]).addReg(TempReg[5]); 1585 emitInst(Mips::OR, DestReg).addReg(TempReg[6]).addReg(TempReg[7]); 1586 updateValueMap(II, DestReg); 1587 return true; 1588 } 1589 } 1590 return false; 1591 } 1592 case Intrinsic::memcpy: 1593 case Intrinsic::memmove: { 1594 const auto *MTI = cast<MemTransferInst>(II); 1595 // Don't handle volatile. 1596 if (MTI->isVolatile()) 1597 return false; 1598 if (!MTI->getLength()->getType()->isIntegerTy(32)) 1599 return false; 1600 const char *IntrMemName = isa<MemCpyInst>(II) ? "memcpy" : "memmove"; 1601 return lowerCallTo(II, IntrMemName, II->getNumArgOperands() - 2); 1602 } 1603 case Intrinsic::memset: { 1604 const MemSetInst *MSI = cast<MemSetInst>(II); 1605 // Don't handle volatile. 1606 if (MSI->isVolatile()) 1607 return false; 1608 if (!MSI->getLength()->getType()->isIntegerTy(32)) 1609 return false; 1610 return lowerCallTo(II, "memset", II->getNumArgOperands() - 2); 1611 } 1612 } 1613 return false; 1614 } 1615 1616 bool MipsFastISel::selectRet(const Instruction *I) { 1617 const Function &F = *I->getParent()->getParent(); 1618 const ReturnInst *Ret = cast<ReturnInst>(I); 1619 1620 if (!FuncInfo.CanLowerReturn) 1621 return false; 1622 1623 // Build a list of return value registers. 1624 SmallVector<unsigned, 4> RetRegs; 1625 1626 if (Ret->getNumOperands() > 0) { 1627 CallingConv::ID CC = F.getCallingConv(); 1628 1629 // Do not handle FastCC. 1630 if (CC == CallingConv::Fast) 1631 return false; 1632 1633 SmallVector<ISD::OutputArg, 4> Outs; 1634 GetReturnInfo(F.getReturnType(), F.getAttributes(), Outs, TLI, DL); 1635 1636 // Analyze operands of the call, assigning locations to each operand. 1637 SmallVector<CCValAssign, 16> ValLocs; 1638 MipsCCState CCInfo(CC, F.isVarArg(), *FuncInfo.MF, ValLocs, 1639 I->getContext()); 1640 CCAssignFn *RetCC = RetCC_Mips; 1641 CCInfo.AnalyzeReturn(Outs, RetCC); 1642 1643 // Only handle a single return value for now. 1644 if (ValLocs.size() != 1) 1645 return false; 1646 1647 CCValAssign &VA = ValLocs[0]; 1648 const Value *RV = Ret->getOperand(0); 1649 1650 // Don't bother handling odd stuff for now. 1651 if ((VA.getLocInfo() != CCValAssign::Full) && 1652 (VA.getLocInfo() != CCValAssign::BCvt)) 1653 return false; 1654 1655 // Only handle register returns for now. 1656 if (!VA.isRegLoc()) 1657 return false; 1658 1659 unsigned Reg = getRegForValue(RV); 1660 if (Reg == 0) 1661 return false; 1662 1663 unsigned SrcReg = Reg + VA.getValNo(); 1664 unsigned DestReg = VA.getLocReg(); 1665 // Avoid a cross-class copy. This is very unlikely. 1666 if (!MRI.getRegClass(SrcReg)->contains(DestReg)) 1667 return false; 1668 1669 EVT RVEVT = TLI.getValueType(DL, RV->getType()); 1670 if (!RVEVT.isSimple()) 1671 return false; 1672 1673 if (RVEVT.isVector()) 1674 return false; 1675 1676 MVT RVVT = RVEVT.getSimpleVT(); 1677 if (RVVT == MVT::f128) 1678 return false; 1679 1680 MVT DestVT = VA.getValVT(); 1681 // Special handling for extended integers. 1682 if (RVVT != DestVT) { 1683 if (RVVT != MVT::i1 && RVVT != MVT::i8 && RVVT != MVT::i16) 1684 return false; 1685 1686 if (Outs[0].Flags.isZExt() || Outs[0].Flags.isSExt()) { 1687 bool IsZExt = Outs[0].Flags.isZExt(); 1688 SrcReg = emitIntExt(RVVT, SrcReg, DestVT, IsZExt); 1689 if (SrcReg == 0) 1690 return false; 1691 } 1692 } 1693 1694 // Make the copy. 1695 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, 1696 TII.get(TargetOpcode::COPY), DestReg).addReg(SrcReg); 1697 1698 // Add register to return instruction. 1699 RetRegs.push_back(VA.getLocReg()); 1700 } 1701 MachineInstrBuilder MIB = emitInst(Mips::RetRA); 1702 for (unsigned i = 0, e = RetRegs.size(); i != e; ++i) 1703 MIB.addReg(RetRegs[i], RegState::Implicit); 1704 return true; 1705 } 1706 1707 bool MipsFastISel::selectTrunc(const Instruction *I) { 1708 // The high bits for a type smaller than the register size are assumed to be 1709 // undefined. 1710 Value *Op = I->getOperand(0); 1711 1712 EVT SrcVT, DestVT; 1713 SrcVT = TLI.getValueType(DL, Op->getType(), true); 1714 DestVT = TLI.getValueType(DL, I->getType(), true); 1715 1716 if (SrcVT != MVT::i32 && SrcVT != MVT::i16 && SrcVT != MVT::i8) 1717 return false; 1718 if (DestVT != MVT::i16 && DestVT != MVT::i8 && DestVT != MVT::i1) 1719 return false; 1720 1721 unsigned SrcReg = getRegForValue(Op); 1722 if (!SrcReg) 1723 return false; 1724 1725 // Because the high bits are undefined, a truncate doesn't generate 1726 // any code. 1727 updateValueMap(I, SrcReg); 1728 return true; 1729 } 1730 bool MipsFastISel::selectIntExt(const Instruction *I) { 1731 Type *DestTy = I->getType(); 1732 Value *Src = I->getOperand(0); 1733 Type *SrcTy = Src->getType(); 1734 1735 bool isZExt = isa<ZExtInst>(I); 1736 unsigned SrcReg = getRegForValue(Src); 1737 if (!SrcReg) 1738 return false; 1739 1740 EVT SrcEVT, DestEVT; 1741 SrcEVT = TLI.getValueType(DL, SrcTy, true); 1742 DestEVT = TLI.getValueType(DL, DestTy, true); 1743 if (!SrcEVT.isSimple()) 1744 return false; 1745 if (!DestEVT.isSimple()) 1746 return false; 1747 1748 MVT SrcVT = SrcEVT.getSimpleVT(); 1749 MVT DestVT = DestEVT.getSimpleVT(); 1750 unsigned ResultReg = createResultReg(&Mips::GPR32RegClass); 1751 1752 if (!emitIntExt(SrcVT, SrcReg, DestVT, ResultReg, isZExt)) 1753 return false; 1754 updateValueMap(I, ResultReg); 1755 return true; 1756 } 1757 bool MipsFastISel::emitIntSExt32r1(MVT SrcVT, unsigned SrcReg, MVT DestVT, 1758 unsigned DestReg) { 1759 unsigned ShiftAmt; 1760 switch (SrcVT.SimpleTy) { 1761 default: 1762 return false; 1763 case MVT::i8: 1764 ShiftAmt = 24; 1765 break; 1766 case MVT::i16: 1767 ShiftAmt = 16; 1768 break; 1769 } 1770 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 1771 emitInst(Mips::SLL, TempReg).addReg(SrcReg).addImm(ShiftAmt); 1772 emitInst(Mips::SRA, DestReg).addReg(TempReg).addImm(ShiftAmt); 1773 return true; 1774 } 1775 1776 bool MipsFastISel::emitIntSExt32r2(MVT SrcVT, unsigned SrcReg, MVT DestVT, 1777 unsigned DestReg) { 1778 switch (SrcVT.SimpleTy) { 1779 default: 1780 return false; 1781 case MVT::i8: 1782 emitInst(Mips::SEB, DestReg).addReg(SrcReg); 1783 break; 1784 case MVT::i16: 1785 emitInst(Mips::SEH, DestReg).addReg(SrcReg); 1786 break; 1787 } 1788 return true; 1789 } 1790 1791 bool MipsFastISel::emitIntSExt(MVT SrcVT, unsigned SrcReg, MVT DestVT, 1792 unsigned DestReg) { 1793 if ((DestVT != MVT::i32) && (DestVT != MVT::i16)) 1794 return false; 1795 if (Subtarget->hasMips32r2()) 1796 return emitIntSExt32r2(SrcVT, SrcReg, DestVT, DestReg); 1797 return emitIntSExt32r1(SrcVT, SrcReg, DestVT, DestReg); 1798 } 1799 1800 bool MipsFastISel::emitIntZExt(MVT SrcVT, unsigned SrcReg, MVT DestVT, 1801 unsigned DestReg) { 1802 int64_t Imm; 1803 1804 switch (SrcVT.SimpleTy) { 1805 default: 1806 return false; 1807 case MVT::i1: 1808 Imm = 1; 1809 break; 1810 case MVT::i8: 1811 Imm = 0xff; 1812 break; 1813 case MVT::i16: 1814 Imm = 0xffff; 1815 break; 1816 } 1817 1818 emitInst(Mips::ANDi, DestReg).addReg(SrcReg).addImm(Imm); 1819 return true; 1820 } 1821 1822 bool MipsFastISel::emitIntExt(MVT SrcVT, unsigned SrcReg, MVT DestVT, 1823 unsigned DestReg, bool IsZExt) { 1824 // FastISel does not have plumbing to deal with extensions where the SrcVT or 1825 // DestVT are odd things, so test to make sure that they are both types we can 1826 // handle (i1/i8/i16/i32 for SrcVT and i8/i16/i32/i64 for DestVT), otherwise 1827 // bail out to SelectionDAG. 1828 if (((DestVT != MVT::i8) && (DestVT != MVT::i16) && (DestVT != MVT::i32)) || 1829 ((SrcVT != MVT::i1) && (SrcVT != MVT::i8) && (SrcVT != MVT::i16))) 1830 return false; 1831 if (IsZExt) 1832 return emitIntZExt(SrcVT, SrcReg, DestVT, DestReg); 1833 return emitIntSExt(SrcVT, SrcReg, DestVT, DestReg); 1834 } 1835 1836 unsigned MipsFastISel::emitIntExt(MVT SrcVT, unsigned SrcReg, MVT DestVT, 1837 bool isZExt) { 1838 unsigned DestReg = createResultReg(&Mips::GPR32RegClass); 1839 bool Success = emitIntExt(SrcVT, SrcReg, DestVT, DestReg, isZExt); 1840 return Success ? DestReg : 0; 1841 } 1842 1843 bool MipsFastISel::selectDivRem(const Instruction *I, unsigned ISDOpcode) { 1844 EVT DestEVT = TLI.getValueType(DL, I->getType(), true); 1845 if (!DestEVT.isSimple()) 1846 return false; 1847 1848 MVT DestVT = DestEVT.getSimpleVT(); 1849 if (DestVT != MVT::i32) 1850 return false; 1851 1852 unsigned DivOpc; 1853 switch (ISDOpcode) { 1854 default: 1855 return false; 1856 case ISD::SDIV: 1857 case ISD::SREM: 1858 DivOpc = Mips::SDIV; 1859 break; 1860 case ISD::UDIV: 1861 case ISD::UREM: 1862 DivOpc = Mips::UDIV; 1863 break; 1864 } 1865 1866 unsigned Src0Reg = getRegForValue(I->getOperand(0)); 1867 unsigned Src1Reg = getRegForValue(I->getOperand(1)); 1868 if (!Src0Reg || !Src1Reg) 1869 return false; 1870 1871 emitInst(DivOpc).addReg(Src0Reg).addReg(Src1Reg); 1872 emitInst(Mips::TEQ).addReg(Src1Reg).addReg(Mips::ZERO).addImm(7); 1873 1874 unsigned ResultReg = createResultReg(&Mips::GPR32RegClass); 1875 if (!ResultReg) 1876 return false; 1877 1878 unsigned MFOpc = (ISDOpcode == ISD::SREM || ISDOpcode == ISD::UREM) 1879 ? Mips::MFHI 1880 : Mips::MFLO; 1881 emitInst(MFOpc, ResultReg); 1882 1883 updateValueMap(I, ResultReg); 1884 return true; 1885 } 1886 1887 bool MipsFastISel::selectShift(const Instruction *I) { 1888 MVT RetVT; 1889 1890 if (!isTypeSupported(I->getType(), RetVT)) 1891 return false; 1892 1893 unsigned ResultReg = createResultReg(&Mips::GPR32RegClass); 1894 if (!ResultReg) 1895 return false; 1896 1897 unsigned Opcode = I->getOpcode(); 1898 const Value *Op0 = I->getOperand(0); 1899 unsigned Op0Reg = getRegForValue(Op0); 1900 if (!Op0Reg) 1901 return false; 1902 1903 // If AShr or LShr, then we need to make sure the operand0 is sign extended. 1904 if (Opcode == Instruction::AShr || Opcode == Instruction::LShr) { 1905 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 1906 if (!TempReg) 1907 return false; 1908 1909 MVT Op0MVT = TLI.getValueType(DL, Op0->getType(), true).getSimpleVT(); 1910 bool IsZExt = Opcode == Instruction::LShr; 1911 if (!emitIntExt(Op0MVT, Op0Reg, MVT::i32, TempReg, IsZExt)) 1912 return false; 1913 1914 Op0Reg = TempReg; 1915 } 1916 1917 if (const auto *C = dyn_cast<ConstantInt>(I->getOperand(1))) { 1918 uint64_t ShiftVal = C->getZExtValue(); 1919 1920 switch (Opcode) { 1921 default: 1922 llvm_unreachable("Unexpected instruction."); 1923 case Instruction::Shl: 1924 Opcode = Mips::SLL; 1925 break; 1926 case Instruction::AShr: 1927 Opcode = Mips::SRA; 1928 break; 1929 case Instruction::LShr: 1930 Opcode = Mips::SRL; 1931 break; 1932 } 1933 1934 emitInst(Opcode, ResultReg).addReg(Op0Reg).addImm(ShiftVal); 1935 updateValueMap(I, ResultReg); 1936 return true; 1937 } 1938 1939 unsigned Op1Reg = getRegForValue(I->getOperand(1)); 1940 if (!Op1Reg) 1941 return false; 1942 1943 switch (Opcode) { 1944 default: 1945 llvm_unreachable("Unexpected instruction."); 1946 case Instruction::Shl: 1947 Opcode = Mips::SLLV; 1948 break; 1949 case Instruction::AShr: 1950 Opcode = Mips::SRAV; 1951 break; 1952 case Instruction::LShr: 1953 Opcode = Mips::SRLV; 1954 break; 1955 } 1956 1957 emitInst(Opcode, ResultReg).addReg(Op0Reg).addReg(Op1Reg); 1958 updateValueMap(I, ResultReg); 1959 return true; 1960 } 1961 1962 bool MipsFastISel::fastSelectInstruction(const Instruction *I) { 1963 if (!TargetSupported) 1964 return false; 1965 switch (I->getOpcode()) { 1966 default: 1967 break; 1968 case Instruction::Load: 1969 return selectLoad(I); 1970 case Instruction::Store: 1971 return selectStore(I); 1972 case Instruction::SDiv: 1973 if (!selectBinaryOp(I, ISD::SDIV)) 1974 return selectDivRem(I, ISD::SDIV); 1975 return true; 1976 case Instruction::UDiv: 1977 if (!selectBinaryOp(I, ISD::UDIV)) 1978 return selectDivRem(I, ISD::UDIV); 1979 return true; 1980 case Instruction::SRem: 1981 if (!selectBinaryOp(I, ISD::SREM)) 1982 return selectDivRem(I, ISD::SREM); 1983 return true; 1984 case Instruction::URem: 1985 if (!selectBinaryOp(I, ISD::UREM)) 1986 return selectDivRem(I, ISD::UREM); 1987 return true; 1988 case Instruction::Shl: 1989 case Instruction::LShr: 1990 case Instruction::AShr: 1991 return selectShift(I); 1992 case Instruction::And: 1993 case Instruction::Or: 1994 case Instruction::Xor: 1995 return selectLogicalOp(I); 1996 case Instruction::Br: 1997 return selectBranch(I); 1998 case Instruction::Ret: 1999 return selectRet(I); 2000 case Instruction::Trunc: 2001 return selectTrunc(I); 2002 case Instruction::ZExt: 2003 case Instruction::SExt: 2004 return selectIntExt(I); 2005 case Instruction::FPTrunc: 2006 return selectFPTrunc(I); 2007 case Instruction::FPExt: 2008 return selectFPExt(I); 2009 case Instruction::FPToSI: 2010 return selectFPToInt(I, /*isSigned*/ true); 2011 case Instruction::FPToUI: 2012 return selectFPToInt(I, /*isSigned*/ false); 2013 case Instruction::ICmp: 2014 case Instruction::FCmp: 2015 return selectCmp(I); 2016 case Instruction::Select: 2017 return selectSelect(I); 2018 } 2019 return false; 2020 } 2021 2022 unsigned MipsFastISel::getRegEnsuringSimpleIntegerWidening(const Value *V, 2023 bool IsUnsigned) { 2024 unsigned VReg = getRegForValue(V); 2025 if (VReg == 0) 2026 return 0; 2027 MVT VMVT = TLI.getValueType(DL, V->getType(), true).getSimpleVT(); 2028 if ((VMVT == MVT::i8) || (VMVT == MVT::i16)) { 2029 unsigned TempReg = createResultReg(&Mips::GPR32RegClass); 2030 if (!emitIntExt(VMVT, VReg, MVT::i32, TempReg, IsUnsigned)) 2031 return 0; 2032 VReg = TempReg; 2033 } 2034 return VReg; 2035 } 2036 2037 void MipsFastISel::simplifyAddress(Address &Addr) { 2038 if (!isInt<16>(Addr.getOffset())) { 2039 unsigned TempReg = 2040 materialize32BitInt(Addr.getOffset(), &Mips::GPR32RegClass); 2041 unsigned DestReg = createResultReg(&Mips::GPR32RegClass); 2042 emitInst(Mips::ADDu, DestReg).addReg(TempReg).addReg(Addr.getReg()); 2043 Addr.setReg(DestReg); 2044 Addr.setOffset(0); 2045 } 2046 } 2047 2048 unsigned MipsFastISel::fastEmitInst_rr(unsigned MachineInstOpcode, 2049 const TargetRegisterClass *RC, 2050 unsigned Op0, bool Op0IsKill, 2051 unsigned Op1, bool Op1IsKill) { 2052 // We treat the MUL instruction in a special way because it clobbers 2053 // the HI0 & LO0 registers. The TableGen definition of this instruction can 2054 // mark these registers only as implicitly defined. As a result, the 2055 // register allocator runs out of registers when this instruction is 2056 // followed by another instruction that defines the same registers too. 2057 // We can fix this by explicitly marking those registers as dead. 2058 if (MachineInstOpcode == Mips::MUL) { 2059 unsigned ResultReg = createResultReg(RC); 2060 const MCInstrDesc &II = TII.get(MachineInstOpcode); 2061 Op0 = constrainOperandRegClass(II, Op0, II.getNumDefs()); 2062 Op1 = constrainOperandRegClass(II, Op1, II.getNumDefs() + 1); 2063 BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DbgLoc, II, ResultReg) 2064 .addReg(Op0, getKillRegState(Op0IsKill)) 2065 .addReg(Op1, getKillRegState(Op1IsKill)) 2066 .addReg(Mips::HI0, RegState::ImplicitDefine | RegState::Dead) 2067 .addReg(Mips::LO0, RegState::ImplicitDefine | RegState::Dead); 2068 return ResultReg; 2069 } 2070 2071 return FastISel::fastEmitInst_rr(MachineInstOpcode, RC, Op0, Op0IsKill, Op1, 2072 Op1IsKill); 2073 } 2074 2075 namespace llvm { 2076 FastISel *Mips::createFastISel(FunctionLoweringInfo &funcInfo, 2077 const TargetLibraryInfo *libInfo) { 2078 return new MipsFastISel(funcInfo, libInfo); 2079 } 2080 } 2081