1664e354dSChandler Carruth //===- BasicTargetTransformInfo.cpp - Basic target-independent TTI impl ---===// 2664e354dSChandler Carruth // 3664e354dSChandler Carruth // The LLVM Compiler Infrastructure 4664e354dSChandler Carruth // 5664e354dSChandler Carruth // This file is distributed under the University of Illinois Open Source 6664e354dSChandler Carruth // License. See LICENSE.TXT for details. 7664e354dSChandler Carruth // 8664e354dSChandler Carruth //===----------------------------------------------------------------------===// 9664e354dSChandler Carruth /// \file 10664e354dSChandler Carruth /// This file provides the implementation of a basic TargetTransformInfo pass 11664e354dSChandler Carruth /// predicated on the target abstractions present in the target independent 12664e354dSChandler Carruth /// code generator. It uses these (primarily TargetLowering) to model as much 13664e354dSChandler Carruth /// of the TTI query interface as possible. It is included by most targets so 14664e354dSChandler Carruth /// that they can specialize only a small subset of the query space. 15664e354dSChandler Carruth /// 16664e354dSChandler Carruth //===----------------------------------------------------------------------===// 17664e354dSChandler Carruth 18664e354dSChandler Carruth #include "llvm/CodeGen/Passes.h" 19d3e73556SChandler Carruth #include "llvm/Analysis/TargetTransformInfo.h" 20664e354dSChandler Carruth #include "llvm/Target/TargetLowering.h" 21664e354dSChandler Carruth #include <utility> 22664e354dSChandler Carruth using namespace llvm; 23664e354dSChandler Carruth 241b9dde08SChandler Carruth #define DEBUG_TYPE "basictti" 251b9dde08SChandler Carruth 26664e354dSChandler Carruth namespace { 27664e354dSChandler Carruth 2877dfe45fSCraig Topper class BasicTTI final : public ImmutablePass, public TargetTransformInfo { 29afc1036fSBill Wendling const TargetMachine *TM; 30664e354dSChandler Carruth 31664e354dSChandler Carruth /// Estimate the overhead of scalarizing an instruction. Insert and Extract 32664e354dSChandler Carruth /// are set if the result needs to be inserted and/or extracted from vectors. 33664e354dSChandler Carruth unsigned getScalarizationOverhead(Type *Ty, bool Insert, bool Extract) const; 34664e354dSChandler Carruth 35afc1036fSBill Wendling const TargetLoweringBase *getTLI() const { return TM->getTargetLowering(); } 36afc1036fSBill Wendling 37664e354dSChandler Carruth public: 38c0196b1bSCraig Topper BasicTTI() : ImmutablePass(ID), TM(nullptr) { 39664e354dSChandler Carruth llvm_unreachable("This pass cannot be directly constructed"); 40664e354dSChandler Carruth } 41664e354dSChandler Carruth 42afc1036fSBill Wendling BasicTTI(const TargetMachine *TM) : ImmutablePass(ID), TM(TM) { 43664e354dSChandler Carruth initializeBasicTTIPass(*PassRegistry::getPassRegistry()); 44664e354dSChandler Carruth } 45664e354dSChandler Carruth 4624e685fdSCraig Topper void initializePass() override { 47664e354dSChandler Carruth pushTTIStack(this); 48664e354dSChandler Carruth } 49664e354dSChandler Carruth 5024e685fdSCraig Topper void getAnalysisUsage(AnalysisUsage &AU) const override { 51664e354dSChandler Carruth TargetTransformInfo::getAnalysisUsage(AU); 52664e354dSChandler Carruth } 53664e354dSChandler Carruth 54664e354dSChandler Carruth /// Pass identification. 55664e354dSChandler Carruth static char ID; 56664e354dSChandler Carruth 57664e354dSChandler Carruth /// Provide necessary pointer adjustments for the two base classes. 5824e685fdSCraig Topper void *getAdjustedAnalysisPointer(const void *ID) override { 59664e354dSChandler Carruth if (ID == &TargetTransformInfo::ID) 60664e354dSChandler Carruth return (TargetTransformInfo*)this; 61664e354dSChandler Carruth return this; 62664e354dSChandler Carruth } 63664e354dSChandler Carruth 6424e685fdSCraig Topper bool hasBranchDivergence() const override; 658b1e021eSTom Stellard 66664e354dSChandler Carruth /// \name Scalar TTI Implementations 67664e354dSChandler Carruth /// @{ 68664e354dSChandler Carruth 6924e685fdSCraig Topper bool isLegalAddImmediate(int64_t imm) const override; 7024e685fdSCraig Topper bool isLegalICmpImmediate(int64_t imm) const override; 7124e685fdSCraig Topper bool isLegalAddressingMode(Type *Ty, GlobalValue *BaseGV, 72664e354dSChandler Carruth int64_t BaseOffset, bool HasBaseReg, 7373156025SCraig Topper int64_t Scale) const override; 7424e685fdSCraig Topper int getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, 75bf490d4aSQuentin Colombet int64_t BaseOffset, bool HasBaseReg, 7673156025SCraig Topper int64_t Scale) const override; 7724e685fdSCraig Topper bool isTruncateFree(Type *Ty1, Type *Ty2) const override; 7824e685fdSCraig Topper bool isTypeLegal(Type *Ty) const override; 7924e685fdSCraig Topper unsigned getJumpBufAlignment() const override; 8024e685fdSCraig Topper unsigned getJumpBufSize() const override; 8124e685fdSCraig Topper bool shouldBuildLookupTables() const override; 8224e685fdSCraig Topper bool haveFastSqrt(Type *Ty) const override; 8324e685fdSCraig Topper void getUnrollingPreferences(Loop *L, 8424e685fdSCraig Topper UnrollingPreferences &UP) const override; 85664e354dSChandler Carruth 86664e354dSChandler Carruth /// @} 87664e354dSChandler Carruth 88664e354dSChandler Carruth /// \name Vector TTI Implementations 89664e354dSChandler Carruth /// @{ 90664e354dSChandler Carruth 9124e685fdSCraig Topper unsigned getNumberOfRegisters(bool Vector) const override; 9224e685fdSCraig Topper unsigned getMaximumUnrollFactor() const override; 9324e685fdSCraig Topper unsigned getRegisterBitWidth(bool Vector) const override; 9424e685fdSCraig Topper unsigned getArithmeticInstrCost(unsigned Opcode, Type *Ty, OperandValueKind, 9573156025SCraig Topper OperandValueKind) const override; 9624e685fdSCraig Topper unsigned getShuffleCost(ShuffleKind Kind, Type *Tp, 9773156025SCraig Topper int Index, Type *SubTp) const override; 9824e685fdSCraig Topper unsigned getCastInstrCost(unsigned Opcode, Type *Dst, 9973156025SCraig Topper Type *Src) const override; 10024e685fdSCraig Topper unsigned getCFInstrCost(unsigned Opcode) const override; 10124e685fdSCraig Topper unsigned getCmpSelInstrCost(unsigned Opcode, Type *ValTy, 10273156025SCraig Topper Type *CondTy) const override; 10324e685fdSCraig Topper unsigned getVectorInstrCost(unsigned Opcode, Type *Val, 10473156025SCraig Topper unsigned Index) const override; 10524e685fdSCraig Topper unsigned getMemoryOpCost(unsigned Opcode, Type *Src, unsigned Alignment, 10673156025SCraig Topper unsigned AddressSpace) const override; 10724e685fdSCraig Topper unsigned getIntrinsicInstrCost(Intrinsic::ID, Type *RetTy, 10824e685fdSCraig Topper ArrayRef<Type*> Tys) const override; 10924e685fdSCraig Topper unsigned getNumberOfParts(Type *Tp) const override; 11024e685fdSCraig Topper unsigned getAddressComputationCost( Type *Ty, bool IsComplex) const override; 11124e685fdSCraig Topper unsigned getReductionCost(unsigned Opcode, Type *Ty, 11273156025SCraig Topper bool IsPairwise) const override; 113664e354dSChandler Carruth 114664e354dSChandler Carruth /// @} 115664e354dSChandler Carruth }; 116664e354dSChandler Carruth 117664e354dSChandler Carruth } 118664e354dSChandler Carruth 119664e354dSChandler Carruth INITIALIZE_AG_PASS(BasicTTI, TargetTransformInfo, "basictti", 120664e354dSChandler Carruth "Target independent code generator's TTI", true, true, false) 121664e354dSChandler Carruth char BasicTTI::ID = 0; 122664e354dSChandler Carruth 123664e354dSChandler Carruth ImmutablePass * 124afc1036fSBill Wendling llvm::createBasicTargetTransformInfoPass(const TargetMachine *TM) { 125afc1036fSBill Wendling return new BasicTTI(TM); 126664e354dSChandler Carruth } 127664e354dSChandler Carruth 1288b1e021eSTom Stellard bool BasicTTI::hasBranchDivergence() const { return false; } 129664e354dSChandler Carruth 130664e354dSChandler Carruth bool BasicTTI::isLegalAddImmediate(int64_t imm) const { 131afc1036fSBill Wendling return getTLI()->isLegalAddImmediate(imm); 132664e354dSChandler Carruth } 133664e354dSChandler Carruth 134664e354dSChandler Carruth bool BasicTTI::isLegalICmpImmediate(int64_t imm) const { 135afc1036fSBill Wendling return getTLI()->isLegalICmpImmediate(imm); 136664e354dSChandler Carruth } 137664e354dSChandler Carruth 138664e354dSChandler Carruth bool BasicTTI::isLegalAddressingMode(Type *Ty, GlobalValue *BaseGV, 139664e354dSChandler Carruth int64_t BaseOffset, bool HasBaseReg, 140664e354dSChandler Carruth int64_t Scale) const { 14156b31bd9SBenjamin Kramer TargetLoweringBase::AddrMode AM; 142664e354dSChandler Carruth AM.BaseGV = BaseGV; 143664e354dSChandler Carruth AM.BaseOffs = BaseOffset; 144664e354dSChandler Carruth AM.HasBaseReg = HasBaseReg; 145664e354dSChandler Carruth AM.Scale = Scale; 146afc1036fSBill Wendling return getTLI()->isLegalAddressingMode(AM, Ty); 147664e354dSChandler Carruth } 148664e354dSChandler Carruth 149bf490d4aSQuentin Colombet int BasicTTI::getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, 150bf490d4aSQuentin Colombet int64_t BaseOffset, bool HasBaseReg, 151bf490d4aSQuentin Colombet int64_t Scale) const { 152bf490d4aSQuentin Colombet TargetLoweringBase::AddrMode AM; 153bf490d4aSQuentin Colombet AM.BaseGV = BaseGV; 154bf490d4aSQuentin Colombet AM.BaseOffs = BaseOffset; 155bf490d4aSQuentin Colombet AM.HasBaseReg = HasBaseReg; 156bf490d4aSQuentin Colombet AM.Scale = Scale; 157afc1036fSBill Wendling return getTLI()->getScalingFactorCost(AM, Ty); 158bf490d4aSQuentin Colombet } 159bf490d4aSQuentin Colombet 160664e354dSChandler Carruth bool BasicTTI::isTruncateFree(Type *Ty1, Type *Ty2) const { 161afc1036fSBill Wendling return getTLI()->isTruncateFree(Ty1, Ty2); 162664e354dSChandler Carruth } 163664e354dSChandler Carruth 164664e354dSChandler Carruth bool BasicTTI::isTypeLegal(Type *Ty) const { 165afc1036fSBill Wendling EVT T = getTLI()->getValueType(Ty); 166afc1036fSBill Wendling return getTLI()->isTypeLegal(T); 167664e354dSChandler Carruth } 168664e354dSChandler Carruth 169664e354dSChandler Carruth unsigned BasicTTI::getJumpBufAlignment() const { 170afc1036fSBill Wendling return getTLI()->getJumpBufAlignment(); 171664e354dSChandler Carruth } 172664e354dSChandler Carruth 173664e354dSChandler Carruth unsigned BasicTTI::getJumpBufSize() const { 174afc1036fSBill Wendling return getTLI()->getJumpBufSize(); 175664e354dSChandler Carruth } 176664e354dSChandler Carruth 177664e354dSChandler Carruth bool BasicTTI::shouldBuildLookupTables() const { 178afc1036fSBill Wendling const TargetLoweringBase *TLI = getTLI(); 179664e354dSChandler Carruth return TLI->supportJumpTables() && 180664e354dSChandler Carruth (TLI->isOperationLegalOrCustom(ISD::BR_JT, MVT::Other) || 181664e354dSChandler Carruth TLI->isOperationLegalOrCustom(ISD::BRIND, MVT::Other)); 182664e354dSChandler Carruth } 183664e354dSChandler Carruth 18437cd6cfbSRichard Sandiford bool BasicTTI::haveFastSqrt(Type *Ty) const { 18537cd6cfbSRichard Sandiford const TargetLoweringBase *TLI = getTLI(); 18637cd6cfbSRichard Sandiford EVT VT = TLI->getValueType(Ty); 18737cd6cfbSRichard Sandiford return TLI->isTypeLegal(VT) && TLI->isOperationLegalOrCustom(ISD::FSQRT, VT); 18837cd6cfbSRichard Sandiford } 18937cd6cfbSRichard Sandiford 1908f2e7005SHal Finkel void BasicTTI::getUnrollingPreferences(Loop *, UnrollingPreferences &) const { } 1918f2e7005SHal Finkel 192664e354dSChandler Carruth //===----------------------------------------------------------------------===// 193664e354dSChandler Carruth // 194664e354dSChandler Carruth // Calls used by the vectorizers. 195664e354dSChandler Carruth // 196664e354dSChandler Carruth //===----------------------------------------------------------------------===// 197664e354dSChandler Carruth 198664e354dSChandler Carruth unsigned BasicTTI::getScalarizationOverhead(Type *Ty, bool Insert, 199664e354dSChandler Carruth bool Extract) const { 200664e354dSChandler Carruth assert (Ty->isVectorTy() && "Can only scalarize vectors"); 201664e354dSChandler Carruth unsigned Cost = 0; 202664e354dSChandler Carruth 203664e354dSChandler Carruth for (int i = 0, e = Ty->getVectorNumElements(); i < e; ++i) { 204664e354dSChandler Carruth if (Insert) 205664e354dSChandler Carruth Cost += TopTTI->getVectorInstrCost(Instruction::InsertElement, Ty, i); 206664e354dSChandler Carruth if (Extract) 207664e354dSChandler Carruth Cost += TopTTI->getVectorInstrCost(Instruction::ExtractElement, Ty, i); 208664e354dSChandler Carruth } 209664e354dSChandler Carruth 210664e354dSChandler Carruth return Cost; 211664e354dSChandler Carruth } 212664e354dSChandler Carruth 213664e354dSChandler Carruth unsigned BasicTTI::getNumberOfRegisters(bool Vector) const { 214664e354dSChandler Carruth return 1; 215664e354dSChandler Carruth } 216664e354dSChandler Carruth 217b1791a75SNadav Rotem unsigned BasicTTI::getRegisterBitWidth(bool Vector) const { 218b1791a75SNadav Rotem return 32; 219b1791a75SNadav Rotem } 220b1791a75SNadav Rotem 221b696c36fSNadav Rotem unsigned BasicTTI::getMaximumUnrollFactor() const { 222b696c36fSNadav Rotem return 1; 223b696c36fSNadav Rotem } 224b696c36fSNadav Rotem 225b9773871SArnold Schwaighofer unsigned BasicTTI::getArithmeticInstrCost(unsigned Opcode, Type *Ty, 226b9773871SArnold Schwaighofer OperandValueKind, 227b9773871SArnold Schwaighofer OperandValueKind) const { 228664e354dSChandler Carruth // Check if any of the operands are vector operands. 229afc1036fSBill Wendling const TargetLoweringBase *TLI = getTLI(); 230664e354dSChandler Carruth int ISD = TLI->InstructionOpcodeToISD(Opcode); 231664e354dSChandler Carruth assert(ISD && "Invalid opcode"); 232664e354dSChandler Carruth 233664e354dSChandler Carruth std::pair<unsigned, MVT> LT = TLI->getTypeLegalizationCost(Ty); 234664e354dSChandler Carruth 23587a0af6eSNadav Rotem bool IsFloat = Ty->getScalarType()->isFloatingPointTy(); 2360db0690aSNadav Rotem // Assume that floating point arithmetic operations cost twice as much as 2370db0690aSNadav Rotem // integer operations. 23887a0af6eSNadav Rotem unsigned OpCost = (IsFloat ? 2 : 1); 23987a0af6eSNadav Rotem 240664e354dSChandler Carruth if (TLI->isOperationLegalOrPromote(ISD, LT.second)) { 241664e354dSChandler Carruth // The operation is legal. Assume it costs 1. 2420db0690aSNadav Rotem // If the type is split to multiple registers, assume that there is some 243664e354dSChandler Carruth // overhead to this. 244664e354dSChandler Carruth // TODO: Once we have extract/insert subvector cost we need to use them. 245664e354dSChandler Carruth if (LT.first > 1) 24687a0af6eSNadav Rotem return LT.first * 2 * OpCost; 24787a0af6eSNadav Rotem return LT.first * 1 * OpCost; 248664e354dSChandler Carruth } 249664e354dSChandler Carruth 250664e354dSChandler Carruth if (!TLI->isOperationExpand(ISD, LT.second)) { 251664e354dSChandler Carruth // If the operation is custom lowered then assume 252664e354dSChandler Carruth // thare the code is twice as expensive. 25387a0af6eSNadav Rotem return LT.first * 2 * OpCost; 254664e354dSChandler Carruth } 255664e354dSChandler Carruth 256664e354dSChandler Carruth // Else, assume that we need to scalarize this op. 257664e354dSChandler Carruth if (Ty->isVectorTy()) { 258664e354dSChandler Carruth unsigned Num = Ty->getVectorNumElements(); 259664e354dSChandler Carruth unsigned Cost = TopTTI->getArithmeticInstrCost(Opcode, Ty->getScalarType()); 260664e354dSChandler Carruth // return the cost of multiple scalar invocation plus the cost of inserting 261664e354dSChandler Carruth // and extracting the values. 262664e354dSChandler Carruth return getScalarizationOverhead(Ty, true, true) + Num * Cost; 263664e354dSChandler Carruth } 264664e354dSChandler Carruth 265664e354dSChandler Carruth // We don't know anything about this scalar instruction. 26687a0af6eSNadav Rotem return OpCost; 267664e354dSChandler Carruth } 268664e354dSChandler Carruth 269664e354dSChandler Carruth unsigned BasicTTI::getShuffleCost(ShuffleKind Kind, Type *Tp, int Index, 270664e354dSChandler Carruth Type *SubTp) const { 271664e354dSChandler Carruth return 1; 272664e354dSChandler Carruth } 273664e354dSChandler Carruth 274664e354dSChandler Carruth unsigned BasicTTI::getCastInstrCost(unsigned Opcode, Type *Dst, 275664e354dSChandler Carruth Type *Src) const { 276afc1036fSBill Wendling const TargetLoweringBase *TLI = getTLI(); 277664e354dSChandler Carruth int ISD = TLI->InstructionOpcodeToISD(Opcode); 278664e354dSChandler Carruth assert(ISD && "Invalid opcode"); 279664e354dSChandler Carruth 280664e354dSChandler Carruth std::pair<unsigned, MVT> SrcLT = TLI->getTypeLegalizationCost(Src); 281664e354dSChandler Carruth std::pair<unsigned, MVT> DstLT = TLI->getTypeLegalizationCost(Dst); 282664e354dSChandler Carruth 283e55aa3c8SNadav Rotem // Check for NOOP conversions. 284e55aa3c8SNadav Rotem if (SrcLT.first == DstLT.first && 285e55aa3c8SNadav Rotem SrcLT.second.getSizeInBits() == DstLT.second.getSizeInBits()) { 286664e354dSChandler Carruth 287e55aa3c8SNadav Rotem // Bitcast between types that are legalized to the same type are free. 288e55aa3c8SNadav Rotem if (Opcode == Instruction::BitCast || Opcode == Instruction::Trunc) 289664e354dSChandler Carruth return 0; 290e55aa3c8SNadav Rotem } 291664e354dSChandler Carruth 292664e354dSChandler Carruth if (Opcode == Instruction::Trunc && 293664e354dSChandler Carruth TLI->isTruncateFree(SrcLT.second, DstLT.second)) 294664e354dSChandler Carruth return 0; 295664e354dSChandler Carruth 296664e354dSChandler Carruth if (Opcode == Instruction::ZExt && 297664e354dSChandler Carruth TLI->isZExtFree(SrcLT.second, DstLT.second)) 298664e354dSChandler Carruth return 0; 299664e354dSChandler Carruth 300e55aa3c8SNadav Rotem // If the cast is marked as legal (or promote) then assume low cost. 30155312debSHal Finkel if (SrcLT.first == DstLT.first && 30255312debSHal Finkel TLI->isOperationLegalOrPromote(ISD, DstLT.second)) 303e55aa3c8SNadav Rotem return 1; 304e55aa3c8SNadav Rotem 305e55aa3c8SNadav Rotem // Handle scalar conversions. 306e55aa3c8SNadav Rotem if (!Src->isVectorTy() && !Dst->isVectorTy()) { 307e55aa3c8SNadav Rotem 308e55aa3c8SNadav Rotem // Scalar bitcasts are usually free. 309e55aa3c8SNadav Rotem if (Opcode == Instruction::BitCast) 310e55aa3c8SNadav Rotem return 0; 311e55aa3c8SNadav Rotem 312664e354dSChandler Carruth // Just check the op cost. If the operation is legal then assume it costs 1. 313664e354dSChandler Carruth if (!TLI->isOperationExpand(ISD, DstLT.second)) 314664e354dSChandler Carruth return 1; 315664e354dSChandler Carruth 316664e354dSChandler Carruth // Assume that illegal scalar instruction are expensive. 317664e354dSChandler Carruth return 4; 318664e354dSChandler Carruth } 319664e354dSChandler Carruth 320664e354dSChandler Carruth // Check vector-to-vector casts. 321664e354dSChandler Carruth if (Dst->isVectorTy() && Src->isVectorTy()) { 322664e354dSChandler Carruth 323664e354dSChandler Carruth // If the cast is between same-sized registers, then the check is simple. 324664e354dSChandler Carruth if (SrcLT.first == DstLT.first && 325664e354dSChandler Carruth SrcLT.second.getSizeInBits() == DstLT.second.getSizeInBits()) { 326664e354dSChandler Carruth 327664e354dSChandler Carruth // Assume that Zext is done using AND. 328664e354dSChandler Carruth if (Opcode == Instruction::ZExt) 329664e354dSChandler Carruth return 1; 330664e354dSChandler Carruth 331664e354dSChandler Carruth // Assume that sext is done using SHL and SRA. 332664e354dSChandler Carruth if (Opcode == Instruction::SExt) 333664e354dSChandler Carruth return 2; 334664e354dSChandler Carruth 335664e354dSChandler Carruth // Just check the op cost. If the operation is legal then assume it costs 336664e354dSChandler Carruth // 1 and multiply by the type-legalization overhead. 337664e354dSChandler Carruth if (!TLI->isOperationExpand(ISD, DstLT.second)) 338664e354dSChandler Carruth return SrcLT.first * 1; 339664e354dSChandler Carruth } 340664e354dSChandler Carruth 341664e354dSChandler Carruth // If we are converting vectors and the operation is illegal, or 342664e354dSChandler Carruth // if the vectors are legalized to different types, estimate the 343664e354dSChandler Carruth // scalarization costs. 344664e354dSChandler Carruth unsigned Num = Dst->getVectorNumElements(); 345664e354dSChandler Carruth unsigned Cost = TopTTI->getCastInstrCost(Opcode, Dst->getScalarType(), 346664e354dSChandler Carruth Src->getScalarType()); 347664e354dSChandler Carruth 348664e354dSChandler Carruth // Return the cost of multiple scalar invocation plus the cost of 349664e354dSChandler Carruth // inserting and extracting the values. 350664e354dSChandler Carruth return getScalarizationOverhead(Dst, true, true) + Num * Cost; 351664e354dSChandler Carruth } 352664e354dSChandler Carruth 353664e354dSChandler Carruth // We already handled vector-to-vector and scalar-to-scalar conversions. This 354664e354dSChandler Carruth // is where we handle bitcast between vectors and scalars. We need to assume 355664e354dSChandler Carruth // that the conversion is scalarized in one way or another. 356664e354dSChandler Carruth if (Opcode == Instruction::BitCast) 357664e354dSChandler Carruth // Illegal bitcasts are done by storing and loading from a stack slot. 358664e354dSChandler Carruth return (Src->isVectorTy()? getScalarizationOverhead(Src, false, true):0) + 359664e354dSChandler Carruth (Dst->isVectorTy()? getScalarizationOverhead(Dst, true, false):0); 360664e354dSChandler Carruth 361664e354dSChandler Carruth llvm_unreachable("Unhandled cast"); 362664e354dSChandler Carruth } 363664e354dSChandler Carruth 364664e354dSChandler Carruth unsigned BasicTTI::getCFInstrCost(unsigned Opcode) const { 365664e354dSChandler Carruth // Branches are assumed to be predicted. 366664e354dSChandler Carruth return 0; 367664e354dSChandler Carruth } 368664e354dSChandler Carruth 369664e354dSChandler Carruth unsigned BasicTTI::getCmpSelInstrCost(unsigned Opcode, Type *ValTy, 370664e354dSChandler Carruth Type *CondTy) const { 371afc1036fSBill Wendling const TargetLoweringBase *TLI = getTLI(); 372664e354dSChandler Carruth int ISD = TLI->InstructionOpcodeToISD(Opcode); 373664e354dSChandler Carruth assert(ISD && "Invalid opcode"); 374664e354dSChandler Carruth 375664e354dSChandler Carruth // Selects on vectors are actually vector selects. 376664e354dSChandler Carruth if (ISD == ISD::SELECT) { 377664e354dSChandler Carruth assert(CondTy && "CondTy must exist"); 378664e354dSChandler Carruth if (CondTy->isVectorTy()) 379664e354dSChandler Carruth ISD = ISD::VSELECT; 380664e354dSChandler Carruth } 381664e354dSChandler Carruth 382664e354dSChandler Carruth std::pair<unsigned, MVT> LT = TLI->getTypeLegalizationCost(ValTy); 383664e354dSChandler Carruth 384664e354dSChandler Carruth if (!TLI->isOperationExpand(ISD, LT.second)) { 385664e354dSChandler Carruth // The operation is legal. Assume it costs 1. Multiply 386664e354dSChandler Carruth // by the type-legalization overhead. 387664e354dSChandler Carruth return LT.first * 1; 388664e354dSChandler Carruth } 389664e354dSChandler Carruth 390664e354dSChandler Carruth // Otherwise, assume that the cast is scalarized. 391664e354dSChandler Carruth if (ValTy->isVectorTy()) { 392664e354dSChandler Carruth unsigned Num = ValTy->getVectorNumElements(); 393664e354dSChandler Carruth if (CondTy) 394664e354dSChandler Carruth CondTy = CondTy->getScalarType(); 395664e354dSChandler Carruth unsigned Cost = TopTTI->getCmpSelInstrCost(Opcode, ValTy->getScalarType(), 396664e354dSChandler Carruth CondTy); 397664e354dSChandler Carruth 398664e354dSChandler Carruth // Return the cost of multiple scalar invocation plus the cost of inserting 399664e354dSChandler Carruth // and extracting the values. 400664e354dSChandler Carruth return getScalarizationOverhead(ValTy, true, false) + Num * Cost; 401664e354dSChandler Carruth } 402664e354dSChandler Carruth 403664e354dSChandler Carruth // Unknown scalar opcode. 404664e354dSChandler Carruth return 1; 405664e354dSChandler Carruth } 406664e354dSChandler Carruth 407664e354dSChandler Carruth unsigned BasicTTI::getVectorInstrCost(unsigned Opcode, Type *Val, 408664e354dSChandler Carruth unsigned Index) const { 409ce376c0fSRaul E. Silvera std::pair<unsigned, MVT> LT = getTLI()->getTypeLegalizationCost(Val->getScalarType()); 410ce376c0fSRaul E. Silvera 411ce376c0fSRaul E. Silvera return LT.first; 412664e354dSChandler Carruth } 413664e354dSChandler Carruth 414664e354dSChandler Carruth unsigned BasicTTI::getMemoryOpCost(unsigned Opcode, Type *Src, 415664e354dSChandler Carruth unsigned Alignment, 416664e354dSChandler Carruth unsigned AddressSpace) const { 417664e354dSChandler Carruth assert(!Src->isVoidTy() && "Invalid type"); 418afc1036fSBill Wendling std::pair<unsigned, MVT> LT = getTLI()->getTypeLegalizationCost(Src); 419664e354dSChandler Carruth 4206fd19ab3SHal Finkel // Assuming that all loads of legal types cost 1. 4216fd19ab3SHal Finkel unsigned Cost = LT.first; 4226fd19ab3SHal Finkel 4236fd19ab3SHal Finkel if (Src->isVectorTy() && 4246fd19ab3SHal Finkel Src->getPrimitiveSizeInBits() < LT.second.getSizeInBits()) { 4256fd19ab3SHal Finkel // This is a vector load that legalizes to a larger type than the vector 4266fd19ab3SHal Finkel // itself. Unless the corresponding extending load or truncating store is 4276fd19ab3SHal Finkel // legal, then this will scalarize. 42856bf297eSHal Finkel TargetLowering::LegalizeAction LA = TargetLowering::Expand; 42956bf297eSHal Finkel EVT MemVT = getTLI()->getValueType(Src, true); 43056bf297eSHal Finkel if (MemVT.isSimple() && MemVT != MVT::Other) { 4316fd19ab3SHal Finkel if (Opcode == Instruction::Store) 43256bf297eSHal Finkel LA = getTLI()->getTruncStoreAction(LT.second, MemVT.getSimpleVT()); 4336fd19ab3SHal Finkel else 43456bf297eSHal Finkel LA = getTLI()->getLoadExtAction(ISD::EXTLOAD, MemVT.getSimpleVT()); 43556bf297eSHal Finkel } 4366fd19ab3SHal Finkel 4376fd19ab3SHal Finkel if (LA != TargetLowering::Legal && LA != TargetLowering::Custom) { 4386fd19ab3SHal Finkel // This is a vector load/store for some illegal type that is scalarized. 4396fd19ab3SHal Finkel // We must account for the cost of building or decomposing the vector. 4406fd19ab3SHal Finkel Cost += getScalarizationOverhead(Src, Opcode != Instruction::Store, 4416fd19ab3SHal Finkel Opcode == Instruction::Store); 4426fd19ab3SHal Finkel } 4436fd19ab3SHal Finkel } 4446fd19ab3SHal Finkel 4456fd19ab3SHal Finkel return Cost; 446664e354dSChandler Carruth } 447664e354dSChandler Carruth 448f7cfac7aSBenjamin Kramer unsigned BasicTTI::getIntrinsicInstrCost(Intrinsic::ID IID, Type *RetTy, 449664e354dSChandler Carruth ArrayRef<Type *> Tys) const { 450f7cfac7aSBenjamin Kramer unsigned ISD = 0; 451f7cfac7aSBenjamin Kramer switch (IID) { 452f7cfac7aSBenjamin Kramer default: { 453f7cfac7aSBenjamin Kramer // Assume that we need to scalarize this intrinsic. 454664e354dSChandler Carruth unsigned ScalarizationCost = 0; 455664e354dSChandler Carruth unsigned ScalarCalls = 1; 456664e354dSChandler Carruth if (RetTy->isVectorTy()) { 457664e354dSChandler Carruth ScalarizationCost = getScalarizationOverhead(RetTy, true, false); 458664e354dSChandler Carruth ScalarCalls = std::max(ScalarCalls, RetTy->getVectorNumElements()); 459664e354dSChandler Carruth } 460664e354dSChandler Carruth for (unsigned i = 0, ie = Tys.size(); i != ie; ++i) { 461664e354dSChandler Carruth if (Tys[i]->isVectorTy()) { 462664e354dSChandler Carruth ScalarizationCost += getScalarizationOverhead(Tys[i], false, true); 463664e354dSChandler Carruth ScalarCalls = std::max(ScalarCalls, RetTy->getVectorNumElements()); 464664e354dSChandler Carruth } 465664e354dSChandler Carruth } 466f7cfac7aSBenjamin Kramer 467664e354dSChandler Carruth return ScalarCalls + ScalarizationCost; 468664e354dSChandler Carruth } 469f7cfac7aSBenjamin Kramer // Look for intrinsics that can be lowered directly or turned into a scalar 470f7cfac7aSBenjamin Kramer // intrinsic call. 471f7cfac7aSBenjamin Kramer case Intrinsic::sqrt: ISD = ISD::FSQRT; break; 472f7cfac7aSBenjamin Kramer case Intrinsic::sin: ISD = ISD::FSIN; break; 473f7cfac7aSBenjamin Kramer case Intrinsic::cos: ISD = ISD::FCOS; break; 474f7cfac7aSBenjamin Kramer case Intrinsic::exp: ISD = ISD::FEXP; break; 475f7cfac7aSBenjamin Kramer case Intrinsic::exp2: ISD = ISD::FEXP2; break; 476f7cfac7aSBenjamin Kramer case Intrinsic::log: ISD = ISD::FLOG; break; 477f7cfac7aSBenjamin Kramer case Intrinsic::log10: ISD = ISD::FLOG10; break; 478f7cfac7aSBenjamin Kramer case Intrinsic::log2: ISD = ISD::FLOG2; break; 479f7cfac7aSBenjamin Kramer case Intrinsic::fabs: ISD = ISD::FABS; break; 4800c5c01aaSHal Finkel case Intrinsic::copysign: ISD = ISD::FCOPYSIGN; break; 481f7cfac7aSBenjamin Kramer case Intrinsic::floor: ISD = ISD::FFLOOR; break; 482f7cfac7aSBenjamin Kramer case Intrinsic::ceil: ISD = ISD::FCEIL; break; 483f7cfac7aSBenjamin Kramer case Intrinsic::trunc: ISD = ISD::FTRUNC; break; 484ec474f28SHal Finkel case Intrinsic::nearbyint: 485ec474f28SHal Finkel ISD = ISD::FNEARBYINT; break; 486f7cfac7aSBenjamin Kramer case Intrinsic::rint: ISD = ISD::FRINT; break; 487171817eeSHal Finkel case Intrinsic::round: ISD = ISD::FROUND; break; 488f7cfac7aSBenjamin Kramer case Intrinsic::pow: ISD = ISD::FPOW; break; 489f7cfac7aSBenjamin Kramer case Intrinsic::fma: ISD = ISD::FMA; break; 490*1625bfccSBenjamin Kramer case Intrinsic::fmuladd: ISD = ISD::FMA; break; 491a7cd6bf3SArnold Schwaighofer case Intrinsic::lifetime_start: 492a7cd6bf3SArnold Schwaighofer case Intrinsic::lifetime_end: 493a7cd6bf3SArnold Schwaighofer return 0; 494f7cfac7aSBenjamin Kramer } 495f7cfac7aSBenjamin Kramer 496afc1036fSBill Wendling const TargetLoweringBase *TLI = getTLI(); 497f7cfac7aSBenjamin Kramer std::pair<unsigned, MVT> LT = TLI->getTypeLegalizationCost(RetTy); 498f7cfac7aSBenjamin Kramer 499f7cfac7aSBenjamin Kramer if (TLI->isOperationLegalOrPromote(ISD, LT.second)) { 500f7cfac7aSBenjamin Kramer // The operation is legal. Assume it costs 1. 501f7cfac7aSBenjamin Kramer // If the type is split to multiple registers, assume that thre is some 502f7cfac7aSBenjamin Kramer // overhead to this. 503f7cfac7aSBenjamin Kramer // TODO: Once we have extract/insert subvector cost we need to use them. 504f7cfac7aSBenjamin Kramer if (LT.first > 1) 505f7cfac7aSBenjamin Kramer return LT.first * 2; 506f7cfac7aSBenjamin Kramer return LT.first * 1; 507f7cfac7aSBenjamin Kramer } 508f7cfac7aSBenjamin Kramer 509f7cfac7aSBenjamin Kramer if (!TLI->isOperationExpand(ISD, LT.second)) { 510f7cfac7aSBenjamin Kramer // If the operation is custom lowered then assume 511f7cfac7aSBenjamin Kramer // thare the code is twice as expensive. 512f7cfac7aSBenjamin Kramer return LT.first * 2; 513f7cfac7aSBenjamin Kramer } 514f7cfac7aSBenjamin Kramer 515*1625bfccSBenjamin Kramer // If we can't lower fmuladd into an FMA estimate the cost as a floating 516*1625bfccSBenjamin Kramer // point mul followed by an add. 517*1625bfccSBenjamin Kramer if (IID == Intrinsic::fmuladd) 518*1625bfccSBenjamin Kramer return TopTTI->getArithmeticInstrCost(BinaryOperator::FMul, RetTy) + 519*1625bfccSBenjamin Kramer TopTTI->getArithmeticInstrCost(BinaryOperator::FAdd, RetTy); 520*1625bfccSBenjamin Kramer 521f7cfac7aSBenjamin Kramer // Else, assume that we need to scalarize this intrinsic. For math builtins 522f7cfac7aSBenjamin Kramer // this will emit a costly libcall, adding call overhead and spills. Make it 523f7cfac7aSBenjamin Kramer // very expensive. 524f7cfac7aSBenjamin Kramer if (RetTy->isVectorTy()) { 525f7cfac7aSBenjamin Kramer unsigned Num = RetTy->getVectorNumElements(); 526f7cfac7aSBenjamin Kramer unsigned Cost = TopTTI->getIntrinsicInstrCost(IID, RetTy->getScalarType(), 527f7cfac7aSBenjamin Kramer Tys); 528f7cfac7aSBenjamin Kramer return 10 * Cost * Num; 529f7cfac7aSBenjamin Kramer } 530f7cfac7aSBenjamin Kramer 531f7cfac7aSBenjamin Kramer // This is going to be turned into a library call, make it expensive. 532f7cfac7aSBenjamin Kramer return 10; 533f7cfac7aSBenjamin Kramer } 534664e354dSChandler Carruth 535664e354dSChandler Carruth unsigned BasicTTI::getNumberOfParts(Type *Tp) const { 536afc1036fSBill Wendling std::pair<unsigned, MVT> LT = getTLI()->getTypeLegalizationCost(Tp); 537664e354dSChandler Carruth return LT.first; 538664e354dSChandler Carruth } 539594fa2dcSArnold Schwaighofer 5409da9a43aSArnold Schwaighofer unsigned BasicTTI::getAddressComputationCost(Type *Ty, bool IsComplex) const { 541594fa2dcSArnold Schwaighofer return 0; 542594fa2dcSArnold Schwaighofer } 543cae8735aSArnold Schwaighofer 544cae8735aSArnold Schwaighofer unsigned BasicTTI::getReductionCost(unsigned Opcode, Type *Ty, 545cae8735aSArnold Schwaighofer bool IsPairwise) const { 546cae8735aSArnold Schwaighofer assert(Ty->isVectorTy() && "Expect a vector type"); 547cae8735aSArnold Schwaighofer unsigned NumVecElts = Ty->getVectorNumElements(); 548cae8735aSArnold Schwaighofer unsigned NumReduxLevels = Log2_32(NumVecElts); 549cae8735aSArnold Schwaighofer unsigned ArithCost = NumReduxLevels * 550cae8735aSArnold Schwaighofer TopTTI->getArithmeticInstrCost(Opcode, Ty); 551cae8735aSArnold Schwaighofer // Assume the pairwise shuffles add a cost. 552cae8735aSArnold Schwaighofer unsigned ShuffleCost = 553cae8735aSArnold Schwaighofer NumReduxLevels * (IsPairwise + 1) * 554cae8735aSArnold Schwaighofer TopTTI->getShuffleCost(SK_ExtractSubvector, Ty, NumVecElts / 2, Ty); 555cae8735aSArnold Schwaighofer return ShuffleCost + ArithCost + getScalarizationOverhead(Ty, false, true); 556cae8735aSArnold Schwaighofer } 557