14d6fb72aSErik Eckstein //===- FunctionComparator.h - Function Comparator -------------------------===// 24d6fb72aSErik Eckstein // 34d6fb72aSErik Eckstein // The LLVM Compiler Infrastructure 44d6fb72aSErik Eckstein // 54d6fb72aSErik Eckstein // This file is distributed under the University of Illinois Open Source 64d6fb72aSErik Eckstein // License. See LICENSE.TXT for details. 74d6fb72aSErik Eckstein // 84d6fb72aSErik Eckstein //===----------------------------------------------------------------------===// 94d6fb72aSErik Eckstein // 104d6fb72aSErik Eckstein // This file implements the FunctionComparator and GlobalNumberState classes 114d6fb72aSErik Eckstein // which are used by the MergeFunctions pass for comparing functions. 124d6fb72aSErik Eckstein // 134d6fb72aSErik Eckstein //===----------------------------------------------------------------------===// 144d6fb72aSErik Eckstein 154d6fb72aSErik Eckstein #include "llvm/Transforms/Utils/FunctionComparator.h" 164d6fb72aSErik Eckstein #include "llvm/ADT/SmallSet.h" 174d6fb72aSErik Eckstein #include "llvm/IR/CallSite.h" 184d6fb72aSErik Eckstein #include "llvm/IR/InlineAsm.h" 196bda14b3SChandler Carruth #include "llvm/IR/Instructions.h" 204d6fb72aSErik Eckstein #include "llvm/IR/Module.h" 214d6fb72aSErik Eckstein #include "llvm/Support/Debug.h" 224d6fb72aSErik Eckstein #include "llvm/Support/raw_ostream.h" 234d6fb72aSErik Eckstein 244d6fb72aSErik Eckstein using namespace llvm; 254d6fb72aSErik Eckstein 264d6fb72aSErik Eckstein #define DEBUG_TYPE "functioncomparator" 274d6fb72aSErik Eckstein 284d6fb72aSErik Eckstein int FunctionComparator::cmpNumbers(uint64_t L, uint64_t R) const { 294d6fb72aSErik Eckstein if (L < R) return -1; 304d6fb72aSErik Eckstein if (L > R) return 1; 314d6fb72aSErik Eckstein return 0; 324d6fb72aSErik Eckstein } 334d6fb72aSErik Eckstein 344d6fb72aSErik Eckstein int FunctionComparator::cmpOrderings(AtomicOrdering L, AtomicOrdering R) const { 354d6fb72aSErik Eckstein if ((int)L < (int)R) return -1; 364d6fb72aSErik Eckstein if ((int)L > (int)R) return 1; 374d6fb72aSErik Eckstein return 0; 384d6fb72aSErik Eckstein } 394d6fb72aSErik Eckstein 404d6fb72aSErik Eckstein int FunctionComparator::cmpAPInts(const APInt &L, const APInt &R) const { 414d6fb72aSErik Eckstein if (int Res = cmpNumbers(L.getBitWidth(), R.getBitWidth())) 424d6fb72aSErik Eckstein return Res; 434d6fb72aSErik Eckstein if (L.ugt(R)) return 1; 444d6fb72aSErik Eckstein if (R.ugt(L)) return -1; 454d6fb72aSErik Eckstein return 0; 464d6fb72aSErik Eckstein } 474d6fb72aSErik Eckstein 484d6fb72aSErik Eckstein int FunctionComparator::cmpAPFloats(const APFloat &L, const APFloat &R) const { 494d6fb72aSErik Eckstein // Floats are ordered first by semantics (i.e. float, double, half, etc.), 504d6fb72aSErik Eckstein // then by value interpreted as a bitstring (aka APInt). 514d6fb72aSErik Eckstein const fltSemantics &SL = L.getSemantics(), &SR = R.getSemantics(); 524d6fb72aSErik Eckstein if (int Res = cmpNumbers(APFloat::semanticsPrecision(SL), 534d6fb72aSErik Eckstein APFloat::semanticsPrecision(SR))) 544d6fb72aSErik Eckstein return Res; 554d6fb72aSErik Eckstein if (int Res = cmpNumbers(APFloat::semanticsMaxExponent(SL), 564d6fb72aSErik Eckstein APFloat::semanticsMaxExponent(SR))) 574d6fb72aSErik Eckstein return Res; 584d6fb72aSErik Eckstein if (int Res = cmpNumbers(APFloat::semanticsMinExponent(SL), 594d6fb72aSErik Eckstein APFloat::semanticsMinExponent(SR))) 604d6fb72aSErik Eckstein return Res; 614d6fb72aSErik Eckstein if (int Res = cmpNumbers(APFloat::semanticsSizeInBits(SL), 624d6fb72aSErik Eckstein APFloat::semanticsSizeInBits(SR))) 634d6fb72aSErik Eckstein return Res; 644d6fb72aSErik Eckstein return cmpAPInts(L.bitcastToAPInt(), R.bitcastToAPInt()); 654d6fb72aSErik Eckstein } 664d6fb72aSErik Eckstein 674d6fb72aSErik Eckstein int FunctionComparator::cmpMem(StringRef L, StringRef R) const { 684d6fb72aSErik Eckstein // Prevent heavy comparison, compare sizes first. 694d6fb72aSErik Eckstein if (int Res = cmpNumbers(L.size(), R.size())) 704d6fb72aSErik Eckstein return Res; 714d6fb72aSErik Eckstein 724d6fb72aSErik Eckstein // Compare strings lexicographically only when it is necessary: only when 734d6fb72aSErik Eckstein // strings are equal in size. 744d6fb72aSErik Eckstein return L.compare(R); 754d6fb72aSErik Eckstein } 764d6fb72aSErik Eckstein 77b518054bSReid Kleckner int FunctionComparator::cmpAttrs(const AttributeList L, 78b518054bSReid Kleckner const AttributeList R) const { 798bf67fe9SReid Kleckner if (int Res = cmpNumbers(L.getNumAttrSets(), R.getNumAttrSets())) 804d6fb72aSErik Eckstein return Res; 814d6fb72aSErik Eckstein 828bf67fe9SReid Kleckner for (unsigned i = L.index_begin(), e = L.index_end(); i != e; ++i) { 838bf67fe9SReid Kleckner AttributeSet LAS = L.getAttributes(i); 848bf67fe9SReid Kleckner AttributeSet RAS = R.getAttributes(i); 858bf67fe9SReid Kleckner AttributeSet::iterator LI = LAS.begin(), LE = LAS.end(); 868bf67fe9SReid Kleckner AttributeSet::iterator RI = RAS.begin(), RE = RAS.end(); 874d6fb72aSErik Eckstein for (; LI != LE && RI != RE; ++LI, ++RI) { 884d6fb72aSErik Eckstein Attribute LA = *LI; 894d6fb72aSErik Eckstein Attribute RA = *RI; 904d6fb72aSErik Eckstein if (LA < RA) 914d6fb72aSErik Eckstein return -1; 924d6fb72aSErik Eckstein if (RA < LA) 934d6fb72aSErik Eckstein return 1; 944d6fb72aSErik Eckstein } 954d6fb72aSErik Eckstein if (LI != LE) 964d6fb72aSErik Eckstein return 1; 974d6fb72aSErik Eckstein if (RI != RE) 984d6fb72aSErik Eckstein return -1; 994d6fb72aSErik Eckstein } 1004d6fb72aSErik Eckstein return 0; 1014d6fb72aSErik Eckstein } 1024d6fb72aSErik Eckstein 1034d6fb72aSErik Eckstein int FunctionComparator::cmpRangeMetadata(const MDNode *L, 1044d6fb72aSErik Eckstein const MDNode *R) const { 1054d6fb72aSErik Eckstein if (L == R) 1064d6fb72aSErik Eckstein return 0; 1074d6fb72aSErik Eckstein if (!L) 1084d6fb72aSErik Eckstein return -1; 1094d6fb72aSErik Eckstein if (!R) 1104d6fb72aSErik Eckstein return 1; 1114d6fb72aSErik Eckstein // Range metadata is a sequence of numbers. Make sure they are the same 1124d6fb72aSErik Eckstein // sequence. 1134d6fb72aSErik Eckstein // TODO: Note that as this is metadata, it is possible to drop and/or merge 1144d6fb72aSErik Eckstein // this data when considering functions to merge. Thus this comparison would 1154d6fb72aSErik Eckstein // return 0 (i.e. equivalent), but merging would become more complicated 1164d6fb72aSErik Eckstein // because the ranges would need to be unioned. It is not likely that 1174d6fb72aSErik Eckstein // functions differ ONLY in this metadata if they are actually the same 1184d6fb72aSErik Eckstein // function semantically. 1194d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getNumOperands(), R->getNumOperands())) 1204d6fb72aSErik Eckstein return Res; 1214d6fb72aSErik Eckstein for (size_t I = 0; I < L->getNumOperands(); ++I) { 1224d6fb72aSErik Eckstein ConstantInt *LLow = mdconst::extract<ConstantInt>(L->getOperand(I)); 1234d6fb72aSErik Eckstein ConstantInt *RLow = mdconst::extract<ConstantInt>(R->getOperand(I)); 1244d6fb72aSErik Eckstein if (int Res = cmpAPInts(LLow->getValue(), RLow->getValue())) 1254d6fb72aSErik Eckstein return Res; 1264d6fb72aSErik Eckstein } 1274d6fb72aSErik Eckstein return 0; 1284d6fb72aSErik Eckstein } 1294d6fb72aSErik Eckstein 1304d6fb72aSErik Eckstein int FunctionComparator::cmpOperandBundlesSchema(const Instruction *L, 1314d6fb72aSErik Eckstein const Instruction *R) const { 1324d6fb72aSErik Eckstein ImmutableCallSite LCS(L); 1334d6fb72aSErik Eckstein ImmutableCallSite RCS(R); 1344d6fb72aSErik Eckstein 1354d6fb72aSErik Eckstein assert(LCS && RCS && "Must be calls or invokes!"); 1364d6fb72aSErik Eckstein assert(LCS.isCall() == RCS.isCall() && "Can't compare otherwise!"); 1374d6fb72aSErik Eckstein 1384d6fb72aSErik Eckstein if (int Res = 1394d6fb72aSErik Eckstein cmpNumbers(LCS.getNumOperandBundles(), RCS.getNumOperandBundles())) 1404d6fb72aSErik Eckstein return Res; 1414d6fb72aSErik Eckstein 1424d6fb72aSErik Eckstein for (unsigned i = 0, e = LCS.getNumOperandBundles(); i != e; ++i) { 1434d6fb72aSErik Eckstein auto OBL = LCS.getOperandBundleAt(i); 1444d6fb72aSErik Eckstein auto OBR = RCS.getOperandBundleAt(i); 1454d6fb72aSErik Eckstein 1464d6fb72aSErik Eckstein if (int Res = OBL.getTagName().compare(OBR.getTagName())) 1474d6fb72aSErik Eckstein return Res; 1484d6fb72aSErik Eckstein 1494d6fb72aSErik Eckstein if (int Res = cmpNumbers(OBL.Inputs.size(), OBR.Inputs.size())) 1504d6fb72aSErik Eckstein return Res; 1514d6fb72aSErik Eckstein } 1524d6fb72aSErik Eckstein 1534d6fb72aSErik Eckstein return 0; 1544d6fb72aSErik Eckstein } 1554d6fb72aSErik Eckstein 1564d6fb72aSErik Eckstein /// Constants comparison: 1574d6fb72aSErik Eckstein /// 1. Check whether type of L constant could be losslessly bitcasted to R 1584d6fb72aSErik Eckstein /// type. 1594d6fb72aSErik Eckstein /// 2. Compare constant contents. 1604d6fb72aSErik Eckstein /// For more details see declaration comments. 1614d6fb72aSErik Eckstein int FunctionComparator::cmpConstants(const Constant *L, 1624d6fb72aSErik Eckstein const Constant *R) const { 1634d6fb72aSErik Eckstein 1644d6fb72aSErik Eckstein Type *TyL = L->getType(); 1654d6fb72aSErik Eckstein Type *TyR = R->getType(); 1664d6fb72aSErik Eckstein 1674d6fb72aSErik Eckstein // Check whether types are bitcastable. This part is just re-factored 1684d6fb72aSErik Eckstein // Type::canLosslesslyBitCastTo method, but instead of returning true/false, 1694d6fb72aSErik Eckstein // we also pack into result which type is "less" for us. 1704d6fb72aSErik Eckstein int TypesRes = cmpTypes(TyL, TyR); 1714d6fb72aSErik Eckstein if (TypesRes != 0) { 1724d6fb72aSErik Eckstein // Types are different, but check whether we can bitcast them. 1734d6fb72aSErik Eckstein if (!TyL->isFirstClassType()) { 1744d6fb72aSErik Eckstein if (TyR->isFirstClassType()) 1754d6fb72aSErik Eckstein return -1; 1764d6fb72aSErik Eckstein // Neither TyL nor TyR are values of first class type. Return the result 1774d6fb72aSErik Eckstein // of comparing the types 1784d6fb72aSErik Eckstein return TypesRes; 1794d6fb72aSErik Eckstein } 1804d6fb72aSErik Eckstein if (!TyR->isFirstClassType()) { 1814d6fb72aSErik Eckstein if (TyL->isFirstClassType()) 1824d6fb72aSErik Eckstein return 1; 1834d6fb72aSErik Eckstein return TypesRes; 1844d6fb72aSErik Eckstein } 1854d6fb72aSErik Eckstein 1864d6fb72aSErik Eckstein // Vector -> Vector conversions are always lossless if the two vector types 1874d6fb72aSErik Eckstein // have the same size, otherwise not. 1884d6fb72aSErik Eckstein unsigned TyLWidth = 0; 1894d6fb72aSErik Eckstein unsigned TyRWidth = 0; 1904d6fb72aSErik Eckstein 1914d6fb72aSErik Eckstein if (auto *VecTyL = dyn_cast<VectorType>(TyL)) 1924d6fb72aSErik Eckstein TyLWidth = VecTyL->getBitWidth(); 1934d6fb72aSErik Eckstein if (auto *VecTyR = dyn_cast<VectorType>(TyR)) 1944d6fb72aSErik Eckstein TyRWidth = VecTyR->getBitWidth(); 1954d6fb72aSErik Eckstein 1964d6fb72aSErik Eckstein if (TyLWidth != TyRWidth) 1974d6fb72aSErik Eckstein return cmpNumbers(TyLWidth, TyRWidth); 1984d6fb72aSErik Eckstein 1994d6fb72aSErik Eckstein // Zero bit-width means neither TyL nor TyR are vectors. 2004d6fb72aSErik Eckstein if (!TyLWidth) { 2014d6fb72aSErik Eckstein PointerType *PTyL = dyn_cast<PointerType>(TyL); 2024d6fb72aSErik Eckstein PointerType *PTyR = dyn_cast<PointerType>(TyR); 2034d6fb72aSErik Eckstein if (PTyL && PTyR) { 2044d6fb72aSErik Eckstein unsigned AddrSpaceL = PTyL->getAddressSpace(); 2054d6fb72aSErik Eckstein unsigned AddrSpaceR = PTyR->getAddressSpace(); 2064d6fb72aSErik Eckstein if (int Res = cmpNumbers(AddrSpaceL, AddrSpaceR)) 2074d6fb72aSErik Eckstein return Res; 2084d6fb72aSErik Eckstein } 2094d6fb72aSErik Eckstein if (PTyL) 2104d6fb72aSErik Eckstein return 1; 2114d6fb72aSErik Eckstein if (PTyR) 2124d6fb72aSErik Eckstein return -1; 2134d6fb72aSErik Eckstein 2144d6fb72aSErik Eckstein // TyL and TyR aren't vectors, nor pointers. We don't know how to 2154d6fb72aSErik Eckstein // bitcast them. 2164d6fb72aSErik Eckstein return TypesRes; 2174d6fb72aSErik Eckstein } 2184d6fb72aSErik Eckstein } 2194d6fb72aSErik Eckstein 2204d6fb72aSErik Eckstein // OK, types are bitcastable, now check constant contents. 2214d6fb72aSErik Eckstein 2224d6fb72aSErik Eckstein if (L->isNullValue() && R->isNullValue()) 2234d6fb72aSErik Eckstein return TypesRes; 2244d6fb72aSErik Eckstein if (L->isNullValue() && !R->isNullValue()) 2254d6fb72aSErik Eckstein return 1; 2264d6fb72aSErik Eckstein if (!L->isNullValue() && R->isNullValue()) 2274d6fb72aSErik Eckstein return -1; 2284d6fb72aSErik Eckstein 2294d6fb72aSErik Eckstein auto GlobalValueL = const_cast<GlobalValue*>(dyn_cast<GlobalValue>(L)); 2304d6fb72aSErik Eckstein auto GlobalValueR = const_cast<GlobalValue*>(dyn_cast<GlobalValue>(R)); 2314d6fb72aSErik Eckstein if (GlobalValueL && GlobalValueR) { 2324d6fb72aSErik Eckstein return cmpGlobalValues(GlobalValueL, GlobalValueR); 2334d6fb72aSErik Eckstein } 2344d6fb72aSErik Eckstein 2354d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getValueID(), R->getValueID())) 2364d6fb72aSErik Eckstein return Res; 2374d6fb72aSErik Eckstein 2384d6fb72aSErik Eckstein if (const auto *SeqL = dyn_cast<ConstantDataSequential>(L)) { 2394d6fb72aSErik Eckstein const auto *SeqR = cast<ConstantDataSequential>(R); 2404d6fb72aSErik Eckstein // This handles ConstantDataArray and ConstantDataVector. Note that we 2414d6fb72aSErik Eckstein // compare the two raw data arrays, which might differ depending on the host 2424d6fb72aSErik Eckstein // endianness. This isn't a problem though, because the endiness of a module 2434d6fb72aSErik Eckstein // will affect the order of the constants, but this order is the same 2444d6fb72aSErik Eckstein // for a given input module and host platform. 2454d6fb72aSErik Eckstein return cmpMem(SeqL->getRawDataValues(), SeqR->getRawDataValues()); 2464d6fb72aSErik Eckstein } 2474d6fb72aSErik Eckstein 2484d6fb72aSErik Eckstein switch (L->getValueID()) { 2494d6fb72aSErik Eckstein case Value::UndefValueVal: 2504d6fb72aSErik Eckstein case Value::ConstantTokenNoneVal: 2514d6fb72aSErik Eckstein return TypesRes; 2524d6fb72aSErik Eckstein case Value::ConstantIntVal: { 2534d6fb72aSErik Eckstein const APInt &LInt = cast<ConstantInt>(L)->getValue(); 2544d6fb72aSErik Eckstein const APInt &RInt = cast<ConstantInt>(R)->getValue(); 2554d6fb72aSErik Eckstein return cmpAPInts(LInt, RInt); 2564d6fb72aSErik Eckstein } 2574d6fb72aSErik Eckstein case Value::ConstantFPVal: { 2584d6fb72aSErik Eckstein const APFloat &LAPF = cast<ConstantFP>(L)->getValueAPF(); 2594d6fb72aSErik Eckstein const APFloat &RAPF = cast<ConstantFP>(R)->getValueAPF(); 2604d6fb72aSErik Eckstein return cmpAPFloats(LAPF, RAPF); 2614d6fb72aSErik Eckstein } 2624d6fb72aSErik Eckstein case Value::ConstantArrayVal: { 2634d6fb72aSErik Eckstein const ConstantArray *LA = cast<ConstantArray>(L); 2644d6fb72aSErik Eckstein const ConstantArray *RA = cast<ConstantArray>(R); 2654d6fb72aSErik Eckstein uint64_t NumElementsL = cast<ArrayType>(TyL)->getNumElements(); 2664d6fb72aSErik Eckstein uint64_t NumElementsR = cast<ArrayType>(TyR)->getNumElements(); 2674d6fb72aSErik Eckstein if (int Res = cmpNumbers(NumElementsL, NumElementsR)) 2684d6fb72aSErik Eckstein return Res; 2694d6fb72aSErik Eckstein for (uint64_t i = 0; i < NumElementsL; ++i) { 2704d6fb72aSErik Eckstein if (int Res = cmpConstants(cast<Constant>(LA->getOperand(i)), 2714d6fb72aSErik Eckstein cast<Constant>(RA->getOperand(i)))) 2724d6fb72aSErik Eckstein return Res; 2734d6fb72aSErik Eckstein } 2744d6fb72aSErik Eckstein return 0; 2754d6fb72aSErik Eckstein } 2764d6fb72aSErik Eckstein case Value::ConstantStructVal: { 2774d6fb72aSErik Eckstein const ConstantStruct *LS = cast<ConstantStruct>(L); 2784d6fb72aSErik Eckstein const ConstantStruct *RS = cast<ConstantStruct>(R); 2794d6fb72aSErik Eckstein unsigned NumElementsL = cast<StructType>(TyL)->getNumElements(); 2804d6fb72aSErik Eckstein unsigned NumElementsR = cast<StructType>(TyR)->getNumElements(); 2814d6fb72aSErik Eckstein if (int Res = cmpNumbers(NumElementsL, NumElementsR)) 2824d6fb72aSErik Eckstein return Res; 2834d6fb72aSErik Eckstein for (unsigned i = 0; i != NumElementsL; ++i) { 2844d6fb72aSErik Eckstein if (int Res = cmpConstants(cast<Constant>(LS->getOperand(i)), 2854d6fb72aSErik Eckstein cast<Constant>(RS->getOperand(i)))) 2864d6fb72aSErik Eckstein return Res; 2874d6fb72aSErik Eckstein } 2884d6fb72aSErik Eckstein return 0; 2894d6fb72aSErik Eckstein } 2904d6fb72aSErik Eckstein case Value::ConstantVectorVal: { 2914d6fb72aSErik Eckstein const ConstantVector *LV = cast<ConstantVector>(L); 2924d6fb72aSErik Eckstein const ConstantVector *RV = cast<ConstantVector>(R); 2934d6fb72aSErik Eckstein unsigned NumElementsL = cast<VectorType>(TyL)->getNumElements(); 2944d6fb72aSErik Eckstein unsigned NumElementsR = cast<VectorType>(TyR)->getNumElements(); 2954d6fb72aSErik Eckstein if (int Res = cmpNumbers(NumElementsL, NumElementsR)) 2964d6fb72aSErik Eckstein return Res; 2974d6fb72aSErik Eckstein for (uint64_t i = 0; i < NumElementsL; ++i) { 2984d6fb72aSErik Eckstein if (int Res = cmpConstants(cast<Constant>(LV->getOperand(i)), 2994d6fb72aSErik Eckstein cast<Constant>(RV->getOperand(i)))) 3004d6fb72aSErik Eckstein return Res; 3014d6fb72aSErik Eckstein } 3024d6fb72aSErik Eckstein return 0; 3034d6fb72aSErik Eckstein } 3044d6fb72aSErik Eckstein case Value::ConstantExprVal: { 3054d6fb72aSErik Eckstein const ConstantExpr *LE = cast<ConstantExpr>(L); 3064d6fb72aSErik Eckstein const ConstantExpr *RE = cast<ConstantExpr>(R); 3074d6fb72aSErik Eckstein unsigned NumOperandsL = LE->getNumOperands(); 3084d6fb72aSErik Eckstein unsigned NumOperandsR = RE->getNumOperands(); 3094d6fb72aSErik Eckstein if (int Res = cmpNumbers(NumOperandsL, NumOperandsR)) 3104d6fb72aSErik Eckstein return Res; 3114d6fb72aSErik Eckstein for (unsigned i = 0; i < NumOperandsL; ++i) { 3124d6fb72aSErik Eckstein if (int Res = cmpConstants(cast<Constant>(LE->getOperand(i)), 3134d6fb72aSErik Eckstein cast<Constant>(RE->getOperand(i)))) 3144d6fb72aSErik Eckstein return Res; 3154d6fb72aSErik Eckstein } 3164d6fb72aSErik Eckstein return 0; 3174d6fb72aSErik Eckstein } 3184d6fb72aSErik Eckstein case Value::BlockAddressVal: { 3194d6fb72aSErik Eckstein const BlockAddress *LBA = cast<BlockAddress>(L); 3204d6fb72aSErik Eckstein const BlockAddress *RBA = cast<BlockAddress>(R); 3214d6fb72aSErik Eckstein if (int Res = cmpValues(LBA->getFunction(), RBA->getFunction())) 3224d6fb72aSErik Eckstein return Res; 3234d6fb72aSErik Eckstein if (LBA->getFunction() == RBA->getFunction()) { 3244d6fb72aSErik Eckstein // They are BBs in the same function. Order by which comes first in the 3254d6fb72aSErik Eckstein // BB order of the function. This order is deterministic. 3264d6fb72aSErik Eckstein Function* F = LBA->getFunction(); 3274d6fb72aSErik Eckstein BasicBlock *LBB = LBA->getBasicBlock(); 3284d6fb72aSErik Eckstein BasicBlock *RBB = RBA->getBasicBlock(); 3294d6fb72aSErik Eckstein if (LBB == RBB) 3304d6fb72aSErik Eckstein return 0; 3314d6fb72aSErik Eckstein for(BasicBlock &BB : F->getBasicBlockList()) { 3324d6fb72aSErik Eckstein if (&BB == LBB) { 3334d6fb72aSErik Eckstein assert(&BB != RBB); 3344d6fb72aSErik Eckstein return -1; 3354d6fb72aSErik Eckstein } 3364d6fb72aSErik Eckstein if (&BB == RBB) 3374d6fb72aSErik Eckstein return 1; 3384d6fb72aSErik Eckstein } 3394d6fb72aSErik Eckstein llvm_unreachable("Basic Block Address does not point to a basic block in " 3404d6fb72aSErik Eckstein "its function."); 3414d6fb72aSErik Eckstein return -1; 3424d6fb72aSErik Eckstein } else { 3434d6fb72aSErik Eckstein // cmpValues said the functions are the same. So because they aren't 3444d6fb72aSErik Eckstein // literally the same pointer, they must respectively be the left and 3454d6fb72aSErik Eckstein // right functions. 3464d6fb72aSErik Eckstein assert(LBA->getFunction() == FnL && RBA->getFunction() == FnR); 3474d6fb72aSErik Eckstein // cmpValues will tell us if these are equivalent BasicBlocks, in the 3484d6fb72aSErik Eckstein // context of their respective functions. 3494d6fb72aSErik Eckstein return cmpValues(LBA->getBasicBlock(), RBA->getBasicBlock()); 3504d6fb72aSErik Eckstein } 3514d6fb72aSErik Eckstein } 3524d6fb72aSErik Eckstein default: // Unknown constant, abort. 3534d6fb72aSErik Eckstein DEBUG(dbgs() << "Looking at valueID " << L->getValueID() << "\n"); 3544d6fb72aSErik Eckstein llvm_unreachable("Constant ValueID not recognized."); 3554d6fb72aSErik Eckstein return -1; 3564d6fb72aSErik Eckstein } 3574d6fb72aSErik Eckstein } 3584d6fb72aSErik Eckstein 3594d6fb72aSErik Eckstein int FunctionComparator::cmpGlobalValues(GlobalValue *L, GlobalValue *R) const { 360c1d52e5cSErik Eckstein uint64_t LNumber = GlobalNumbers->getNumber(L); 361c1d52e5cSErik Eckstein uint64_t RNumber = GlobalNumbers->getNumber(R); 362c1d52e5cSErik Eckstein return cmpNumbers(LNumber, RNumber); 3634d6fb72aSErik Eckstein } 3644d6fb72aSErik Eckstein 3654d6fb72aSErik Eckstein /// cmpType - compares two types, 3664d6fb72aSErik Eckstein /// defines total ordering among the types set. 3674d6fb72aSErik Eckstein /// See method declaration comments for more details. 3684d6fb72aSErik Eckstein int FunctionComparator::cmpTypes(Type *TyL, Type *TyR) const { 3694d6fb72aSErik Eckstein PointerType *PTyL = dyn_cast<PointerType>(TyL); 3704d6fb72aSErik Eckstein PointerType *PTyR = dyn_cast<PointerType>(TyR); 3714d6fb72aSErik Eckstein 3724d6fb72aSErik Eckstein const DataLayout &DL = FnL->getParent()->getDataLayout(); 3734d6fb72aSErik Eckstein if (PTyL && PTyL->getAddressSpace() == 0) 3744d6fb72aSErik Eckstein TyL = DL.getIntPtrType(TyL); 3754d6fb72aSErik Eckstein if (PTyR && PTyR->getAddressSpace() == 0) 3764d6fb72aSErik Eckstein TyR = DL.getIntPtrType(TyR); 3774d6fb72aSErik Eckstein 3784d6fb72aSErik Eckstein if (TyL == TyR) 3794d6fb72aSErik Eckstein return 0; 3804d6fb72aSErik Eckstein 3814d6fb72aSErik Eckstein if (int Res = cmpNumbers(TyL->getTypeID(), TyR->getTypeID())) 3824d6fb72aSErik Eckstein return Res; 3834d6fb72aSErik Eckstein 3844d6fb72aSErik Eckstein switch (TyL->getTypeID()) { 3854d6fb72aSErik Eckstein default: 3864d6fb72aSErik Eckstein llvm_unreachable("Unknown type!"); 3874d6fb72aSErik Eckstein // Fall through in Release mode. 3884d6fb72aSErik Eckstein LLVM_FALLTHROUGH; 3894d6fb72aSErik Eckstein case Type::IntegerTyID: 3904d6fb72aSErik Eckstein return cmpNumbers(cast<IntegerType>(TyL)->getBitWidth(), 3914d6fb72aSErik Eckstein cast<IntegerType>(TyR)->getBitWidth()); 3924d6fb72aSErik Eckstein // TyL == TyR would have returned true earlier, because types are uniqued. 3934d6fb72aSErik Eckstein case Type::VoidTyID: 3944d6fb72aSErik Eckstein case Type::FloatTyID: 3954d6fb72aSErik Eckstein case Type::DoubleTyID: 3964d6fb72aSErik Eckstein case Type::X86_FP80TyID: 3974d6fb72aSErik Eckstein case Type::FP128TyID: 3984d6fb72aSErik Eckstein case Type::PPC_FP128TyID: 3994d6fb72aSErik Eckstein case Type::LabelTyID: 4004d6fb72aSErik Eckstein case Type::MetadataTyID: 4014d6fb72aSErik Eckstein case Type::TokenTyID: 4024d6fb72aSErik Eckstein return 0; 4034d6fb72aSErik Eckstein 4044d6fb72aSErik Eckstein case Type::PointerTyID: { 4054d6fb72aSErik Eckstein assert(PTyL && PTyR && "Both types must be pointers here."); 4064d6fb72aSErik Eckstein return cmpNumbers(PTyL->getAddressSpace(), PTyR->getAddressSpace()); 4074d6fb72aSErik Eckstein } 4084d6fb72aSErik Eckstein 4094d6fb72aSErik Eckstein case Type::StructTyID: { 4104d6fb72aSErik Eckstein StructType *STyL = cast<StructType>(TyL); 4114d6fb72aSErik Eckstein StructType *STyR = cast<StructType>(TyR); 4124d6fb72aSErik Eckstein if (STyL->getNumElements() != STyR->getNumElements()) 4134d6fb72aSErik Eckstein return cmpNumbers(STyL->getNumElements(), STyR->getNumElements()); 4144d6fb72aSErik Eckstein 4154d6fb72aSErik Eckstein if (STyL->isPacked() != STyR->isPacked()) 4164d6fb72aSErik Eckstein return cmpNumbers(STyL->isPacked(), STyR->isPacked()); 4174d6fb72aSErik Eckstein 4184d6fb72aSErik Eckstein for (unsigned i = 0, e = STyL->getNumElements(); i != e; ++i) { 4194d6fb72aSErik Eckstein if (int Res = cmpTypes(STyL->getElementType(i), STyR->getElementType(i))) 4204d6fb72aSErik Eckstein return Res; 4214d6fb72aSErik Eckstein } 4224d6fb72aSErik Eckstein return 0; 4234d6fb72aSErik Eckstein } 4244d6fb72aSErik Eckstein 4254d6fb72aSErik Eckstein case Type::FunctionTyID: { 4264d6fb72aSErik Eckstein FunctionType *FTyL = cast<FunctionType>(TyL); 4274d6fb72aSErik Eckstein FunctionType *FTyR = cast<FunctionType>(TyR); 4284d6fb72aSErik Eckstein if (FTyL->getNumParams() != FTyR->getNumParams()) 4294d6fb72aSErik Eckstein return cmpNumbers(FTyL->getNumParams(), FTyR->getNumParams()); 4304d6fb72aSErik Eckstein 4314d6fb72aSErik Eckstein if (FTyL->isVarArg() != FTyR->isVarArg()) 4324d6fb72aSErik Eckstein return cmpNumbers(FTyL->isVarArg(), FTyR->isVarArg()); 4334d6fb72aSErik Eckstein 4344d6fb72aSErik Eckstein if (int Res = cmpTypes(FTyL->getReturnType(), FTyR->getReturnType())) 4354d6fb72aSErik Eckstein return Res; 4364d6fb72aSErik Eckstein 4374d6fb72aSErik Eckstein for (unsigned i = 0, e = FTyL->getNumParams(); i != e; ++i) { 4384d6fb72aSErik Eckstein if (int Res = cmpTypes(FTyL->getParamType(i), FTyR->getParamType(i))) 4394d6fb72aSErik Eckstein return Res; 4404d6fb72aSErik Eckstein } 4414d6fb72aSErik Eckstein return 0; 4424d6fb72aSErik Eckstein } 4434d6fb72aSErik Eckstein 444bc070524SPeter Collingbourne case Type::ArrayTyID: 445bc070524SPeter Collingbourne case Type::VectorTyID: { 446bc070524SPeter Collingbourne auto *STyL = cast<SequentialType>(TyL); 447bc070524SPeter Collingbourne auto *STyR = cast<SequentialType>(TyR); 448bc070524SPeter Collingbourne if (STyL->getNumElements() != STyR->getNumElements()) 449bc070524SPeter Collingbourne return cmpNumbers(STyL->getNumElements(), STyR->getNumElements()); 450bc070524SPeter Collingbourne return cmpTypes(STyL->getElementType(), STyR->getElementType()); 4514d6fb72aSErik Eckstein } 4524d6fb72aSErik Eckstein } 4534d6fb72aSErik Eckstein } 4544d6fb72aSErik Eckstein 4554d6fb72aSErik Eckstein // Determine whether the two operations are the same except that pointer-to-A 4564d6fb72aSErik Eckstein // and pointer-to-B are equivalent. This should be kept in sync with 4574d6fb72aSErik Eckstein // Instruction::isSameOperationAs. 4584d6fb72aSErik Eckstein // Read method declaration comments for more details. 4594d6fb72aSErik Eckstein int FunctionComparator::cmpOperations(const Instruction *L, 4604d6fb72aSErik Eckstein const Instruction *R, 4614d6fb72aSErik Eckstein bool &needToCmpOperands) const { 4624d6fb72aSErik Eckstein needToCmpOperands = true; 4634d6fb72aSErik Eckstein if (int Res = cmpValues(L, R)) 4644d6fb72aSErik Eckstein return Res; 4654d6fb72aSErik Eckstein 4664d6fb72aSErik Eckstein // Differences from Instruction::isSameOperationAs: 4674d6fb72aSErik Eckstein // * replace type comparison with calls to cmpTypes. 4684d6fb72aSErik Eckstein // * we test for I->getRawSubclassOptionalData (nuw/nsw/tail) at the top. 4694d6fb72aSErik Eckstein // * because of the above, we don't test for the tail bit on calls later on. 4704d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getOpcode(), R->getOpcode())) 4714d6fb72aSErik Eckstein return Res; 4724d6fb72aSErik Eckstein 4734d6fb72aSErik Eckstein if (const GetElementPtrInst *GEPL = dyn_cast<GetElementPtrInst>(L)) { 4744d6fb72aSErik Eckstein needToCmpOperands = false; 4754d6fb72aSErik Eckstein const GetElementPtrInst *GEPR = cast<GetElementPtrInst>(R); 4764d6fb72aSErik Eckstein if (int Res = 4774d6fb72aSErik Eckstein cmpValues(GEPL->getPointerOperand(), GEPR->getPointerOperand())) 4784d6fb72aSErik Eckstein return Res; 4794d6fb72aSErik Eckstein return cmpGEPs(GEPL, GEPR); 4804d6fb72aSErik Eckstein } 4814d6fb72aSErik Eckstein 4824d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getNumOperands(), R->getNumOperands())) 4834d6fb72aSErik Eckstein return Res; 4844d6fb72aSErik Eckstein 4854d6fb72aSErik Eckstein if (int Res = cmpTypes(L->getType(), R->getType())) 4864d6fb72aSErik Eckstein return Res; 4874d6fb72aSErik Eckstein 4884d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getRawSubclassOptionalData(), 4894d6fb72aSErik Eckstein R->getRawSubclassOptionalData())) 4904d6fb72aSErik Eckstein return Res; 4914d6fb72aSErik Eckstein 4924d6fb72aSErik Eckstein // We have two instructions of identical opcode and #operands. Check to see 4934d6fb72aSErik Eckstein // if all operands are the same type 4944d6fb72aSErik Eckstein for (unsigned i = 0, e = L->getNumOperands(); i != e; ++i) { 4954d6fb72aSErik Eckstein if (int Res = 4964d6fb72aSErik Eckstein cmpTypes(L->getOperand(i)->getType(), R->getOperand(i)->getType())) 4974d6fb72aSErik Eckstein return Res; 4984d6fb72aSErik Eckstein } 4994d6fb72aSErik Eckstein 5004d6fb72aSErik Eckstein // Check special state that is a part of some instructions. 5014d6fb72aSErik Eckstein if (const AllocaInst *AI = dyn_cast<AllocaInst>(L)) { 5024d6fb72aSErik Eckstein if (int Res = cmpTypes(AI->getAllocatedType(), 5034d6fb72aSErik Eckstein cast<AllocaInst>(R)->getAllocatedType())) 5044d6fb72aSErik Eckstein return Res; 5054d6fb72aSErik Eckstein return cmpNumbers(AI->getAlignment(), cast<AllocaInst>(R)->getAlignment()); 5064d6fb72aSErik Eckstein } 5074d6fb72aSErik Eckstein if (const LoadInst *LI = dyn_cast<LoadInst>(L)) { 5084d6fb72aSErik Eckstein if (int Res = cmpNumbers(LI->isVolatile(), cast<LoadInst>(R)->isVolatile())) 5094d6fb72aSErik Eckstein return Res; 5104d6fb72aSErik Eckstein if (int Res = 5114d6fb72aSErik Eckstein cmpNumbers(LI->getAlignment(), cast<LoadInst>(R)->getAlignment())) 5124d6fb72aSErik Eckstein return Res; 5134d6fb72aSErik Eckstein if (int Res = 5144d6fb72aSErik Eckstein cmpOrderings(LI->getOrdering(), cast<LoadInst>(R)->getOrdering())) 5154d6fb72aSErik Eckstein return Res; 516*bb80d3e1SKonstantin Zhuravlyov if (int Res = cmpNumbers(LI->getSyncScopeID(), 517*bb80d3e1SKonstantin Zhuravlyov cast<LoadInst>(R)->getSyncScopeID())) 5184d6fb72aSErik Eckstein return Res; 5194d6fb72aSErik Eckstein return cmpRangeMetadata(LI->getMetadata(LLVMContext::MD_range), 5204d6fb72aSErik Eckstein cast<LoadInst>(R)->getMetadata(LLVMContext::MD_range)); 5214d6fb72aSErik Eckstein } 5224d6fb72aSErik Eckstein if (const StoreInst *SI = dyn_cast<StoreInst>(L)) { 5234d6fb72aSErik Eckstein if (int Res = 5244d6fb72aSErik Eckstein cmpNumbers(SI->isVolatile(), cast<StoreInst>(R)->isVolatile())) 5254d6fb72aSErik Eckstein return Res; 5264d6fb72aSErik Eckstein if (int Res = 5274d6fb72aSErik Eckstein cmpNumbers(SI->getAlignment(), cast<StoreInst>(R)->getAlignment())) 5284d6fb72aSErik Eckstein return Res; 5294d6fb72aSErik Eckstein if (int Res = 5304d6fb72aSErik Eckstein cmpOrderings(SI->getOrdering(), cast<StoreInst>(R)->getOrdering())) 5314d6fb72aSErik Eckstein return Res; 532*bb80d3e1SKonstantin Zhuravlyov return cmpNumbers(SI->getSyncScopeID(), 533*bb80d3e1SKonstantin Zhuravlyov cast<StoreInst>(R)->getSyncScopeID()); 5344d6fb72aSErik Eckstein } 5354d6fb72aSErik Eckstein if (const CmpInst *CI = dyn_cast<CmpInst>(L)) 5364d6fb72aSErik Eckstein return cmpNumbers(CI->getPredicate(), cast<CmpInst>(R)->getPredicate()); 5374d6fb72aSErik Eckstein if (const CallInst *CI = dyn_cast<CallInst>(L)) { 5384d6fb72aSErik Eckstein if (int Res = cmpNumbers(CI->getCallingConv(), 5394d6fb72aSErik Eckstein cast<CallInst>(R)->getCallingConv())) 5404d6fb72aSErik Eckstein return Res; 5414d6fb72aSErik Eckstein if (int Res = 5424d6fb72aSErik Eckstein cmpAttrs(CI->getAttributes(), cast<CallInst>(R)->getAttributes())) 5434d6fb72aSErik Eckstein return Res; 5444d6fb72aSErik Eckstein if (int Res = cmpOperandBundlesSchema(CI, R)) 5454d6fb72aSErik Eckstein return Res; 5464d6fb72aSErik Eckstein return cmpRangeMetadata( 5474d6fb72aSErik Eckstein CI->getMetadata(LLVMContext::MD_range), 5484d6fb72aSErik Eckstein cast<CallInst>(R)->getMetadata(LLVMContext::MD_range)); 5494d6fb72aSErik Eckstein } 5504d6fb72aSErik Eckstein if (const InvokeInst *II = dyn_cast<InvokeInst>(L)) { 5514d6fb72aSErik Eckstein if (int Res = cmpNumbers(II->getCallingConv(), 5524d6fb72aSErik Eckstein cast<InvokeInst>(R)->getCallingConv())) 5534d6fb72aSErik Eckstein return Res; 5544d6fb72aSErik Eckstein if (int Res = 5554d6fb72aSErik Eckstein cmpAttrs(II->getAttributes(), cast<InvokeInst>(R)->getAttributes())) 5564d6fb72aSErik Eckstein return Res; 5574d6fb72aSErik Eckstein if (int Res = cmpOperandBundlesSchema(II, R)) 5584d6fb72aSErik Eckstein return Res; 5594d6fb72aSErik Eckstein return cmpRangeMetadata( 5604d6fb72aSErik Eckstein II->getMetadata(LLVMContext::MD_range), 5614d6fb72aSErik Eckstein cast<InvokeInst>(R)->getMetadata(LLVMContext::MD_range)); 5624d6fb72aSErik Eckstein } 5634d6fb72aSErik Eckstein if (const InsertValueInst *IVI = dyn_cast<InsertValueInst>(L)) { 5644d6fb72aSErik Eckstein ArrayRef<unsigned> LIndices = IVI->getIndices(); 5654d6fb72aSErik Eckstein ArrayRef<unsigned> RIndices = cast<InsertValueInst>(R)->getIndices(); 5664d6fb72aSErik Eckstein if (int Res = cmpNumbers(LIndices.size(), RIndices.size())) 5674d6fb72aSErik Eckstein return Res; 5684d6fb72aSErik Eckstein for (size_t i = 0, e = LIndices.size(); i != e; ++i) { 5694d6fb72aSErik Eckstein if (int Res = cmpNumbers(LIndices[i], RIndices[i])) 5704d6fb72aSErik Eckstein return Res; 5714d6fb72aSErik Eckstein } 5724d6fb72aSErik Eckstein return 0; 5734d6fb72aSErik Eckstein } 5744d6fb72aSErik Eckstein if (const ExtractValueInst *EVI = dyn_cast<ExtractValueInst>(L)) { 5754d6fb72aSErik Eckstein ArrayRef<unsigned> LIndices = EVI->getIndices(); 5764d6fb72aSErik Eckstein ArrayRef<unsigned> RIndices = cast<ExtractValueInst>(R)->getIndices(); 5774d6fb72aSErik Eckstein if (int Res = cmpNumbers(LIndices.size(), RIndices.size())) 5784d6fb72aSErik Eckstein return Res; 5794d6fb72aSErik Eckstein for (size_t i = 0, e = LIndices.size(); i != e; ++i) { 5804d6fb72aSErik Eckstein if (int Res = cmpNumbers(LIndices[i], RIndices[i])) 5814d6fb72aSErik Eckstein return Res; 5824d6fb72aSErik Eckstein } 5834d6fb72aSErik Eckstein } 5844d6fb72aSErik Eckstein if (const FenceInst *FI = dyn_cast<FenceInst>(L)) { 5854d6fb72aSErik Eckstein if (int Res = 5864d6fb72aSErik Eckstein cmpOrderings(FI->getOrdering(), cast<FenceInst>(R)->getOrdering())) 5874d6fb72aSErik Eckstein return Res; 588*bb80d3e1SKonstantin Zhuravlyov return cmpNumbers(FI->getSyncScopeID(), 589*bb80d3e1SKonstantin Zhuravlyov cast<FenceInst>(R)->getSyncScopeID()); 5904d6fb72aSErik Eckstein } 5914d6fb72aSErik Eckstein if (const AtomicCmpXchgInst *CXI = dyn_cast<AtomicCmpXchgInst>(L)) { 5924d6fb72aSErik Eckstein if (int Res = cmpNumbers(CXI->isVolatile(), 5934d6fb72aSErik Eckstein cast<AtomicCmpXchgInst>(R)->isVolatile())) 5944d6fb72aSErik Eckstein return Res; 5954d6fb72aSErik Eckstein if (int Res = cmpNumbers(CXI->isWeak(), 5964d6fb72aSErik Eckstein cast<AtomicCmpXchgInst>(R)->isWeak())) 5974d6fb72aSErik Eckstein return Res; 5984d6fb72aSErik Eckstein if (int Res = 5994d6fb72aSErik Eckstein cmpOrderings(CXI->getSuccessOrdering(), 6004d6fb72aSErik Eckstein cast<AtomicCmpXchgInst>(R)->getSuccessOrdering())) 6014d6fb72aSErik Eckstein return Res; 6024d6fb72aSErik Eckstein if (int Res = 6034d6fb72aSErik Eckstein cmpOrderings(CXI->getFailureOrdering(), 6044d6fb72aSErik Eckstein cast<AtomicCmpXchgInst>(R)->getFailureOrdering())) 6054d6fb72aSErik Eckstein return Res; 606*bb80d3e1SKonstantin Zhuravlyov return cmpNumbers(CXI->getSyncScopeID(), 607*bb80d3e1SKonstantin Zhuravlyov cast<AtomicCmpXchgInst>(R)->getSyncScopeID()); 6084d6fb72aSErik Eckstein } 6094d6fb72aSErik Eckstein if (const AtomicRMWInst *RMWI = dyn_cast<AtomicRMWInst>(L)) { 6104d6fb72aSErik Eckstein if (int Res = cmpNumbers(RMWI->getOperation(), 6114d6fb72aSErik Eckstein cast<AtomicRMWInst>(R)->getOperation())) 6124d6fb72aSErik Eckstein return Res; 6134d6fb72aSErik Eckstein if (int Res = cmpNumbers(RMWI->isVolatile(), 6144d6fb72aSErik Eckstein cast<AtomicRMWInst>(R)->isVolatile())) 6154d6fb72aSErik Eckstein return Res; 6164d6fb72aSErik Eckstein if (int Res = cmpOrderings(RMWI->getOrdering(), 6174d6fb72aSErik Eckstein cast<AtomicRMWInst>(R)->getOrdering())) 6184d6fb72aSErik Eckstein return Res; 619*bb80d3e1SKonstantin Zhuravlyov return cmpNumbers(RMWI->getSyncScopeID(), 620*bb80d3e1SKonstantin Zhuravlyov cast<AtomicRMWInst>(R)->getSyncScopeID()); 6214d6fb72aSErik Eckstein } 6224d6fb72aSErik Eckstein if (const PHINode *PNL = dyn_cast<PHINode>(L)) { 6234d6fb72aSErik Eckstein const PHINode *PNR = cast<PHINode>(R); 6244d6fb72aSErik Eckstein // Ensure that in addition to the incoming values being identical 6254d6fb72aSErik Eckstein // (checked by the caller of this function), the incoming blocks 6264d6fb72aSErik Eckstein // are also identical. 6274d6fb72aSErik Eckstein for (unsigned i = 0, e = PNL->getNumIncomingValues(); i != e; ++i) { 6284d6fb72aSErik Eckstein if (int Res = 6294d6fb72aSErik Eckstein cmpValues(PNL->getIncomingBlock(i), PNR->getIncomingBlock(i))) 6304d6fb72aSErik Eckstein return Res; 6314d6fb72aSErik Eckstein } 6324d6fb72aSErik Eckstein } 6334d6fb72aSErik Eckstein return 0; 6344d6fb72aSErik Eckstein } 6354d6fb72aSErik Eckstein 6364d6fb72aSErik Eckstein // Determine whether two GEP operations perform the same underlying arithmetic. 6374d6fb72aSErik Eckstein // Read method declaration comments for more details. 6384d6fb72aSErik Eckstein int FunctionComparator::cmpGEPs(const GEPOperator *GEPL, 6394d6fb72aSErik Eckstein const GEPOperator *GEPR) const { 6404d6fb72aSErik Eckstein 6414d6fb72aSErik Eckstein unsigned int ASL = GEPL->getPointerAddressSpace(); 6424d6fb72aSErik Eckstein unsigned int ASR = GEPR->getPointerAddressSpace(); 6434d6fb72aSErik Eckstein 6444d6fb72aSErik Eckstein if (int Res = cmpNumbers(ASL, ASR)) 6454d6fb72aSErik Eckstein return Res; 6464d6fb72aSErik Eckstein 6474d6fb72aSErik Eckstein // When we have target data, we can reduce the GEP down to the value in bytes 6484d6fb72aSErik Eckstein // added to the address. 6494d6fb72aSErik Eckstein const DataLayout &DL = FnL->getParent()->getDataLayout(); 6504d6fb72aSErik Eckstein unsigned BitWidth = DL.getPointerSizeInBits(ASL); 6514d6fb72aSErik Eckstein APInt OffsetL(BitWidth, 0), OffsetR(BitWidth, 0); 6524d6fb72aSErik Eckstein if (GEPL->accumulateConstantOffset(DL, OffsetL) && 6534d6fb72aSErik Eckstein GEPR->accumulateConstantOffset(DL, OffsetR)) 6544d6fb72aSErik Eckstein return cmpAPInts(OffsetL, OffsetR); 6554d6fb72aSErik Eckstein if (int Res = cmpTypes(GEPL->getSourceElementType(), 6564d6fb72aSErik Eckstein GEPR->getSourceElementType())) 6574d6fb72aSErik Eckstein return Res; 6584d6fb72aSErik Eckstein 6594d6fb72aSErik Eckstein if (int Res = cmpNumbers(GEPL->getNumOperands(), GEPR->getNumOperands())) 6604d6fb72aSErik Eckstein return Res; 6614d6fb72aSErik Eckstein 6624d6fb72aSErik Eckstein for (unsigned i = 0, e = GEPL->getNumOperands(); i != e; ++i) { 6634d6fb72aSErik Eckstein if (int Res = cmpValues(GEPL->getOperand(i), GEPR->getOperand(i))) 6644d6fb72aSErik Eckstein return Res; 6654d6fb72aSErik Eckstein } 6664d6fb72aSErik Eckstein 6674d6fb72aSErik Eckstein return 0; 6684d6fb72aSErik Eckstein } 6694d6fb72aSErik Eckstein 6704d6fb72aSErik Eckstein int FunctionComparator::cmpInlineAsm(const InlineAsm *L, 6714d6fb72aSErik Eckstein const InlineAsm *R) const { 6724d6fb72aSErik Eckstein // InlineAsm's are uniqued. If they are the same pointer, obviously they are 6734d6fb72aSErik Eckstein // the same, otherwise compare the fields. 6744d6fb72aSErik Eckstein if (L == R) 6754d6fb72aSErik Eckstein return 0; 6764d6fb72aSErik Eckstein if (int Res = cmpTypes(L->getFunctionType(), R->getFunctionType())) 6774d6fb72aSErik Eckstein return Res; 6784d6fb72aSErik Eckstein if (int Res = cmpMem(L->getAsmString(), R->getAsmString())) 6794d6fb72aSErik Eckstein return Res; 6804d6fb72aSErik Eckstein if (int Res = cmpMem(L->getConstraintString(), R->getConstraintString())) 6814d6fb72aSErik Eckstein return Res; 6824d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->hasSideEffects(), R->hasSideEffects())) 6834d6fb72aSErik Eckstein return Res; 6844d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->isAlignStack(), R->isAlignStack())) 6854d6fb72aSErik Eckstein return Res; 6864d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getDialect(), R->getDialect())) 6874d6fb72aSErik Eckstein return Res; 6884d6fb72aSErik Eckstein llvm_unreachable("InlineAsm blocks were not uniqued."); 6894d6fb72aSErik Eckstein return 0; 6904d6fb72aSErik Eckstein } 6914d6fb72aSErik Eckstein 6924d6fb72aSErik Eckstein /// Compare two values used by the two functions under pair-wise comparison. If 6934d6fb72aSErik Eckstein /// this is the first time the values are seen, they're added to the mapping so 6944d6fb72aSErik Eckstein /// that we will detect mismatches on next use. 6954d6fb72aSErik Eckstein /// See comments in declaration for more details. 6964d6fb72aSErik Eckstein int FunctionComparator::cmpValues(const Value *L, const Value *R) const { 6974d6fb72aSErik Eckstein // Catch self-reference case. 6984d6fb72aSErik Eckstein if (L == FnL) { 6994d6fb72aSErik Eckstein if (R == FnR) 7004d6fb72aSErik Eckstein return 0; 7014d6fb72aSErik Eckstein return -1; 7024d6fb72aSErik Eckstein } 7034d6fb72aSErik Eckstein if (R == FnR) { 7044d6fb72aSErik Eckstein if (L == FnL) 7054d6fb72aSErik Eckstein return 0; 7064d6fb72aSErik Eckstein return 1; 7074d6fb72aSErik Eckstein } 7084d6fb72aSErik Eckstein 7094d6fb72aSErik Eckstein const Constant *ConstL = dyn_cast<Constant>(L); 7104d6fb72aSErik Eckstein const Constant *ConstR = dyn_cast<Constant>(R); 7114d6fb72aSErik Eckstein if (ConstL && ConstR) { 7124d6fb72aSErik Eckstein if (L == R) 7134d6fb72aSErik Eckstein return 0; 7144d6fb72aSErik Eckstein return cmpConstants(ConstL, ConstR); 7154d6fb72aSErik Eckstein } 7164d6fb72aSErik Eckstein 7174d6fb72aSErik Eckstein if (ConstL) 7184d6fb72aSErik Eckstein return 1; 7194d6fb72aSErik Eckstein if (ConstR) 7204d6fb72aSErik Eckstein return -1; 7214d6fb72aSErik Eckstein 7224d6fb72aSErik Eckstein const InlineAsm *InlineAsmL = dyn_cast<InlineAsm>(L); 7234d6fb72aSErik Eckstein const InlineAsm *InlineAsmR = dyn_cast<InlineAsm>(R); 7244d6fb72aSErik Eckstein 7254d6fb72aSErik Eckstein if (InlineAsmL && InlineAsmR) 7264d6fb72aSErik Eckstein return cmpInlineAsm(InlineAsmL, InlineAsmR); 7274d6fb72aSErik Eckstein if (InlineAsmL) 7284d6fb72aSErik Eckstein return 1; 7294d6fb72aSErik Eckstein if (InlineAsmR) 7304d6fb72aSErik Eckstein return -1; 7314d6fb72aSErik Eckstein 7324d6fb72aSErik Eckstein auto LeftSN = sn_mapL.insert(std::make_pair(L, sn_mapL.size())), 7334d6fb72aSErik Eckstein RightSN = sn_mapR.insert(std::make_pair(R, sn_mapR.size())); 7344d6fb72aSErik Eckstein 7354d6fb72aSErik Eckstein return cmpNumbers(LeftSN.first->second, RightSN.first->second); 7364d6fb72aSErik Eckstein } 7374d6fb72aSErik Eckstein 7384d6fb72aSErik Eckstein // Test whether two basic blocks have equivalent behaviour. 7394d6fb72aSErik Eckstein int FunctionComparator::cmpBasicBlocks(const BasicBlock *BBL, 7404d6fb72aSErik Eckstein const BasicBlock *BBR) const { 7414d6fb72aSErik Eckstein BasicBlock::const_iterator InstL = BBL->begin(), InstLE = BBL->end(); 7424d6fb72aSErik Eckstein BasicBlock::const_iterator InstR = BBR->begin(), InstRE = BBR->end(); 7434d6fb72aSErik Eckstein 7444d6fb72aSErik Eckstein do { 7454d6fb72aSErik Eckstein bool needToCmpOperands = true; 7464d6fb72aSErik Eckstein if (int Res = cmpOperations(&*InstL, &*InstR, needToCmpOperands)) 7474d6fb72aSErik Eckstein return Res; 7484d6fb72aSErik Eckstein if (needToCmpOperands) { 7494d6fb72aSErik Eckstein assert(InstL->getNumOperands() == InstR->getNumOperands()); 7504d6fb72aSErik Eckstein 7514d6fb72aSErik Eckstein for (unsigned i = 0, e = InstL->getNumOperands(); i != e; ++i) { 7524d6fb72aSErik Eckstein Value *OpL = InstL->getOperand(i); 7534d6fb72aSErik Eckstein Value *OpR = InstR->getOperand(i); 7544d6fb72aSErik Eckstein if (int Res = cmpValues(OpL, OpR)) 7554d6fb72aSErik Eckstein return Res; 7564d6fb72aSErik Eckstein // cmpValues should ensure this is true. 7574d6fb72aSErik Eckstein assert(cmpTypes(OpL->getType(), OpR->getType()) == 0); 7584d6fb72aSErik Eckstein } 7594d6fb72aSErik Eckstein } 7604d6fb72aSErik Eckstein 7614d6fb72aSErik Eckstein ++InstL; 7624d6fb72aSErik Eckstein ++InstR; 7634d6fb72aSErik Eckstein } while (InstL != InstLE && InstR != InstRE); 7644d6fb72aSErik Eckstein 7654d6fb72aSErik Eckstein if (InstL != InstLE && InstR == InstRE) 7664d6fb72aSErik Eckstein return 1; 7674d6fb72aSErik Eckstein if (InstL == InstLE && InstR != InstRE) 7684d6fb72aSErik Eckstein return -1; 7694d6fb72aSErik Eckstein return 0; 7704d6fb72aSErik Eckstein } 7714d6fb72aSErik Eckstein 7724d6fb72aSErik Eckstein int FunctionComparator::compareSignature() const { 7734d6fb72aSErik Eckstein if (int Res = cmpAttrs(FnL->getAttributes(), FnR->getAttributes())) 7744d6fb72aSErik Eckstein return Res; 7754d6fb72aSErik Eckstein 7764d6fb72aSErik Eckstein if (int Res = cmpNumbers(FnL->hasGC(), FnR->hasGC())) 7774d6fb72aSErik Eckstein return Res; 7784d6fb72aSErik Eckstein 7794d6fb72aSErik Eckstein if (FnL->hasGC()) { 7804d6fb72aSErik Eckstein if (int Res = cmpMem(FnL->getGC(), FnR->getGC())) 7814d6fb72aSErik Eckstein return Res; 7824d6fb72aSErik Eckstein } 7834d6fb72aSErik Eckstein 7844d6fb72aSErik Eckstein if (int Res = cmpNumbers(FnL->hasSection(), FnR->hasSection())) 7854d6fb72aSErik Eckstein return Res; 7864d6fb72aSErik Eckstein 7874d6fb72aSErik Eckstein if (FnL->hasSection()) { 7884d6fb72aSErik Eckstein if (int Res = cmpMem(FnL->getSection(), FnR->getSection())) 7894d6fb72aSErik Eckstein return Res; 7904d6fb72aSErik Eckstein } 7914d6fb72aSErik Eckstein 7924d6fb72aSErik Eckstein if (int Res = cmpNumbers(FnL->isVarArg(), FnR->isVarArg())) 7934d6fb72aSErik Eckstein return Res; 7944d6fb72aSErik Eckstein 7954d6fb72aSErik Eckstein // TODO: if it's internal and only used in direct calls, we could handle this 7964d6fb72aSErik Eckstein // case too. 7974d6fb72aSErik Eckstein if (int Res = cmpNumbers(FnL->getCallingConv(), FnR->getCallingConv())) 7984d6fb72aSErik Eckstein return Res; 7994d6fb72aSErik Eckstein 8004d6fb72aSErik Eckstein if (int Res = cmpTypes(FnL->getFunctionType(), FnR->getFunctionType())) 8014d6fb72aSErik Eckstein return Res; 8024d6fb72aSErik Eckstein 8034d6fb72aSErik Eckstein assert(FnL->arg_size() == FnR->arg_size() && 8044d6fb72aSErik Eckstein "Identically typed functions have different numbers of args!"); 8054d6fb72aSErik Eckstein 8064d6fb72aSErik Eckstein // Visit the arguments so that they get enumerated in the order they're 8074d6fb72aSErik Eckstein // passed in. 8084d6fb72aSErik Eckstein for (Function::const_arg_iterator ArgLI = FnL->arg_begin(), 8094d6fb72aSErik Eckstein ArgRI = FnR->arg_begin(), 8104d6fb72aSErik Eckstein ArgLE = FnL->arg_end(); 8114d6fb72aSErik Eckstein ArgLI != ArgLE; ++ArgLI, ++ArgRI) { 8124d6fb72aSErik Eckstein if (cmpValues(&*ArgLI, &*ArgRI) != 0) 8134d6fb72aSErik Eckstein llvm_unreachable("Arguments repeat!"); 8144d6fb72aSErik Eckstein } 8154d6fb72aSErik Eckstein return 0; 8164d6fb72aSErik Eckstein } 8174d6fb72aSErik Eckstein 8184d6fb72aSErik Eckstein // Test whether the two functions have equivalent behaviour. 8194d6fb72aSErik Eckstein int FunctionComparator::compare() { 8204d6fb72aSErik Eckstein beginCompare(); 8214d6fb72aSErik Eckstein 8224d6fb72aSErik Eckstein if (int Res = compareSignature()) 8234d6fb72aSErik Eckstein return Res; 8244d6fb72aSErik Eckstein 8254d6fb72aSErik Eckstein // We do a CFG-ordered walk since the actual ordering of the blocks in the 8264d6fb72aSErik Eckstein // linked list is immaterial. Our walk starts at the entry block for both 8274d6fb72aSErik Eckstein // functions, then takes each block from each terminator in order. As an 8284d6fb72aSErik Eckstein // artifact, this also means that unreachable blocks are ignored. 8294d6fb72aSErik Eckstein SmallVector<const BasicBlock *, 8> FnLBBs, FnRBBs; 8304d6fb72aSErik Eckstein SmallPtrSet<const BasicBlock *, 32> VisitedBBs; // in terms of F1. 8314d6fb72aSErik Eckstein 8324d6fb72aSErik Eckstein FnLBBs.push_back(&FnL->getEntryBlock()); 8334d6fb72aSErik Eckstein FnRBBs.push_back(&FnR->getEntryBlock()); 8344d6fb72aSErik Eckstein 8354d6fb72aSErik Eckstein VisitedBBs.insert(FnLBBs[0]); 8364d6fb72aSErik Eckstein while (!FnLBBs.empty()) { 8374d6fb72aSErik Eckstein const BasicBlock *BBL = FnLBBs.pop_back_val(); 8384d6fb72aSErik Eckstein const BasicBlock *BBR = FnRBBs.pop_back_val(); 8394d6fb72aSErik Eckstein 8404d6fb72aSErik Eckstein if (int Res = cmpValues(BBL, BBR)) 8414d6fb72aSErik Eckstein return Res; 8424d6fb72aSErik Eckstein 8434d6fb72aSErik Eckstein if (int Res = cmpBasicBlocks(BBL, BBR)) 8444d6fb72aSErik Eckstein return Res; 8454d6fb72aSErik Eckstein 8464d6fb72aSErik Eckstein const TerminatorInst *TermL = BBL->getTerminator(); 8474d6fb72aSErik Eckstein const TerminatorInst *TermR = BBR->getTerminator(); 8484d6fb72aSErik Eckstein 8494d6fb72aSErik Eckstein assert(TermL->getNumSuccessors() == TermR->getNumSuccessors()); 8504d6fb72aSErik Eckstein for (unsigned i = 0, e = TermL->getNumSuccessors(); i != e; ++i) { 8514d6fb72aSErik Eckstein if (!VisitedBBs.insert(TermL->getSuccessor(i)).second) 8524d6fb72aSErik Eckstein continue; 8534d6fb72aSErik Eckstein 8544d6fb72aSErik Eckstein FnLBBs.push_back(TermL->getSuccessor(i)); 8554d6fb72aSErik Eckstein FnRBBs.push_back(TermR->getSuccessor(i)); 8564d6fb72aSErik Eckstein } 8574d6fb72aSErik Eckstein } 8584d6fb72aSErik Eckstein return 0; 8594d6fb72aSErik Eckstein } 8604d6fb72aSErik Eckstein 8614d6fb72aSErik Eckstein namespace { 8624d6fb72aSErik Eckstein 8634d6fb72aSErik Eckstein // Accumulate the hash of a sequence of 64-bit integers. This is similar to a 8644d6fb72aSErik Eckstein // hash of a sequence of 64bit ints, but the entire input does not need to be 8654d6fb72aSErik Eckstein // available at once. This interface is necessary for functionHash because it 8664d6fb72aSErik Eckstein // needs to accumulate the hash as the structure of the function is traversed 8674d6fb72aSErik Eckstein // without saving these values to an intermediate buffer. This form of hashing 8684d6fb72aSErik Eckstein // is not often needed, as usually the object to hash is just read from a 8694d6fb72aSErik Eckstein // buffer. 8704d6fb72aSErik Eckstein class HashAccumulator64 { 8714d6fb72aSErik Eckstein uint64_t Hash; 8724d6fb72aSErik Eckstein public: 8734d6fb72aSErik Eckstein // Initialize to random constant, so the state isn't zero. 8744d6fb72aSErik Eckstein HashAccumulator64() { Hash = 0x6acaa36bef8325c5ULL; } 8754d6fb72aSErik Eckstein void add(uint64_t V) { 8764d6fb72aSErik Eckstein Hash = llvm::hashing::detail::hash_16_bytes(Hash, V); 8774d6fb72aSErik Eckstein } 8784d6fb72aSErik Eckstein // No finishing is required, because the entire hash value is used. 8794d6fb72aSErik Eckstein uint64_t getHash() { return Hash; } 8804d6fb72aSErik Eckstein }; 8814d6fb72aSErik Eckstein } // end anonymous namespace 8824d6fb72aSErik Eckstein 8834d6fb72aSErik Eckstein // A function hash is calculated by considering only the number of arguments and 8844d6fb72aSErik Eckstein // whether a function is varargs, the order of basic blocks (given by the 8854d6fb72aSErik Eckstein // successors of each basic block in depth first order), and the order of 8864d6fb72aSErik Eckstein // opcodes of each instruction within each of these basic blocks. This mirrors 8874d6fb72aSErik Eckstein // the strategy compare() uses to compare functions by walking the BBs in depth 8884d6fb72aSErik Eckstein // first order and comparing each instruction in sequence. Because this hash 8894d6fb72aSErik Eckstein // does not look at the operands, it is insensitive to things such as the 8904d6fb72aSErik Eckstein // target of calls and the constants used in the function, which makes it useful 8914d6fb72aSErik Eckstein // when possibly merging functions which are the same modulo constants and call 8924d6fb72aSErik Eckstein // targets. 8934d6fb72aSErik Eckstein FunctionComparator::FunctionHash FunctionComparator::functionHash(Function &F) { 8944d6fb72aSErik Eckstein HashAccumulator64 H; 8954d6fb72aSErik Eckstein H.add(F.isVarArg()); 8964d6fb72aSErik Eckstein H.add(F.arg_size()); 8974d6fb72aSErik Eckstein 8984d6fb72aSErik Eckstein SmallVector<const BasicBlock *, 8> BBs; 8994d6fb72aSErik Eckstein SmallSet<const BasicBlock *, 16> VisitedBBs; 9004d6fb72aSErik Eckstein 9014d6fb72aSErik Eckstein // Walk the blocks in the same order as FunctionComparator::cmpBasicBlocks(), 9024d6fb72aSErik Eckstein // accumulating the hash of the function "structure." (BB and opcode sequence) 9034d6fb72aSErik Eckstein BBs.push_back(&F.getEntryBlock()); 9044d6fb72aSErik Eckstein VisitedBBs.insert(BBs[0]); 9054d6fb72aSErik Eckstein while (!BBs.empty()) { 9064d6fb72aSErik Eckstein const BasicBlock *BB = BBs.pop_back_val(); 9074d6fb72aSErik Eckstein // This random value acts as a block header, as otherwise the partition of 9084d6fb72aSErik Eckstein // opcodes into BBs wouldn't affect the hash, only the order of the opcodes 9094d6fb72aSErik Eckstein H.add(45798); 9104d6fb72aSErik Eckstein for (auto &Inst : *BB) { 9114d6fb72aSErik Eckstein H.add(Inst.getOpcode()); 9124d6fb72aSErik Eckstein } 9134d6fb72aSErik Eckstein const TerminatorInst *Term = BB->getTerminator(); 9144d6fb72aSErik Eckstein for (unsigned i = 0, e = Term->getNumSuccessors(); i != e; ++i) { 9154d6fb72aSErik Eckstein if (!VisitedBBs.insert(Term->getSuccessor(i)).second) 9164d6fb72aSErik Eckstein continue; 9174d6fb72aSErik Eckstein BBs.push_back(Term->getSuccessor(i)); 9184d6fb72aSErik Eckstein } 9194d6fb72aSErik Eckstein } 9204d6fb72aSErik Eckstein return H.getHash(); 9214d6fb72aSErik Eckstein } 9224d6fb72aSErik Eckstein 9234d6fb72aSErik Eckstein 924