14d6fb72aSErik Eckstein //===- FunctionComparator.h - Function Comparator -------------------------===// 24d6fb72aSErik Eckstein // 34d6fb72aSErik Eckstein // The LLVM Compiler Infrastructure 44d6fb72aSErik Eckstein // 54d6fb72aSErik Eckstein // This file is distributed under the University of Illinois Open Source 64d6fb72aSErik Eckstein // License. See LICENSE.TXT for details. 74d6fb72aSErik Eckstein // 84d6fb72aSErik Eckstein //===----------------------------------------------------------------------===// 94d6fb72aSErik Eckstein // 104d6fb72aSErik Eckstein // This file implements the FunctionComparator and GlobalNumberState classes 114d6fb72aSErik Eckstein // which are used by the MergeFunctions pass for comparing functions. 124d6fb72aSErik Eckstein // 134d6fb72aSErik Eckstein //===----------------------------------------------------------------------===// 144d6fb72aSErik Eckstein 154d6fb72aSErik Eckstein #include "llvm/Transforms/Utils/FunctionComparator.h" 16286d5897SEugene Zelenko #include "llvm/ADT/APFloat.h" 17286d5897SEugene Zelenko #include "llvm/ADT/APInt.h" 18286d5897SEugene Zelenko #include "llvm/ADT/ArrayRef.h" 19286d5897SEugene Zelenko #include "llvm/ADT/Hashing.h" 20286d5897SEugene Zelenko #include "llvm/ADT/SmallPtrSet.h" 214d6fb72aSErik Eckstein #include "llvm/ADT/SmallSet.h" 22286d5897SEugene Zelenko #include "llvm/ADT/SmallVector.h" 23286d5897SEugene Zelenko #include "llvm/IR/Attributes.h" 24286d5897SEugene Zelenko #include "llvm/IR/BasicBlock.h" 254d6fb72aSErik Eckstein #include "llvm/IR/CallSite.h" 26286d5897SEugene Zelenko #include "llvm/IR/Constant.h" 27286d5897SEugene Zelenko #include "llvm/IR/Constants.h" 28286d5897SEugene Zelenko #include "llvm/IR/DataLayout.h" 29286d5897SEugene Zelenko #include "llvm/IR/DerivedTypes.h" 30286d5897SEugene Zelenko #include "llvm/IR/Function.h" 31286d5897SEugene Zelenko #include "llvm/IR/GlobalValue.h" 324d6fb72aSErik Eckstein #include "llvm/IR/InlineAsm.h" 33286d5897SEugene Zelenko #include "llvm/IR/InstrTypes.h" 34286d5897SEugene Zelenko #include "llvm/IR/Instruction.h" 356bda14b3SChandler Carruth #include "llvm/IR/Instructions.h" 36286d5897SEugene Zelenko #include "llvm/IR/LLVMContext.h" 37286d5897SEugene Zelenko #include "llvm/IR/Metadata.h" 384d6fb72aSErik Eckstein #include "llvm/IR/Module.h" 39286d5897SEugene Zelenko #include "llvm/IR/Operator.h" 40286d5897SEugene Zelenko #include "llvm/IR/Type.h" 41286d5897SEugene Zelenko #include "llvm/IR/Value.h" 42286d5897SEugene Zelenko #include "llvm/Support/Casting.h" 43286d5897SEugene Zelenko #include "llvm/Support/Compiler.h" 444d6fb72aSErik Eckstein #include "llvm/Support/Debug.h" 45286d5897SEugene Zelenko #include "llvm/Support/ErrorHandling.h" 464d6fb72aSErik Eckstein #include "llvm/Support/raw_ostream.h" 47286d5897SEugene Zelenko #include <cassert> 48286d5897SEugene Zelenko #include <cstddef> 49286d5897SEugene Zelenko #include <cstdint> 50286d5897SEugene Zelenko #include <utility> 514d6fb72aSErik Eckstein 524d6fb72aSErik Eckstein using namespace llvm; 534d6fb72aSErik Eckstein 544d6fb72aSErik Eckstein #define DEBUG_TYPE "functioncomparator" 554d6fb72aSErik Eckstein 564d6fb72aSErik Eckstein int FunctionComparator::cmpNumbers(uint64_t L, uint64_t R) const { 574d6fb72aSErik Eckstein if (L < R) return -1; 584d6fb72aSErik Eckstein if (L > R) return 1; 594d6fb72aSErik Eckstein return 0; 604d6fb72aSErik Eckstein } 614d6fb72aSErik Eckstein 624d6fb72aSErik Eckstein int FunctionComparator::cmpOrderings(AtomicOrdering L, AtomicOrdering R) const { 634d6fb72aSErik Eckstein if ((int)L < (int)R) return -1; 644d6fb72aSErik Eckstein if ((int)L > (int)R) return 1; 654d6fb72aSErik Eckstein return 0; 664d6fb72aSErik Eckstein } 674d6fb72aSErik Eckstein 684d6fb72aSErik Eckstein int FunctionComparator::cmpAPInts(const APInt &L, const APInt &R) const { 694d6fb72aSErik Eckstein if (int Res = cmpNumbers(L.getBitWidth(), R.getBitWidth())) 704d6fb72aSErik Eckstein return Res; 714d6fb72aSErik Eckstein if (L.ugt(R)) return 1; 724d6fb72aSErik Eckstein if (R.ugt(L)) return -1; 734d6fb72aSErik Eckstein return 0; 744d6fb72aSErik Eckstein } 754d6fb72aSErik Eckstein 764d6fb72aSErik Eckstein int FunctionComparator::cmpAPFloats(const APFloat &L, const APFloat &R) const { 774d6fb72aSErik Eckstein // Floats are ordered first by semantics (i.e. float, double, half, etc.), 784d6fb72aSErik Eckstein // then by value interpreted as a bitstring (aka APInt). 794d6fb72aSErik Eckstein const fltSemantics &SL = L.getSemantics(), &SR = R.getSemantics(); 804d6fb72aSErik Eckstein if (int Res = cmpNumbers(APFloat::semanticsPrecision(SL), 814d6fb72aSErik Eckstein APFloat::semanticsPrecision(SR))) 824d6fb72aSErik Eckstein return Res; 834d6fb72aSErik Eckstein if (int Res = cmpNumbers(APFloat::semanticsMaxExponent(SL), 844d6fb72aSErik Eckstein APFloat::semanticsMaxExponent(SR))) 854d6fb72aSErik Eckstein return Res; 864d6fb72aSErik Eckstein if (int Res = cmpNumbers(APFloat::semanticsMinExponent(SL), 874d6fb72aSErik Eckstein APFloat::semanticsMinExponent(SR))) 884d6fb72aSErik Eckstein return Res; 894d6fb72aSErik Eckstein if (int Res = cmpNumbers(APFloat::semanticsSizeInBits(SL), 904d6fb72aSErik Eckstein APFloat::semanticsSizeInBits(SR))) 914d6fb72aSErik Eckstein return Res; 924d6fb72aSErik Eckstein return cmpAPInts(L.bitcastToAPInt(), R.bitcastToAPInt()); 934d6fb72aSErik Eckstein } 944d6fb72aSErik Eckstein 954d6fb72aSErik Eckstein int FunctionComparator::cmpMem(StringRef L, StringRef R) const { 964d6fb72aSErik Eckstein // Prevent heavy comparison, compare sizes first. 974d6fb72aSErik Eckstein if (int Res = cmpNumbers(L.size(), R.size())) 984d6fb72aSErik Eckstein return Res; 994d6fb72aSErik Eckstein 1004d6fb72aSErik Eckstein // Compare strings lexicographically only when it is necessary: only when 1014d6fb72aSErik Eckstein // strings are equal in size. 1024d6fb72aSErik Eckstein return L.compare(R); 1034d6fb72aSErik Eckstein } 1044d6fb72aSErik Eckstein 105b518054bSReid Kleckner int FunctionComparator::cmpAttrs(const AttributeList L, 106b518054bSReid Kleckner const AttributeList R) const { 1078bf67fe9SReid Kleckner if (int Res = cmpNumbers(L.getNumAttrSets(), R.getNumAttrSets())) 1084d6fb72aSErik Eckstein return Res; 1094d6fb72aSErik Eckstein 1108bf67fe9SReid Kleckner for (unsigned i = L.index_begin(), e = L.index_end(); i != e; ++i) { 1118bf67fe9SReid Kleckner AttributeSet LAS = L.getAttributes(i); 1128bf67fe9SReid Kleckner AttributeSet RAS = R.getAttributes(i); 1138bf67fe9SReid Kleckner AttributeSet::iterator LI = LAS.begin(), LE = LAS.end(); 1148bf67fe9SReid Kleckner AttributeSet::iterator RI = RAS.begin(), RE = RAS.end(); 1154d6fb72aSErik Eckstein for (; LI != LE && RI != RE; ++LI, ++RI) { 1164d6fb72aSErik Eckstein Attribute LA = *LI; 1174d6fb72aSErik Eckstein Attribute RA = *RI; 1184d6fb72aSErik Eckstein if (LA < RA) 1194d6fb72aSErik Eckstein return -1; 1204d6fb72aSErik Eckstein if (RA < LA) 1214d6fb72aSErik Eckstein return 1; 1224d6fb72aSErik Eckstein } 1234d6fb72aSErik Eckstein if (LI != LE) 1244d6fb72aSErik Eckstein return 1; 1254d6fb72aSErik Eckstein if (RI != RE) 1264d6fb72aSErik Eckstein return -1; 1274d6fb72aSErik Eckstein } 1284d6fb72aSErik Eckstein return 0; 1294d6fb72aSErik Eckstein } 1304d6fb72aSErik Eckstein 1314d6fb72aSErik Eckstein int FunctionComparator::cmpRangeMetadata(const MDNode *L, 1324d6fb72aSErik Eckstein const MDNode *R) const { 1334d6fb72aSErik Eckstein if (L == R) 1344d6fb72aSErik Eckstein return 0; 1354d6fb72aSErik Eckstein if (!L) 1364d6fb72aSErik Eckstein return -1; 1374d6fb72aSErik Eckstein if (!R) 1384d6fb72aSErik Eckstein return 1; 1394d6fb72aSErik Eckstein // Range metadata is a sequence of numbers. Make sure they are the same 1404d6fb72aSErik Eckstein // sequence. 1414d6fb72aSErik Eckstein // TODO: Note that as this is metadata, it is possible to drop and/or merge 1424d6fb72aSErik Eckstein // this data when considering functions to merge. Thus this comparison would 1434d6fb72aSErik Eckstein // return 0 (i.e. equivalent), but merging would become more complicated 1444d6fb72aSErik Eckstein // because the ranges would need to be unioned. It is not likely that 1454d6fb72aSErik Eckstein // functions differ ONLY in this metadata if they are actually the same 1464d6fb72aSErik Eckstein // function semantically. 1474d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getNumOperands(), R->getNumOperands())) 1484d6fb72aSErik Eckstein return Res; 1494d6fb72aSErik Eckstein for (size_t I = 0; I < L->getNumOperands(); ++I) { 1504d6fb72aSErik Eckstein ConstantInt *LLow = mdconst::extract<ConstantInt>(L->getOperand(I)); 1514d6fb72aSErik Eckstein ConstantInt *RLow = mdconst::extract<ConstantInt>(R->getOperand(I)); 1524d6fb72aSErik Eckstein if (int Res = cmpAPInts(LLow->getValue(), RLow->getValue())) 1534d6fb72aSErik Eckstein return Res; 1544d6fb72aSErik Eckstein } 1554d6fb72aSErik Eckstein return 0; 1564d6fb72aSErik Eckstein } 1574d6fb72aSErik Eckstein 1584d6fb72aSErik Eckstein int FunctionComparator::cmpOperandBundlesSchema(const Instruction *L, 1594d6fb72aSErik Eckstein const Instruction *R) const { 1604d6fb72aSErik Eckstein ImmutableCallSite LCS(L); 1614d6fb72aSErik Eckstein ImmutableCallSite RCS(R); 1624d6fb72aSErik Eckstein 1634d6fb72aSErik Eckstein assert(LCS && RCS && "Must be calls or invokes!"); 1644d6fb72aSErik Eckstein assert(LCS.isCall() == RCS.isCall() && "Can't compare otherwise!"); 1654d6fb72aSErik Eckstein 1664d6fb72aSErik Eckstein if (int Res = 1674d6fb72aSErik Eckstein cmpNumbers(LCS.getNumOperandBundles(), RCS.getNumOperandBundles())) 1684d6fb72aSErik Eckstein return Res; 1694d6fb72aSErik Eckstein 1704d6fb72aSErik Eckstein for (unsigned i = 0, e = LCS.getNumOperandBundles(); i != e; ++i) { 1714d6fb72aSErik Eckstein auto OBL = LCS.getOperandBundleAt(i); 1724d6fb72aSErik Eckstein auto OBR = RCS.getOperandBundleAt(i); 1734d6fb72aSErik Eckstein 1744d6fb72aSErik Eckstein if (int Res = OBL.getTagName().compare(OBR.getTagName())) 1754d6fb72aSErik Eckstein return Res; 1764d6fb72aSErik Eckstein 1774d6fb72aSErik Eckstein if (int Res = cmpNumbers(OBL.Inputs.size(), OBR.Inputs.size())) 1784d6fb72aSErik Eckstein return Res; 1794d6fb72aSErik Eckstein } 1804d6fb72aSErik Eckstein 1814d6fb72aSErik Eckstein return 0; 1824d6fb72aSErik Eckstein } 1834d6fb72aSErik Eckstein 1844d6fb72aSErik Eckstein /// Constants comparison: 1854d6fb72aSErik Eckstein /// 1. Check whether type of L constant could be losslessly bitcasted to R 1864d6fb72aSErik Eckstein /// type. 1874d6fb72aSErik Eckstein /// 2. Compare constant contents. 1884d6fb72aSErik Eckstein /// For more details see declaration comments. 1894d6fb72aSErik Eckstein int FunctionComparator::cmpConstants(const Constant *L, 1904d6fb72aSErik Eckstein const Constant *R) const { 1914d6fb72aSErik Eckstein Type *TyL = L->getType(); 1924d6fb72aSErik Eckstein Type *TyR = R->getType(); 1934d6fb72aSErik Eckstein 1944d6fb72aSErik Eckstein // Check whether types are bitcastable. This part is just re-factored 1954d6fb72aSErik Eckstein // Type::canLosslesslyBitCastTo method, but instead of returning true/false, 1964d6fb72aSErik Eckstein // we also pack into result which type is "less" for us. 1974d6fb72aSErik Eckstein int TypesRes = cmpTypes(TyL, TyR); 1984d6fb72aSErik Eckstein if (TypesRes != 0) { 1994d6fb72aSErik Eckstein // Types are different, but check whether we can bitcast them. 2004d6fb72aSErik Eckstein if (!TyL->isFirstClassType()) { 2014d6fb72aSErik Eckstein if (TyR->isFirstClassType()) 2024d6fb72aSErik Eckstein return -1; 2034d6fb72aSErik Eckstein // Neither TyL nor TyR are values of first class type. Return the result 2044d6fb72aSErik Eckstein // of comparing the types 2054d6fb72aSErik Eckstein return TypesRes; 2064d6fb72aSErik Eckstein } 2074d6fb72aSErik Eckstein if (!TyR->isFirstClassType()) { 2084d6fb72aSErik Eckstein if (TyL->isFirstClassType()) 2094d6fb72aSErik Eckstein return 1; 2104d6fb72aSErik Eckstein return TypesRes; 2114d6fb72aSErik Eckstein } 2124d6fb72aSErik Eckstein 2134d6fb72aSErik Eckstein // Vector -> Vector conversions are always lossless if the two vector types 2144d6fb72aSErik Eckstein // have the same size, otherwise not. 2154d6fb72aSErik Eckstein unsigned TyLWidth = 0; 2164d6fb72aSErik Eckstein unsigned TyRWidth = 0; 2174d6fb72aSErik Eckstein 2184d6fb72aSErik Eckstein if (auto *VecTyL = dyn_cast<VectorType>(TyL)) 2194d6fb72aSErik Eckstein TyLWidth = VecTyL->getBitWidth(); 2204d6fb72aSErik Eckstein if (auto *VecTyR = dyn_cast<VectorType>(TyR)) 2214d6fb72aSErik Eckstein TyRWidth = VecTyR->getBitWidth(); 2224d6fb72aSErik Eckstein 2234d6fb72aSErik Eckstein if (TyLWidth != TyRWidth) 2244d6fb72aSErik Eckstein return cmpNumbers(TyLWidth, TyRWidth); 2254d6fb72aSErik Eckstein 2264d6fb72aSErik Eckstein // Zero bit-width means neither TyL nor TyR are vectors. 2274d6fb72aSErik Eckstein if (!TyLWidth) { 2284d6fb72aSErik Eckstein PointerType *PTyL = dyn_cast<PointerType>(TyL); 2294d6fb72aSErik Eckstein PointerType *PTyR = dyn_cast<PointerType>(TyR); 2304d6fb72aSErik Eckstein if (PTyL && PTyR) { 2314d6fb72aSErik Eckstein unsigned AddrSpaceL = PTyL->getAddressSpace(); 2324d6fb72aSErik Eckstein unsigned AddrSpaceR = PTyR->getAddressSpace(); 2334d6fb72aSErik Eckstein if (int Res = cmpNumbers(AddrSpaceL, AddrSpaceR)) 2344d6fb72aSErik Eckstein return Res; 2354d6fb72aSErik Eckstein } 2364d6fb72aSErik Eckstein if (PTyL) 2374d6fb72aSErik Eckstein return 1; 2384d6fb72aSErik Eckstein if (PTyR) 2394d6fb72aSErik Eckstein return -1; 2404d6fb72aSErik Eckstein 2414d6fb72aSErik Eckstein // TyL and TyR aren't vectors, nor pointers. We don't know how to 2424d6fb72aSErik Eckstein // bitcast them. 2434d6fb72aSErik Eckstein return TypesRes; 2444d6fb72aSErik Eckstein } 2454d6fb72aSErik Eckstein } 2464d6fb72aSErik Eckstein 2474d6fb72aSErik Eckstein // OK, types are bitcastable, now check constant contents. 2484d6fb72aSErik Eckstein 2494d6fb72aSErik Eckstein if (L->isNullValue() && R->isNullValue()) 2504d6fb72aSErik Eckstein return TypesRes; 2514d6fb72aSErik Eckstein if (L->isNullValue() && !R->isNullValue()) 2524d6fb72aSErik Eckstein return 1; 2534d6fb72aSErik Eckstein if (!L->isNullValue() && R->isNullValue()) 2544d6fb72aSErik Eckstein return -1; 2554d6fb72aSErik Eckstein 2564d6fb72aSErik Eckstein auto GlobalValueL = const_cast<GlobalValue *>(dyn_cast<GlobalValue>(L)); 2574d6fb72aSErik Eckstein auto GlobalValueR = const_cast<GlobalValue *>(dyn_cast<GlobalValue>(R)); 2584d6fb72aSErik Eckstein if (GlobalValueL && GlobalValueR) { 2594d6fb72aSErik Eckstein return cmpGlobalValues(GlobalValueL, GlobalValueR); 2604d6fb72aSErik Eckstein } 2614d6fb72aSErik Eckstein 2624d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getValueID(), R->getValueID())) 2634d6fb72aSErik Eckstein return Res; 2644d6fb72aSErik Eckstein 2654d6fb72aSErik Eckstein if (const auto *SeqL = dyn_cast<ConstantDataSequential>(L)) { 2664d6fb72aSErik Eckstein const auto *SeqR = cast<ConstantDataSequential>(R); 2674d6fb72aSErik Eckstein // This handles ConstantDataArray and ConstantDataVector. Note that we 2684d6fb72aSErik Eckstein // compare the two raw data arrays, which might differ depending on the host 2694d6fb72aSErik Eckstein // endianness. This isn't a problem though, because the endiness of a module 2704d6fb72aSErik Eckstein // will affect the order of the constants, but this order is the same 2714d6fb72aSErik Eckstein // for a given input module and host platform. 2724d6fb72aSErik Eckstein return cmpMem(SeqL->getRawDataValues(), SeqR->getRawDataValues()); 2734d6fb72aSErik Eckstein } 2744d6fb72aSErik Eckstein 2754d6fb72aSErik Eckstein switch (L->getValueID()) { 2764d6fb72aSErik Eckstein case Value::UndefValueVal: 2774d6fb72aSErik Eckstein case Value::ConstantTokenNoneVal: 2784d6fb72aSErik Eckstein return TypesRes; 2794d6fb72aSErik Eckstein case Value::ConstantIntVal: { 2804d6fb72aSErik Eckstein const APInt &LInt = cast<ConstantInt>(L)->getValue(); 2814d6fb72aSErik Eckstein const APInt &RInt = cast<ConstantInt>(R)->getValue(); 2824d6fb72aSErik Eckstein return cmpAPInts(LInt, RInt); 2834d6fb72aSErik Eckstein } 2844d6fb72aSErik Eckstein case Value::ConstantFPVal: { 2854d6fb72aSErik Eckstein const APFloat &LAPF = cast<ConstantFP>(L)->getValueAPF(); 2864d6fb72aSErik Eckstein const APFloat &RAPF = cast<ConstantFP>(R)->getValueAPF(); 2874d6fb72aSErik Eckstein return cmpAPFloats(LAPF, RAPF); 2884d6fb72aSErik Eckstein } 2894d6fb72aSErik Eckstein case Value::ConstantArrayVal: { 2904d6fb72aSErik Eckstein const ConstantArray *LA = cast<ConstantArray>(L); 2914d6fb72aSErik Eckstein const ConstantArray *RA = cast<ConstantArray>(R); 2924d6fb72aSErik Eckstein uint64_t NumElementsL = cast<ArrayType>(TyL)->getNumElements(); 2934d6fb72aSErik Eckstein uint64_t NumElementsR = cast<ArrayType>(TyR)->getNumElements(); 2944d6fb72aSErik Eckstein if (int Res = cmpNumbers(NumElementsL, NumElementsR)) 2954d6fb72aSErik Eckstein return Res; 2964d6fb72aSErik Eckstein for (uint64_t i = 0; i < NumElementsL; ++i) { 2974d6fb72aSErik Eckstein if (int Res = cmpConstants(cast<Constant>(LA->getOperand(i)), 2984d6fb72aSErik Eckstein cast<Constant>(RA->getOperand(i)))) 2994d6fb72aSErik Eckstein return Res; 3004d6fb72aSErik Eckstein } 3014d6fb72aSErik Eckstein return 0; 3024d6fb72aSErik Eckstein } 3034d6fb72aSErik Eckstein case Value::ConstantStructVal: { 3044d6fb72aSErik Eckstein const ConstantStruct *LS = cast<ConstantStruct>(L); 3054d6fb72aSErik Eckstein const ConstantStruct *RS = cast<ConstantStruct>(R); 3064d6fb72aSErik Eckstein unsigned NumElementsL = cast<StructType>(TyL)->getNumElements(); 3074d6fb72aSErik Eckstein unsigned NumElementsR = cast<StructType>(TyR)->getNumElements(); 3084d6fb72aSErik Eckstein if (int Res = cmpNumbers(NumElementsL, NumElementsR)) 3094d6fb72aSErik Eckstein return Res; 3104d6fb72aSErik Eckstein for (unsigned i = 0; i != NumElementsL; ++i) { 3114d6fb72aSErik Eckstein if (int Res = cmpConstants(cast<Constant>(LS->getOperand(i)), 3124d6fb72aSErik Eckstein cast<Constant>(RS->getOperand(i)))) 3134d6fb72aSErik Eckstein return Res; 3144d6fb72aSErik Eckstein } 3154d6fb72aSErik Eckstein return 0; 3164d6fb72aSErik Eckstein } 3174d6fb72aSErik Eckstein case Value::ConstantVectorVal: { 3184d6fb72aSErik Eckstein const ConstantVector *LV = cast<ConstantVector>(L); 3194d6fb72aSErik Eckstein const ConstantVector *RV = cast<ConstantVector>(R); 3204d6fb72aSErik Eckstein unsigned NumElementsL = cast<VectorType>(TyL)->getNumElements(); 3214d6fb72aSErik Eckstein unsigned NumElementsR = cast<VectorType>(TyR)->getNumElements(); 3224d6fb72aSErik Eckstein if (int Res = cmpNumbers(NumElementsL, NumElementsR)) 3234d6fb72aSErik Eckstein return Res; 3244d6fb72aSErik Eckstein for (uint64_t i = 0; i < NumElementsL; ++i) { 3254d6fb72aSErik Eckstein if (int Res = cmpConstants(cast<Constant>(LV->getOperand(i)), 3264d6fb72aSErik Eckstein cast<Constant>(RV->getOperand(i)))) 3274d6fb72aSErik Eckstein return Res; 3284d6fb72aSErik Eckstein } 3294d6fb72aSErik Eckstein return 0; 3304d6fb72aSErik Eckstein } 3314d6fb72aSErik Eckstein case Value::ConstantExprVal: { 3324d6fb72aSErik Eckstein const ConstantExpr *LE = cast<ConstantExpr>(L); 3334d6fb72aSErik Eckstein const ConstantExpr *RE = cast<ConstantExpr>(R); 3344d6fb72aSErik Eckstein unsigned NumOperandsL = LE->getNumOperands(); 3354d6fb72aSErik Eckstein unsigned NumOperandsR = RE->getNumOperands(); 3364d6fb72aSErik Eckstein if (int Res = cmpNumbers(NumOperandsL, NumOperandsR)) 3374d6fb72aSErik Eckstein return Res; 3384d6fb72aSErik Eckstein for (unsigned i = 0; i < NumOperandsL; ++i) { 3394d6fb72aSErik Eckstein if (int Res = cmpConstants(cast<Constant>(LE->getOperand(i)), 3404d6fb72aSErik Eckstein cast<Constant>(RE->getOperand(i)))) 3414d6fb72aSErik Eckstein return Res; 3424d6fb72aSErik Eckstein } 3434d6fb72aSErik Eckstein return 0; 3444d6fb72aSErik Eckstein } 3454d6fb72aSErik Eckstein case Value::BlockAddressVal: { 3464d6fb72aSErik Eckstein const BlockAddress *LBA = cast<BlockAddress>(L); 3474d6fb72aSErik Eckstein const BlockAddress *RBA = cast<BlockAddress>(R); 3484d6fb72aSErik Eckstein if (int Res = cmpValues(LBA->getFunction(), RBA->getFunction())) 3494d6fb72aSErik Eckstein return Res; 3504d6fb72aSErik Eckstein if (LBA->getFunction() == RBA->getFunction()) { 3514d6fb72aSErik Eckstein // They are BBs in the same function. Order by which comes first in the 3524d6fb72aSErik Eckstein // BB order of the function. This order is deterministic. 3534d6fb72aSErik Eckstein Function* F = LBA->getFunction(); 3544d6fb72aSErik Eckstein BasicBlock *LBB = LBA->getBasicBlock(); 3554d6fb72aSErik Eckstein BasicBlock *RBB = RBA->getBasicBlock(); 3564d6fb72aSErik Eckstein if (LBB == RBB) 3574d6fb72aSErik Eckstein return 0; 3584d6fb72aSErik Eckstein for(BasicBlock &BB : F->getBasicBlockList()) { 3594d6fb72aSErik Eckstein if (&BB == LBB) { 3604d6fb72aSErik Eckstein assert(&BB != RBB); 3614d6fb72aSErik Eckstein return -1; 3624d6fb72aSErik Eckstein } 3634d6fb72aSErik Eckstein if (&BB == RBB) 3644d6fb72aSErik Eckstein return 1; 3654d6fb72aSErik Eckstein } 3664d6fb72aSErik Eckstein llvm_unreachable("Basic Block Address does not point to a basic block in " 3674d6fb72aSErik Eckstein "its function."); 3684d6fb72aSErik Eckstein return -1; 3694d6fb72aSErik Eckstein } else { 3704d6fb72aSErik Eckstein // cmpValues said the functions are the same. So because they aren't 3714d6fb72aSErik Eckstein // literally the same pointer, they must respectively be the left and 3724d6fb72aSErik Eckstein // right functions. 3734d6fb72aSErik Eckstein assert(LBA->getFunction() == FnL && RBA->getFunction() == FnR); 3744d6fb72aSErik Eckstein // cmpValues will tell us if these are equivalent BasicBlocks, in the 3754d6fb72aSErik Eckstein // context of their respective functions. 3764d6fb72aSErik Eckstein return cmpValues(LBA->getBasicBlock(), RBA->getBasicBlock()); 3774d6fb72aSErik Eckstein } 3784d6fb72aSErik Eckstein } 3794d6fb72aSErik Eckstein default: // Unknown constant, abort. 380*d34e60caSNicola Zaghen LLVM_DEBUG(dbgs() << "Looking at valueID " << L->getValueID() << "\n"); 3814d6fb72aSErik Eckstein llvm_unreachable("Constant ValueID not recognized."); 3824d6fb72aSErik Eckstein return -1; 3834d6fb72aSErik Eckstein } 3844d6fb72aSErik Eckstein } 3854d6fb72aSErik Eckstein 3864d6fb72aSErik Eckstein int FunctionComparator::cmpGlobalValues(GlobalValue *L, GlobalValue *R) const { 387c1d52e5cSErik Eckstein uint64_t LNumber = GlobalNumbers->getNumber(L); 388c1d52e5cSErik Eckstein uint64_t RNumber = GlobalNumbers->getNumber(R); 389c1d52e5cSErik Eckstein return cmpNumbers(LNumber, RNumber); 3904d6fb72aSErik Eckstein } 3914d6fb72aSErik Eckstein 3924d6fb72aSErik Eckstein /// cmpType - compares two types, 3934d6fb72aSErik Eckstein /// defines total ordering among the types set. 3944d6fb72aSErik Eckstein /// See method declaration comments for more details. 3954d6fb72aSErik Eckstein int FunctionComparator::cmpTypes(Type *TyL, Type *TyR) const { 3964d6fb72aSErik Eckstein PointerType *PTyL = dyn_cast<PointerType>(TyL); 3974d6fb72aSErik Eckstein PointerType *PTyR = dyn_cast<PointerType>(TyR); 3984d6fb72aSErik Eckstein 3994d6fb72aSErik Eckstein const DataLayout &DL = FnL->getParent()->getDataLayout(); 4004d6fb72aSErik Eckstein if (PTyL && PTyL->getAddressSpace() == 0) 4014d6fb72aSErik Eckstein TyL = DL.getIntPtrType(TyL); 4024d6fb72aSErik Eckstein if (PTyR && PTyR->getAddressSpace() == 0) 4034d6fb72aSErik Eckstein TyR = DL.getIntPtrType(TyR); 4044d6fb72aSErik Eckstein 4054d6fb72aSErik Eckstein if (TyL == TyR) 4064d6fb72aSErik Eckstein return 0; 4074d6fb72aSErik Eckstein 4084d6fb72aSErik Eckstein if (int Res = cmpNumbers(TyL->getTypeID(), TyR->getTypeID())) 4094d6fb72aSErik Eckstein return Res; 4104d6fb72aSErik Eckstein 4114d6fb72aSErik Eckstein switch (TyL->getTypeID()) { 4124d6fb72aSErik Eckstein default: 4134d6fb72aSErik Eckstein llvm_unreachable("Unknown type!"); 4144d6fb72aSErik Eckstein // Fall through in Release mode. 4154d6fb72aSErik Eckstein LLVM_FALLTHROUGH; 4164d6fb72aSErik Eckstein case Type::IntegerTyID: 4174d6fb72aSErik Eckstein return cmpNumbers(cast<IntegerType>(TyL)->getBitWidth(), 4184d6fb72aSErik Eckstein cast<IntegerType>(TyR)->getBitWidth()); 4194d6fb72aSErik Eckstein // TyL == TyR would have returned true earlier, because types are uniqued. 4204d6fb72aSErik Eckstein case Type::VoidTyID: 4214d6fb72aSErik Eckstein case Type::FloatTyID: 4224d6fb72aSErik Eckstein case Type::DoubleTyID: 4234d6fb72aSErik Eckstein case Type::X86_FP80TyID: 4244d6fb72aSErik Eckstein case Type::FP128TyID: 4254d6fb72aSErik Eckstein case Type::PPC_FP128TyID: 4264d6fb72aSErik Eckstein case Type::LabelTyID: 4274d6fb72aSErik Eckstein case Type::MetadataTyID: 4284d6fb72aSErik Eckstein case Type::TokenTyID: 4294d6fb72aSErik Eckstein return 0; 4304d6fb72aSErik Eckstein 431286d5897SEugene Zelenko case Type::PointerTyID: 4324d6fb72aSErik Eckstein assert(PTyL && PTyR && "Both types must be pointers here."); 4334d6fb72aSErik Eckstein return cmpNumbers(PTyL->getAddressSpace(), PTyR->getAddressSpace()); 4344d6fb72aSErik Eckstein 4354d6fb72aSErik Eckstein case Type::StructTyID: { 4364d6fb72aSErik Eckstein StructType *STyL = cast<StructType>(TyL); 4374d6fb72aSErik Eckstein StructType *STyR = cast<StructType>(TyR); 4384d6fb72aSErik Eckstein if (STyL->getNumElements() != STyR->getNumElements()) 4394d6fb72aSErik Eckstein return cmpNumbers(STyL->getNumElements(), STyR->getNumElements()); 4404d6fb72aSErik Eckstein 4414d6fb72aSErik Eckstein if (STyL->isPacked() != STyR->isPacked()) 4424d6fb72aSErik Eckstein return cmpNumbers(STyL->isPacked(), STyR->isPacked()); 4434d6fb72aSErik Eckstein 4444d6fb72aSErik Eckstein for (unsigned i = 0, e = STyL->getNumElements(); i != e; ++i) { 4454d6fb72aSErik Eckstein if (int Res = cmpTypes(STyL->getElementType(i), STyR->getElementType(i))) 4464d6fb72aSErik Eckstein return Res; 4474d6fb72aSErik Eckstein } 4484d6fb72aSErik Eckstein return 0; 4494d6fb72aSErik Eckstein } 4504d6fb72aSErik Eckstein 4514d6fb72aSErik Eckstein case Type::FunctionTyID: { 4524d6fb72aSErik Eckstein FunctionType *FTyL = cast<FunctionType>(TyL); 4534d6fb72aSErik Eckstein FunctionType *FTyR = cast<FunctionType>(TyR); 4544d6fb72aSErik Eckstein if (FTyL->getNumParams() != FTyR->getNumParams()) 4554d6fb72aSErik Eckstein return cmpNumbers(FTyL->getNumParams(), FTyR->getNumParams()); 4564d6fb72aSErik Eckstein 4574d6fb72aSErik Eckstein if (FTyL->isVarArg() != FTyR->isVarArg()) 4584d6fb72aSErik Eckstein return cmpNumbers(FTyL->isVarArg(), FTyR->isVarArg()); 4594d6fb72aSErik Eckstein 4604d6fb72aSErik Eckstein if (int Res = cmpTypes(FTyL->getReturnType(), FTyR->getReturnType())) 4614d6fb72aSErik Eckstein return Res; 4624d6fb72aSErik Eckstein 4634d6fb72aSErik Eckstein for (unsigned i = 0, e = FTyL->getNumParams(); i != e; ++i) { 4644d6fb72aSErik Eckstein if (int Res = cmpTypes(FTyL->getParamType(i), FTyR->getParamType(i))) 4654d6fb72aSErik Eckstein return Res; 4664d6fb72aSErik Eckstein } 4674d6fb72aSErik Eckstein return 0; 4684d6fb72aSErik Eckstein } 4694d6fb72aSErik Eckstein 470bc070524SPeter Collingbourne case Type::ArrayTyID: 471bc070524SPeter Collingbourne case Type::VectorTyID: { 472bc070524SPeter Collingbourne auto *STyL = cast<SequentialType>(TyL); 473bc070524SPeter Collingbourne auto *STyR = cast<SequentialType>(TyR); 474bc070524SPeter Collingbourne if (STyL->getNumElements() != STyR->getNumElements()) 475bc070524SPeter Collingbourne return cmpNumbers(STyL->getNumElements(), STyR->getNumElements()); 476bc070524SPeter Collingbourne return cmpTypes(STyL->getElementType(), STyR->getElementType()); 4774d6fb72aSErik Eckstein } 4784d6fb72aSErik Eckstein } 4794d6fb72aSErik Eckstein } 4804d6fb72aSErik Eckstein 4814d6fb72aSErik Eckstein // Determine whether the two operations are the same except that pointer-to-A 4824d6fb72aSErik Eckstein // and pointer-to-B are equivalent. This should be kept in sync with 4834d6fb72aSErik Eckstein // Instruction::isSameOperationAs. 4844d6fb72aSErik Eckstein // Read method declaration comments for more details. 4854d6fb72aSErik Eckstein int FunctionComparator::cmpOperations(const Instruction *L, 4864d6fb72aSErik Eckstein const Instruction *R, 4874d6fb72aSErik Eckstein bool &needToCmpOperands) const { 4884d6fb72aSErik Eckstein needToCmpOperands = true; 4894d6fb72aSErik Eckstein if (int Res = cmpValues(L, R)) 4904d6fb72aSErik Eckstein return Res; 4914d6fb72aSErik Eckstein 4924d6fb72aSErik Eckstein // Differences from Instruction::isSameOperationAs: 4934d6fb72aSErik Eckstein // * replace type comparison with calls to cmpTypes. 4944d6fb72aSErik Eckstein // * we test for I->getRawSubclassOptionalData (nuw/nsw/tail) at the top. 4954d6fb72aSErik Eckstein // * because of the above, we don't test for the tail bit on calls later on. 4964d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getOpcode(), R->getOpcode())) 4974d6fb72aSErik Eckstein return Res; 4984d6fb72aSErik Eckstein 4994d6fb72aSErik Eckstein if (const GetElementPtrInst *GEPL = dyn_cast<GetElementPtrInst>(L)) { 5004d6fb72aSErik Eckstein needToCmpOperands = false; 5014d6fb72aSErik Eckstein const GetElementPtrInst *GEPR = cast<GetElementPtrInst>(R); 5024d6fb72aSErik Eckstein if (int Res = 5034d6fb72aSErik Eckstein cmpValues(GEPL->getPointerOperand(), GEPR->getPointerOperand())) 5044d6fb72aSErik Eckstein return Res; 5054d6fb72aSErik Eckstein return cmpGEPs(GEPL, GEPR); 5064d6fb72aSErik Eckstein } 5074d6fb72aSErik Eckstein 5084d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getNumOperands(), R->getNumOperands())) 5094d6fb72aSErik Eckstein return Res; 5104d6fb72aSErik Eckstein 5114d6fb72aSErik Eckstein if (int Res = cmpTypes(L->getType(), R->getType())) 5124d6fb72aSErik Eckstein return Res; 5134d6fb72aSErik Eckstein 5144d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getRawSubclassOptionalData(), 5154d6fb72aSErik Eckstein R->getRawSubclassOptionalData())) 5164d6fb72aSErik Eckstein return Res; 5174d6fb72aSErik Eckstein 5184d6fb72aSErik Eckstein // We have two instructions of identical opcode and #operands. Check to see 5194d6fb72aSErik Eckstein // if all operands are the same type 5204d6fb72aSErik Eckstein for (unsigned i = 0, e = L->getNumOperands(); i != e; ++i) { 5214d6fb72aSErik Eckstein if (int Res = 5224d6fb72aSErik Eckstein cmpTypes(L->getOperand(i)->getType(), R->getOperand(i)->getType())) 5234d6fb72aSErik Eckstein return Res; 5244d6fb72aSErik Eckstein } 5254d6fb72aSErik Eckstein 5264d6fb72aSErik Eckstein // Check special state that is a part of some instructions. 5274d6fb72aSErik Eckstein if (const AllocaInst *AI = dyn_cast<AllocaInst>(L)) { 5284d6fb72aSErik Eckstein if (int Res = cmpTypes(AI->getAllocatedType(), 5294d6fb72aSErik Eckstein cast<AllocaInst>(R)->getAllocatedType())) 5304d6fb72aSErik Eckstein return Res; 5314d6fb72aSErik Eckstein return cmpNumbers(AI->getAlignment(), cast<AllocaInst>(R)->getAlignment()); 5324d6fb72aSErik Eckstein } 5334d6fb72aSErik Eckstein if (const LoadInst *LI = dyn_cast<LoadInst>(L)) { 5344d6fb72aSErik Eckstein if (int Res = cmpNumbers(LI->isVolatile(), cast<LoadInst>(R)->isVolatile())) 5354d6fb72aSErik Eckstein return Res; 5364d6fb72aSErik Eckstein if (int Res = 5374d6fb72aSErik Eckstein cmpNumbers(LI->getAlignment(), cast<LoadInst>(R)->getAlignment())) 5384d6fb72aSErik Eckstein return Res; 5394d6fb72aSErik Eckstein if (int Res = 5404d6fb72aSErik Eckstein cmpOrderings(LI->getOrdering(), cast<LoadInst>(R)->getOrdering())) 5414d6fb72aSErik Eckstein return Res; 542bb80d3e1SKonstantin Zhuravlyov if (int Res = cmpNumbers(LI->getSyncScopeID(), 543bb80d3e1SKonstantin Zhuravlyov cast<LoadInst>(R)->getSyncScopeID())) 5444d6fb72aSErik Eckstein return Res; 5454d6fb72aSErik Eckstein return cmpRangeMetadata(LI->getMetadata(LLVMContext::MD_range), 5464d6fb72aSErik Eckstein cast<LoadInst>(R)->getMetadata(LLVMContext::MD_range)); 5474d6fb72aSErik Eckstein } 5484d6fb72aSErik Eckstein if (const StoreInst *SI = dyn_cast<StoreInst>(L)) { 5494d6fb72aSErik Eckstein if (int Res = 5504d6fb72aSErik Eckstein cmpNumbers(SI->isVolatile(), cast<StoreInst>(R)->isVolatile())) 5514d6fb72aSErik Eckstein return Res; 5524d6fb72aSErik Eckstein if (int Res = 5534d6fb72aSErik Eckstein cmpNumbers(SI->getAlignment(), cast<StoreInst>(R)->getAlignment())) 5544d6fb72aSErik Eckstein return Res; 5554d6fb72aSErik Eckstein if (int Res = 5564d6fb72aSErik Eckstein cmpOrderings(SI->getOrdering(), cast<StoreInst>(R)->getOrdering())) 5574d6fb72aSErik Eckstein return Res; 558bb80d3e1SKonstantin Zhuravlyov return cmpNumbers(SI->getSyncScopeID(), 559bb80d3e1SKonstantin Zhuravlyov cast<StoreInst>(R)->getSyncScopeID()); 5604d6fb72aSErik Eckstein } 5614d6fb72aSErik Eckstein if (const CmpInst *CI = dyn_cast<CmpInst>(L)) 5624d6fb72aSErik Eckstein return cmpNumbers(CI->getPredicate(), cast<CmpInst>(R)->getPredicate()); 5634d6fb72aSErik Eckstein if (const CallInst *CI = dyn_cast<CallInst>(L)) { 5644d6fb72aSErik Eckstein if (int Res = cmpNumbers(CI->getCallingConv(), 5654d6fb72aSErik Eckstein cast<CallInst>(R)->getCallingConv())) 5664d6fb72aSErik Eckstein return Res; 5674d6fb72aSErik Eckstein if (int Res = 5684d6fb72aSErik Eckstein cmpAttrs(CI->getAttributes(), cast<CallInst>(R)->getAttributes())) 5694d6fb72aSErik Eckstein return Res; 5704d6fb72aSErik Eckstein if (int Res = cmpOperandBundlesSchema(CI, R)) 5714d6fb72aSErik Eckstein return Res; 5724d6fb72aSErik Eckstein return cmpRangeMetadata( 5734d6fb72aSErik Eckstein CI->getMetadata(LLVMContext::MD_range), 5744d6fb72aSErik Eckstein cast<CallInst>(R)->getMetadata(LLVMContext::MD_range)); 5754d6fb72aSErik Eckstein } 5764d6fb72aSErik Eckstein if (const InvokeInst *II = dyn_cast<InvokeInst>(L)) { 5774d6fb72aSErik Eckstein if (int Res = cmpNumbers(II->getCallingConv(), 5784d6fb72aSErik Eckstein cast<InvokeInst>(R)->getCallingConv())) 5794d6fb72aSErik Eckstein return Res; 5804d6fb72aSErik Eckstein if (int Res = 5814d6fb72aSErik Eckstein cmpAttrs(II->getAttributes(), cast<InvokeInst>(R)->getAttributes())) 5824d6fb72aSErik Eckstein return Res; 5834d6fb72aSErik Eckstein if (int Res = cmpOperandBundlesSchema(II, R)) 5844d6fb72aSErik Eckstein return Res; 5854d6fb72aSErik Eckstein return cmpRangeMetadata( 5864d6fb72aSErik Eckstein II->getMetadata(LLVMContext::MD_range), 5874d6fb72aSErik Eckstein cast<InvokeInst>(R)->getMetadata(LLVMContext::MD_range)); 5884d6fb72aSErik Eckstein } 5894d6fb72aSErik Eckstein if (const InsertValueInst *IVI = dyn_cast<InsertValueInst>(L)) { 5904d6fb72aSErik Eckstein ArrayRef<unsigned> LIndices = IVI->getIndices(); 5914d6fb72aSErik Eckstein ArrayRef<unsigned> RIndices = cast<InsertValueInst>(R)->getIndices(); 5924d6fb72aSErik Eckstein if (int Res = cmpNumbers(LIndices.size(), RIndices.size())) 5934d6fb72aSErik Eckstein return Res; 5944d6fb72aSErik Eckstein for (size_t i = 0, e = LIndices.size(); i != e; ++i) { 5954d6fb72aSErik Eckstein if (int Res = cmpNumbers(LIndices[i], RIndices[i])) 5964d6fb72aSErik Eckstein return Res; 5974d6fb72aSErik Eckstein } 5984d6fb72aSErik Eckstein return 0; 5994d6fb72aSErik Eckstein } 6004d6fb72aSErik Eckstein if (const ExtractValueInst *EVI = dyn_cast<ExtractValueInst>(L)) { 6014d6fb72aSErik Eckstein ArrayRef<unsigned> LIndices = EVI->getIndices(); 6024d6fb72aSErik Eckstein ArrayRef<unsigned> RIndices = cast<ExtractValueInst>(R)->getIndices(); 6034d6fb72aSErik Eckstein if (int Res = cmpNumbers(LIndices.size(), RIndices.size())) 6044d6fb72aSErik Eckstein return Res; 6054d6fb72aSErik Eckstein for (size_t i = 0, e = LIndices.size(); i != e; ++i) { 6064d6fb72aSErik Eckstein if (int Res = cmpNumbers(LIndices[i], RIndices[i])) 6074d6fb72aSErik Eckstein return Res; 6084d6fb72aSErik Eckstein } 6094d6fb72aSErik Eckstein } 6104d6fb72aSErik Eckstein if (const FenceInst *FI = dyn_cast<FenceInst>(L)) { 6114d6fb72aSErik Eckstein if (int Res = 6124d6fb72aSErik Eckstein cmpOrderings(FI->getOrdering(), cast<FenceInst>(R)->getOrdering())) 6134d6fb72aSErik Eckstein return Res; 614bb80d3e1SKonstantin Zhuravlyov return cmpNumbers(FI->getSyncScopeID(), 615bb80d3e1SKonstantin Zhuravlyov cast<FenceInst>(R)->getSyncScopeID()); 6164d6fb72aSErik Eckstein } 6174d6fb72aSErik Eckstein if (const AtomicCmpXchgInst *CXI = dyn_cast<AtomicCmpXchgInst>(L)) { 6184d6fb72aSErik Eckstein if (int Res = cmpNumbers(CXI->isVolatile(), 6194d6fb72aSErik Eckstein cast<AtomicCmpXchgInst>(R)->isVolatile())) 6204d6fb72aSErik Eckstein return Res; 6214d6fb72aSErik Eckstein if (int Res = cmpNumbers(CXI->isWeak(), 6224d6fb72aSErik Eckstein cast<AtomicCmpXchgInst>(R)->isWeak())) 6234d6fb72aSErik Eckstein return Res; 6244d6fb72aSErik Eckstein if (int Res = 6254d6fb72aSErik Eckstein cmpOrderings(CXI->getSuccessOrdering(), 6264d6fb72aSErik Eckstein cast<AtomicCmpXchgInst>(R)->getSuccessOrdering())) 6274d6fb72aSErik Eckstein return Res; 6284d6fb72aSErik Eckstein if (int Res = 6294d6fb72aSErik Eckstein cmpOrderings(CXI->getFailureOrdering(), 6304d6fb72aSErik Eckstein cast<AtomicCmpXchgInst>(R)->getFailureOrdering())) 6314d6fb72aSErik Eckstein return Res; 632bb80d3e1SKonstantin Zhuravlyov return cmpNumbers(CXI->getSyncScopeID(), 633bb80d3e1SKonstantin Zhuravlyov cast<AtomicCmpXchgInst>(R)->getSyncScopeID()); 6344d6fb72aSErik Eckstein } 6354d6fb72aSErik Eckstein if (const AtomicRMWInst *RMWI = dyn_cast<AtomicRMWInst>(L)) { 6364d6fb72aSErik Eckstein if (int Res = cmpNumbers(RMWI->getOperation(), 6374d6fb72aSErik Eckstein cast<AtomicRMWInst>(R)->getOperation())) 6384d6fb72aSErik Eckstein return Res; 6394d6fb72aSErik Eckstein if (int Res = cmpNumbers(RMWI->isVolatile(), 6404d6fb72aSErik Eckstein cast<AtomicRMWInst>(R)->isVolatile())) 6414d6fb72aSErik Eckstein return Res; 6424d6fb72aSErik Eckstein if (int Res = cmpOrderings(RMWI->getOrdering(), 6434d6fb72aSErik Eckstein cast<AtomicRMWInst>(R)->getOrdering())) 6444d6fb72aSErik Eckstein return Res; 645bb80d3e1SKonstantin Zhuravlyov return cmpNumbers(RMWI->getSyncScopeID(), 646bb80d3e1SKonstantin Zhuravlyov cast<AtomicRMWInst>(R)->getSyncScopeID()); 6474d6fb72aSErik Eckstein } 6484d6fb72aSErik Eckstein if (const PHINode *PNL = dyn_cast<PHINode>(L)) { 6494d6fb72aSErik Eckstein const PHINode *PNR = cast<PHINode>(R); 6504d6fb72aSErik Eckstein // Ensure that in addition to the incoming values being identical 6514d6fb72aSErik Eckstein // (checked by the caller of this function), the incoming blocks 6524d6fb72aSErik Eckstein // are also identical. 6534d6fb72aSErik Eckstein for (unsigned i = 0, e = PNL->getNumIncomingValues(); i != e; ++i) { 6544d6fb72aSErik Eckstein if (int Res = 6554d6fb72aSErik Eckstein cmpValues(PNL->getIncomingBlock(i), PNR->getIncomingBlock(i))) 6564d6fb72aSErik Eckstein return Res; 6574d6fb72aSErik Eckstein } 6584d6fb72aSErik Eckstein } 6594d6fb72aSErik Eckstein return 0; 6604d6fb72aSErik Eckstein } 6614d6fb72aSErik Eckstein 6624d6fb72aSErik Eckstein // Determine whether two GEP operations perform the same underlying arithmetic. 6634d6fb72aSErik Eckstein // Read method declaration comments for more details. 6644d6fb72aSErik Eckstein int FunctionComparator::cmpGEPs(const GEPOperator *GEPL, 6654d6fb72aSErik Eckstein const GEPOperator *GEPR) const { 6664d6fb72aSErik Eckstein unsigned int ASL = GEPL->getPointerAddressSpace(); 6674d6fb72aSErik Eckstein unsigned int ASR = GEPR->getPointerAddressSpace(); 6684d6fb72aSErik Eckstein 6694d6fb72aSErik Eckstein if (int Res = cmpNumbers(ASL, ASR)) 6704d6fb72aSErik Eckstein return Res; 6714d6fb72aSErik Eckstein 6724d6fb72aSErik Eckstein // When we have target data, we can reduce the GEP down to the value in bytes 6734d6fb72aSErik Eckstein // added to the address. 6744d6fb72aSErik Eckstein const DataLayout &DL = FnL->getParent()->getDataLayout(); 6754d6fb72aSErik Eckstein unsigned BitWidth = DL.getPointerSizeInBits(ASL); 6764d6fb72aSErik Eckstein APInt OffsetL(BitWidth, 0), OffsetR(BitWidth, 0); 6774d6fb72aSErik Eckstein if (GEPL->accumulateConstantOffset(DL, OffsetL) && 6784d6fb72aSErik Eckstein GEPR->accumulateConstantOffset(DL, OffsetR)) 6794d6fb72aSErik Eckstein return cmpAPInts(OffsetL, OffsetR); 6804d6fb72aSErik Eckstein if (int Res = cmpTypes(GEPL->getSourceElementType(), 6814d6fb72aSErik Eckstein GEPR->getSourceElementType())) 6824d6fb72aSErik Eckstein return Res; 6834d6fb72aSErik Eckstein 6844d6fb72aSErik Eckstein if (int Res = cmpNumbers(GEPL->getNumOperands(), GEPR->getNumOperands())) 6854d6fb72aSErik Eckstein return Res; 6864d6fb72aSErik Eckstein 6874d6fb72aSErik Eckstein for (unsigned i = 0, e = GEPL->getNumOperands(); i != e; ++i) { 6884d6fb72aSErik Eckstein if (int Res = cmpValues(GEPL->getOperand(i), GEPR->getOperand(i))) 6894d6fb72aSErik Eckstein return Res; 6904d6fb72aSErik Eckstein } 6914d6fb72aSErik Eckstein 6924d6fb72aSErik Eckstein return 0; 6934d6fb72aSErik Eckstein } 6944d6fb72aSErik Eckstein 6954d6fb72aSErik Eckstein int FunctionComparator::cmpInlineAsm(const InlineAsm *L, 6964d6fb72aSErik Eckstein const InlineAsm *R) const { 6974d6fb72aSErik Eckstein // InlineAsm's are uniqued. If they are the same pointer, obviously they are 6984d6fb72aSErik Eckstein // the same, otherwise compare the fields. 6994d6fb72aSErik Eckstein if (L == R) 7004d6fb72aSErik Eckstein return 0; 7014d6fb72aSErik Eckstein if (int Res = cmpTypes(L->getFunctionType(), R->getFunctionType())) 7024d6fb72aSErik Eckstein return Res; 7034d6fb72aSErik Eckstein if (int Res = cmpMem(L->getAsmString(), R->getAsmString())) 7044d6fb72aSErik Eckstein return Res; 7054d6fb72aSErik Eckstein if (int Res = cmpMem(L->getConstraintString(), R->getConstraintString())) 7064d6fb72aSErik Eckstein return Res; 7074d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->hasSideEffects(), R->hasSideEffects())) 7084d6fb72aSErik Eckstein return Res; 7094d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->isAlignStack(), R->isAlignStack())) 7104d6fb72aSErik Eckstein return Res; 7114d6fb72aSErik Eckstein if (int Res = cmpNumbers(L->getDialect(), R->getDialect())) 7124d6fb72aSErik Eckstein return Res; 71368403564Swhitequark assert(L->getFunctionType() != R->getFunctionType()); 7144d6fb72aSErik Eckstein return 0; 7154d6fb72aSErik Eckstein } 7164d6fb72aSErik Eckstein 7174d6fb72aSErik Eckstein /// Compare two values used by the two functions under pair-wise comparison. If 7184d6fb72aSErik Eckstein /// this is the first time the values are seen, they're added to the mapping so 7194d6fb72aSErik Eckstein /// that we will detect mismatches on next use. 7204d6fb72aSErik Eckstein /// See comments in declaration for more details. 7214d6fb72aSErik Eckstein int FunctionComparator::cmpValues(const Value *L, const Value *R) const { 7224d6fb72aSErik Eckstein // Catch self-reference case. 7234d6fb72aSErik Eckstein if (L == FnL) { 7244d6fb72aSErik Eckstein if (R == FnR) 7254d6fb72aSErik Eckstein return 0; 7264d6fb72aSErik Eckstein return -1; 7274d6fb72aSErik Eckstein } 7284d6fb72aSErik Eckstein if (R == FnR) { 7294d6fb72aSErik Eckstein if (L == FnL) 7304d6fb72aSErik Eckstein return 0; 7314d6fb72aSErik Eckstein return 1; 7324d6fb72aSErik Eckstein } 7334d6fb72aSErik Eckstein 7344d6fb72aSErik Eckstein const Constant *ConstL = dyn_cast<Constant>(L); 7354d6fb72aSErik Eckstein const Constant *ConstR = dyn_cast<Constant>(R); 7364d6fb72aSErik Eckstein if (ConstL && ConstR) { 7374d6fb72aSErik Eckstein if (L == R) 7384d6fb72aSErik Eckstein return 0; 7394d6fb72aSErik Eckstein return cmpConstants(ConstL, ConstR); 7404d6fb72aSErik Eckstein } 7414d6fb72aSErik Eckstein 7424d6fb72aSErik Eckstein if (ConstL) 7434d6fb72aSErik Eckstein return 1; 7444d6fb72aSErik Eckstein if (ConstR) 7454d6fb72aSErik Eckstein return -1; 7464d6fb72aSErik Eckstein 7474d6fb72aSErik Eckstein const InlineAsm *InlineAsmL = dyn_cast<InlineAsm>(L); 7484d6fb72aSErik Eckstein const InlineAsm *InlineAsmR = dyn_cast<InlineAsm>(R); 7494d6fb72aSErik Eckstein 7504d6fb72aSErik Eckstein if (InlineAsmL && InlineAsmR) 7514d6fb72aSErik Eckstein return cmpInlineAsm(InlineAsmL, InlineAsmR); 7524d6fb72aSErik Eckstein if (InlineAsmL) 7534d6fb72aSErik Eckstein return 1; 7544d6fb72aSErik Eckstein if (InlineAsmR) 7554d6fb72aSErik Eckstein return -1; 7564d6fb72aSErik Eckstein 7574d6fb72aSErik Eckstein auto LeftSN = sn_mapL.insert(std::make_pair(L, sn_mapL.size())), 7584d6fb72aSErik Eckstein RightSN = sn_mapR.insert(std::make_pair(R, sn_mapR.size())); 7594d6fb72aSErik Eckstein 7604d6fb72aSErik Eckstein return cmpNumbers(LeftSN.first->second, RightSN.first->second); 7614d6fb72aSErik Eckstein } 7624d6fb72aSErik Eckstein 7634d6fb72aSErik Eckstein // Test whether two basic blocks have equivalent behaviour. 7644d6fb72aSErik Eckstein int FunctionComparator::cmpBasicBlocks(const BasicBlock *BBL, 7654d6fb72aSErik Eckstein const BasicBlock *BBR) const { 7664d6fb72aSErik Eckstein BasicBlock::const_iterator InstL = BBL->begin(), InstLE = BBL->end(); 7674d6fb72aSErik Eckstein BasicBlock::const_iterator InstR = BBR->begin(), InstRE = BBR->end(); 7684d6fb72aSErik Eckstein 7694d6fb72aSErik Eckstein do { 7704d6fb72aSErik Eckstein bool needToCmpOperands = true; 7714d6fb72aSErik Eckstein if (int Res = cmpOperations(&*InstL, &*InstR, needToCmpOperands)) 7724d6fb72aSErik Eckstein return Res; 7734d6fb72aSErik Eckstein if (needToCmpOperands) { 7744d6fb72aSErik Eckstein assert(InstL->getNumOperands() == InstR->getNumOperands()); 7754d6fb72aSErik Eckstein 7764d6fb72aSErik Eckstein for (unsigned i = 0, e = InstL->getNumOperands(); i != e; ++i) { 7774d6fb72aSErik Eckstein Value *OpL = InstL->getOperand(i); 7784d6fb72aSErik Eckstein Value *OpR = InstR->getOperand(i); 7794d6fb72aSErik Eckstein if (int Res = cmpValues(OpL, OpR)) 7804d6fb72aSErik Eckstein return Res; 7814d6fb72aSErik Eckstein // cmpValues should ensure this is true. 7824d6fb72aSErik Eckstein assert(cmpTypes(OpL->getType(), OpR->getType()) == 0); 7834d6fb72aSErik Eckstein } 7844d6fb72aSErik Eckstein } 7854d6fb72aSErik Eckstein 7864d6fb72aSErik Eckstein ++InstL; 7874d6fb72aSErik Eckstein ++InstR; 7884d6fb72aSErik Eckstein } while (InstL != InstLE && InstR != InstRE); 7894d6fb72aSErik Eckstein 7904d6fb72aSErik Eckstein if (InstL != InstLE && InstR == InstRE) 7914d6fb72aSErik Eckstein return 1; 7924d6fb72aSErik Eckstein if (InstL == InstLE && InstR != InstRE) 7934d6fb72aSErik Eckstein return -1; 7944d6fb72aSErik Eckstein return 0; 7954d6fb72aSErik Eckstein } 7964d6fb72aSErik Eckstein 7974d6fb72aSErik Eckstein int FunctionComparator::compareSignature() const { 7984d6fb72aSErik Eckstein if (int Res = cmpAttrs(FnL->getAttributes(), FnR->getAttributes())) 7994d6fb72aSErik Eckstein return Res; 8004d6fb72aSErik Eckstein 8014d6fb72aSErik Eckstein if (int Res = cmpNumbers(FnL->hasGC(), FnR->hasGC())) 8024d6fb72aSErik Eckstein return Res; 8034d6fb72aSErik Eckstein 8044d6fb72aSErik Eckstein if (FnL->hasGC()) { 8054d6fb72aSErik Eckstein if (int Res = cmpMem(FnL->getGC(), FnR->getGC())) 8064d6fb72aSErik Eckstein return Res; 8074d6fb72aSErik Eckstein } 8084d6fb72aSErik Eckstein 8094d6fb72aSErik Eckstein if (int Res = cmpNumbers(FnL->hasSection(), FnR->hasSection())) 8104d6fb72aSErik Eckstein return Res; 8114d6fb72aSErik Eckstein 8124d6fb72aSErik Eckstein if (FnL->hasSection()) { 8134d6fb72aSErik Eckstein if (int Res = cmpMem(FnL->getSection(), FnR->getSection())) 8144d6fb72aSErik Eckstein return Res; 8154d6fb72aSErik Eckstein } 8164d6fb72aSErik Eckstein 8174d6fb72aSErik Eckstein if (int Res = cmpNumbers(FnL->isVarArg(), FnR->isVarArg())) 8184d6fb72aSErik Eckstein return Res; 8194d6fb72aSErik Eckstein 8204d6fb72aSErik Eckstein // TODO: if it's internal and only used in direct calls, we could handle this 8214d6fb72aSErik Eckstein // case too. 8224d6fb72aSErik Eckstein if (int Res = cmpNumbers(FnL->getCallingConv(), FnR->getCallingConv())) 8234d6fb72aSErik Eckstein return Res; 8244d6fb72aSErik Eckstein 8254d6fb72aSErik Eckstein if (int Res = cmpTypes(FnL->getFunctionType(), FnR->getFunctionType())) 8264d6fb72aSErik Eckstein return Res; 8274d6fb72aSErik Eckstein 8284d6fb72aSErik Eckstein assert(FnL->arg_size() == FnR->arg_size() && 8294d6fb72aSErik Eckstein "Identically typed functions have different numbers of args!"); 8304d6fb72aSErik Eckstein 8314d6fb72aSErik Eckstein // Visit the arguments so that they get enumerated in the order they're 8324d6fb72aSErik Eckstein // passed in. 8334d6fb72aSErik Eckstein for (Function::const_arg_iterator ArgLI = FnL->arg_begin(), 8344d6fb72aSErik Eckstein ArgRI = FnR->arg_begin(), 8354d6fb72aSErik Eckstein ArgLE = FnL->arg_end(); 8364d6fb72aSErik Eckstein ArgLI != ArgLE; ++ArgLI, ++ArgRI) { 8374d6fb72aSErik Eckstein if (cmpValues(&*ArgLI, &*ArgRI) != 0) 8384d6fb72aSErik Eckstein llvm_unreachable("Arguments repeat!"); 8394d6fb72aSErik Eckstein } 8404d6fb72aSErik Eckstein return 0; 8414d6fb72aSErik Eckstein } 8424d6fb72aSErik Eckstein 8434d6fb72aSErik Eckstein // Test whether the two functions have equivalent behaviour. 8444d6fb72aSErik Eckstein int FunctionComparator::compare() { 8454d6fb72aSErik Eckstein beginCompare(); 8464d6fb72aSErik Eckstein 8474d6fb72aSErik Eckstein if (int Res = compareSignature()) 8484d6fb72aSErik Eckstein return Res; 8494d6fb72aSErik Eckstein 8504d6fb72aSErik Eckstein // We do a CFG-ordered walk since the actual ordering of the blocks in the 8514d6fb72aSErik Eckstein // linked list is immaterial. Our walk starts at the entry block for both 8524d6fb72aSErik Eckstein // functions, then takes each block from each terminator in order. As an 8534d6fb72aSErik Eckstein // artifact, this also means that unreachable blocks are ignored. 8544d6fb72aSErik Eckstein SmallVector<const BasicBlock *, 8> FnLBBs, FnRBBs; 8554d6fb72aSErik Eckstein SmallPtrSet<const BasicBlock *, 32> VisitedBBs; // in terms of F1. 8564d6fb72aSErik Eckstein 8574d6fb72aSErik Eckstein FnLBBs.push_back(&FnL->getEntryBlock()); 8584d6fb72aSErik Eckstein FnRBBs.push_back(&FnR->getEntryBlock()); 8594d6fb72aSErik Eckstein 8604d6fb72aSErik Eckstein VisitedBBs.insert(FnLBBs[0]); 8614d6fb72aSErik Eckstein while (!FnLBBs.empty()) { 8624d6fb72aSErik Eckstein const BasicBlock *BBL = FnLBBs.pop_back_val(); 8634d6fb72aSErik Eckstein const BasicBlock *BBR = FnRBBs.pop_back_val(); 8644d6fb72aSErik Eckstein 8654d6fb72aSErik Eckstein if (int Res = cmpValues(BBL, BBR)) 8664d6fb72aSErik Eckstein return Res; 8674d6fb72aSErik Eckstein 8684d6fb72aSErik Eckstein if (int Res = cmpBasicBlocks(BBL, BBR)) 8694d6fb72aSErik Eckstein return Res; 8704d6fb72aSErik Eckstein 8714d6fb72aSErik Eckstein const TerminatorInst *TermL = BBL->getTerminator(); 8724d6fb72aSErik Eckstein const TerminatorInst *TermR = BBR->getTerminator(); 8734d6fb72aSErik Eckstein 8744d6fb72aSErik Eckstein assert(TermL->getNumSuccessors() == TermR->getNumSuccessors()); 8754d6fb72aSErik Eckstein for (unsigned i = 0, e = TermL->getNumSuccessors(); i != e; ++i) { 8764d6fb72aSErik Eckstein if (!VisitedBBs.insert(TermL->getSuccessor(i)).second) 8774d6fb72aSErik Eckstein continue; 8784d6fb72aSErik Eckstein 8794d6fb72aSErik Eckstein FnLBBs.push_back(TermL->getSuccessor(i)); 8804d6fb72aSErik Eckstein FnRBBs.push_back(TermR->getSuccessor(i)); 8814d6fb72aSErik Eckstein } 8824d6fb72aSErik Eckstein } 8834d6fb72aSErik Eckstein return 0; 8844d6fb72aSErik Eckstein } 8854d6fb72aSErik Eckstein 8864d6fb72aSErik Eckstein namespace { 8874d6fb72aSErik Eckstein 8884d6fb72aSErik Eckstein // Accumulate the hash of a sequence of 64-bit integers. This is similar to a 8894d6fb72aSErik Eckstein // hash of a sequence of 64bit ints, but the entire input does not need to be 8904d6fb72aSErik Eckstein // available at once. This interface is necessary for functionHash because it 8914d6fb72aSErik Eckstein // needs to accumulate the hash as the structure of the function is traversed 8924d6fb72aSErik Eckstein // without saving these values to an intermediate buffer. This form of hashing 8934d6fb72aSErik Eckstein // is not often needed, as usually the object to hash is just read from a 8944d6fb72aSErik Eckstein // buffer. 8954d6fb72aSErik Eckstein class HashAccumulator64 { 8964d6fb72aSErik Eckstein uint64_t Hash; 897286d5897SEugene Zelenko 8984d6fb72aSErik Eckstein public: 8994d6fb72aSErik Eckstein // Initialize to random constant, so the state isn't zero. 9004d6fb72aSErik Eckstein HashAccumulator64() { Hash = 0x6acaa36bef8325c5ULL; } 901286d5897SEugene Zelenko 9024d6fb72aSErik Eckstein void add(uint64_t V) { 903286d5897SEugene Zelenko Hash = hashing::detail::hash_16_bytes(Hash, V); 9044d6fb72aSErik Eckstein } 905286d5897SEugene Zelenko 9064d6fb72aSErik Eckstein // No finishing is required, because the entire hash value is used. 9074d6fb72aSErik Eckstein uint64_t getHash() { return Hash; } 9084d6fb72aSErik Eckstein }; 909286d5897SEugene Zelenko 9104d6fb72aSErik Eckstein } // end anonymous namespace 9114d6fb72aSErik Eckstein 9124d6fb72aSErik Eckstein // A function hash is calculated by considering only the number of arguments and 9134d6fb72aSErik Eckstein // whether a function is varargs, the order of basic blocks (given by the 9144d6fb72aSErik Eckstein // successors of each basic block in depth first order), and the order of 9154d6fb72aSErik Eckstein // opcodes of each instruction within each of these basic blocks. This mirrors 9164d6fb72aSErik Eckstein // the strategy compare() uses to compare functions by walking the BBs in depth 9174d6fb72aSErik Eckstein // first order and comparing each instruction in sequence. Because this hash 9184d6fb72aSErik Eckstein // does not look at the operands, it is insensitive to things such as the 9194d6fb72aSErik Eckstein // target of calls and the constants used in the function, which makes it useful 9204d6fb72aSErik Eckstein // when possibly merging functions which are the same modulo constants and call 9214d6fb72aSErik Eckstein // targets. 9224d6fb72aSErik Eckstein FunctionComparator::FunctionHash FunctionComparator::functionHash(Function &F) { 9234d6fb72aSErik Eckstein HashAccumulator64 H; 9244d6fb72aSErik Eckstein H.add(F.isVarArg()); 9254d6fb72aSErik Eckstein H.add(F.arg_size()); 9264d6fb72aSErik Eckstein 9274d6fb72aSErik Eckstein SmallVector<const BasicBlock *, 8> BBs; 9284d6fb72aSErik Eckstein SmallSet<const BasicBlock *, 16> VisitedBBs; 9294d6fb72aSErik Eckstein 9304d6fb72aSErik Eckstein // Walk the blocks in the same order as FunctionComparator::cmpBasicBlocks(), 9314d6fb72aSErik Eckstein // accumulating the hash of the function "structure." (BB and opcode sequence) 9324d6fb72aSErik Eckstein BBs.push_back(&F.getEntryBlock()); 9334d6fb72aSErik Eckstein VisitedBBs.insert(BBs[0]); 9344d6fb72aSErik Eckstein while (!BBs.empty()) { 9354d6fb72aSErik Eckstein const BasicBlock *BB = BBs.pop_back_val(); 9364d6fb72aSErik Eckstein // This random value acts as a block header, as otherwise the partition of 9374d6fb72aSErik Eckstein // opcodes into BBs wouldn't affect the hash, only the order of the opcodes 9384d6fb72aSErik Eckstein H.add(45798); 9394d6fb72aSErik Eckstein for (auto &Inst : *BB) { 9404d6fb72aSErik Eckstein H.add(Inst.getOpcode()); 9414d6fb72aSErik Eckstein } 9424d6fb72aSErik Eckstein const TerminatorInst *Term = BB->getTerminator(); 9434d6fb72aSErik Eckstein for (unsigned i = 0, e = Term->getNumSuccessors(); i != e; ++i) { 9444d6fb72aSErik Eckstein if (!VisitedBBs.insert(Term->getSuccessor(i)).second) 9454d6fb72aSErik Eckstein continue; 9464d6fb72aSErik Eckstein BBs.push_back(Term->getSuccessor(i)); 9474d6fb72aSErik Eckstein } 9484d6fb72aSErik Eckstein } 9494d6fb72aSErik Eckstein return H.getHash(); 9504d6fb72aSErik Eckstein } 951