1ee3c74fbSChris Lattner //===- FileCheck.cpp - Check that File's Contents match what is expected --===// 2ee3c74fbSChris Lattner // 3ee3c74fbSChris Lattner // The LLVM Compiler Infrastructure 4ee3c74fbSChris Lattner // 5ee3c74fbSChris Lattner // This file is distributed under the University of Illinois Open Source 6ee3c74fbSChris Lattner // License. See LICENSE.TXT for details. 7ee3c74fbSChris Lattner // 8ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 9ee3c74fbSChris Lattner // 10ee3c74fbSChris Lattner // FileCheck does a line-by line check of a file that validates whether it 11ee3c74fbSChris Lattner // contains the expected content. This is useful for regression tests etc. 12ee3c74fbSChris Lattner // 13b5ecceffSJames Henderson // This program exits with an exit status of 2 on error, exit status of 0 if 14ee3c74fbSChris Lattner // the file matched the expected contents, and exit status of 1 if it did not 15ee3c74fbSChris Lattner // contain the expected contents. 16ee3c74fbSChris Lattner // 17ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 18ee3c74fbSChris Lattner 1991d19d8eSChandler Carruth #include "llvm/ADT/SmallString.h" 2091d19d8eSChandler Carruth #include "llvm/ADT/StringExtras.h" 2191d19d8eSChandler Carruth #include "llvm/ADT/StringMap.h" 2213df4626SMatt Arsenault #include "llvm/ADT/StringSet.h" 23ee3c74fbSChris Lattner #include "llvm/Support/CommandLine.h" 24ee3c74fbSChris Lattner #include "llvm/Support/MemoryBuffer.h" 25ee3c74fbSChris Lattner #include "llvm/Support/PrettyStackTrace.h" 26f08d2db9SChris Lattner #include "llvm/Support/Regex.h" 2791d19d8eSChandler Carruth #include "llvm/Support/Signals.h" 28ee3c74fbSChris Lattner #include "llvm/Support/SourceMgr.h" 29ee3c74fbSChris Lattner #include "llvm/Support/raw_ostream.h" 308879e06dSChris Lattner #include <algorithm> 31981af002SWill Dietz #include <cctype> 32e8b8f1bcSEli Bendersky #include <map> 33e8b8f1bcSEli Bendersky #include <string> 34a6e9c3e4SRafael Espindola #include <system_error> 35e8b8f1bcSEli Bendersky #include <vector> 36ee3c74fbSChris Lattner using namespace llvm; 37ee3c74fbSChris Lattner 38ee3c74fbSChris Lattner static cl::opt<std::string> 39ee3c74fbSChris Lattner CheckFilename(cl::Positional, cl::desc("<check-file>"), cl::Required); 40ee3c74fbSChris Lattner 41ee3c74fbSChris Lattner static cl::opt<std::string> 42ee3c74fbSChris Lattner InputFilename("input-file", cl::desc("File to check (defaults to stdin)"), 43ee3c74fbSChris Lattner cl::init("-"), cl::value_desc("filename")); 44ee3c74fbSChris Lattner 45e8f2fb20SChandler Carruth static cl::list<std::string> CheckPrefixes( 46e8f2fb20SChandler Carruth "check-prefix", 47ee3c74fbSChris Lattner cl::desc("Prefix to use from check file (defaults to 'CHECK')")); 48fd557cb0SDaniel Sanders static cl::alias CheckPrefixesAlias( 49fd557cb0SDaniel Sanders "check-prefixes", cl::aliasopt(CheckPrefixes), cl::CommaSeparated, 50fd557cb0SDaniel Sanders cl::NotHidden, 51fd557cb0SDaniel Sanders cl::desc( 52fd557cb0SDaniel Sanders "Alias for -check-prefix permitting multiple comma separated values")); 53ee3c74fbSChris Lattner 54e8f2fb20SChandler Carruth static cl::opt<bool> NoCanonicalizeWhiteSpace( 55e8f2fb20SChandler Carruth "strict-whitespace", 562c3e5cdfSChris Lattner cl::desc("Do not treat all horizontal whitespace as equivalent")); 572c3e5cdfSChris Lattner 5856ccdbbdSAlexander Kornienko static cl::list<std::string> ImplicitCheckNot( 5956ccdbbdSAlexander Kornienko "implicit-check-not", 6056ccdbbdSAlexander Kornienko cl::desc("Add an implicit negative check with this pattern to every\n" 6156ccdbbdSAlexander Kornienko "positive check. This can be used to ensure that no instances of\n" 6256ccdbbdSAlexander Kornienko "this pattern occur which are not matched by a positive pattern"), 6356ccdbbdSAlexander Kornienko cl::value_desc("pattern")); 6456ccdbbdSAlexander Kornienko 65*46e1fd61SAlexander Richardson static cl::list<std::string> GlobalDefines("D", cl::Prefix, 66*46e1fd61SAlexander Richardson cl::desc("Define a variable to be used in capture patterns."), 67*46e1fd61SAlexander Richardson cl::value_desc("VAR=VALUE")); 68*46e1fd61SAlexander Richardson 691b9f936fSJustin Bogner static cl::opt<bool> AllowEmptyInput( 701b9f936fSJustin Bogner "allow-empty", cl::init(false), 711b9f936fSJustin Bogner cl::desc("Allow the input file to be empty. This is useful when making\n" 721b9f936fSJustin Bogner "checks that some error message does not occur, for example.")); 731b9f936fSJustin Bogner 7485913ccaSJames Y Knight static cl::opt<bool> MatchFullLines( 7585913ccaSJames Y Knight "match-full-lines", cl::init(false), 7685913ccaSJames Y Knight cl::desc("Require all positive matches to cover an entire input line.\n" 7785913ccaSJames Y Knight "Allows leading and trailing whitespace if --strict-whitespace\n" 7885913ccaSJames Y Knight "is not also passed.")); 7985913ccaSJames Y Knight 80f55e72a5SArtem Belevich static cl::opt<bool> EnableVarScope( 81f55e72a5SArtem Belevich "enable-var-scope", cl::init(false), 82f55e72a5SArtem Belevich cl::desc("Enables scope for regex variables. Variables with names that\n" 83f55e72a5SArtem Belevich "do not start with '$' will be reset at the beginning of\n" 84f55e72a5SArtem Belevich "each CHECK-LABEL block.")); 85f55e72a5SArtem Belevich 8613df4626SMatt Arsenault typedef cl::list<std::string>::const_iterator prefix_iterator; 8713df4626SMatt Arsenault 8874d50731SChris Lattner //===----------------------------------------------------------------------===// 8974d50731SChris Lattner // Pattern Handling Code. 9074d50731SChris Lattner //===----------------------------------------------------------------------===// 9174d50731SChris Lattner 9238820972SMatt Arsenault namespace Check { 9338820972SMatt Arsenault enum CheckType { 9438820972SMatt Arsenault CheckNone = 0, 9538820972SMatt Arsenault CheckPlain, 9638820972SMatt Arsenault CheckNext, 9701ac1707SDuncan P. N. Exon Smith CheckSame, 9838820972SMatt Arsenault CheckNot, 9938820972SMatt Arsenault CheckDAG, 10038820972SMatt Arsenault CheckLabel, 1010a4c44bdSChris Lattner 1024dabac20SChandler Carruth /// Indicates the pattern only matches the end of file. This is used for 1034dabac20SChandler Carruth /// trailing CHECK-NOTs. 104a908e7bdSPaul Robinson CheckEOF, 1054dabac20SChandler Carruth 1064dabac20SChandler Carruth /// Marks when parsing found a -NOT check combined with another CHECK suffix. 107a908e7bdSPaul Robinson CheckBadNot 10838820972SMatt Arsenault }; 10938820972SMatt Arsenault } 110eba55822SJakob Stoklund Olesen 11138820972SMatt Arsenault class Pattern { 11238820972SMatt Arsenault SMLoc PatternLoc; 11391a1b2c9SMichael Liao 1144dabac20SChandler Carruth /// A fixed string to match as the pattern or empty if this pattern requires 1154dabac20SChandler Carruth /// a regex match. 116221460e0SChris Lattner StringRef FixedStr; 117b16ab0c4SChris Lattner 1184dabac20SChandler Carruth /// A regex string to match as the pattern or empty if this pattern requires 1194dabac20SChandler Carruth /// a fixed string to match. 120b16ab0c4SChris Lattner std::string RegExStr; 1218879e06dSChris Lattner 1224dabac20SChandler Carruth /// Entries in this vector map to uses of a variable in the pattern, e.g. 1234dabac20SChandler Carruth /// "foo[[bar]]baz". In this case, the RegExStr will contain "foobaz" and 1244dabac20SChandler Carruth /// we'll get an entry in this vector that tells us to insert the value of 1254dabac20SChandler Carruth /// bar at offset 3. 1268879e06dSChris Lattner std::vector<std::pair<StringRef, unsigned>> VariableUses; 1278879e06dSChris Lattner 1284dabac20SChandler Carruth /// Maps definitions of variables to their parenthesized capture numbers. 1294dabac20SChandler Carruth /// 1304dabac20SChandler Carruth /// E.g. for the pattern "foo[[bar:.*]]baz", VariableDefs will map "bar" to 1314dabac20SChandler Carruth /// 1. 132e8b8f1bcSEli Bendersky std::map<StringRef, unsigned> VariableDefs; 1338879e06dSChris Lattner 134d1e020f7SSaleem Abdulrasool Check::CheckType CheckTy; 1353b40b445SChris Lattner 1364dabac20SChandler Carruth /// Contains the number of line this pattern is in. 137d1e020f7SSaleem Abdulrasool unsigned LineNumber; 138d1e020f7SSaleem Abdulrasool 139d1e020f7SSaleem Abdulrasool public: 140d1e020f7SSaleem Abdulrasool explicit Pattern(Check::CheckType Ty) : CheckTy(Ty) {} 14174d50731SChris Lattner 1424dabac20SChandler Carruth /// Returns the location in source code. 1430b707eb8SMichael Liao SMLoc getLoc() const { return PatternLoc; } 1440b707eb8SMichael Liao 145e8f2fb20SChandler Carruth bool ParsePattern(StringRef PatternStr, StringRef Prefix, SourceMgr &SM, 14613df4626SMatt Arsenault unsigned LineNumber); 1478879e06dSChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen, 1488879e06dSChris Lattner StringMap<StringRef> &VariableTable) const; 149e0ef65abSDaniel Dunbar void PrintFailureInfo(const SourceMgr &SM, StringRef Buffer, 150e0ef65abSDaniel Dunbar const StringMap<StringRef> &VariableTable) const; 151e0ef65abSDaniel Dunbar 152e8f2fb20SChandler Carruth bool hasVariable() const { 153e8f2fb20SChandler Carruth return !(VariableUses.empty() && VariableDefs.empty()); 154e8f2fb20SChandler Carruth } 155f8bd2e5bSStephen Lin 15638820972SMatt Arsenault Check::CheckType getCheckTy() const { return CheckTy; } 15791a1b2c9SMichael Liao 158b16ab0c4SChris Lattner private: 159e8b8f1bcSEli Bendersky bool AddRegExToRegEx(StringRef RS, unsigned &CurParen, SourceMgr &SM); 160e8b8f1bcSEli Bendersky void AddBackrefToRegEx(unsigned BackrefNum); 161e8f2fb20SChandler Carruth unsigned 162e8f2fb20SChandler Carruth ComputeMatchDistance(StringRef Buffer, 163fd29d886SDaniel Dunbar const StringMap<StringRef> &VariableTable) const; 16492987fb3SAlexander Kornienko bool EvaluateExpression(StringRef Expr, std::string &Value) const; 16581e5cd9eSAdrian Prantl size_t FindRegexVarEnd(StringRef Str, SourceMgr &SM); 1663b40b445SChris Lattner }; 1673b40b445SChris Lattner 1684dabac20SChandler Carruth /// Parses the given string into the Pattern. 1694dabac20SChandler Carruth /// 1704dabac20SChandler Carruth /// \p Prefix provides which prefix is being matched, \p SM provides the 1714dabac20SChandler Carruth /// SourceMgr used for error reports, and \p LineNumber is the line number in 1724dabac20SChandler Carruth /// the input file from which the pattern string was read. Returns true in 1734dabac20SChandler Carruth /// case of an error, false otherwise. 174e8f2fb20SChandler Carruth bool Pattern::ParsePattern(StringRef PatternStr, StringRef Prefix, 175e8f2fb20SChandler Carruth SourceMgr &SM, unsigned LineNumber) { 17685913ccaSJames Y Knight bool MatchFullLinesHere = MatchFullLines && CheckTy != Check::CheckNot; 17785913ccaSJames Y Knight 17892987fb3SAlexander Kornienko this->LineNumber = LineNumber; 1790a4c44bdSChris Lattner PatternLoc = SMLoc::getFromPointer(PatternStr.data()); 1800a4c44bdSChris Lattner 1811714676aSTom de Vries if (!(NoCanonicalizeWhiteSpace && MatchFullLines)) 18274d50731SChris Lattner // Ignore trailing whitespace. 18374d50731SChris Lattner while (!PatternStr.empty() && 18474d50731SChris Lattner (PatternStr.back() == ' ' || PatternStr.back() == '\t')) 18574d50731SChris Lattner PatternStr = PatternStr.substr(0, PatternStr.size() - 1); 18674d50731SChris Lattner 18774d50731SChris Lattner // Check that there is something on the line. 18874d50731SChris Lattner if (PatternStr.empty()) { 18903b80a40SChris Lattner SM.PrintMessage(PatternLoc, SourceMgr::DK_Error, 190e8f2fb20SChandler Carruth "found empty check string with prefix '" + Prefix + ":'"); 19174d50731SChris Lattner return true; 19274d50731SChris Lattner } 19374d50731SChris Lattner 194221460e0SChris Lattner // Check to see if this is a fixed string, or if it has regex pieces. 19585913ccaSJames Y Knight if (!MatchFullLinesHere && 19685913ccaSJames Y Knight (PatternStr.size() < 2 || (PatternStr.find("{{") == StringRef::npos && 19785913ccaSJames Y Knight PatternStr.find("[[") == StringRef::npos))) { 198221460e0SChris Lattner FixedStr = PatternStr; 199221460e0SChris Lattner return false; 200221460e0SChris Lattner } 201221460e0SChris Lattner 20285913ccaSJames Y Knight if (MatchFullLinesHere) { 20385913ccaSJames Y Knight RegExStr += '^'; 20485913ccaSJames Y Knight if (!NoCanonicalizeWhiteSpace) 20585913ccaSJames Y Knight RegExStr += " *"; 20685913ccaSJames Y Knight } 20785913ccaSJames Y Knight 2088879e06dSChris Lattner // Paren value #0 is for the fully matched string. Any new parenthesized 20953e0679dSChris Lattner // values add from there. 2108879e06dSChris Lattner unsigned CurParen = 1; 2118879e06dSChris Lattner 212b16ab0c4SChris Lattner // Otherwise, there is at least one regex piece. Build up the regex pattern 213b16ab0c4SChris Lattner // by escaping scary characters in fixed strings, building up one big regex. 214f08d2db9SChris Lattner while (!PatternStr.empty()) { 2158879e06dSChris Lattner // RegEx matches. 21653e0679dSChris Lattner if (PatternStr.startswith("{{")) { 21743d50d4aSEli Bendersky // This is the start of a regex match. Scan for the }}. 218f08d2db9SChris Lattner size_t End = PatternStr.find("}}"); 219f08d2db9SChris Lattner if (End == StringRef::npos) { 220f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 22103b80a40SChris Lattner SourceMgr::DK_Error, 22203b80a40SChris Lattner "found start of regex string with no end '}}'"); 223f08d2db9SChris Lattner return true; 224f08d2db9SChris Lattner } 225f08d2db9SChris Lattner 226e53c95f1SChris Lattner // Enclose {{}} patterns in parens just like [[]] even though we're not 227e53c95f1SChris Lattner // capturing the result for any purpose. This is required in case the 228e53c95f1SChris Lattner // expression contains an alternation like: CHECK: abc{{x|z}}def. We 229e53c95f1SChris Lattner // want this to turn into: "abc(x|z)def" not "abcx|zdef". 230e53c95f1SChris Lattner RegExStr += '('; 231e53c95f1SChris Lattner ++CurParen; 232e53c95f1SChris Lattner 2338879e06dSChris Lattner if (AddRegExToRegEx(PatternStr.substr(2, End - 2), CurParen, SM)) 2348879e06dSChris Lattner return true; 235e53c95f1SChris Lattner RegExStr += ')'; 23653e0679dSChris Lattner 2378879e06dSChris Lattner PatternStr = PatternStr.substr(End + 2); 2388879e06dSChris Lattner continue; 2398879e06dSChris Lattner } 2408879e06dSChris Lattner 2418879e06dSChris Lattner // Named RegEx matches. These are of two forms: [[foo:.*]] which matches .* 2428879e06dSChris Lattner // (or some other regex) and assigns it to the FileCheck variable 'foo'. The 2438879e06dSChris Lattner // second form is [[foo]] which is a reference to foo. The variable name 24457cb733bSDaniel Dunbar // itself must be of the form "[a-zA-Z_][0-9a-zA-Z_]*", otherwise we reject 2458879e06dSChris Lattner // it. This is to catch some common errors. 24653e0679dSChris Lattner if (PatternStr.startswith("[[")) { 247061d2baaSEli Bendersky // Find the closing bracket pair ending the match. End is going to be an 248061d2baaSEli Bendersky // offset relative to the beginning of the match string. 24981e5cd9eSAdrian Prantl size_t End = FindRegexVarEnd(PatternStr.substr(2), SM); 250061d2baaSEli Bendersky 2518879e06dSChris Lattner if (End == StringRef::npos) { 2528879e06dSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 25303b80a40SChris Lattner SourceMgr::DK_Error, 25403b80a40SChris Lattner "invalid named regex reference, no ]] found"); 255f08d2db9SChris Lattner return true; 256f08d2db9SChris Lattner } 257f08d2db9SChris Lattner 258061d2baaSEli Bendersky StringRef MatchStr = PatternStr.substr(2, End); 259061d2baaSEli Bendersky PatternStr = PatternStr.substr(End + 4); 2608879e06dSChris Lattner 2618879e06dSChris Lattner // Get the regex name (e.g. "foo"). 2628879e06dSChris Lattner size_t NameEnd = MatchStr.find(':'); 2638879e06dSChris Lattner StringRef Name = MatchStr.substr(0, NameEnd); 2648879e06dSChris Lattner 2658879e06dSChris Lattner if (Name.empty()) { 26603b80a40SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Name.data()), SourceMgr::DK_Error, 26703b80a40SChris Lattner "invalid name in named regex: empty name"); 2688879e06dSChris Lattner return true; 2698879e06dSChris Lattner } 2708879e06dSChris Lattner 27192987fb3SAlexander Kornienko // Verify that the name/expression is well formed. FileCheck currently 27292987fb3SAlexander Kornienko // supports @LINE, @LINE+number, @LINE-number expressions. The check here 27392987fb3SAlexander Kornienko // is relaxed, more strict check is performed in \c EvaluateExpression. 27492987fb3SAlexander Kornienko bool IsExpression = false; 27592987fb3SAlexander Kornienko for (unsigned i = 0, e = Name.size(); i != e; ++i) { 276f55e72a5SArtem Belevich if (i == 0) { 277f55e72a5SArtem Belevich if (Name[i] == '$') // Global vars start with '$' 278f55e72a5SArtem Belevich continue; 279f55e72a5SArtem Belevich if (Name[i] == '@') { 28092987fb3SAlexander Kornienko if (NameEnd != StringRef::npos) { 28192987fb3SAlexander Kornienko SM.PrintMessage(SMLoc::getFromPointer(Name.data()), 28292987fb3SAlexander Kornienko SourceMgr::DK_Error, 28392987fb3SAlexander Kornienko "invalid name in named regex definition"); 28492987fb3SAlexander Kornienko return true; 28592987fb3SAlexander Kornienko } 28692987fb3SAlexander Kornienko IsExpression = true; 28792987fb3SAlexander Kornienko continue; 28892987fb3SAlexander Kornienko } 289f55e72a5SArtem Belevich } 29092987fb3SAlexander Kornienko if (Name[i] != '_' && !isalnum(Name[i]) && 29192987fb3SAlexander Kornienko (!IsExpression || (Name[i] != '+' && Name[i] != '-'))) { 2928879e06dSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Name.data() + i), 29303b80a40SChris Lattner SourceMgr::DK_Error, "invalid name in named regex"); 2948879e06dSChris Lattner return true; 2958879e06dSChris Lattner } 29692987fb3SAlexander Kornienko } 2978879e06dSChris Lattner 2988879e06dSChris Lattner // Name can't start with a digit. 29983c74e9fSGuy Benyei if (isdigit(static_cast<unsigned char>(Name[0]))) { 30003b80a40SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Name.data()), SourceMgr::DK_Error, 30103b80a40SChris Lattner "invalid name in named regex"); 3028879e06dSChris Lattner return true; 3038879e06dSChris Lattner } 3048879e06dSChris Lattner 3058879e06dSChris Lattner // Handle [[foo]]. 3068879e06dSChris Lattner if (NameEnd == StringRef::npos) { 307e8b8f1bcSEli Bendersky // Handle variables that were defined earlier on the same line by 308e8b8f1bcSEli Bendersky // emitting a backreference. 309e8b8f1bcSEli Bendersky if (VariableDefs.find(Name) != VariableDefs.end()) { 310e8b8f1bcSEli Bendersky unsigned VarParenNum = VariableDefs[Name]; 311e8b8f1bcSEli Bendersky if (VarParenNum < 1 || VarParenNum > 9) { 312e8b8f1bcSEli Bendersky SM.PrintMessage(SMLoc::getFromPointer(Name.data()), 313e8b8f1bcSEli Bendersky SourceMgr::DK_Error, 314e8b8f1bcSEli Bendersky "Can't back-reference more than 9 variables"); 315e8b8f1bcSEli Bendersky return true; 316e8b8f1bcSEli Bendersky } 317e8b8f1bcSEli Bendersky AddBackrefToRegEx(VarParenNum); 318e8b8f1bcSEli Bendersky } else { 3198879e06dSChris Lattner VariableUses.push_back(std::make_pair(Name, RegExStr.size())); 320e8b8f1bcSEli Bendersky } 3218879e06dSChris Lattner continue; 3228879e06dSChris Lattner } 3238879e06dSChris Lattner 3248879e06dSChris Lattner // Handle [[foo:.*]]. 325e8b8f1bcSEli Bendersky VariableDefs[Name] = CurParen; 3268879e06dSChris Lattner RegExStr += '('; 3278879e06dSChris Lattner ++CurParen; 3288879e06dSChris Lattner 3298879e06dSChris Lattner if (AddRegExToRegEx(MatchStr.substr(NameEnd + 1), CurParen, SM)) 3308879e06dSChris Lattner return true; 3318879e06dSChris Lattner 3328879e06dSChris Lattner RegExStr += ')'; 3338879e06dSChris Lattner } 3348879e06dSChris Lattner 3358879e06dSChris Lattner // Handle fixed string matches. 3368879e06dSChris Lattner // Find the end, which is the start of the next regex. 3378879e06dSChris Lattner size_t FixedMatchEnd = PatternStr.find("{{"); 3388879e06dSChris Lattner FixedMatchEnd = std::min(FixedMatchEnd, PatternStr.find("[[")); 3396f4f77b7SHans Wennborg RegExStr += Regex::escape(PatternStr.substr(0, FixedMatchEnd)); 3408879e06dSChris Lattner PatternStr = PatternStr.substr(FixedMatchEnd); 341f08d2db9SChris Lattner } 342f08d2db9SChris Lattner 34385913ccaSJames Y Knight if (MatchFullLinesHere) { 34485913ccaSJames Y Knight if (!NoCanonicalizeWhiteSpace) 34585913ccaSJames Y Knight RegExStr += " *"; 34685913ccaSJames Y Knight RegExStr += '$'; 34785913ccaSJames Y Knight } 34885913ccaSJames Y Knight 34974d50731SChris Lattner return false; 35074d50731SChris Lattner } 35174d50731SChris Lattner 352e8f2fb20SChandler Carruth bool Pattern::AddRegExToRegEx(StringRef RS, unsigned &CurParen, SourceMgr &SM) { 353e8b8f1bcSEli Bendersky Regex R(RS); 3548879e06dSChris Lattner std::string Error; 3558879e06dSChris Lattner if (!R.isValid(Error)) { 356e8b8f1bcSEli Bendersky SM.PrintMessage(SMLoc::getFromPointer(RS.data()), SourceMgr::DK_Error, 35703b80a40SChris Lattner "invalid regex: " + Error); 3588879e06dSChris Lattner return true; 3598879e06dSChris Lattner } 3608879e06dSChris Lattner 361e8b8f1bcSEli Bendersky RegExStr += RS.str(); 3628879e06dSChris Lattner CurParen += R.getNumMatches(); 3638879e06dSChris Lattner return false; 3648879e06dSChris Lattner } 365b16ab0c4SChris Lattner 366e8b8f1bcSEli Bendersky void Pattern::AddBackrefToRegEx(unsigned BackrefNum) { 367e8b8f1bcSEli Bendersky assert(BackrefNum >= 1 && BackrefNum <= 9 && "Invalid backref number"); 368e8f2fb20SChandler Carruth std::string Backref = std::string("\\") + std::string(1, '0' + BackrefNum); 369e8b8f1bcSEli Bendersky RegExStr += Backref; 370e8b8f1bcSEli Bendersky } 371e8b8f1bcSEli Bendersky 3724dabac20SChandler Carruth /// Evaluates expression and stores the result to \p Value. 3734dabac20SChandler Carruth /// 3744dabac20SChandler Carruth /// Returns true on success and false when the expression has invalid syntax. 37592987fb3SAlexander Kornienko bool Pattern::EvaluateExpression(StringRef Expr, std::string &Value) const { 37692987fb3SAlexander Kornienko // The only supported expression is @LINE([\+-]\d+)? 37792987fb3SAlexander Kornienko if (!Expr.startswith("@LINE")) 37892987fb3SAlexander Kornienko return false; 37992987fb3SAlexander Kornienko Expr = Expr.substr(StringRef("@LINE").size()); 38092987fb3SAlexander Kornienko int Offset = 0; 38192987fb3SAlexander Kornienko if (!Expr.empty()) { 38292987fb3SAlexander Kornienko if (Expr[0] == '+') 38392987fb3SAlexander Kornienko Expr = Expr.substr(1); 38492987fb3SAlexander Kornienko else if (Expr[0] != '-') 38592987fb3SAlexander Kornienko return false; 38692987fb3SAlexander Kornienko if (Expr.getAsInteger(10, Offset)) 38792987fb3SAlexander Kornienko return false; 38892987fb3SAlexander Kornienko } 38992987fb3SAlexander Kornienko Value = llvm::itostr(LineNumber + Offset); 39092987fb3SAlexander Kornienko return true; 39192987fb3SAlexander Kornienko } 39292987fb3SAlexander Kornienko 3934dabac20SChandler Carruth /// Matches the pattern string against the input buffer \p Buffer 3944dabac20SChandler Carruth /// 3954dabac20SChandler Carruth /// This returns the position that is matched or npos if there is no match. If 3964dabac20SChandler Carruth /// there is a match, the size of the matched string is returned in \p 3974dabac20SChandler Carruth /// MatchLen. 3984dabac20SChandler Carruth /// 3994dabac20SChandler Carruth /// The \p VariableTable StringMap provides the current values of filecheck 4004dabac20SChandler Carruth /// variables and is updated if this match defines new values. 4018879e06dSChris Lattner size_t Pattern::Match(StringRef Buffer, size_t &MatchLen, 4028879e06dSChris Lattner StringMap<StringRef> &VariableTable) const { 403eba55822SJakob Stoklund Olesen // If this is the EOF pattern, match it immediately. 40438820972SMatt Arsenault if (CheckTy == Check::CheckEOF) { 405eba55822SJakob Stoklund Olesen MatchLen = 0; 406eba55822SJakob Stoklund Olesen return Buffer.size(); 407eba55822SJakob Stoklund Olesen } 408eba55822SJakob Stoklund Olesen 409221460e0SChris Lattner // If this is a fixed string pattern, just match it now. 410221460e0SChris Lattner if (!FixedStr.empty()) { 411221460e0SChris Lattner MatchLen = FixedStr.size(); 412221460e0SChris Lattner return Buffer.find(FixedStr); 413221460e0SChris Lattner } 414221460e0SChris Lattner 415b16ab0c4SChris Lattner // Regex match. 4168879e06dSChris Lattner 4178879e06dSChris Lattner // If there are variable uses, we need to create a temporary string with the 4188879e06dSChris Lattner // actual value. 4198879e06dSChris Lattner StringRef RegExToMatch = RegExStr; 4208879e06dSChris Lattner std::string TmpStr; 4218879e06dSChris Lattner if (!VariableUses.empty()) { 4228879e06dSChris Lattner TmpStr = RegExStr; 4238879e06dSChris Lattner 4248879e06dSChris Lattner unsigned InsertOffset = 0; 4258f870499SBenjamin Kramer for (const auto &VariableUse : VariableUses) { 42692987fb3SAlexander Kornienko std::string Value; 42792987fb3SAlexander Kornienko 4288f870499SBenjamin Kramer if (VariableUse.first[0] == '@') { 4298f870499SBenjamin Kramer if (!EvaluateExpression(VariableUse.first, Value)) 43092987fb3SAlexander Kornienko return StringRef::npos; 43192987fb3SAlexander Kornienko } else { 432e0ef65abSDaniel Dunbar StringMap<StringRef>::iterator it = 4338f870499SBenjamin Kramer VariableTable.find(VariableUse.first); 434e0ef65abSDaniel Dunbar // If the variable is undefined, return an error. 435e0ef65abSDaniel Dunbar if (it == VariableTable.end()) 436e0ef65abSDaniel Dunbar return StringRef::npos; 437e0ef65abSDaniel Dunbar 4386f4f77b7SHans Wennborg // Look up the value and escape it so that we can put it into the regex. 4396f4f77b7SHans Wennborg Value += Regex::escape(it->second); 44092987fb3SAlexander Kornienko } 4418879e06dSChris Lattner 4428879e06dSChris Lattner // Plop it into the regex at the adjusted offset. 4438f870499SBenjamin Kramer TmpStr.insert(TmpStr.begin() + VariableUse.second + InsertOffset, 4448879e06dSChris Lattner Value.begin(), Value.end()); 4458879e06dSChris Lattner InsertOffset += Value.size(); 4468879e06dSChris Lattner } 4478879e06dSChris Lattner 4488879e06dSChris Lattner // Match the newly constructed regex. 4498879e06dSChris Lattner RegExToMatch = TmpStr; 4508879e06dSChris Lattner } 4518879e06dSChris Lattner 452b16ab0c4SChris Lattner SmallVector<StringRef, 4> MatchInfo; 4538879e06dSChris Lattner if (!Regex(RegExToMatch, Regex::Newline).match(Buffer, &MatchInfo)) 454f08d2db9SChris Lattner return StringRef::npos; 455b16ab0c4SChris Lattner 456b16ab0c4SChris Lattner // Successful regex match. 457b16ab0c4SChris Lattner assert(!MatchInfo.empty() && "Didn't get any match"); 458b16ab0c4SChris Lattner StringRef FullMatch = MatchInfo[0]; 459b16ab0c4SChris Lattner 4608879e06dSChris Lattner // If this defines any variables, remember their values. 4618f870499SBenjamin Kramer for (const auto &VariableDef : VariableDefs) { 4628f870499SBenjamin Kramer assert(VariableDef.second < MatchInfo.size() && "Internal paren error"); 4638f870499SBenjamin Kramer VariableTable[VariableDef.first] = MatchInfo[VariableDef.second]; 4640a4c44bdSChris Lattner } 4650a4c44bdSChris Lattner 466b16ab0c4SChris Lattner MatchLen = FullMatch.size(); 467b16ab0c4SChris Lattner return FullMatch.data() - Buffer.data(); 468f08d2db9SChris Lattner } 469f08d2db9SChris Lattner 4704dabac20SChandler Carruth 4714dabac20SChandler Carruth /// Computes an arbitrary estimate for the quality of matching this pattern at 4724dabac20SChandler Carruth /// the start of \p Buffer; a distance of zero should correspond to a perfect 4734dabac20SChandler Carruth /// match. 474e8f2fb20SChandler Carruth unsigned 475e8f2fb20SChandler Carruth Pattern::ComputeMatchDistance(StringRef Buffer, 476fd29d886SDaniel Dunbar const StringMap<StringRef> &VariableTable) const { 477fd29d886SDaniel Dunbar // Just compute the number of matching characters. For regular expressions, we 478fd29d886SDaniel Dunbar // just compare against the regex itself and hope for the best. 479fd29d886SDaniel Dunbar // 480fd29d886SDaniel Dunbar // FIXME: One easy improvement here is have the regex lib generate a single 481fd29d886SDaniel Dunbar // example regular expression which matches, and use that as the example 482fd29d886SDaniel Dunbar // string. 483fd29d886SDaniel Dunbar StringRef ExampleString(FixedStr); 484fd29d886SDaniel Dunbar if (ExampleString.empty()) 485fd29d886SDaniel Dunbar ExampleString = RegExStr; 486fd29d886SDaniel Dunbar 487e9aa36c8SDaniel Dunbar // Only compare up to the first line in the buffer, or the string size. 488e9aa36c8SDaniel Dunbar StringRef BufferPrefix = Buffer.substr(0, ExampleString.size()); 489e9aa36c8SDaniel Dunbar BufferPrefix = BufferPrefix.split('\n').first; 490e9aa36c8SDaniel Dunbar return BufferPrefix.edit_distance(ExampleString); 491fd29d886SDaniel Dunbar } 492fd29d886SDaniel Dunbar 4934dabac20SChandler Carruth /// Prints additional information about a failure to match involving this 4944dabac20SChandler Carruth /// pattern. 495e8f2fb20SChandler Carruth void Pattern::PrintFailureInfo( 496e8f2fb20SChandler Carruth const SourceMgr &SM, StringRef Buffer, 497e0ef65abSDaniel Dunbar const StringMap<StringRef> &VariableTable) const { 498e0ef65abSDaniel Dunbar // If this was a regular expression using variables, print the current 499e0ef65abSDaniel Dunbar // variable values. 500e0ef65abSDaniel Dunbar if (!VariableUses.empty()) { 5018f870499SBenjamin Kramer for (const auto &VariableUse : VariableUses) { 502e69170a1SAlp Toker SmallString<256> Msg; 503e69170a1SAlp Toker raw_svector_ostream OS(Msg); 5048f870499SBenjamin Kramer StringRef Var = VariableUse.first; 50592987fb3SAlexander Kornienko if (Var[0] == '@') { 50692987fb3SAlexander Kornienko std::string Value; 50792987fb3SAlexander Kornienko if (EvaluateExpression(Var, Value)) { 50892987fb3SAlexander Kornienko OS << "with expression \""; 50992987fb3SAlexander Kornienko OS.write_escaped(Var) << "\" equal to \""; 51092987fb3SAlexander Kornienko OS.write_escaped(Value) << "\""; 51192987fb3SAlexander Kornienko } else { 51292987fb3SAlexander Kornienko OS << "uses incorrect expression \""; 51392987fb3SAlexander Kornienko OS.write_escaped(Var) << "\""; 51492987fb3SAlexander Kornienko } 51592987fb3SAlexander Kornienko } else { 51692987fb3SAlexander Kornienko StringMap<StringRef>::const_iterator it = VariableTable.find(Var); 517e0ef65abSDaniel Dunbar 518e0ef65abSDaniel Dunbar // Check for undefined variable references. 519e0ef65abSDaniel Dunbar if (it == VariableTable.end()) { 520e0ef65abSDaniel Dunbar OS << "uses undefined variable \""; 52192987fb3SAlexander Kornienko OS.write_escaped(Var) << "\""; 522e0ef65abSDaniel Dunbar } else { 523e0ef65abSDaniel Dunbar OS << "with variable \""; 524e0ef65abSDaniel Dunbar OS.write_escaped(Var) << "\" equal to \""; 525e0ef65abSDaniel Dunbar OS.write_escaped(it->second) << "\""; 526e0ef65abSDaniel Dunbar } 52792987fb3SAlexander Kornienko } 528e0ef65abSDaniel Dunbar 52903b80a40SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note, 53003b80a40SChris Lattner OS.str()); 531e0ef65abSDaniel Dunbar } 532e0ef65abSDaniel Dunbar } 533fd29d886SDaniel Dunbar 534fd29d886SDaniel Dunbar // Attempt to find the closest/best fuzzy match. Usually an error happens 535fd29d886SDaniel Dunbar // because some string in the output didn't exactly match. In these cases, we 536fd29d886SDaniel Dunbar // would like to show the user a best guess at what "should have" matched, to 537fd29d886SDaniel Dunbar // save them having to actually check the input manually. 538fd29d886SDaniel Dunbar size_t NumLinesForward = 0; 539fd29d886SDaniel Dunbar size_t Best = StringRef::npos; 540fd29d886SDaniel Dunbar double BestQuality = 0; 541fd29d886SDaniel Dunbar 542fd29d886SDaniel Dunbar // Use an arbitrary 4k limit on how far we will search. 5432bf486ebSDan Gohman for (size_t i = 0, e = std::min(size_t(4096), Buffer.size()); i != e; ++i) { 544fd29d886SDaniel Dunbar if (Buffer[i] == '\n') 545fd29d886SDaniel Dunbar ++NumLinesForward; 546fd29d886SDaniel Dunbar 547df22bbf7SDan Gohman // Patterns have leading whitespace stripped, so skip whitespace when 548df22bbf7SDan Gohman // looking for something which looks like a pattern. 549df22bbf7SDan Gohman if (Buffer[i] == ' ' || Buffer[i] == '\t') 550df22bbf7SDan Gohman continue; 551df22bbf7SDan Gohman 552fd29d886SDaniel Dunbar // Compute the "quality" of this match as an arbitrary combination of the 553fd29d886SDaniel Dunbar // match distance and the number of lines skipped to get to this match. 554fd29d886SDaniel Dunbar unsigned Distance = ComputeMatchDistance(Buffer.substr(i), VariableTable); 555fd29d886SDaniel Dunbar double Quality = Distance + (NumLinesForward / 100.); 556fd29d886SDaniel Dunbar 557fd29d886SDaniel Dunbar if (Quality < BestQuality || Best == StringRef::npos) { 558fd29d886SDaniel Dunbar Best = i; 559fd29d886SDaniel Dunbar BestQuality = Quality; 560fd29d886SDaniel Dunbar } 561fd29d886SDaniel Dunbar } 562fd29d886SDaniel Dunbar 563fd29d886SDaniel Dunbar // Print the "possible intended match here" line if we found something 564c069cc8eSDaniel Dunbar // reasonable and not equal to what we showed in the "scanning from here" 565c069cc8eSDaniel Dunbar // line. 566c069cc8eSDaniel Dunbar if (Best && Best != StringRef::npos && BestQuality < 50) { 567fd29d886SDaniel Dunbar SM.PrintMessage(SMLoc::getFromPointer(Buffer.data() + Best), 56803b80a40SChris Lattner SourceMgr::DK_Note, "possible intended match here"); 569fd29d886SDaniel Dunbar 570fd29d886SDaniel Dunbar // FIXME: If we wanted to be really friendly we would show why the match 571fd29d886SDaniel Dunbar // failed, as it can be hard to spot simple one character differences. 572fd29d886SDaniel Dunbar } 573e0ef65abSDaniel Dunbar } 57474d50731SChris Lattner 5754dabac20SChandler Carruth /// Finds the closing sequence of a regex variable usage or definition. 5764dabac20SChandler Carruth /// 5774dabac20SChandler Carruth /// \p Str has to point in the beginning of the definition (right after the 5784dabac20SChandler Carruth /// opening sequence). Returns the offset of the closing sequence within Str, 5794dabac20SChandler Carruth /// or npos if it was not found. 58081e5cd9eSAdrian Prantl size_t Pattern::FindRegexVarEnd(StringRef Str, SourceMgr &SM) { 581061d2baaSEli Bendersky // Offset keeps track of the current offset within the input Str 582061d2baaSEli Bendersky size_t Offset = 0; 583061d2baaSEli Bendersky // [...] Nesting depth 584061d2baaSEli Bendersky size_t BracketDepth = 0; 585061d2baaSEli Bendersky 586061d2baaSEli Bendersky while (!Str.empty()) { 587061d2baaSEli Bendersky if (Str.startswith("]]") && BracketDepth == 0) 588061d2baaSEli Bendersky return Offset; 589061d2baaSEli Bendersky if (Str[0] == '\\') { 590061d2baaSEli Bendersky // Backslash escapes the next char within regexes, so skip them both. 591061d2baaSEli Bendersky Str = Str.substr(2); 592061d2baaSEli Bendersky Offset += 2; 593061d2baaSEli Bendersky } else { 594061d2baaSEli Bendersky switch (Str[0]) { 595061d2baaSEli Bendersky default: 596061d2baaSEli Bendersky break; 597061d2baaSEli Bendersky case '[': 598061d2baaSEli Bendersky BracketDepth++; 599061d2baaSEli Bendersky break; 600061d2baaSEli Bendersky case ']': 60181e5cd9eSAdrian Prantl if (BracketDepth == 0) { 60281e5cd9eSAdrian Prantl SM.PrintMessage(SMLoc::getFromPointer(Str.data()), 60381e5cd9eSAdrian Prantl SourceMgr::DK_Error, 60481e5cd9eSAdrian Prantl "missing closing \"]\" for regex variable"); 60581e5cd9eSAdrian Prantl exit(1); 60681e5cd9eSAdrian Prantl } 607061d2baaSEli Bendersky BracketDepth--; 608061d2baaSEli Bendersky break; 609061d2baaSEli Bendersky } 610061d2baaSEli Bendersky Str = Str.substr(1); 611061d2baaSEli Bendersky Offset++; 612061d2baaSEli Bendersky } 613061d2baaSEli Bendersky } 614061d2baaSEli Bendersky 615061d2baaSEli Bendersky return StringRef::npos; 616061d2baaSEli Bendersky } 617061d2baaSEli Bendersky 61874d50731SChris Lattner //===----------------------------------------------------------------------===// 61974d50731SChris Lattner // Check Strings. 62074d50731SChris Lattner //===----------------------------------------------------------------------===// 6213b40b445SChris Lattner 6224dabac20SChandler Carruth /// A check that we found in the input file. 6233b40b445SChris Lattner struct CheckString { 6244dabac20SChandler Carruth /// The pattern to match. 6253b40b445SChris Lattner Pattern Pat; 62626cccfe1SChris Lattner 6274dabac20SChandler Carruth /// Which prefix name this check matched. 62813df4626SMatt Arsenault StringRef Prefix; 62913df4626SMatt Arsenault 6304dabac20SChandler Carruth /// The location in the match file that the check string was specified. 63126cccfe1SChris Lattner SMLoc Loc; 63226cccfe1SChris Lattner 6334dabac20SChandler Carruth /// All of the strings that are disallowed from occurring between this match 6344dabac20SChandler Carruth /// string and the previous one (or start of file). 63591a1b2c9SMichael Liao std::vector<Pattern> DagNotStrings; 636236d2d5eSChris Lattner 63785913ccaSJames Y Knight CheckString(const Pattern &P, StringRef S, SMLoc L) 63885913ccaSJames Y Knight : Pat(P), Prefix(S), Loc(L) {} 639dcc7d48dSMichael Liao 640e93a3a08SStephen Lin size_t Check(const SourceMgr &SM, StringRef Buffer, bool IsLabelScanMode, 641f8bd2e5bSStephen Lin size_t &MatchLen, StringMap<StringRef> &VariableTable) const; 642dcc7d48dSMichael Liao 643dcc7d48dSMichael Liao bool CheckNext(const SourceMgr &SM, StringRef Buffer) const; 64401ac1707SDuncan P. N. Exon Smith bool CheckSame(const SourceMgr &SM, StringRef Buffer) const; 645dcc7d48dSMichael Liao bool CheckNot(const SourceMgr &SM, StringRef Buffer, 64691a1b2c9SMichael Liao const std::vector<const Pattern *> &NotStrings, 64791a1b2c9SMichael Liao StringMap<StringRef> &VariableTable) const; 64891a1b2c9SMichael Liao size_t CheckDag(const SourceMgr &SM, StringRef Buffer, 64991a1b2c9SMichael Liao std::vector<const Pattern *> &NotStrings, 650dcc7d48dSMichael Liao StringMap<StringRef> &VariableTable) const; 65126cccfe1SChris Lattner }; 65226cccfe1SChris Lattner 65320247900SChandler Carruth /// Canonicalize whitespaces in the file. Line endings are replaced with 65420247900SChandler Carruth /// UNIX-style '\n'. 655b03c166aSChandler Carruth static StringRef CanonicalizeFile(MemoryBuffer &MB, 65620247900SChandler Carruth SmallVectorImpl<char> &OutputBuffer) { 65720247900SChandler Carruth OutputBuffer.reserve(MB.getBufferSize()); 658a2f8fc5aSChris Lattner 65920247900SChandler Carruth for (const char *Ptr = MB.getBufferStart(), *End = MB.getBufferEnd(); 660a2f8fc5aSChris Lattner Ptr != End; ++Ptr) { 661fd781bf0SNAKAMURA Takumi // Eliminate trailing dosish \r. 662fd781bf0SNAKAMURA Takumi if (Ptr <= End - 2 && Ptr[0] == '\r' && Ptr[1] == '\n') { 663fd781bf0SNAKAMURA Takumi continue; 664fd781bf0SNAKAMURA Takumi } 665fd781bf0SNAKAMURA Takumi 6665ea04c38SGuy Benyei // If current char is not a horizontal whitespace or if horizontal 6675ea04c38SGuy Benyei // whitespace canonicalization is disabled, dump it to output as is. 668b03c166aSChandler Carruth if (NoCanonicalizeWhiteSpace || (*Ptr != ' ' && *Ptr != '\t')) { 66920247900SChandler Carruth OutputBuffer.push_back(*Ptr); 670a2f8fc5aSChris Lattner continue; 671a2f8fc5aSChris Lattner } 672a2f8fc5aSChris Lattner 673a2f8fc5aSChris Lattner // Otherwise, add one space and advance over neighboring space. 67420247900SChandler Carruth OutputBuffer.push_back(' '); 675e8f2fb20SChandler Carruth while (Ptr + 1 != End && (Ptr[1] == ' ' || Ptr[1] == '\t')) 676a2f8fc5aSChris Lattner ++Ptr; 677a2f8fc5aSChris Lattner } 678a2f8fc5aSChris Lattner 67920247900SChandler Carruth // Add a null byte and then return all but that byte. 68020247900SChandler Carruth OutputBuffer.push_back('\0'); 68120247900SChandler Carruth return StringRef(OutputBuffer.data(), OutputBuffer.size() - 1); 682a2f8fc5aSChris Lattner } 683a2f8fc5aSChris Lattner 68438820972SMatt Arsenault static bool IsPartOfWord(char c) { 68538820972SMatt Arsenault return (isalnum(c) || c == '-' || c == '_'); 68638820972SMatt Arsenault } 68738820972SMatt Arsenault 68813df4626SMatt Arsenault // Get the size of the prefix extension. 68913df4626SMatt Arsenault static size_t CheckTypeSize(Check::CheckType Ty) { 69013df4626SMatt Arsenault switch (Ty) { 69113df4626SMatt Arsenault case Check::CheckNone: 692a908e7bdSPaul Robinson case Check::CheckBadNot: 69313df4626SMatt Arsenault return 0; 69413df4626SMatt Arsenault 69513df4626SMatt Arsenault case Check::CheckPlain: 69613df4626SMatt Arsenault return sizeof(":") - 1; 69713df4626SMatt Arsenault 69813df4626SMatt Arsenault case Check::CheckNext: 69913df4626SMatt Arsenault return sizeof("-NEXT:") - 1; 70013df4626SMatt Arsenault 70101ac1707SDuncan P. N. Exon Smith case Check::CheckSame: 70201ac1707SDuncan P. N. Exon Smith return sizeof("-SAME:") - 1; 70301ac1707SDuncan P. N. Exon Smith 70413df4626SMatt Arsenault case Check::CheckNot: 70513df4626SMatt Arsenault return sizeof("-NOT:") - 1; 70613df4626SMatt Arsenault 70713df4626SMatt Arsenault case Check::CheckDAG: 70813df4626SMatt Arsenault return sizeof("-DAG:") - 1; 70913df4626SMatt Arsenault 71013df4626SMatt Arsenault case Check::CheckLabel: 71113df4626SMatt Arsenault return sizeof("-LABEL:") - 1; 71213df4626SMatt Arsenault 71313df4626SMatt Arsenault case Check::CheckEOF: 71413df4626SMatt Arsenault llvm_unreachable("Should not be using EOF size"); 71513df4626SMatt Arsenault } 71613df4626SMatt Arsenault 71713df4626SMatt Arsenault llvm_unreachable("Bad check type"); 71813df4626SMatt Arsenault } 71913df4626SMatt Arsenault 72013df4626SMatt Arsenault static Check::CheckType FindCheckType(StringRef Buffer, StringRef Prefix) { 721c4d2d471SMatt Arsenault char NextChar = Buffer[Prefix.size()]; 72238820972SMatt Arsenault 72338820972SMatt Arsenault // Verify that the : is present after the prefix. 72413df4626SMatt Arsenault if (NextChar == ':') 72538820972SMatt Arsenault return Check::CheckPlain; 72638820972SMatt Arsenault 72713df4626SMatt Arsenault if (NextChar != '-') 72838820972SMatt Arsenault return Check::CheckNone; 72938820972SMatt Arsenault 730c4d2d471SMatt Arsenault StringRef Rest = Buffer.drop_front(Prefix.size() + 1); 73113df4626SMatt Arsenault if (Rest.startswith("NEXT:")) 73238820972SMatt Arsenault return Check::CheckNext; 73338820972SMatt Arsenault 73401ac1707SDuncan P. N. Exon Smith if (Rest.startswith("SAME:")) 73501ac1707SDuncan P. N. Exon Smith return Check::CheckSame; 73601ac1707SDuncan P. N. Exon Smith 73713df4626SMatt Arsenault if (Rest.startswith("NOT:")) 73838820972SMatt Arsenault return Check::CheckNot; 73938820972SMatt Arsenault 74013df4626SMatt Arsenault if (Rest.startswith("DAG:")) 74138820972SMatt Arsenault return Check::CheckDAG; 74238820972SMatt Arsenault 74313df4626SMatt Arsenault if (Rest.startswith("LABEL:")) 74438820972SMatt Arsenault return Check::CheckLabel; 74513df4626SMatt Arsenault 746a908e7bdSPaul Robinson // You can't combine -NOT with another suffix. 747a908e7bdSPaul Robinson if (Rest.startswith("DAG-NOT:") || Rest.startswith("NOT-DAG:") || 748a908e7bdSPaul Robinson Rest.startswith("NEXT-NOT:") || Rest.startswith("NOT-NEXT:") || 749a908e7bdSPaul Robinson Rest.startswith("SAME-NOT:") || Rest.startswith("NOT-SAME:")) 750a908e7bdSPaul Robinson return Check::CheckBadNot; 751a908e7bdSPaul Robinson 75213df4626SMatt Arsenault return Check::CheckNone; 75338820972SMatt Arsenault } 75438820972SMatt Arsenault 75513df4626SMatt Arsenault // From the given position, find the next character after the word. 75613df4626SMatt Arsenault static size_t SkipWord(StringRef Str, size_t Loc) { 75713df4626SMatt Arsenault while (Loc < Str.size() && IsPartOfWord(Str[Loc])) 75813df4626SMatt Arsenault ++Loc; 75913df4626SMatt Arsenault return Loc; 76013df4626SMatt Arsenault } 76113df4626SMatt Arsenault 762726774cbSChandler Carruth /// Search the buffer for the first prefix in the prefix regular expression. 763726774cbSChandler Carruth /// 764726774cbSChandler Carruth /// This searches the buffer using the provided regular expression, however it 765726774cbSChandler Carruth /// enforces constraints beyond that: 766726774cbSChandler Carruth /// 1) The found prefix must not be a suffix of something that looks like 767726774cbSChandler Carruth /// a valid prefix. 768726774cbSChandler Carruth /// 2) The found prefix must be followed by a valid check type suffix using \c 769726774cbSChandler Carruth /// FindCheckType above. 770726774cbSChandler Carruth /// 771726774cbSChandler Carruth /// The first match of the regular expression to satisfy these two is returned, 772726774cbSChandler Carruth /// otherwise an empty StringRef is returned to indicate failure. 773726774cbSChandler Carruth /// 774726774cbSChandler Carruth /// If this routine returns a valid prefix, it will also shrink \p Buffer to 775726774cbSChandler Carruth /// start at the beginning of the returned prefix, increment \p LineNumber for 776726774cbSChandler Carruth /// each new line consumed from \p Buffer, and set \p CheckTy to the type of 777726774cbSChandler Carruth /// check found by examining the suffix. 778726774cbSChandler Carruth /// 779726774cbSChandler Carruth /// If no valid prefix is found, the state of Buffer, LineNumber, and CheckTy 780726774cbSChandler Carruth /// is unspecified. 781726774cbSChandler Carruth static StringRef FindFirstMatchingPrefix(Regex &PrefixRE, StringRef &Buffer, 78213df4626SMatt Arsenault unsigned &LineNumber, 783726774cbSChandler Carruth Check::CheckType &CheckTy) { 784726774cbSChandler Carruth SmallVector<StringRef, 2> Matches; 785726774cbSChandler Carruth 78613df4626SMatt Arsenault while (!Buffer.empty()) { 787726774cbSChandler Carruth // Find the first (longest) match using the RE. 788726774cbSChandler Carruth if (!PrefixRE.match(Buffer, &Matches)) 789726774cbSChandler Carruth // No match at all, bail. 790726774cbSChandler Carruth return StringRef(); 791726774cbSChandler Carruth 792726774cbSChandler Carruth StringRef Prefix = Matches[0]; 793726774cbSChandler Carruth Matches.clear(); 794726774cbSChandler Carruth 795726774cbSChandler Carruth assert(Prefix.data() >= Buffer.data() && 796726774cbSChandler Carruth Prefix.data() < Buffer.data() + Buffer.size() && 797726774cbSChandler Carruth "Prefix doesn't start inside of buffer!"); 798726774cbSChandler Carruth size_t Loc = Prefix.data() - Buffer.data(); 799726774cbSChandler Carruth StringRef Skipped = Buffer.substr(0, Loc); 800726774cbSChandler Carruth Buffer = Buffer.drop_front(Loc); 801726774cbSChandler Carruth LineNumber += Skipped.count('\n'); 802726774cbSChandler Carruth 803726774cbSChandler Carruth // Check that the matched prefix isn't a suffix of some other check-like 804726774cbSChandler Carruth // word. 805726774cbSChandler Carruth // FIXME: This is a very ad-hoc check. it would be better handled in some 806726774cbSChandler Carruth // other way. Among other things it seems hard to distinguish between 807726774cbSChandler Carruth // intentional and unintentional uses of this feature. 808726774cbSChandler Carruth if (Skipped.empty() || !IsPartOfWord(Skipped.back())) { 809726774cbSChandler Carruth // Now extract the type. 810726774cbSChandler Carruth CheckTy = FindCheckType(Buffer, Prefix); 811726774cbSChandler Carruth 812726774cbSChandler Carruth // If we've found a valid check type for this prefix, we're done. 813726774cbSChandler Carruth if (CheckTy != Check::CheckNone) 81413df4626SMatt Arsenault return Prefix; 81513df4626SMatt Arsenault } 81613df4626SMatt Arsenault 817726774cbSChandler Carruth // If we didn't successfully find a prefix, we need to skip this invalid 818726774cbSChandler Carruth // prefix and continue scanning. We directly skip the prefix that was 819726774cbSChandler Carruth // matched and any additional parts of that check-like word. 820726774cbSChandler Carruth Buffer = Buffer.drop_front(SkipWord(Buffer, Prefix.size())); 82113df4626SMatt Arsenault } 82213df4626SMatt Arsenault 823726774cbSChandler Carruth // We ran out of buffer while skipping partial matches so give up. 82413df4626SMatt Arsenault return StringRef(); 82538820972SMatt Arsenault } 826ee3c74fbSChris Lattner 8274dabac20SChandler Carruth /// Read the check file, which specifies the sequence of expected strings. 8284dabac20SChandler Carruth /// 8294dabac20SChandler Carruth /// The strings are added to the CheckStrings vector. Returns true in case of 8304dabac20SChandler Carruth /// an error, false otherwise. 831726774cbSChandler Carruth static bool ReadCheckFile(SourceMgr &SM, StringRef Buffer, Regex &PrefixRE, 83226cccfe1SChris Lattner std::vector<CheckString> &CheckStrings) { 83356ccdbbdSAlexander Kornienko std::vector<Pattern> ImplicitNegativeChecks; 83456ccdbbdSAlexander Kornienko for (const auto &PatternString : ImplicitCheckNot) { 83556ccdbbdSAlexander Kornienko // Create a buffer with fake command line content in order to display the 83656ccdbbdSAlexander Kornienko // command line option responsible for the specific implicit CHECK-NOT. 837ff43d69dSDavid Blaikie std::string Prefix = (Twine("-") + ImplicitCheckNot.ArgStr + "='").str(); 83856ccdbbdSAlexander Kornienko std::string Suffix = "'"; 8393560ff2cSRafael Espindola std::unique_ptr<MemoryBuffer> CmdLine = MemoryBuffer::getMemBufferCopy( 8403560ff2cSRafael Espindola Prefix + PatternString + Suffix, "command line"); 8413560ff2cSRafael Espindola 84256ccdbbdSAlexander Kornienko StringRef PatternInBuffer = 84356ccdbbdSAlexander Kornienko CmdLine->getBuffer().substr(Prefix.size(), PatternString.size()); 8441961f14cSDavid Blaikie SM.AddNewSourceBuffer(std::move(CmdLine), SMLoc()); 84556ccdbbdSAlexander Kornienko 84656ccdbbdSAlexander Kornienko ImplicitNegativeChecks.push_back(Pattern(Check::CheckNot)); 84756ccdbbdSAlexander Kornienko ImplicitNegativeChecks.back().ParsePattern(PatternInBuffer, 84856ccdbbdSAlexander Kornienko "IMPLICIT-CHECK", SM, 0); 84956ccdbbdSAlexander Kornienko } 85056ccdbbdSAlexander Kornienko 85156ccdbbdSAlexander Kornienko std::vector<Pattern> DagNotMatches = ImplicitNegativeChecks; 852236d2d5eSChris Lattner 85343d50d4aSEli Bendersky // LineNumber keeps track of the line on which CheckPrefix instances are 85443d50d4aSEli Bendersky // found. 85592987fb3SAlexander Kornienko unsigned LineNumber = 1; 85692987fb3SAlexander Kornienko 857ee3c74fbSChris Lattner while (1) { 85813df4626SMatt Arsenault Check::CheckType CheckTy; 85913df4626SMatt Arsenault 86013df4626SMatt Arsenault // See if a prefix occurs in the memory buffer. 861726774cbSChandler Carruth StringRef UsedPrefix = FindFirstMatchingPrefix(PrefixRE, Buffer, LineNumber, 862726774cbSChandler Carruth CheckTy); 86313df4626SMatt Arsenault if (UsedPrefix.empty()) 864ee3c74fbSChris Lattner break; 865726774cbSChandler Carruth assert(UsedPrefix.data() == Buffer.data() && 866726774cbSChandler Carruth "Failed to move Buffer's start forward, or pointed prefix outside " 867726774cbSChandler Carruth "of the buffer!"); 86892987fb3SAlexander Kornienko 86913df4626SMatt Arsenault // Location to use for error messages. 870726774cbSChandler Carruth const char *UsedPrefixStart = UsedPrefix.data(); 87192987fb3SAlexander Kornienko 872726774cbSChandler Carruth // Skip the buffer to the end. 87313df4626SMatt Arsenault Buffer = Buffer.drop_front(UsedPrefix.size() + CheckTypeSize(CheckTy)); 87410f10cedSChris Lattner 875a908e7bdSPaul Robinson // Complain about useful-looking but unsupported suffixes. 876a908e7bdSPaul Robinson if (CheckTy == Check::CheckBadNot) { 877e8f2fb20SChandler Carruth SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Error, 878a908e7bdSPaul Robinson "unsupported -NOT combo on prefix '" + UsedPrefix + "'"); 879a908e7bdSPaul Robinson return true; 880a908e7bdSPaul Robinson } 881a908e7bdSPaul Robinson 88238820972SMatt Arsenault // Okay, we found the prefix, yay. Remember the rest of the line, but ignore 883a26bc914STom de Vries // leading whitespace. 8841714676aSTom de Vries if (!(NoCanonicalizeWhiteSpace && MatchFullLines)) 885236d2d5eSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t")); 886ee3c74fbSChris Lattner 887ee3c74fbSChris Lattner // Scan ahead to the end of line. 888caa5fc0cSChris Lattner size_t EOL = Buffer.find_first_of("\n\r"); 889ee3c74fbSChris Lattner 890838fb09aSDan Gohman // Remember the location of the start of the pattern, for diagnostics. 891838fb09aSDan Gohman SMLoc PatternLoc = SMLoc::getFromPointer(Buffer.data()); 892838fb09aSDan Gohman 89374d50731SChris Lattner // Parse the pattern. 89438820972SMatt Arsenault Pattern P(CheckTy); 89513df4626SMatt Arsenault if (P.ParsePattern(Buffer.substr(0, EOL), UsedPrefix, SM, LineNumber)) 896ee3c74fbSChris Lattner return true; 897ee3c74fbSChris Lattner 898f8bd2e5bSStephen Lin // Verify that CHECK-LABEL lines do not define or use variables 89938820972SMatt Arsenault if ((CheckTy == Check::CheckLabel) && P.hasVariable()) { 900e8f2fb20SChandler Carruth SM.PrintMessage( 901e8f2fb20SChandler Carruth SMLoc::getFromPointer(UsedPrefixStart), SourceMgr::DK_Error, 90213df4626SMatt Arsenault "found '" + UsedPrefix + "-LABEL:'" 90313df4626SMatt Arsenault " with variable definition or use"); 904f8bd2e5bSStephen Lin return true; 905f8bd2e5bSStephen Lin } 906f8bd2e5bSStephen Lin 907236d2d5eSChris Lattner Buffer = Buffer.substr(EOL); 90874d50731SChris Lattner 909da108b4eSChris Lattner // Verify that CHECK-NEXT lines have at least one CHECK line before them. 91001ac1707SDuncan P. N. Exon Smith if ((CheckTy == Check::CheckNext || CheckTy == Check::CheckSame) && 91101ac1707SDuncan P. N. Exon Smith CheckStrings.empty()) { 91201ac1707SDuncan P. N. Exon Smith StringRef Type = CheckTy == Check::CheckNext ? "NEXT" : "SAME"; 91313df4626SMatt Arsenault SM.PrintMessage(SMLoc::getFromPointer(UsedPrefixStart), 91403b80a40SChris Lattner SourceMgr::DK_Error, 915e8f2fb20SChandler Carruth "found '" + UsedPrefix + "-" + Type + 916e8f2fb20SChandler Carruth "' without previous '" + UsedPrefix + ": line"); 917da108b4eSChris Lattner return true; 918da108b4eSChris Lattner } 919da108b4eSChris Lattner 92091a1b2c9SMichael Liao // Handle CHECK-DAG/-NOT. 92138820972SMatt Arsenault if (CheckTy == Check::CheckDAG || CheckTy == Check::CheckNot) { 92291a1b2c9SMichael Liao DagNotMatches.push_back(P); 92374d50731SChris Lattner continue; 92474d50731SChris Lattner } 92574d50731SChris Lattner 926ee3c74fbSChris Lattner // Okay, add the string we captured to the output vector and move on. 92785913ccaSJames Y Knight CheckStrings.emplace_back(P, UsedPrefix, PatternLoc); 92891a1b2c9SMichael Liao std::swap(DagNotMatches, CheckStrings.back().DagNotStrings); 92956ccdbbdSAlexander Kornienko DagNotMatches = ImplicitNegativeChecks; 930ee3c74fbSChris Lattner } 931ee3c74fbSChris Lattner 93213df4626SMatt Arsenault // Add an EOF pattern for any trailing CHECK-DAG/-NOTs, and use the first 93313df4626SMatt Arsenault // prefix as a filler for the error message. 93491a1b2c9SMichael Liao if (!DagNotMatches.empty()) { 935f5e2fc47SBenjamin Kramer CheckStrings.emplace_back(Pattern(Check::CheckEOF), *CheckPrefixes.begin(), 93685913ccaSJames Y Knight SMLoc::getFromPointer(Buffer.data())); 93791a1b2c9SMichael Liao std::swap(DagNotMatches, CheckStrings.back().DagNotStrings); 938eba55822SJakob Stoklund Olesen } 939eba55822SJakob Stoklund Olesen 940ee3c74fbSChris Lattner if (CheckStrings.empty()) { 94113df4626SMatt Arsenault errs() << "error: no check strings found with prefix" 94213df4626SMatt Arsenault << (CheckPrefixes.size() > 1 ? "es " : " "); 9433e3ef2f2SChris Bieneman prefix_iterator I = CheckPrefixes.begin(); 9443e3ef2f2SChris Bieneman prefix_iterator E = CheckPrefixes.end(); 9453e3ef2f2SChris Bieneman if (I != E) { 9463e3ef2f2SChris Bieneman errs() << "\'" << *I << ":'"; 9473e3ef2f2SChris Bieneman ++I; 94813df4626SMatt Arsenault } 9493e3ef2f2SChris Bieneman for (; I != E; ++I) 9503e3ef2f2SChris Bieneman errs() << ", \'" << *I << ":'"; 95113df4626SMatt Arsenault 95213df4626SMatt Arsenault errs() << '\n'; 953ee3c74fbSChris Lattner return true; 954ee3c74fbSChris Lattner } 955ee3c74fbSChris Lattner 956ee3c74fbSChris Lattner return false; 957ee3c74fbSChris Lattner } 958ee3c74fbSChris Lattner 959e8f2fb20SChandler Carruth static void PrintCheckFailed(const SourceMgr &SM, SMLoc Loc, const Pattern &Pat, 960e8f2fb20SChandler Carruth StringRef Buffer, 961e0ef65abSDaniel Dunbar StringMap<StringRef> &VariableTable) { 962da108b4eSChris Lattner // Otherwise, we have an error, emit an error message. 96391a1b2c9SMichael Liao SM.PrintMessage(Loc, SourceMgr::DK_Error, 96403b80a40SChris Lattner "expected string not found in input"); 965da108b4eSChris Lattner 966da108b4eSChris Lattner // Print the "scanning from here" line. If the current position is at the 967da108b4eSChris Lattner // end of a line, advance to the start of the next line. 968caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t\n\r")); 969da108b4eSChris Lattner 97003b80a40SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note, 97103b80a40SChris Lattner "scanning from here"); 972e0ef65abSDaniel Dunbar 973e0ef65abSDaniel Dunbar // Allow the pattern to print additional information if desired. 97491a1b2c9SMichael Liao Pat.PrintFailureInfo(SM, Buffer, VariableTable); 97591a1b2c9SMichael Liao } 97691a1b2c9SMichael Liao 97791a1b2c9SMichael Liao static void PrintCheckFailed(const SourceMgr &SM, const CheckString &CheckStr, 97891a1b2c9SMichael Liao StringRef Buffer, 97991a1b2c9SMichael Liao StringMap<StringRef> &VariableTable) { 98091a1b2c9SMichael Liao PrintCheckFailed(SM, CheckStr.Loc, CheckStr.Pat, Buffer, VariableTable); 981da108b4eSChris Lattner } 982da108b4eSChris Lattner 9834dabac20SChandler Carruth /// Count the number of newlines in the specified range. 984592fe880SRichard Smith static unsigned CountNumNewlinesBetween(StringRef Range, 985592fe880SRichard Smith const char *&FirstNewLine) { 986da108b4eSChris Lattner unsigned NumNewLines = 0; 98737183584SChris Lattner while (1) { 988da108b4eSChris Lattner // Scan for newline. 98937183584SChris Lattner Range = Range.substr(Range.find_first_of("\n\r")); 990e8f2fb20SChandler Carruth if (Range.empty()) 991e8f2fb20SChandler Carruth return NumNewLines; 992da108b4eSChris Lattner 993da108b4eSChris Lattner ++NumNewLines; 994da108b4eSChris Lattner 995da108b4eSChris Lattner // Handle \n\r and \r\n as a single newline. 996e8f2fb20SChandler Carruth if (Range.size() > 1 && (Range[1] == '\n' || Range[1] == '\r') && 99737183584SChris Lattner (Range[0] != Range[1])) 99837183584SChris Lattner Range = Range.substr(1); 99937183584SChris Lattner Range = Range.substr(1); 1000592fe880SRichard Smith 1001592fe880SRichard Smith if (NumNewLines == 1) 1002592fe880SRichard Smith FirstNewLine = Range.begin(); 1003da108b4eSChris Lattner } 1004da108b4eSChris Lattner } 1005da108b4eSChris Lattner 10064dabac20SChandler Carruth /// Match check string and its "not strings" and/or "dag strings". 1007dcc7d48dSMichael Liao size_t CheckString::Check(const SourceMgr &SM, StringRef Buffer, 1008e93a3a08SStephen Lin bool IsLabelScanMode, size_t &MatchLen, 1009dcc7d48dSMichael Liao StringMap<StringRef> &VariableTable) const { 101091a1b2c9SMichael Liao size_t LastPos = 0; 101191a1b2c9SMichael Liao std::vector<const Pattern *> NotStrings; 101291a1b2c9SMichael Liao 1013e93a3a08SStephen Lin // IsLabelScanMode is true when we are scanning forward to find CHECK-LABEL 1014e93a3a08SStephen Lin // bounds; we have not processed variable definitions within the bounded block 1015e93a3a08SStephen Lin // yet so cannot handle any final CHECK-DAG yet; this is handled when going 1016e93a3a08SStephen Lin // over the block again (including the last CHECK-LABEL) in normal mode. 1017e93a3a08SStephen Lin if (!IsLabelScanMode) { 101891a1b2c9SMichael Liao // Match "dag strings" (with mixed "not strings" if any). 101991a1b2c9SMichael Liao LastPos = CheckDag(SM, Buffer, NotStrings, VariableTable); 102091a1b2c9SMichael Liao if (LastPos == StringRef::npos) 102191a1b2c9SMichael Liao return StringRef::npos; 1022e93a3a08SStephen Lin } 102391a1b2c9SMichael Liao 102491a1b2c9SMichael Liao // Match itself from the last position after matching CHECK-DAG. 102591a1b2c9SMichael Liao StringRef MatchBuffer = Buffer.substr(LastPos); 102691a1b2c9SMichael Liao size_t MatchPos = Pat.Match(MatchBuffer, MatchLen, VariableTable); 1027dcc7d48dSMichael Liao if (MatchPos == StringRef::npos) { 102891a1b2c9SMichael Liao PrintCheckFailed(SM, *this, MatchBuffer, VariableTable); 1029dcc7d48dSMichael Liao return StringRef::npos; 1030dcc7d48dSMichael Liao } 1031dcc7d48dSMichael Liao 1032e93a3a08SStephen Lin // Similar to the above, in "label-scan mode" we can't yet handle CHECK-NEXT 1033e93a3a08SStephen Lin // or CHECK-NOT 1034e93a3a08SStephen Lin if (!IsLabelScanMode) { 103591a1b2c9SMichael Liao StringRef SkippedRegion = Buffer.substr(LastPos, MatchPos); 1036dcc7d48dSMichael Liao 1037dcc7d48dSMichael Liao // If this check is a "CHECK-NEXT", verify that the previous match was on 1038dcc7d48dSMichael Liao // the previous line (i.e. that there is one newline between them). 1039dcc7d48dSMichael Liao if (CheckNext(SM, SkippedRegion)) 1040dcc7d48dSMichael Liao return StringRef::npos; 1041dcc7d48dSMichael Liao 104201ac1707SDuncan P. N. Exon Smith // If this check is a "CHECK-SAME", verify that the previous match was on 104301ac1707SDuncan P. N. Exon Smith // the same line (i.e. that there is no newline between them). 104401ac1707SDuncan P. N. Exon Smith if (CheckSame(SM, SkippedRegion)) 104501ac1707SDuncan P. N. Exon Smith return StringRef::npos; 104601ac1707SDuncan P. N. Exon Smith 1047dcc7d48dSMichael Liao // If this match had "not strings", verify that they don't exist in the 1048dcc7d48dSMichael Liao // skipped region. 104991a1b2c9SMichael Liao if (CheckNot(SM, SkippedRegion, NotStrings, VariableTable)) 1050dcc7d48dSMichael Liao return StringRef::npos; 1051f8bd2e5bSStephen Lin } 1052dcc7d48dSMichael Liao 10537dfb92b9SMehdi Amini return LastPos + MatchPos; 1054dcc7d48dSMichael Liao } 1055dcc7d48dSMichael Liao 10564dabac20SChandler Carruth /// Verify there is a single line in the given buffer. 1057dcc7d48dSMichael Liao bool CheckString::CheckNext(const SourceMgr &SM, StringRef Buffer) const { 105885913ccaSJames Y Knight if (Pat.getCheckTy() != Check::CheckNext) 1059dcc7d48dSMichael Liao return false; 1060dcc7d48dSMichael Liao 1061dcc7d48dSMichael Liao // Count the number of newlines between the previous match and this one. 1062dcc7d48dSMichael Liao assert(Buffer.data() != 1063e8f2fb20SChandler Carruth SM.getMemoryBuffer(SM.FindBufferContainingLoc( 1064e8f2fb20SChandler Carruth SMLoc::getFromPointer(Buffer.data()))) 1065e8f2fb20SChandler Carruth ->getBufferStart() && 1066dcc7d48dSMichael Liao "CHECK-NEXT can't be the first check in a file"); 1067dcc7d48dSMichael Liao 106866f09ad0SCraig Topper const char *FirstNewLine = nullptr; 1069592fe880SRichard Smith unsigned NumNewLines = CountNumNewlinesBetween(Buffer, FirstNewLine); 1070dcc7d48dSMichael Liao 1071dcc7d48dSMichael Liao if (NumNewLines == 0) { 1072e8f2fb20SChandler Carruth SM.PrintMessage(Loc, SourceMgr::DK_Error, 1073e8f2fb20SChandler Carruth Prefix + "-NEXT: is on the same line as previous match"); 1074e8f2fb20SChandler Carruth SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note, 1075e8f2fb20SChandler Carruth "'next' match was here"); 1076dcc7d48dSMichael Liao SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note, 1077dcc7d48dSMichael Liao "previous match ended here"); 1078dcc7d48dSMichael Liao return true; 1079dcc7d48dSMichael Liao } 1080dcc7d48dSMichael Liao 1081dcc7d48dSMichael Liao if (NumNewLines != 1) { 1082e8f2fb20SChandler Carruth SM.PrintMessage(Loc, SourceMgr::DK_Error, 1083e8f2fb20SChandler Carruth Prefix + 1084dcc7d48dSMichael Liao "-NEXT: is not on the line after the previous match"); 1085e8f2fb20SChandler Carruth SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note, 1086e8f2fb20SChandler Carruth "'next' match was here"); 1087dcc7d48dSMichael Liao SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note, 1088dcc7d48dSMichael Liao "previous match ended here"); 1089592fe880SRichard Smith SM.PrintMessage(SMLoc::getFromPointer(FirstNewLine), SourceMgr::DK_Note, 1090592fe880SRichard Smith "non-matching line after previous match is here"); 1091dcc7d48dSMichael Liao return true; 1092dcc7d48dSMichael Liao } 1093dcc7d48dSMichael Liao 1094dcc7d48dSMichael Liao return false; 1095dcc7d48dSMichael Liao } 1096dcc7d48dSMichael Liao 10974dabac20SChandler Carruth /// Verify there is no newline in the given buffer. 109801ac1707SDuncan P. N. Exon Smith bool CheckString::CheckSame(const SourceMgr &SM, StringRef Buffer) const { 109985913ccaSJames Y Knight if (Pat.getCheckTy() != Check::CheckSame) 110001ac1707SDuncan P. N. Exon Smith return false; 110101ac1707SDuncan P. N. Exon Smith 110201ac1707SDuncan P. N. Exon Smith // Count the number of newlines between the previous match and this one. 110301ac1707SDuncan P. N. Exon Smith assert(Buffer.data() != 110401ac1707SDuncan P. N. Exon Smith SM.getMemoryBuffer(SM.FindBufferContainingLoc( 110501ac1707SDuncan P. N. Exon Smith SMLoc::getFromPointer(Buffer.data()))) 110601ac1707SDuncan P. N. Exon Smith ->getBufferStart() && 110701ac1707SDuncan P. N. Exon Smith "CHECK-SAME can't be the first check in a file"); 110801ac1707SDuncan P. N. Exon Smith 110901ac1707SDuncan P. N. Exon Smith const char *FirstNewLine = nullptr; 111001ac1707SDuncan P. N. Exon Smith unsigned NumNewLines = CountNumNewlinesBetween(Buffer, FirstNewLine); 111101ac1707SDuncan P. N. Exon Smith 111201ac1707SDuncan P. N. Exon Smith if (NumNewLines != 0) { 111301ac1707SDuncan P. N. Exon Smith SM.PrintMessage(Loc, SourceMgr::DK_Error, 111401ac1707SDuncan P. N. Exon Smith Prefix + 111501ac1707SDuncan P. N. Exon Smith "-SAME: is not on the same line as the previous match"); 111601ac1707SDuncan P. N. Exon Smith SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note, 111701ac1707SDuncan P. N. Exon Smith "'next' match was here"); 111801ac1707SDuncan P. N. Exon Smith SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note, 111901ac1707SDuncan P. N. Exon Smith "previous match ended here"); 112001ac1707SDuncan P. N. Exon Smith return true; 112101ac1707SDuncan P. N. Exon Smith } 112201ac1707SDuncan P. N. Exon Smith 112301ac1707SDuncan P. N. Exon Smith return false; 112401ac1707SDuncan P. N. Exon Smith } 112501ac1707SDuncan P. N. Exon Smith 11264dabac20SChandler Carruth /// Verify there's no "not strings" in the given buffer. 1127dcc7d48dSMichael Liao bool CheckString::CheckNot(const SourceMgr &SM, StringRef Buffer, 112891a1b2c9SMichael Liao const std::vector<const Pattern *> &NotStrings, 1129dcc7d48dSMichael Liao StringMap<StringRef> &VariableTable) const { 11308f870499SBenjamin Kramer for (const Pattern *Pat : NotStrings) { 113138820972SMatt Arsenault assert((Pat->getCheckTy() == Check::CheckNot) && "Expect CHECK-NOT!"); 113291a1b2c9SMichael Liao 1133dcc7d48dSMichael Liao size_t MatchLen = 0; 113491a1b2c9SMichael Liao size_t Pos = Pat->Match(Buffer, MatchLen, VariableTable); 1135dcc7d48dSMichael Liao 1136e8f2fb20SChandler Carruth if (Pos == StringRef::npos) 1137e8f2fb20SChandler Carruth continue; 1138dcc7d48dSMichael Liao 1139dcc7d48dSMichael Liao SM.PrintMessage(SMLoc::getFromPointer(Buffer.data() + Pos), 1140e8f2fb20SChandler Carruth SourceMgr::DK_Error, Prefix + "-NOT: string occurred!"); 114191a1b2c9SMichael Liao SM.PrintMessage(Pat->getLoc(), SourceMgr::DK_Note, 114213df4626SMatt Arsenault Prefix + "-NOT: pattern specified here"); 1143dcc7d48dSMichael Liao return true; 1144dcc7d48dSMichael Liao } 1145dcc7d48dSMichael Liao 1146dcc7d48dSMichael Liao return false; 1147dcc7d48dSMichael Liao } 1148dcc7d48dSMichael Liao 11494dabac20SChandler Carruth /// Match "dag strings" and their mixed "not strings". 115091a1b2c9SMichael Liao size_t CheckString::CheckDag(const SourceMgr &SM, StringRef Buffer, 115191a1b2c9SMichael Liao std::vector<const Pattern *> &NotStrings, 115291a1b2c9SMichael Liao StringMap<StringRef> &VariableTable) const { 115391a1b2c9SMichael Liao if (DagNotStrings.empty()) 115491a1b2c9SMichael Liao return 0; 115591a1b2c9SMichael Liao 115691a1b2c9SMichael Liao size_t LastPos = 0; 115791a1b2c9SMichael Liao size_t StartPos = LastPos; 115891a1b2c9SMichael Liao 11598f870499SBenjamin Kramer for (const Pattern &Pat : DagNotStrings) { 116038820972SMatt Arsenault assert((Pat.getCheckTy() == Check::CheckDAG || 116138820972SMatt Arsenault Pat.getCheckTy() == Check::CheckNot) && 116291a1b2c9SMichael Liao "Invalid CHECK-DAG or CHECK-NOT!"); 116391a1b2c9SMichael Liao 116438820972SMatt Arsenault if (Pat.getCheckTy() == Check::CheckNot) { 116591a1b2c9SMichael Liao NotStrings.push_back(&Pat); 116691a1b2c9SMichael Liao continue; 116791a1b2c9SMichael Liao } 116891a1b2c9SMichael Liao 116938820972SMatt Arsenault assert((Pat.getCheckTy() == Check::CheckDAG) && "Expect CHECK-DAG!"); 117091a1b2c9SMichael Liao 117191a1b2c9SMichael Liao size_t MatchLen = 0, MatchPos; 117291a1b2c9SMichael Liao 117391a1b2c9SMichael Liao // CHECK-DAG always matches from the start. 117491a1b2c9SMichael Liao StringRef MatchBuffer = Buffer.substr(StartPos); 117591a1b2c9SMichael Liao MatchPos = Pat.Match(MatchBuffer, MatchLen, VariableTable); 117691a1b2c9SMichael Liao // With a group of CHECK-DAGs, a single mismatching means the match on 117791a1b2c9SMichael Liao // that group of CHECK-DAGs fails immediately. 117891a1b2c9SMichael Liao if (MatchPos == StringRef::npos) { 117991a1b2c9SMichael Liao PrintCheckFailed(SM, Pat.getLoc(), Pat, MatchBuffer, VariableTable); 118091a1b2c9SMichael Liao return StringRef::npos; 118191a1b2c9SMichael Liao } 118291a1b2c9SMichael Liao // Re-calc it as the offset relative to the start of the original string. 118391a1b2c9SMichael Liao MatchPos += StartPos; 118491a1b2c9SMichael Liao 118591a1b2c9SMichael Liao if (!NotStrings.empty()) { 118691a1b2c9SMichael Liao if (MatchPos < LastPos) { 118791a1b2c9SMichael Liao // Reordered? 118891a1b2c9SMichael Liao SM.PrintMessage(SMLoc::getFromPointer(Buffer.data() + MatchPos), 118991a1b2c9SMichael Liao SourceMgr::DK_Error, 119013df4626SMatt Arsenault Prefix + "-DAG: found a match of CHECK-DAG" 119191a1b2c9SMichael Liao " reordering across a CHECK-NOT"); 119291a1b2c9SMichael Liao SM.PrintMessage(SMLoc::getFromPointer(Buffer.data() + LastPos), 119391a1b2c9SMichael Liao SourceMgr::DK_Note, 119413df4626SMatt Arsenault Prefix + "-DAG: the farthest match of CHECK-DAG" 119591a1b2c9SMichael Liao " is found here"); 119691a1b2c9SMichael Liao SM.PrintMessage(NotStrings[0]->getLoc(), SourceMgr::DK_Note, 119713df4626SMatt Arsenault Prefix + "-NOT: the crossed pattern specified" 119891a1b2c9SMichael Liao " here"); 119991a1b2c9SMichael Liao SM.PrintMessage(Pat.getLoc(), SourceMgr::DK_Note, 120013df4626SMatt Arsenault Prefix + "-DAG: the reordered pattern specified" 120191a1b2c9SMichael Liao " here"); 120291a1b2c9SMichael Liao return StringRef::npos; 120391a1b2c9SMichael Liao } 120491a1b2c9SMichael Liao // All subsequent CHECK-DAGs should be matched from the farthest 120591a1b2c9SMichael Liao // position of all precedent CHECK-DAGs (including this one.) 120691a1b2c9SMichael Liao StartPos = LastPos; 120791a1b2c9SMichael Liao // If there's CHECK-NOTs between two CHECK-DAGs or from CHECK to 120891a1b2c9SMichael Liao // CHECK-DAG, verify that there's no 'not' strings occurred in that 120991a1b2c9SMichael Liao // region. 1210cf60ab31SBenjamin Kramer StringRef SkippedRegion = Buffer.slice(LastPos, MatchPos); 1211cf708c32STim Northover if (CheckNot(SM, SkippedRegion, NotStrings, VariableTable)) 121291a1b2c9SMichael Liao return StringRef::npos; 121391a1b2c9SMichael Liao // Clear "not strings". 121491a1b2c9SMichael Liao NotStrings.clear(); 121591a1b2c9SMichael Liao } 121691a1b2c9SMichael Liao 121791a1b2c9SMichael Liao // Update the last position with CHECK-DAG matches. 121891a1b2c9SMichael Liao LastPos = std::max(MatchPos + MatchLen, LastPos); 121991a1b2c9SMichael Liao } 122091a1b2c9SMichael Liao 122191a1b2c9SMichael Liao return LastPos; 122291a1b2c9SMichael Liao } 122391a1b2c9SMichael Liao 122413df4626SMatt Arsenault // A check prefix must contain only alphanumeric, hyphens and underscores. 122513df4626SMatt Arsenault static bool ValidateCheckPrefix(StringRef CheckPrefix) { 122613df4626SMatt Arsenault Regex Validator("^[a-zA-Z0-9_-]*$"); 122713df4626SMatt Arsenault return Validator.match(CheckPrefix); 122813df4626SMatt Arsenault } 122913df4626SMatt Arsenault 123013df4626SMatt Arsenault static bool ValidateCheckPrefixes() { 123113df4626SMatt Arsenault StringSet<> PrefixSet; 123213df4626SMatt Arsenault 12338f870499SBenjamin Kramer for (StringRef Prefix : CheckPrefixes) { 123424412b14SEli Bendersky // Reject empty prefixes. 123524412b14SEli Bendersky if (Prefix == "") 123624412b14SEli Bendersky return false; 123724412b14SEli Bendersky 12380356975cSDavid Blaikie if (!PrefixSet.insert(Prefix).second) 123913df4626SMatt Arsenault return false; 124013df4626SMatt Arsenault 124113df4626SMatt Arsenault if (!ValidateCheckPrefix(Prefix)) 124213df4626SMatt Arsenault return false; 124313df4626SMatt Arsenault } 124413df4626SMatt Arsenault 124513df4626SMatt Arsenault return true; 124613df4626SMatt Arsenault } 124713df4626SMatt Arsenault 1248726774cbSChandler Carruth // Combines the check prefixes into a single regex so that we can efficiently 1249726774cbSChandler Carruth // scan for any of the set. 1250726774cbSChandler Carruth // 1251726774cbSChandler Carruth // The semantics are that the longest-match wins which matches our regex 1252726774cbSChandler Carruth // library. 1253726774cbSChandler Carruth static Regex buildCheckPrefixRegex() { 125413df4626SMatt Arsenault // I don't think there's a way to specify an initial value for cl::list, 125513df4626SMatt Arsenault // so if nothing was specified, add the default 125613df4626SMatt Arsenault if (CheckPrefixes.empty()) 125713df4626SMatt Arsenault CheckPrefixes.push_back("CHECK"); 1258726774cbSChandler Carruth 1259726774cbSChandler Carruth // We already validated the contents of CheckPrefixes so just concatenate 1260726774cbSChandler Carruth // them as alternatives. 1261726774cbSChandler Carruth SmallString<32> PrefixRegexStr; 1262726774cbSChandler Carruth for (StringRef Prefix : CheckPrefixes) { 1263726774cbSChandler Carruth if (Prefix != CheckPrefixes.front()) 1264726774cbSChandler Carruth PrefixRegexStr.push_back('|'); 1265726774cbSChandler Carruth 1266726774cbSChandler Carruth PrefixRegexStr.append(Prefix); 1267726774cbSChandler Carruth } 1268726774cbSChandler Carruth 1269726774cbSChandler Carruth return Regex(PrefixRegexStr); 1270c2735158SRui Ueyama } 1271c2735158SRui Ueyama 12722bd4f8b6SXinliang David Li static void DumpCommandLine(int argc, char **argv) { 12732bd4f8b6SXinliang David Li errs() << "FileCheck command line: "; 12742bd4f8b6SXinliang David Li for (int I = 0; I < argc; I++) 12752bd4f8b6SXinliang David Li errs() << " " << argv[I]; 12762bd4f8b6SXinliang David Li errs() << "\n"; 12772bd4f8b6SXinliang David Li } 12782bd4f8b6SXinliang David Li 1279f55e72a5SArtem Belevich // Remove local variables from \p VariableTable. Global variables 1280f55e72a5SArtem Belevich // (start with '$') are preserved. 1281f55e72a5SArtem Belevich static void ClearLocalVars(StringMap<StringRef> &VariableTable) { 1282f55e72a5SArtem Belevich SmallVector<StringRef, 16> LocalVars; 1283f55e72a5SArtem Belevich for (const auto &Var : VariableTable) 1284f55e72a5SArtem Belevich if (Var.first()[0] != '$') 1285f55e72a5SArtem Belevich LocalVars.push_back(Var.first()); 1286f55e72a5SArtem Belevich 1287f55e72a5SArtem Belevich for (const auto &Var : LocalVars) 1288f55e72a5SArtem Belevich VariableTable.erase(Var); 1289f55e72a5SArtem Belevich } 1290f55e72a5SArtem Belevich 129120247900SChandler Carruth /// Check the input to FileCheck provided in the \p Buffer against the \p 129220247900SChandler Carruth /// CheckStrings read from the check file. 129320247900SChandler Carruth /// 129420247900SChandler Carruth /// Returns false if the input fails to satisfy the checks. 129520247900SChandler Carruth bool CheckInput(SourceMgr &SM, StringRef Buffer, 129620247900SChandler Carruth ArrayRef<CheckString> CheckStrings) { 129720247900SChandler Carruth bool ChecksFailed = false; 129820247900SChandler Carruth 129920247900SChandler Carruth /// VariableTable - This holds all the current filecheck variables. 130020247900SChandler Carruth StringMap<StringRef> VariableTable; 130120247900SChandler Carruth 1302*46e1fd61SAlexander Richardson for (const auto& Def : GlobalDefines) 1303*46e1fd61SAlexander Richardson VariableTable.insert(StringRef(Def).split('=')); 1304*46e1fd61SAlexander Richardson 130520247900SChandler Carruth unsigned i = 0, j = 0, e = CheckStrings.size(); 130620247900SChandler Carruth while (true) { 130720247900SChandler Carruth StringRef CheckRegion; 130820247900SChandler Carruth if (j == e) { 130920247900SChandler Carruth CheckRegion = Buffer; 131020247900SChandler Carruth } else { 131120247900SChandler Carruth const CheckString &CheckLabelStr = CheckStrings[j]; 131220247900SChandler Carruth if (CheckLabelStr.Pat.getCheckTy() != Check::CheckLabel) { 131320247900SChandler Carruth ++j; 131420247900SChandler Carruth continue; 131520247900SChandler Carruth } 131620247900SChandler Carruth 131720247900SChandler Carruth // Scan to next CHECK-LABEL match, ignoring CHECK-NOT and CHECK-DAG 131820247900SChandler Carruth size_t MatchLabelLen = 0; 1319e8f2fb20SChandler Carruth size_t MatchLabelPos = 1320e8f2fb20SChandler Carruth CheckLabelStr.Check(SM, Buffer, true, MatchLabelLen, VariableTable); 132120247900SChandler Carruth if (MatchLabelPos == StringRef::npos) 132220247900SChandler Carruth // Immediately bail of CHECK-LABEL fails, nothing else we can do. 132320247900SChandler Carruth return false; 132420247900SChandler Carruth 132520247900SChandler Carruth CheckRegion = Buffer.substr(0, MatchLabelPos + MatchLabelLen); 132620247900SChandler Carruth Buffer = Buffer.substr(MatchLabelPos + MatchLabelLen); 132720247900SChandler Carruth ++j; 132820247900SChandler Carruth } 132920247900SChandler Carruth 1330f55e72a5SArtem Belevich if (EnableVarScope) 1331f55e72a5SArtem Belevich ClearLocalVars(VariableTable); 1332f55e72a5SArtem Belevich 133320247900SChandler Carruth for (; i != j; ++i) { 133420247900SChandler Carruth const CheckString &CheckStr = CheckStrings[i]; 133520247900SChandler Carruth 133620247900SChandler Carruth // Check each string within the scanned region, including a second check 133720247900SChandler Carruth // of any final CHECK-LABEL (to verify CHECK-NOT and CHECK-DAG) 133820247900SChandler Carruth size_t MatchLen = 0; 1339e8f2fb20SChandler Carruth size_t MatchPos = 1340e8f2fb20SChandler Carruth CheckStr.Check(SM, CheckRegion, false, MatchLen, VariableTable); 134120247900SChandler Carruth 134220247900SChandler Carruth if (MatchPos == StringRef::npos) { 134320247900SChandler Carruth ChecksFailed = true; 134420247900SChandler Carruth i = j; 134520247900SChandler Carruth break; 134620247900SChandler Carruth } 134720247900SChandler Carruth 134820247900SChandler Carruth CheckRegion = CheckRegion.substr(MatchPos + MatchLen); 134920247900SChandler Carruth } 135020247900SChandler Carruth 135120247900SChandler Carruth if (j == e) 135220247900SChandler Carruth break; 135320247900SChandler Carruth } 135420247900SChandler Carruth 135520247900SChandler Carruth // Success if no checks failed. 135620247900SChandler Carruth return !ChecksFailed; 135720247900SChandler Carruth } 135820247900SChandler Carruth 1359ee3c74fbSChris Lattner int main(int argc, char **argv) { 13602ad6d48bSRichard Smith sys::PrintStackTraceOnErrorSignal(argv[0]); 1361ee3c74fbSChris Lattner PrettyStackTraceProgram X(argc, argv); 1362ee3c74fbSChris Lattner cl::ParseCommandLineOptions(argc, argv); 1363ee3c74fbSChris Lattner 136413df4626SMatt Arsenault if (!ValidateCheckPrefixes()) { 136513df4626SMatt Arsenault errs() << "Supplied check-prefix is invalid! Prefixes must be unique and " 136613df4626SMatt Arsenault "start with a letter and contain only alphanumeric characters, " 136713df4626SMatt Arsenault "hyphens and underscores\n"; 1368c2735158SRui Ueyama return 2; 1369c2735158SRui Ueyama } 1370c2735158SRui Ueyama 1371726774cbSChandler Carruth Regex PrefixRE = buildCheckPrefixRegex(); 1372726774cbSChandler Carruth std::string REError; 1373726774cbSChandler Carruth if (!PrefixRE.isValid(REError)) { 1374726774cbSChandler Carruth errs() << "Unable to combine check-prefix strings into a prefix regular " 1375726774cbSChandler Carruth "expression! This is likely a bug in FileCheck's verification of " 1376726774cbSChandler Carruth "the check-prefix strings. Regular expression parsing failed " 1377726774cbSChandler Carruth "with the following error: " 1378726774cbSChandler Carruth << REError << "\n"; 1379726774cbSChandler Carruth return 2; 1380726774cbSChandler Carruth } 138113df4626SMatt Arsenault 1382ee3c74fbSChris Lattner SourceMgr SM; 1383ee3c74fbSChris Lattner 1384ee3c74fbSChris Lattner // Read the expected strings from the check file. 138520247900SChandler Carruth ErrorOr<std::unique_ptr<MemoryBuffer>> CheckFileOrErr = 138620247900SChandler Carruth MemoryBuffer::getFileOrSTDIN(CheckFilename); 138720247900SChandler Carruth if (std::error_code EC = CheckFileOrErr.getError()) { 138820247900SChandler Carruth errs() << "Could not open check file '" << CheckFilename 138920247900SChandler Carruth << "': " << EC.message() << '\n'; 139020247900SChandler Carruth return 2; 139120247900SChandler Carruth } 139220247900SChandler Carruth MemoryBuffer &CheckFile = *CheckFileOrErr.get(); 139320247900SChandler Carruth 139420247900SChandler Carruth SmallString<4096> CheckFileBuffer; 1395b03c166aSChandler Carruth StringRef CheckFileText = CanonicalizeFile(CheckFile, CheckFileBuffer); 139620247900SChandler Carruth 139720247900SChandler Carruth SM.AddNewSourceBuffer(MemoryBuffer::getMemBuffer( 139820247900SChandler Carruth CheckFileText, CheckFile.getBufferIdentifier()), 139920247900SChandler Carruth SMLoc()); 140020247900SChandler Carruth 140126cccfe1SChris Lattner std::vector<CheckString> CheckStrings; 1402726774cbSChandler Carruth if (ReadCheckFile(SM, CheckFileText, PrefixRE, CheckStrings)) 1403ee3c74fbSChris Lattner return 2; 1404ee3c74fbSChris Lattner 1405ee3c74fbSChris Lattner // Open the file to check and add it to SourceMgr. 140620247900SChandler Carruth ErrorOr<std::unique_ptr<MemoryBuffer>> InputFileOrErr = 1407adf21f2aSRafael Espindola MemoryBuffer::getFileOrSTDIN(InputFilename); 140820247900SChandler Carruth if (std::error_code EC = InputFileOrErr.getError()) { 1409adf21f2aSRafael Espindola errs() << "Could not open input file '" << InputFilename 1410adf21f2aSRafael Espindola << "': " << EC.message() << '\n'; 14118e1c6477SEli Bendersky return 2; 1412ee3c74fbSChris Lattner } 141320247900SChandler Carruth MemoryBuffer &InputFile = *InputFileOrErr.get(); 14142c3e5cdfSChris Lattner 141520247900SChandler Carruth if (InputFile.getBufferSize() == 0 && !AllowEmptyInput) { 1416b692bed7SChris Lattner errs() << "FileCheck error: '" << InputFilename << "' is empty.\n"; 14172bd4f8b6SXinliang David Li DumpCommandLine(argc, argv); 14188e1c6477SEli Bendersky return 2; 1419b692bed7SChris Lattner } 1420b692bed7SChris Lattner 142120247900SChandler Carruth SmallString<4096> InputFileBuffer; 1422b03c166aSChandler Carruth StringRef InputFileText = CanonicalizeFile(InputFile, InputFileBuffer); 14232c3e5cdfSChris Lattner 1424e8f2fb20SChandler Carruth SM.AddNewSourceBuffer(MemoryBuffer::getMemBuffer( 1425e8f2fb20SChandler Carruth InputFileText, InputFile.getBufferIdentifier()), 1426e8f2fb20SChandler Carruth SMLoc()); 1427ee3c74fbSChris Lattner 142820247900SChandler Carruth return CheckInput(SM, InputFileText, CheckStrings) ? EXIT_SUCCESS : 1; 1429ee3c74fbSChris Lattner } 1430