1ee3c74fbSChris Lattner //===- FileCheck.cpp - Check that File's Contents match what is expected --===// 2ee3c74fbSChris Lattner // 3ee3c74fbSChris Lattner // The LLVM Compiler Infrastructure 4ee3c74fbSChris Lattner // 5ee3c74fbSChris Lattner // This file is distributed under the University of Illinois Open Source 6ee3c74fbSChris Lattner // License. See LICENSE.TXT for details. 7ee3c74fbSChris Lattner // 8ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 9ee3c74fbSChris Lattner // 10ee3c74fbSChris Lattner // FileCheck does a line-by line check of a file that validates whether it 11ee3c74fbSChris Lattner // contains the expected content. This is useful for regression tests etc. 12ee3c74fbSChris Lattner // 13ee3c74fbSChris Lattner // This program exits with an error status of 2 on error, exit status of 0 if 14ee3c74fbSChris Lattner // the file matched the expected contents, and exit status of 1 if it did not 15ee3c74fbSChris Lattner // contain the expected contents. 16ee3c74fbSChris Lattner // 17ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 18ee3c74fbSChris Lattner 19ee3c74fbSChris Lattner #include "llvm/Support/CommandLine.h" 20ee3c74fbSChris Lattner #include "llvm/Support/MemoryBuffer.h" 21ee3c74fbSChris Lattner #include "llvm/Support/PrettyStackTrace.h" 22f08d2db9SChris Lattner #include "llvm/Support/Regex.h" 23ee3c74fbSChris Lattner #include "llvm/Support/SourceMgr.h" 24ee3c74fbSChris Lattner #include "llvm/Support/raw_ostream.h" 25ee3c74fbSChris Lattner #include "llvm/System/Signals.h" 26ee3c74fbSChris Lattner using namespace llvm; 27ee3c74fbSChris Lattner 28ee3c74fbSChris Lattner static cl::opt<std::string> 29ee3c74fbSChris Lattner CheckFilename(cl::Positional, cl::desc("<check-file>"), cl::Required); 30ee3c74fbSChris Lattner 31ee3c74fbSChris Lattner static cl::opt<std::string> 32ee3c74fbSChris Lattner InputFilename("input-file", cl::desc("File to check (defaults to stdin)"), 33ee3c74fbSChris Lattner cl::init("-"), cl::value_desc("filename")); 34ee3c74fbSChris Lattner 35ee3c74fbSChris Lattner static cl::opt<std::string> 36ee3c74fbSChris Lattner CheckPrefix("check-prefix", cl::init("CHECK"), 37ee3c74fbSChris Lattner cl::desc("Prefix to use from check file (defaults to 'CHECK')")); 38ee3c74fbSChris Lattner 392c3e5cdfSChris Lattner static cl::opt<bool> 402c3e5cdfSChris Lattner NoCanonicalizeWhiteSpace("strict-whitespace", 412c3e5cdfSChris Lattner cl::desc("Do not treat all horizontal whitespace as equivalent")); 422c3e5cdfSChris Lattner 4374d50731SChris Lattner //===----------------------------------------------------------------------===// 4474d50731SChris Lattner // Pattern Handling Code. 4574d50731SChris Lattner //===----------------------------------------------------------------------===// 4674d50731SChris Lattner 47b121a24fSChris Lattner class PatternChunk { 48b121a24fSChris Lattner StringRef Str; 49b121a24fSChris Lattner bool isRegEx; 50b121a24fSChris Lattner public: 51b121a24fSChris Lattner PatternChunk(StringRef S, bool isRE) : Str(S), isRegEx(isRE) {} 52b121a24fSChris Lattner 53b121a24fSChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen) const { 54b121a24fSChris Lattner if (!isRegEx) { 55b121a24fSChris Lattner // Fixed string match. 56b121a24fSChris Lattner MatchLen = Str.size(); 57b121a24fSChris Lattner return Buffer.find(Str); 58b121a24fSChris Lattner } 59b121a24fSChris Lattner 60b121a24fSChris Lattner // Regex match. 61b121a24fSChris Lattner SmallVector<StringRef, 4> MatchInfo; 62712e8e03SChris Lattner if (!Regex(Str, Regex::Sub|Regex::Newline).match(Buffer, &MatchInfo)) 63b121a24fSChris Lattner return StringRef::npos; 64b121a24fSChris Lattner 65b121a24fSChris Lattner // Successful regex match. 66b121a24fSChris Lattner assert(!MatchInfo.empty() && "Didn't get any match"); 67b121a24fSChris Lattner StringRef FullMatch = MatchInfo[0]; 68b121a24fSChris Lattner 69b121a24fSChris Lattner MatchLen = FullMatch.size(); 70b121a24fSChris Lattner return FullMatch.data()-Buffer.data(); 71b121a24fSChris Lattner } 72b121a24fSChris Lattner }; 73b121a24fSChris Lattner 743b40b445SChris Lattner class Pattern { 75f08d2db9SChris Lattner /// Chunks - The pattern chunks to match. If the bool is false, it is a fixed 76f08d2db9SChris Lattner /// string match, if it is true, it is a regex match. 77b121a24fSChris Lattner SmallVector<PatternChunk, 4> Chunks; 78*221460e0SChris Lattner 79*221460e0SChris Lattner StringRef FixedStr; 803b40b445SChris Lattner public: 813b40b445SChris Lattner 8274d50731SChris Lattner Pattern() { } 8374d50731SChris Lattner 8474d50731SChris Lattner bool ParsePattern(StringRef PatternStr, SourceMgr &SM); 853b40b445SChris Lattner 863b40b445SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 873b40b445SChris Lattner /// returns the position that is matched or npos if there is no match. If 883b40b445SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 89f08d2db9SChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen) const; 903b40b445SChris Lattner }; 913b40b445SChris Lattner 9274d50731SChris Lattner bool Pattern::ParsePattern(StringRef PatternStr, SourceMgr &SM) { 9374d50731SChris Lattner // Ignore trailing whitespace. 9474d50731SChris Lattner while (!PatternStr.empty() && 9574d50731SChris Lattner (PatternStr.back() == ' ' || PatternStr.back() == '\t')) 9674d50731SChris Lattner PatternStr = PatternStr.substr(0, PatternStr.size()-1); 9774d50731SChris Lattner 9874d50731SChris Lattner // Check that there is something on the line. 9974d50731SChris Lattner if (PatternStr.empty()) { 10074d50731SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 10174d50731SChris Lattner "found empty check string with prefix '"+CheckPrefix+":'", 10274d50731SChris Lattner "error"); 10374d50731SChris Lattner return true; 10474d50731SChris Lattner } 10574d50731SChris Lattner 106*221460e0SChris Lattner // Check to see if this is a fixed string, or if it has regex pieces. 107*221460e0SChris Lattner if (PatternStr.size() < 2 || PatternStr.find("{{") == StringRef::npos) { 108*221460e0SChris Lattner FixedStr = PatternStr; 109*221460e0SChris Lattner return false; 110*221460e0SChris Lattner } 111*221460e0SChris Lattner 112*221460e0SChris Lattner // Otherwise, there is at least one regex piece. 113*221460e0SChris Lattner 114f08d2db9SChris Lattner // Scan the pattern to break it into regex and non-regex pieces. 115f08d2db9SChris Lattner while (!PatternStr.empty()) { 116f08d2db9SChris Lattner // Handle fixed string matches. 117f08d2db9SChris Lattner if (PatternStr.size() < 2 || 118f08d2db9SChris Lattner PatternStr[0] != '{' || PatternStr[1] != '{') { 119f08d2db9SChris Lattner // Find the end, which is the start of the next regex. 120f08d2db9SChris Lattner size_t FixedMatchEnd = PatternStr.find("{{"); 12174d50731SChris Lattner 122b121a24fSChris Lattner Chunks.push_back(PatternChunk(PatternStr.substr(0, FixedMatchEnd),false)); 123f08d2db9SChris Lattner PatternStr = PatternStr.substr(FixedMatchEnd); 124f08d2db9SChris Lattner continue; 125f08d2db9SChris Lattner } 12674d50731SChris Lattner 127f08d2db9SChris Lattner // Otherwise, this is the start of a regex match. Scan for the }}. 128f08d2db9SChris Lattner size_t End = PatternStr.find("}}"); 129f08d2db9SChris Lattner if (End == StringRef::npos) { 130f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 131f08d2db9SChris Lattner "found start of regex string with no end '}}'", "error"); 132f08d2db9SChris Lattner return true; 133f08d2db9SChris Lattner } 134f08d2db9SChris Lattner 135f08d2db9SChris Lattner Regex R(PatternStr.substr(2, End-2)); 136f08d2db9SChris Lattner std::string Error; 137f08d2db9SChris Lattner if (!R.isValid(Error)) { 138f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()+2), 139f08d2db9SChris Lattner "invalid regex: " + Error, "error"); 140f08d2db9SChris Lattner return true; 141f08d2db9SChris Lattner } 142f08d2db9SChris Lattner 143b121a24fSChris Lattner Chunks.push_back(PatternChunk(PatternStr.substr(2, End-2), true)); 144f08d2db9SChris Lattner PatternStr = PatternStr.substr(End+2); 145f08d2db9SChris Lattner } 146f08d2db9SChris Lattner 14774d50731SChris Lattner return false; 14874d50731SChris Lattner } 14974d50731SChris Lattner 150f08d2db9SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 151f08d2db9SChris Lattner /// returns the position that is matched or npos if there is no match. If 152f08d2db9SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 153f08d2db9SChris Lattner size_t Pattern::Match(StringRef Buffer, size_t &MatchLen) const { 154*221460e0SChris Lattner // If this is a fixed string pattern, just match it now. 155*221460e0SChris Lattner if (!FixedStr.empty()) { 156*221460e0SChris Lattner MatchLen = FixedStr.size(); 157*221460e0SChris Lattner return Buffer.find(FixedStr); 158*221460e0SChris Lattner } 159*221460e0SChris Lattner 160f08d2db9SChris Lattner size_t FirstMatch = StringRef::npos; 161f08d2db9SChris Lattner MatchLen = 0; 162f08d2db9SChris Lattner 163f08d2db9SChris Lattner while (!Buffer.empty()) { 164f08d2db9SChris Lattner StringRef MatchAttempt = Buffer; 165f08d2db9SChris Lattner 166f08d2db9SChris Lattner unsigned ChunkNo = 0, e = Chunks.size(); 167f08d2db9SChris Lattner for (; ChunkNo != e; ++ChunkNo) { 168b121a24fSChris Lattner size_t ThisMatch, ThisLength = StringRef::npos; 169b121a24fSChris Lattner ThisMatch = Chunks[ChunkNo].Match(MatchAttempt, ThisLength); 170f08d2db9SChris Lattner 171f08d2db9SChris Lattner // Otherwise, what we do depends on if this is the first match or not. If 172f08d2db9SChris Lattner // this is the first match, it doesn't match to match at the start of 173f08d2db9SChris Lattner // MatchAttempt. 174f08d2db9SChris Lattner if (ChunkNo == 0) { 175f08d2db9SChris Lattner // If the first match fails then this pattern will never match in 176f08d2db9SChris Lattner // Buffer. 177f08d2db9SChris Lattner if (ThisMatch == StringRef::npos) 178f08d2db9SChris Lattner return ThisMatch; 179f08d2db9SChris Lattner 180f08d2db9SChris Lattner FirstMatch = ThisMatch; 181f08d2db9SChris Lattner MatchAttempt = MatchAttempt.substr(FirstMatch); 182f08d2db9SChris Lattner ThisMatch = 0; 183f08d2db9SChris Lattner } 184f08d2db9SChris Lattner 185f08d2db9SChris Lattner // If this chunk didn't match, then the entire pattern didn't match from 186f08d2db9SChris Lattner // FirstMatch, try later in the buffer. 187f08d2db9SChris Lattner if (ThisMatch == StringRef::npos) 188f08d2db9SChris Lattner break; 189f08d2db9SChris Lattner 190f08d2db9SChris Lattner // Ok, if the match didn't match at the beginning of MatchAttempt, then we 191f08d2db9SChris Lattner // have something like "ABC{{DEF}} and something was in-between. Reject 192f08d2db9SChris Lattner // the match. 193f08d2db9SChris Lattner if (ThisMatch != 0) 194f08d2db9SChris Lattner break; 195f08d2db9SChris Lattner 196f08d2db9SChris Lattner // Otherwise, match the string and move to the next chunk. 197f08d2db9SChris Lattner MatchLen += ThisLength; 198f08d2db9SChris Lattner MatchAttempt = MatchAttempt.substr(ThisLength); 199f08d2db9SChris Lattner } 200f08d2db9SChris Lattner 201f08d2db9SChris Lattner // If the whole thing matched, we win. 202f08d2db9SChris Lattner if (ChunkNo == e) 203f08d2db9SChris Lattner return FirstMatch; 204f08d2db9SChris Lattner 205f08d2db9SChris Lattner // Otherwise, try matching again after FirstMatch to see if this pattern 206f08d2db9SChris Lattner // matches later in the buffer. 207f08d2db9SChris Lattner Buffer = Buffer.substr(FirstMatch+1); 208f08d2db9SChris Lattner } 209f08d2db9SChris Lattner 210f08d2db9SChris Lattner // If we ran out of stuff to scan, then we didn't match. 211f08d2db9SChris Lattner return StringRef::npos; 212f08d2db9SChris Lattner } 213f08d2db9SChris Lattner 21474d50731SChris Lattner 21574d50731SChris Lattner //===----------------------------------------------------------------------===// 21674d50731SChris Lattner // Check Strings. 21774d50731SChris Lattner //===----------------------------------------------------------------------===// 2183b40b445SChris Lattner 2193b40b445SChris Lattner /// CheckString - This is a check that we found in the input file. 2203b40b445SChris Lattner struct CheckString { 2213b40b445SChris Lattner /// Pat - The pattern to match. 2223b40b445SChris Lattner Pattern Pat; 22326cccfe1SChris Lattner 22426cccfe1SChris Lattner /// Loc - The location in the match file that the check string was specified. 22526cccfe1SChris Lattner SMLoc Loc; 22626cccfe1SChris Lattner 227da108b4eSChris Lattner /// IsCheckNext - This is true if this is a CHECK-NEXT: directive (as opposed 228da108b4eSChris Lattner /// to a CHECK: directive. 229da108b4eSChris Lattner bool IsCheckNext; 230da108b4eSChris Lattner 231236d2d5eSChris Lattner /// NotStrings - These are all of the strings that are disallowed from 232236d2d5eSChris Lattner /// occurring between this match string and the previous one (or start of 233236d2d5eSChris Lattner /// file). 23474d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotStrings; 235236d2d5eSChris Lattner 2363b40b445SChris Lattner CheckString(const Pattern &P, SMLoc L, bool isCheckNext) 2373b40b445SChris Lattner : Pat(P), Loc(L), IsCheckNext(isCheckNext) {} 23826cccfe1SChris Lattner }; 23926cccfe1SChris Lattner 240a2f8fc5aSChris Lattner /// CanonicalizeInputFile - Remove duplicate horizontal space from the specified 241a2f8fc5aSChris Lattner /// memory buffer, free it, and return a new one. 242a2f8fc5aSChris Lattner static MemoryBuffer *CanonicalizeInputFile(MemoryBuffer *MB) { 243a2f8fc5aSChris Lattner SmallVector<char, 16> NewFile; 244a2f8fc5aSChris Lattner NewFile.reserve(MB->getBufferSize()); 245a2f8fc5aSChris Lattner 246a2f8fc5aSChris Lattner for (const char *Ptr = MB->getBufferStart(), *End = MB->getBufferEnd(); 247a2f8fc5aSChris Lattner Ptr != End; ++Ptr) { 248a2f8fc5aSChris Lattner // If C is not a horizontal whitespace, skip it. 249a2f8fc5aSChris Lattner if (*Ptr != ' ' && *Ptr != '\t') { 250a2f8fc5aSChris Lattner NewFile.push_back(*Ptr); 251a2f8fc5aSChris Lattner continue; 252a2f8fc5aSChris Lattner } 253a2f8fc5aSChris Lattner 254a2f8fc5aSChris Lattner // Otherwise, add one space and advance over neighboring space. 255a2f8fc5aSChris Lattner NewFile.push_back(' '); 256a2f8fc5aSChris Lattner while (Ptr+1 != End && 257a2f8fc5aSChris Lattner (Ptr[1] == ' ' || Ptr[1] == '\t')) 258a2f8fc5aSChris Lattner ++Ptr; 259a2f8fc5aSChris Lattner } 260a2f8fc5aSChris Lattner 261a2f8fc5aSChris Lattner // Free the old buffer and return a new one. 262a2f8fc5aSChris Lattner MemoryBuffer *MB2 = 263a2f8fc5aSChris Lattner MemoryBuffer::getMemBufferCopy(NewFile.data(), 264a2f8fc5aSChris Lattner NewFile.data() + NewFile.size(), 265a2f8fc5aSChris Lattner MB->getBufferIdentifier()); 266a2f8fc5aSChris Lattner 267a2f8fc5aSChris Lattner delete MB; 268a2f8fc5aSChris Lattner return MB2; 269a2f8fc5aSChris Lattner } 270a2f8fc5aSChris Lattner 271ee3c74fbSChris Lattner 272ee3c74fbSChris Lattner /// ReadCheckFile - Read the check file, which specifies the sequence of 273ee3c74fbSChris Lattner /// expected strings. The strings are added to the CheckStrings vector. 274ee3c74fbSChris Lattner static bool ReadCheckFile(SourceMgr &SM, 27526cccfe1SChris Lattner std::vector<CheckString> &CheckStrings) { 276ee3c74fbSChris Lattner // Open the check file, and tell SourceMgr about it. 277ee3c74fbSChris Lattner std::string ErrorStr; 278ee3c74fbSChris Lattner MemoryBuffer *F = 279ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(CheckFilename.c_str(), &ErrorStr); 280ee3c74fbSChris Lattner if (F == 0) { 281ee3c74fbSChris Lattner errs() << "Could not open check file '" << CheckFilename << "': " 282ee3c74fbSChris Lattner << ErrorStr << '\n'; 283ee3c74fbSChris Lattner return true; 284ee3c74fbSChris Lattner } 285a2f8fc5aSChris Lattner 286a2f8fc5aSChris Lattner // If we want to canonicalize whitespace, strip excess whitespace from the 287a2f8fc5aSChris Lattner // buffer containing the CHECK lines. 288a2f8fc5aSChris Lattner if (!NoCanonicalizeWhiteSpace) 289a2f8fc5aSChris Lattner F = CanonicalizeInputFile(F); 290a2f8fc5aSChris Lattner 291ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 292ee3c74fbSChris Lattner 29310f10cedSChris Lattner // Find all instances of CheckPrefix followed by : in the file. 294caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 295ee3c74fbSChris Lattner 29674d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotMatches; 297236d2d5eSChris Lattner 298ee3c74fbSChris Lattner while (1) { 299ee3c74fbSChris Lattner // See if Prefix occurs in the memory buffer. 300caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find(CheckPrefix)); 301ee3c74fbSChris Lattner 302ee3c74fbSChris Lattner // If we didn't find a match, we're done. 303caa5fc0cSChris Lattner if (Buffer.empty()) 304ee3c74fbSChris Lattner break; 305ee3c74fbSChris Lattner 306caa5fc0cSChris Lattner const char *CheckPrefixStart = Buffer.data(); 307da108b4eSChris Lattner 308da108b4eSChris Lattner // When we find a check prefix, keep track of whether we find CHECK: or 309da108b4eSChris Lattner // CHECK-NEXT: 310236d2d5eSChris Lattner bool IsCheckNext = false, IsCheckNot = false; 311da108b4eSChris Lattner 31210f10cedSChris Lattner // Verify that the : is present after the prefix. 313caa5fc0cSChris Lattner if (Buffer[CheckPrefix.size()] == ':') { 314caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+1); 315caa5fc0cSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+6 && 316caa5fc0cSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NEXT:", 6) == 0) { 317caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+7); 318da108b4eSChris Lattner IsCheckNext = true; 319236d2d5eSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+5 && 320236d2d5eSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NOT:", 5) == 0) { 321236d2d5eSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+6); 322236d2d5eSChris Lattner IsCheckNot = true; 323da108b4eSChris Lattner } else { 324caa5fc0cSChris Lattner Buffer = Buffer.substr(1); 32510f10cedSChris Lattner continue; 32610f10cedSChris Lattner } 32710f10cedSChris Lattner 328ee3c74fbSChris Lattner // Okay, we found the prefix, yay. Remember the rest of the line, but 329ee3c74fbSChris Lattner // ignore leading and trailing whitespace. 330236d2d5eSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t")); 331ee3c74fbSChris Lattner 332ee3c74fbSChris Lattner // Scan ahead to the end of line. 333caa5fc0cSChris Lattner size_t EOL = Buffer.find_first_of("\n\r"); 334ee3c74fbSChris Lattner 33574d50731SChris Lattner // Parse the pattern. 33674d50731SChris Lattner Pattern P; 33774d50731SChris Lattner if (P.ParsePattern(Buffer.substr(0, EOL), SM)) 338ee3c74fbSChris Lattner return true; 339ee3c74fbSChris Lattner 340236d2d5eSChris Lattner Buffer = Buffer.substr(EOL); 34174d50731SChris Lattner 342236d2d5eSChris Lattner 343da108b4eSChris Lattner // Verify that CHECK-NEXT lines have at least one CHECK line before them. 344da108b4eSChris Lattner if (IsCheckNext && CheckStrings.empty()) { 345da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(CheckPrefixStart), 346da108b4eSChris Lattner "found '"+CheckPrefix+"-NEXT:' without previous '"+ 347da108b4eSChris Lattner CheckPrefix+ ": line", "error"); 348da108b4eSChris Lattner return true; 349da108b4eSChris Lattner } 350da108b4eSChris Lattner 35174d50731SChris Lattner // Handle CHECK-NOT. 35274d50731SChris Lattner if (IsCheckNot) { 35374d50731SChris Lattner NotMatches.push_back(std::make_pair(SMLoc::getFromPointer(Buffer.data()), 35474d50731SChris Lattner P)); 35574d50731SChris Lattner continue; 35674d50731SChris Lattner } 35774d50731SChris Lattner 3583b40b445SChris Lattner 359ee3c74fbSChris Lattner // Okay, add the string we captured to the output vector and move on. 3603b40b445SChris Lattner CheckStrings.push_back(CheckString(P, 361caa5fc0cSChris Lattner SMLoc::getFromPointer(Buffer.data()), 362da108b4eSChris Lattner IsCheckNext)); 363236d2d5eSChris Lattner std::swap(NotMatches, CheckStrings.back().NotStrings); 364ee3c74fbSChris Lattner } 365ee3c74fbSChris Lattner 366ee3c74fbSChris Lattner if (CheckStrings.empty()) { 36710f10cedSChris Lattner errs() << "error: no check strings found with prefix '" << CheckPrefix 36810f10cedSChris Lattner << ":'\n"; 369ee3c74fbSChris Lattner return true; 370ee3c74fbSChris Lattner } 371ee3c74fbSChris Lattner 372236d2d5eSChris Lattner if (!NotMatches.empty()) { 373236d2d5eSChris Lattner errs() << "error: '" << CheckPrefix 374236d2d5eSChris Lattner << "-NOT:' not supported after last check line.\n"; 375236d2d5eSChris Lattner return true; 376236d2d5eSChris Lattner } 377236d2d5eSChris Lattner 378ee3c74fbSChris Lattner return false; 379ee3c74fbSChris Lattner } 380ee3c74fbSChris Lattner 381da108b4eSChris Lattner static void PrintCheckFailed(const SourceMgr &SM, const CheckString &CheckStr, 382caa5fc0cSChris Lattner StringRef Buffer) { 383da108b4eSChris Lattner // Otherwise, we have an error, emit an error message. 384da108b4eSChris Lattner SM.PrintMessage(CheckStr.Loc, "expected string not found in input", 385da108b4eSChris Lattner "error"); 386da108b4eSChris Lattner 387da108b4eSChris Lattner // Print the "scanning from here" line. If the current position is at the 388da108b4eSChris Lattner // end of a line, advance to the start of the next line. 389caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t\n\r")); 390da108b4eSChris Lattner 391caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), "scanning from here", 392da108b4eSChris Lattner "note"); 393da108b4eSChris Lattner } 394da108b4eSChris Lattner 39537183584SChris Lattner /// CountNumNewlinesBetween - Count the number of newlines in the specified 39637183584SChris Lattner /// range. 39737183584SChris Lattner static unsigned CountNumNewlinesBetween(StringRef Range) { 398da108b4eSChris Lattner unsigned NumNewLines = 0; 39937183584SChris Lattner while (1) { 400da108b4eSChris Lattner // Scan for newline. 40137183584SChris Lattner Range = Range.substr(Range.find_first_of("\n\r")); 40237183584SChris Lattner if (Range.empty()) return NumNewLines; 403da108b4eSChris Lattner 404da108b4eSChris Lattner ++NumNewLines; 405da108b4eSChris Lattner 406da108b4eSChris Lattner // Handle \n\r and \r\n as a single newline. 40737183584SChris Lattner if (Range.size() > 1 && 40837183584SChris Lattner (Range[1] == '\n' || Range[1] == '\r') && 40937183584SChris Lattner (Range[0] != Range[1])) 41037183584SChris Lattner Range = Range.substr(1); 41137183584SChris Lattner Range = Range.substr(1); 412da108b4eSChris Lattner } 413da108b4eSChris Lattner } 414da108b4eSChris Lattner 415ee3c74fbSChris Lattner int main(int argc, char **argv) { 416ee3c74fbSChris Lattner sys::PrintStackTraceOnErrorSignal(); 417ee3c74fbSChris Lattner PrettyStackTraceProgram X(argc, argv); 418ee3c74fbSChris Lattner cl::ParseCommandLineOptions(argc, argv); 419ee3c74fbSChris Lattner 420ee3c74fbSChris Lattner SourceMgr SM; 421ee3c74fbSChris Lattner 422ee3c74fbSChris Lattner // Read the expected strings from the check file. 42326cccfe1SChris Lattner std::vector<CheckString> CheckStrings; 424ee3c74fbSChris Lattner if (ReadCheckFile(SM, CheckStrings)) 425ee3c74fbSChris Lattner return 2; 426ee3c74fbSChris Lattner 427ee3c74fbSChris Lattner // Open the file to check and add it to SourceMgr. 428ee3c74fbSChris Lattner std::string ErrorStr; 429ee3c74fbSChris Lattner MemoryBuffer *F = 430ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(InputFilename.c_str(), &ErrorStr); 431ee3c74fbSChris Lattner if (F == 0) { 432ee3c74fbSChris Lattner errs() << "Could not open input file '" << InputFilename << "': " 433ee3c74fbSChris Lattner << ErrorStr << '\n'; 434ee3c74fbSChris Lattner return true; 435ee3c74fbSChris Lattner } 4362c3e5cdfSChris Lattner 4372c3e5cdfSChris Lattner // Remove duplicate spaces in the input file if requested. 4382c3e5cdfSChris Lattner if (!NoCanonicalizeWhiteSpace) 4392c3e5cdfSChris Lattner F = CanonicalizeInputFile(F); 4402c3e5cdfSChris Lattner 441ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 442ee3c74fbSChris Lattner 443ee3c74fbSChris Lattner // Check that we have all of the expected strings, in order, in the input 444ee3c74fbSChris Lattner // file. 445caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 446ee3c74fbSChris Lattner 447236d2d5eSChris Lattner const char *LastMatch = Buffer.data(); 448236d2d5eSChris Lattner 449ee3c74fbSChris Lattner for (unsigned StrNo = 0, e = CheckStrings.size(); StrNo != e; ++StrNo) { 45026cccfe1SChris Lattner const CheckString &CheckStr = CheckStrings[StrNo]; 451ee3c74fbSChris Lattner 452caa5fc0cSChris Lattner StringRef SearchFrom = Buffer; 453caa5fc0cSChris Lattner 454ee3c74fbSChris Lattner // Find StrNo in the file. 4553b40b445SChris Lattner size_t MatchLen = 0; 4563b40b445SChris Lattner Buffer = Buffer.substr(CheckStr.Pat.Match(Buffer, MatchLen)); 457ee3c74fbSChris Lattner 458da108b4eSChris Lattner // If we didn't find a match, reject the input. 459caa5fc0cSChris Lattner if (Buffer.empty()) { 460caa5fc0cSChris Lattner PrintCheckFailed(SM, CheckStr, SearchFrom); 461da108b4eSChris Lattner return 1; 462ee3c74fbSChris Lattner } 463ee3c74fbSChris Lattner 46437183584SChris Lattner StringRef SkippedRegion(LastMatch, Buffer.data()-LastMatch); 46537183584SChris Lattner 466da108b4eSChris Lattner // If this check is a "CHECK-NEXT", verify that the previous match was on 467da108b4eSChris Lattner // the previous line (i.e. that there is one newline between them). 468da108b4eSChris Lattner if (CheckStr.IsCheckNext) { 469da108b4eSChris Lattner // Count the number of newlines between the previous match and this one. 470236d2d5eSChris Lattner assert(LastMatch != F->getBufferStart() && 471236d2d5eSChris Lattner "CHECK-NEXT can't be the first check in a file"); 472da108b4eSChris Lattner 47337183584SChris Lattner unsigned NumNewLines = CountNumNewlinesBetween(SkippedRegion); 474da108b4eSChris Lattner if (NumNewLines == 0) { 475107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 476da108b4eSChris Lattner CheckPrefix+"-NEXT: is on the same line as previous match", 477ee3c74fbSChris Lattner "error"); 478caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 479107c21eaSChris Lattner "'next' match was here", "note"); 480da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 481da108b4eSChris Lattner "previous match was here", "note"); 482aedd8185SChris Lattner return 1; 483ee3c74fbSChris Lattner } 484ee3c74fbSChris Lattner 485da108b4eSChris Lattner if (NumNewLines != 1) { 486107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 487da108b4eSChris Lattner CheckPrefix+ 488da108b4eSChris Lattner "-NEXT: is not on the line after the previous match", 489da108b4eSChris Lattner "error"); 490caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 491107c21eaSChris Lattner "'next' match was here", "note"); 492da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 493da108b4eSChris Lattner "previous match was here", "note"); 494da108b4eSChris Lattner return 1; 495da108b4eSChris Lattner } 496da108b4eSChris Lattner } 497da108b4eSChris Lattner 498236d2d5eSChris Lattner // If this match had "not strings", verify that they don't exist in the 499236d2d5eSChris Lattner // skipped region. 500f08d2db9SChris Lattner for (unsigned ChunkNo = 0, e = CheckStr.NotStrings.size(); ChunkNo != e; ++ChunkNo) { 50174d50731SChris Lattner size_t MatchLen = 0; 502f08d2db9SChris Lattner size_t Pos = CheckStr.NotStrings[ChunkNo].second.Match(SkippedRegion, MatchLen); 503236d2d5eSChris Lattner if (Pos == StringRef::npos) continue; 504236d2d5eSChris Lattner 505236d2d5eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch+Pos), 506236d2d5eSChris Lattner CheckPrefix+"-NOT: string occurred!", "error"); 507f08d2db9SChris Lattner SM.PrintMessage(CheckStr.NotStrings[ChunkNo].first, 508236d2d5eSChris Lattner CheckPrefix+"-NOT: pattern specified here", "note"); 509236d2d5eSChris Lattner return 1; 510236d2d5eSChris Lattner } 511236d2d5eSChris Lattner 512236d2d5eSChris Lattner 513b9f2bf46SChris Lattner // Otherwise, everything is good. Step over the matched text and remember 514b9f2bf46SChris Lattner // the position after the match as the end of the last match. 5153b40b445SChris Lattner Buffer = Buffer.substr(MatchLen); 516b9f2bf46SChris Lattner LastMatch = Buffer.data(); 517da108b4eSChris Lattner } 518da108b4eSChris Lattner 519ee3c74fbSChris Lattner return 0; 520ee3c74fbSChris Lattner } 521