1ee3c74fbSChris Lattner //===- FileCheck.cpp - Check that File's Contents match what is expected --===// 2ee3c74fbSChris Lattner // 3ee3c74fbSChris Lattner // The LLVM Compiler Infrastructure 4ee3c74fbSChris Lattner // 5ee3c74fbSChris Lattner // This file is distributed under the University of Illinois Open Source 6ee3c74fbSChris Lattner // License. See LICENSE.TXT for details. 7ee3c74fbSChris Lattner // 8ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 9ee3c74fbSChris Lattner // 10ee3c74fbSChris Lattner // FileCheck does a line-by line check of a file that validates whether it 11ee3c74fbSChris Lattner // contains the expected content. This is useful for regression tests etc. 12ee3c74fbSChris Lattner // 13ee3c74fbSChris Lattner // This program exits with an error status of 2 on error, exit status of 0 if 14ee3c74fbSChris Lattner // the file matched the expected contents, and exit status of 1 if it did not 15ee3c74fbSChris Lattner // contain the expected contents. 16ee3c74fbSChris Lattner // 17ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 18ee3c74fbSChris Lattner 19ee3c74fbSChris Lattner #include "llvm/Support/CommandLine.h" 20ee3c74fbSChris Lattner #include "llvm/Support/MemoryBuffer.h" 21ee3c74fbSChris Lattner #include "llvm/Support/PrettyStackTrace.h" 22f08d2db9SChris Lattner #include "llvm/Support/Regex.h" 23ee3c74fbSChris Lattner #include "llvm/Support/SourceMgr.h" 24ee3c74fbSChris Lattner #include "llvm/Support/raw_ostream.h" 25ee3c74fbSChris Lattner #include "llvm/System/Signals.h" 26ee3c74fbSChris Lattner using namespace llvm; 27ee3c74fbSChris Lattner 28ee3c74fbSChris Lattner static cl::opt<std::string> 29ee3c74fbSChris Lattner CheckFilename(cl::Positional, cl::desc("<check-file>"), cl::Required); 30ee3c74fbSChris Lattner 31ee3c74fbSChris Lattner static cl::opt<std::string> 32ee3c74fbSChris Lattner InputFilename("input-file", cl::desc("File to check (defaults to stdin)"), 33ee3c74fbSChris Lattner cl::init("-"), cl::value_desc("filename")); 34ee3c74fbSChris Lattner 35ee3c74fbSChris Lattner static cl::opt<std::string> 36ee3c74fbSChris Lattner CheckPrefix("check-prefix", cl::init("CHECK"), 37ee3c74fbSChris Lattner cl::desc("Prefix to use from check file (defaults to 'CHECK')")); 38ee3c74fbSChris Lattner 392c3e5cdfSChris Lattner static cl::opt<bool> 402c3e5cdfSChris Lattner NoCanonicalizeWhiteSpace("strict-whitespace", 412c3e5cdfSChris Lattner cl::desc("Do not treat all horizontal whitespace as equivalent")); 422c3e5cdfSChris Lattner 4374d50731SChris Lattner //===----------------------------------------------------------------------===// 4474d50731SChris Lattner // Pattern Handling Code. 4574d50731SChris Lattner //===----------------------------------------------------------------------===// 4674d50731SChris Lattner 47b121a24fSChris Lattner class PatternChunk { 48b121a24fSChris Lattner StringRef Str; 49b121a24fSChris Lattner bool isRegEx; 50b121a24fSChris Lattner public: 51b121a24fSChris Lattner PatternChunk(StringRef S, bool isRE) : Str(S), isRegEx(isRE) {} 52b121a24fSChris Lattner 53b121a24fSChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen) const { 54b121a24fSChris Lattner if (!isRegEx) { 55b121a24fSChris Lattner // Fixed string match. 56b121a24fSChris Lattner MatchLen = Str.size(); 57b121a24fSChris Lattner return Buffer.find(Str); 58b121a24fSChris Lattner } 59b121a24fSChris Lattner 60b121a24fSChris Lattner // Regex match. 61b121a24fSChris Lattner SmallVector<StringRef, 4> MatchInfo; 62*712e8e03SChris Lattner if (!Regex(Str, Regex::Sub|Regex::Newline).match(Buffer, &MatchInfo)) 63b121a24fSChris Lattner return StringRef::npos; 64b121a24fSChris Lattner 65b121a24fSChris Lattner // Successful regex match. 66b121a24fSChris Lattner assert(!MatchInfo.empty() && "Didn't get any match"); 67b121a24fSChris Lattner StringRef FullMatch = MatchInfo[0]; 68b121a24fSChris Lattner 69b121a24fSChris Lattner MatchLen = FullMatch.size(); 70b121a24fSChris Lattner return FullMatch.data()-Buffer.data(); 71b121a24fSChris Lattner } 72b121a24fSChris Lattner }; 73b121a24fSChris Lattner 743b40b445SChris Lattner class Pattern { 75f08d2db9SChris Lattner /// Chunks - The pattern chunks to match. If the bool is false, it is a fixed 76f08d2db9SChris Lattner /// string match, if it is true, it is a regex match. 77b121a24fSChris Lattner SmallVector<PatternChunk, 4> Chunks; 783b40b445SChris Lattner public: 793b40b445SChris Lattner 8074d50731SChris Lattner Pattern() { } 8174d50731SChris Lattner 8274d50731SChris Lattner bool ParsePattern(StringRef PatternStr, SourceMgr &SM); 833b40b445SChris Lattner 843b40b445SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 853b40b445SChris Lattner /// returns the position that is matched or npos if there is no match. If 863b40b445SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 87f08d2db9SChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen) const; 883b40b445SChris Lattner }; 893b40b445SChris Lattner 9074d50731SChris Lattner bool Pattern::ParsePattern(StringRef PatternStr, SourceMgr &SM) { 9174d50731SChris Lattner // Ignore trailing whitespace. 9274d50731SChris Lattner while (!PatternStr.empty() && 9374d50731SChris Lattner (PatternStr.back() == ' ' || PatternStr.back() == '\t')) 9474d50731SChris Lattner PatternStr = PatternStr.substr(0, PatternStr.size()-1); 9574d50731SChris Lattner 9674d50731SChris Lattner // Check that there is something on the line. 9774d50731SChris Lattner if (PatternStr.empty()) { 9874d50731SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 9974d50731SChris Lattner "found empty check string with prefix '"+CheckPrefix+":'", 10074d50731SChris Lattner "error"); 10174d50731SChris Lattner return true; 10274d50731SChris Lattner } 10374d50731SChris Lattner 104f08d2db9SChris Lattner // Scan the pattern to break it into regex and non-regex pieces. 105f08d2db9SChris Lattner while (!PatternStr.empty()) { 106f08d2db9SChris Lattner // Handle fixed string matches. 107f08d2db9SChris Lattner if (PatternStr.size() < 2 || 108f08d2db9SChris Lattner PatternStr[0] != '{' || PatternStr[1] != '{') { 109f08d2db9SChris Lattner // Find the end, which is the start of the next regex. 110f08d2db9SChris Lattner size_t FixedMatchEnd = PatternStr.find("{{"); 11174d50731SChris Lattner 112b121a24fSChris Lattner Chunks.push_back(PatternChunk(PatternStr.substr(0, FixedMatchEnd),false)); 113f08d2db9SChris Lattner PatternStr = PatternStr.substr(FixedMatchEnd); 114f08d2db9SChris Lattner continue; 115f08d2db9SChris Lattner } 11674d50731SChris Lattner 117f08d2db9SChris Lattner // Otherwise, this is the start of a regex match. Scan for the }}. 118f08d2db9SChris Lattner size_t End = PatternStr.find("}}"); 119f08d2db9SChris Lattner if (End == StringRef::npos) { 120f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 121f08d2db9SChris Lattner "found start of regex string with no end '}}'", "error"); 122f08d2db9SChris Lattner return true; 123f08d2db9SChris Lattner } 124f08d2db9SChris Lattner 125f08d2db9SChris Lattner Regex R(PatternStr.substr(2, End-2)); 126f08d2db9SChris Lattner std::string Error; 127f08d2db9SChris Lattner if (!R.isValid(Error)) { 128f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()+2), 129f08d2db9SChris Lattner "invalid regex: " + Error, "error"); 130f08d2db9SChris Lattner return true; 131f08d2db9SChris Lattner } 132f08d2db9SChris Lattner 133b121a24fSChris Lattner Chunks.push_back(PatternChunk(PatternStr.substr(2, End-2), true)); 134f08d2db9SChris Lattner PatternStr = PatternStr.substr(End+2); 135f08d2db9SChris Lattner } 136f08d2db9SChris Lattner 13774d50731SChris Lattner return false; 13874d50731SChris Lattner } 13974d50731SChris Lattner 140f08d2db9SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 141f08d2db9SChris Lattner /// returns the position that is matched or npos if there is no match. If 142f08d2db9SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 143f08d2db9SChris Lattner size_t Pattern::Match(StringRef Buffer, size_t &MatchLen) const { 144f08d2db9SChris Lattner size_t FirstMatch = StringRef::npos; 145f08d2db9SChris Lattner MatchLen = 0; 146f08d2db9SChris Lattner 147f08d2db9SChris Lattner while (!Buffer.empty()) { 148f08d2db9SChris Lattner StringRef MatchAttempt = Buffer; 149f08d2db9SChris Lattner 150f08d2db9SChris Lattner unsigned ChunkNo = 0, e = Chunks.size(); 151f08d2db9SChris Lattner for (; ChunkNo != e; ++ChunkNo) { 152b121a24fSChris Lattner size_t ThisMatch, ThisLength = StringRef::npos; 153b121a24fSChris Lattner ThisMatch = Chunks[ChunkNo].Match(MatchAttempt, ThisLength); 154f08d2db9SChris Lattner 155f08d2db9SChris Lattner // Otherwise, what we do depends on if this is the first match or not. If 156f08d2db9SChris Lattner // this is the first match, it doesn't match to match at the start of 157f08d2db9SChris Lattner // MatchAttempt. 158f08d2db9SChris Lattner if (ChunkNo == 0) { 159f08d2db9SChris Lattner // If the first match fails then this pattern will never match in 160f08d2db9SChris Lattner // Buffer. 161f08d2db9SChris Lattner if (ThisMatch == StringRef::npos) 162f08d2db9SChris Lattner return ThisMatch; 163f08d2db9SChris Lattner 164f08d2db9SChris Lattner FirstMatch = ThisMatch; 165f08d2db9SChris Lattner MatchAttempt = MatchAttempt.substr(FirstMatch); 166f08d2db9SChris Lattner ThisMatch = 0; 167f08d2db9SChris Lattner } 168f08d2db9SChris Lattner 169f08d2db9SChris Lattner // If this chunk didn't match, then the entire pattern didn't match from 170f08d2db9SChris Lattner // FirstMatch, try later in the buffer. 171f08d2db9SChris Lattner if (ThisMatch == StringRef::npos) 172f08d2db9SChris Lattner break; 173f08d2db9SChris Lattner 174f08d2db9SChris Lattner // Ok, if the match didn't match at the beginning of MatchAttempt, then we 175f08d2db9SChris Lattner // have something like "ABC{{DEF}} and something was in-between. Reject 176f08d2db9SChris Lattner // the match. 177f08d2db9SChris Lattner if (ThisMatch != 0) 178f08d2db9SChris Lattner break; 179f08d2db9SChris Lattner 180f08d2db9SChris Lattner // Otherwise, match the string and move to the next chunk. 181f08d2db9SChris Lattner MatchLen += ThisLength; 182f08d2db9SChris Lattner MatchAttempt = MatchAttempt.substr(ThisLength); 183f08d2db9SChris Lattner } 184f08d2db9SChris Lattner 185f08d2db9SChris Lattner // If the whole thing matched, we win. 186f08d2db9SChris Lattner if (ChunkNo == e) 187f08d2db9SChris Lattner return FirstMatch; 188f08d2db9SChris Lattner 189f08d2db9SChris Lattner // Otherwise, try matching again after FirstMatch to see if this pattern 190f08d2db9SChris Lattner // matches later in the buffer. 191f08d2db9SChris Lattner Buffer = Buffer.substr(FirstMatch+1); 192f08d2db9SChris Lattner } 193f08d2db9SChris Lattner 194f08d2db9SChris Lattner // If we ran out of stuff to scan, then we didn't match. 195f08d2db9SChris Lattner return StringRef::npos; 196f08d2db9SChris Lattner } 197f08d2db9SChris Lattner 19874d50731SChris Lattner 19974d50731SChris Lattner //===----------------------------------------------------------------------===// 20074d50731SChris Lattner // Check Strings. 20174d50731SChris Lattner //===----------------------------------------------------------------------===// 2023b40b445SChris Lattner 2033b40b445SChris Lattner /// CheckString - This is a check that we found in the input file. 2043b40b445SChris Lattner struct CheckString { 2053b40b445SChris Lattner /// Pat - The pattern to match. 2063b40b445SChris Lattner Pattern Pat; 20726cccfe1SChris Lattner 20826cccfe1SChris Lattner /// Loc - The location in the match file that the check string was specified. 20926cccfe1SChris Lattner SMLoc Loc; 21026cccfe1SChris Lattner 211da108b4eSChris Lattner /// IsCheckNext - This is true if this is a CHECK-NEXT: directive (as opposed 212da108b4eSChris Lattner /// to a CHECK: directive. 213da108b4eSChris Lattner bool IsCheckNext; 214da108b4eSChris Lattner 215236d2d5eSChris Lattner /// NotStrings - These are all of the strings that are disallowed from 216236d2d5eSChris Lattner /// occurring between this match string and the previous one (or start of 217236d2d5eSChris Lattner /// file). 21874d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotStrings; 219236d2d5eSChris Lattner 2203b40b445SChris Lattner CheckString(const Pattern &P, SMLoc L, bool isCheckNext) 2213b40b445SChris Lattner : Pat(P), Loc(L), IsCheckNext(isCheckNext) {} 22226cccfe1SChris Lattner }; 22326cccfe1SChris Lattner 224a2f8fc5aSChris Lattner /// CanonicalizeInputFile - Remove duplicate horizontal space from the specified 225a2f8fc5aSChris Lattner /// memory buffer, free it, and return a new one. 226a2f8fc5aSChris Lattner static MemoryBuffer *CanonicalizeInputFile(MemoryBuffer *MB) { 227a2f8fc5aSChris Lattner SmallVector<char, 16> NewFile; 228a2f8fc5aSChris Lattner NewFile.reserve(MB->getBufferSize()); 229a2f8fc5aSChris Lattner 230a2f8fc5aSChris Lattner for (const char *Ptr = MB->getBufferStart(), *End = MB->getBufferEnd(); 231a2f8fc5aSChris Lattner Ptr != End; ++Ptr) { 232a2f8fc5aSChris Lattner // If C is not a horizontal whitespace, skip it. 233a2f8fc5aSChris Lattner if (*Ptr != ' ' && *Ptr != '\t') { 234a2f8fc5aSChris Lattner NewFile.push_back(*Ptr); 235a2f8fc5aSChris Lattner continue; 236a2f8fc5aSChris Lattner } 237a2f8fc5aSChris Lattner 238a2f8fc5aSChris Lattner // Otherwise, add one space and advance over neighboring space. 239a2f8fc5aSChris Lattner NewFile.push_back(' '); 240a2f8fc5aSChris Lattner while (Ptr+1 != End && 241a2f8fc5aSChris Lattner (Ptr[1] == ' ' || Ptr[1] == '\t')) 242a2f8fc5aSChris Lattner ++Ptr; 243a2f8fc5aSChris Lattner } 244a2f8fc5aSChris Lattner 245a2f8fc5aSChris Lattner // Free the old buffer and return a new one. 246a2f8fc5aSChris Lattner MemoryBuffer *MB2 = 247a2f8fc5aSChris Lattner MemoryBuffer::getMemBufferCopy(NewFile.data(), 248a2f8fc5aSChris Lattner NewFile.data() + NewFile.size(), 249a2f8fc5aSChris Lattner MB->getBufferIdentifier()); 250a2f8fc5aSChris Lattner 251a2f8fc5aSChris Lattner delete MB; 252a2f8fc5aSChris Lattner return MB2; 253a2f8fc5aSChris Lattner } 254a2f8fc5aSChris Lattner 255ee3c74fbSChris Lattner 256ee3c74fbSChris Lattner /// ReadCheckFile - Read the check file, which specifies the sequence of 257ee3c74fbSChris Lattner /// expected strings. The strings are added to the CheckStrings vector. 258ee3c74fbSChris Lattner static bool ReadCheckFile(SourceMgr &SM, 25926cccfe1SChris Lattner std::vector<CheckString> &CheckStrings) { 260ee3c74fbSChris Lattner // Open the check file, and tell SourceMgr about it. 261ee3c74fbSChris Lattner std::string ErrorStr; 262ee3c74fbSChris Lattner MemoryBuffer *F = 263ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(CheckFilename.c_str(), &ErrorStr); 264ee3c74fbSChris Lattner if (F == 0) { 265ee3c74fbSChris Lattner errs() << "Could not open check file '" << CheckFilename << "': " 266ee3c74fbSChris Lattner << ErrorStr << '\n'; 267ee3c74fbSChris Lattner return true; 268ee3c74fbSChris Lattner } 269a2f8fc5aSChris Lattner 270a2f8fc5aSChris Lattner // If we want to canonicalize whitespace, strip excess whitespace from the 271a2f8fc5aSChris Lattner // buffer containing the CHECK lines. 272a2f8fc5aSChris Lattner if (!NoCanonicalizeWhiteSpace) 273a2f8fc5aSChris Lattner F = CanonicalizeInputFile(F); 274a2f8fc5aSChris Lattner 275ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 276ee3c74fbSChris Lattner 27710f10cedSChris Lattner // Find all instances of CheckPrefix followed by : in the file. 278caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 279ee3c74fbSChris Lattner 28074d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotMatches; 281236d2d5eSChris Lattner 282ee3c74fbSChris Lattner while (1) { 283ee3c74fbSChris Lattner // See if Prefix occurs in the memory buffer. 284caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find(CheckPrefix)); 285ee3c74fbSChris Lattner 286ee3c74fbSChris Lattner // If we didn't find a match, we're done. 287caa5fc0cSChris Lattner if (Buffer.empty()) 288ee3c74fbSChris Lattner break; 289ee3c74fbSChris Lattner 290caa5fc0cSChris Lattner const char *CheckPrefixStart = Buffer.data(); 291da108b4eSChris Lattner 292da108b4eSChris Lattner // When we find a check prefix, keep track of whether we find CHECK: or 293da108b4eSChris Lattner // CHECK-NEXT: 294236d2d5eSChris Lattner bool IsCheckNext = false, IsCheckNot = false; 295da108b4eSChris Lattner 29610f10cedSChris Lattner // Verify that the : is present after the prefix. 297caa5fc0cSChris Lattner if (Buffer[CheckPrefix.size()] == ':') { 298caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+1); 299caa5fc0cSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+6 && 300caa5fc0cSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NEXT:", 6) == 0) { 301caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+7); 302da108b4eSChris Lattner IsCheckNext = true; 303236d2d5eSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+5 && 304236d2d5eSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NOT:", 5) == 0) { 305236d2d5eSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+6); 306236d2d5eSChris Lattner IsCheckNot = true; 307da108b4eSChris Lattner } else { 308caa5fc0cSChris Lattner Buffer = Buffer.substr(1); 30910f10cedSChris Lattner continue; 31010f10cedSChris Lattner } 31110f10cedSChris Lattner 312ee3c74fbSChris Lattner // Okay, we found the prefix, yay. Remember the rest of the line, but 313ee3c74fbSChris Lattner // ignore leading and trailing whitespace. 314236d2d5eSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t")); 315ee3c74fbSChris Lattner 316ee3c74fbSChris Lattner // Scan ahead to the end of line. 317caa5fc0cSChris Lattner size_t EOL = Buffer.find_first_of("\n\r"); 318ee3c74fbSChris Lattner 31974d50731SChris Lattner // Parse the pattern. 32074d50731SChris Lattner Pattern P; 32174d50731SChris Lattner if (P.ParsePattern(Buffer.substr(0, EOL), SM)) 322ee3c74fbSChris Lattner return true; 323ee3c74fbSChris Lattner 324236d2d5eSChris Lattner Buffer = Buffer.substr(EOL); 32574d50731SChris Lattner 326236d2d5eSChris Lattner 327da108b4eSChris Lattner // Verify that CHECK-NEXT lines have at least one CHECK line before them. 328da108b4eSChris Lattner if (IsCheckNext && CheckStrings.empty()) { 329da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(CheckPrefixStart), 330da108b4eSChris Lattner "found '"+CheckPrefix+"-NEXT:' without previous '"+ 331da108b4eSChris Lattner CheckPrefix+ ": line", "error"); 332da108b4eSChris Lattner return true; 333da108b4eSChris Lattner } 334da108b4eSChris Lattner 33574d50731SChris Lattner // Handle CHECK-NOT. 33674d50731SChris Lattner if (IsCheckNot) { 33774d50731SChris Lattner NotMatches.push_back(std::make_pair(SMLoc::getFromPointer(Buffer.data()), 33874d50731SChris Lattner P)); 33974d50731SChris Lattner continue; 34074d50731SChris Lattner } 34174d50731SChris Lattner 3423b40b445SChris Lattner 343ee3c74fbSChris Lattner // Okay, add the string we captured to the output vector and move on. 3443b40b445SChris Lattner CheckStrings.push_back(CheckString(P, 345caa5fc0cSChris Lattner SMLoc::getFromPointer(Buffer.data()), 346da108b4eSChris Lattner IsCheckNext)); 347236d2d5eSChris Lattner std::swap(NotMatches, CheckStrings.back().NotStrings); 348ee3c74fbSChris Lattner } 349ee3c74fbSChris Lattner 350ee3c74fbSChris Lattner if (CheckStrings.empty()) { 35110f10cedSChris Lattner errs() << "error: no check strings found with prefix '" << CheckPrefix 35210f10cedSChris Lattner << ":'\n"; 353ee3c74fbSChris Lattner return true; 354ee3c74fbSChris Lattner } 355ee3c74fbSChris Lattner 356236d2d5eSChris Lattner if (!NotMatches.empty()) { 357236d2d5eSChris Lattner errs() << "error: '" << CheckPrefix 358236d2d5eSChris Lattner << "-NOT:' not supported after last check line.\n"; 359236d2d5eSChris Lattner return true; 360236d2d5eSChris Lattner } 361236d2d5eSChris Lattner 362ee3c74fbSChris Lattner return false; 363ee3c74fbSChris Lattner } 364ee3c74fbSChris Lattner 365da108b4eSChris Lattner static void PrintCheckFailed(const SourceMgr &SM, const CheckString &CheckStr, 366caa5fc0cSChris Lattner StringRef Buffer) { 367da108b4eSChris Lattner // Otherwise, we have an error, emit an error message. 368da108b4eSChris Lattner SM.PrintMessage(CheckStr.Loc, "expected string not found in input", 369da108b4eSChris Lattner "error"); 370da108b4eSChris Lattner 371da108b4eSChris Lattner // Print the "scanning from here" line. If the current position is at the 372da108b4eSChris Lattner // end of a line, advance to the start of the next line. 373caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t\n\r")); 374da108b4eSChris Lattner 375caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), "scanning from here", 376da108b4eSChris Lattner "note"); 377da108b4eSChris Lattner } 378da108b4eSChris Lattner 37937183584SChris Lattner /// CountNumNewlinesBetween - Count the number of newlines in the specified 38037183584SChris Lattner /// range. 38137183584SChris Lattner static unsigned CountNumNewlinesBetween(StringRef Range) { 382da108b4eSChris Lattner unsigned NumNewLines = 0; 38337183584SChris Lattner while (1) { 384da108b4eSChris Lattner // Scan for newline. 38537183584SChris Lattner Range = Range.substr(Range.find_first_of("\n\r")); 38637183584SChris Lattner if (Range.empty()) return NumNewLines; 387da108b4eSChris Lattner 388da108b4eSChris Lattner ++NumNewLines; 389da108b4eSChris Lattner 390da108b4eSChris Lattner // Handle \n\r and \r\n as a single newline. 39137183584SChris Lattner if (Range.size() > 1 && 39237183584SChris Lattner (Range[1] == '\n' || Range[1] == '\r') && 39337183584SChris Lattner (Range[0] != Range[1])) 39437183584SChris Lattner Range = Range.substr(1); 39537183584SChris Lattner Range = Range.substr(1); 396da108b4eSChris Lattner } 397da108b4eSChris Lattner } 398da108b4eSChris Lattner 399ee3c74fbSChris Lattner int main(int argc, char **argv) { 400ee3c74fbSChris Lattner sys::PrintStackTraceOnErrorSignal(); 401ee3c74fbSChris Lattner PrettyStackTraceProgram X(argc, argv); 402ee3c74fbSChris Lattner cl::ParseCommandLineOptions(argc, argv); 403ee3c74fbSChris Lattner 404ee3c74fbSChris Lattner SourceMgr SM; 405ee3c74fbSChris Lattner 406ee3c74fbSChris Lattner // Read the expected strings from the check file. 40726cccfe1SChris Lattner std::vector<CheckString> CheckStrings; 408ee3c74fbSChris Lattner if (ReadCheckFile(SM, CheckStrings)) 409ee3c74fbSChris Lattner return 2; 410ee3c74fbSChris Lattner 411ee3c74fbSChris Lattner // Open the file to check and add it to SourceMgr. 412ee3c74fbSChris Lattner std::string ErrorStr; 413ee3c74fbSChris Lattner MemoryBuffer *F = 414ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(InputFilename.c_str(), &ErrorStr); 415ee3c74fbSChris Lattner if (F == 0) { 416ee3c74fbSChris Lattner errs() << "Could not open input file '" << InputFilename << "': " 417ee3c74fbSChris Lattner << ErrorStr << '\n'; 418ee3c74fbSChris Lattner return true; 419ee3c74fbSChris Lattner } 4202c3e5cdfSChris Lattner 4212c3e5cdfSChris Lattner // Remove duplicate spaces in the input file if requested. 4222c3e5cdfSChris Lattner if (!NoCanonicalizeWhiteSpace) 4232c3e5cdfSChris Lattner F = CanonicalizeInputFile(F); 4242c3e5cdfSChris Lattner 425ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 426ee3c74fbSChris Lattner 427ee3c74fbSChris Lattner // Check that we have all of the expected strings, in order, in the input 428ee3c74fbSChris Lattner // file. 429caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 430ee3c74fbSChris Lattner 431236d2d5eSChris Lattner const char *LastMatch = Buffer.data(); 432236d2d5eSChris Lattner 433ee3c74fbSChris Lattner for (unsigned StrNo = 0, e = CheckStrings.size(); StrNo != e; ++StrNo) { 43426cccfe1SChris Lattner const CheckString &CheckStr = CheckStrings[StrNo]; 435ee3c74fbSChris Lattner 436caa5fc0cSChris Lattner StringRef SearchFrom = Buffer; 437caa5fc0cSChris Lattner 438ee3c74fbSChris Lattner // Find StrNo in the file. 4393b40b445SChris Lattner size_t MatchLen = 0; 4403b40b445SChris Lattner Buffer = Buffer.substr(CheckStr.Pat.Match(Buffer, MatchLen)); 441ee3c74fbSChris Lattner 442da108b4eSChris Lattner // If we didn't find a match, reject the input. 443caa5fc0cSChris Lattner if (Buffer.empty()) { 444caa5fc0cSChris Lattner PrintCheckFailed(SM, CheckStr, SearchFrom); 445da108b4eSChris Lattner return 1; 446ee3c74fbSChris Lattner } 447ee3c74fbSChris Lattner 44837183584SChris Lattner StringRef SkippedRegion(LastMatch, Buffer.data()-LastMatch); 44937183584SChris Lattner 450da108b4eSChris Lattner // If this check is a "CHECK-NEXT", verify that the previous match was on 451da108b4eSChris Lattner // the previous line (i.e. that there is one newline between them). 452da108b4eSChris Lattner if (CheckStr.IsCheckNext) { 453da108b4eSChris Lattner // Count the number of newlines between the previous match and this one. 454236d2d5eSChris Lattner assert(LastMatch != F->getBufferStart() && 455236d2d5eSChris Lattner "CHECK-NEXT can't be the first check in a file"); 456da108b4eSChris Lattner 45737183584SChris Lattner unsigned NumNewLines = CountNumNewlinesBetween(SkippedRegion); 458da108b4eSChris Lattner if (NumNewLines == 0) { 459107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 460da108b4eSChris Lattner CheckPrefix+"-NEXT: is on the same line as previous match", 461ee3c74fbSChris Lattner "error"); 462caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 463107c21eaSChris Lattner "'next' match was here", "note"); 464da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 465da108b4eSChris Lattner "previous match was here", "note"); 466aedd8185SChris Lattner return 1; 467ee3c74fbSChris Lattner } 468ee3c74fbSChris Lattner 469da108b4eSChris Lattner if (NumNewLines != 1) { 470107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 471da108b4eSChris Lattner CheckPrefix+ 472da108b4eSChris Lattner "-NEXT: is not on the line after the previous match", 473da108b4eSChris Lattner "error"); 474caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 475107c21eaSChris Lattner "'next' match was here", "note"); 476da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 477da108b4eSChris Lattner "previous match was here", "note"); 478da108b4eSChris Lattner return 1; 479da108b4eSChris Lattner } 480da108b4eSChris Lattner } 481da108b4eSChris Lattner 482236d2d5eSChris Lattner // If this match had "not strings", verify that they don't exist in the 483236d2d5eSChris Lattner // skipped region. 484f08d2db9SChris Lattner for (unsigned ChunkNo = 0, e = CheckStr.NotStrings.size(); ChunkNo != e; ++ChunkNo) { 48574d50731SChris Lattner size_t MatchLen = 0; 486f08d2db9SChris Lattner size_t Pos = CheckStr.NotStrings[ChunkNo].second.Match(SkippedRegion, MatchLen); 487236d2d5eSChris Lattner if (Pos == StringRef::npos) continue; 488236d2d5eSChris Lattner 489236d2d5eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch+Pos), 490236d2d5eSChris Lattner CheckPrefix+"-NOT: string occurred!", "error"); 491f08d2db9SChris Lattner SM.PrintMessage(CheckStr.NotStrings[ChunkNo].first, 492236d2d5eSChris Lattner CheckPrefix+"-NOT: pattern specified here", "note"); 493236d2d5eSChris Lattner return 1; 494236d2d5eSChris Lattner } 495236d2d5eSChris Lattner 496236d2d5eSChris Lattner 497b9f2bf46SChris Lattner // Otherwise, everything is good. Step over the matched text and remember 498b9f2bf46SChris Lattner // the position after the match as the end of the last match. 4993b40b445SChris Lattner Buffer = Buffer.substr(MatchLen); 500b9f2bf46SChris Lattner LastMatch = Buffer.data(); 501da108b4eSChris Lattner } 502da108b4eSChris Lattner 503ee3c74fbSChris Lattner return 0; 504ee3c74fbSChris Lattner } 505