1ee3c74fbSChris Lattner //===- FileCheck.cpp - Check that File's Contents match what is expected --===// 2ee3c74fbSChris Lattner // 3ee3c74fbSChris Lattner // The LLVM Compiler Infrastructure 4ee3c74fbSChris Lattner // 5ee3c74fbSChris Lattner // This file is distributed under the University of Illinois Open Source 6ee3c74fbSChris Lattner // License. See LICENSE.TXT for details. 7ee3c74fbSChris Lattner // 8ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 9ee3c74fbSChris Lattner // 10ee3c74fbSChris Lattner // FileCheck does a line-by line check of a file that validates whether it 11ee3c74fbSChris Lattner // contains the expected content. This is useful for regression tests etc. 12ee3c74fbSChris Lattner // 13ee3c74fbSChris Lattner // This program exits with an error status of 2 on error, exit status of 0 if 14ee3c74fbSChris Lattner // the file matched the expected contents, and exit status of 1 if it did not 15ee3c74fbSChris Lattner // contain the expected contents. 16ee3c74fbSChris Lattner // 17ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 18ee3c74fbSChris Lattner 19ee3c74fbSChris Lattner #include "llvm/Support/CommandLine.h" 20ee3c74fbSChris Lattner #include "llvm/Support/MemoryBuffer.h" 21ee3c74fbSChris Lattner #include "llvm/Support/PrettyStackTrace.h" 22f08d2db9SChris Lattner #include "llvm/Support/Regex.h" 23ee3c74fbSChris Lattner #include "llvm/Support/SourceMgr.h" 24ee3c74fbSChris Lattner #include "llvm/Support/raw_ostream.h" 25ee3c74fbSChris Lattner #include "llvm/System/Signals.h" 26ee3c74fbSChris Lattner using namespace llvm; 27ee3c74fbSChris Lattner 28ee3c74fbSChris Lattner static cl::opt<std::string> 29ee3c74fbSChris Lattner CheckFilename(cl::Positional, cl::desc("<check-file>"), cl::Required); 30ee3c74fbSChris Lattner 31ee3c74fbSChris Lattner static cl::opt<std::string> 32ee3c74fbSChris Lattner InputFilename("input-file", cl::desc("File to check (defaults to stdin)"), 33ee3c74fbSChris Lattner cl::init("-"), cl::value_desc("filename")); 34ee3c74fbSChris Lattner 35ee3c74fbSChris Lattner static cl::opt<std::string> 36ee3c74fbSChris Lattner CheckPrefix("check-prefix", cl::init("CHECK"), 37ee3c74fbSChris Lattner cl::desc("Prefix to use from check file (defaults to 'CHECK')")); 38ee3c74fbSChris Lattner 392c3e5cdfSChris Lattner static cl::opt<bool> 402c3e5cdfSChris Lattner NoCanonicalizeWhiteSpace("strict-whitespace", 412c3e5cdfSChris Lattner cl::desc("Do not treat all horizontal whitespace as equivalent")); 422c3e5cdfSChris Lattner 4374d50731SChris Lattner //===----------------------------------------------------------------------===// 4474d50731SChris Lattner // Pattern Handling Code. 4574d50731SChris Lattner //===----------------------------------------------------------------------===// 4674d50731SChris Lattner 47*b121a24fSChris Lattner class PatternChunk { 48*b121a24fSChris Lattner StringRef Str; 49*b121a24fSChris Lattner bool isRegEx; 50*b121a24fSChris Lattner public: 51*b121a24fSChris Lattner PatternChunk(StringRef S, bool isRE) : Str(S), isRegEx(isRE) {} 52*b121a24fSChris Lattner 53*b121a24fSChris Lattner 54*b121a24fSChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen) const { 55*b121a24fSChris Lattner if (!isRegEx) { 56*b121a24fSChris Lattner // Fixed string match. 57*b121a24fSChris Lattner MatchLen = Str.size(); 58*b121a24fSChris Lattner return Buffer.find(Str); 59*b121a24fSChris Lattner } 60*b121a24fSChris Lattner 61*b121a24fSChris Lattner // Regex match. 62*b121a24fSChris Lattner SmallVector<StringRef, 4> MatchInfo; 63*b121a24fSChris Lattner if (!Regex(Str, Regex::Sub).match(Buffer, &MatchInfo)) 64*b121a24fSChris Lattner return StringRef::npos; 65*b121a24fSChris Lattner 66*b121a24fSChris Lattner // Successful regex match. 67*b121a24fSChris Lattner assert(!MatchInfo.empty() && "Didn't get any match"); 68*b121a24fSChris Lattner StringRef FullMatch = MatchInfo[0]; 69*b121a24fSChris Lattner 70*b121a24fSChris Lattner MatchLen = FullMatch.size(); 71*b121a24fSChris Lattner return FullMatch.data()-Buffer.data(); 72*b121a24fSChris Lattner } 73*b121a24fSChris Lattner 74*b121a24fSChris Lattner }; 75*b121a24fSChris Lattner 763b40b445SChris Lattner class Pattern { 77f08d2db9SChris Lattner /// Chunks - The pattern chunks to match. If the bool is false, it is a fixed 78f08d2db9SChris Lattner /// string match, if it is true, it is a regex match. 79*b121a24fSChris Lattner SmallVector<PatternChunk, 4> Chunks; 803b40b445SChris Lattner public: 813b40b445SChris Lattner 8274d50731SChris Lattner Pattern() { } 8374d50731SChris Lattner 8474d50731SChris Lattner bool ParsePattern(StringRef PatternStr, SourceMgr &SM); 853b40b445SChris Lattner 863b40b445SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 873b40b445SChris Lattner /// returns the position that is matched or npos if there is no match. If 883b40b445SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 89f08d2db9SChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen) const; 903b40b445SChris Lattner }; 913b40b445SChris Lattner 9274d50731SChris Lattner bool Pattern::ParsePattern(StringRef PatternStr, SourceMgr &SM) { 9374d50731SChris Lattner // Ignore trailing whitespace. 9474d50731SChris Lattner while (!PatternStr.empty() && 9574d50731SChris Lattner (PatternStr.back() == ' ' || PatternStr.back() == '\t')) 9674d50731SChris Lattner PatternStr = PatternStr.substr(0, PatternStr.size()-1); 9774d50731SChris Lattner 9874d50731SChris Lattner // Check that there is something on the line. 9974d50731SChris Lattner if (PatternStr.empty()) { 10074d50731SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 10174d50731SChris Lattner "found empty check string with prefix '"+CheckPrefix+":'", 10274d50731SChris Lattner "error"); 10374d50731SChris Lattner return true; 10474d50731SChris Lattner } 10574d50731SChris Lattner 106f08d2db9SChris Lattner // Scan the pattern to break it into regex and non-regex pieces. 107f08d2db9SChris Lattner while (!PatternStr.empty()) { 108f08d2db9SChris Lattner // Handle fixed string matches. 109f08d2db9SChris Lattner if (PatternStr.size() < 2 || 110f08d2db9SChris Lattner PatternStr[0] != '{' || PatternStr[1] != '{') { 111f08d2db9SChris Lattner // Find the end, which is the start of the next regex. 112f08d2db9SChris Lattner size_t FixedMatchEnd = PatternStr.find("{{"); 11374d50731SChris Lattner 114*b121a24fSChris Lattner Chunks.push_back(PatternChunk(PatternStr.substr(0, FixedMatchEnd),false)); 115f08d2db9SChris Lattner PatternStr = PatternStr.substr(FixedMatchEnd); 116f08d2db9SChris Lattner continue; 117f08d2db9SChris Lattner } 11874d50731SChris Lattner 119f08d2db9SChris Lattner // Otherwise, this is the start of a regex match. Scan for the }}. 120f08d2db9SChris Lattner size_t End = PatternStr.find("}}"); 121f08d2db9SChris Lattner if (End == StringRef::npos) { 122f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 123f08d2db9SChris Lattner "found start of regex string with no end '}}'", "error"); 124f08d2db9SChris Lattner return true; 125f08d2db9SChris Lattner } 126f08d2db9SChris Lattner 127f08d2db9SChris Lattner Regex R(PatternStr.substr(2, End-2)); 128f08d2db9SChris Lattner std::string Error; 129f08d2db9SChris Lattner if (!R.isValid(Error)) { 130f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()+2), 131f08d2db9SChris Lattner "invalid regex: " + Error, "error"); 132f08d2db9SChris Lattner return true; 133f08d2db9SChris Lattner } 134f08d2db9SChris Lattner 135*b121a24fSChris Lattner Chunks.push_back(PatternChunk(PatternStr.substr(2, End-2), true)); 136f08d2db9SChris Lattner PatternStr = PatternStr.substr(End+2); 137f08d2db9SChris Lattner } 138f08d2db9SChris Lattner 13974d50731SChris Lattner return false; 14074d50731SChris Lattner } 14174d50731SChris Lattner 142f08d2db9SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 143f08d2db9SChris Lattner /// returns the position that is matched or npos if there is no match. If 144f08d2db9SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 145f08d2db9SChris Lattner size_t Pattern::Match(StringRef Buffer, size_t &MatchLen) const { 146f08d2db9SChris Lattner size_t FirstMatch = StringRef::npos; 147f08d2db9SChris Lattner MatchLen = 0; 148f08d2db9SChris Lattner 149f08d2db9SChris Lattner while (!Buffer.empty()) { 150f08d2db9SChris Lattner StringRef MatchAttempt = Buffer; 151f08d2db9SChris Lattner 152f08d2db9SChris Lattner unsigned ChunkNo = 0, e = Chunks.size(); 153f08d2db9SChris Lattner for (; ChunkNo != e; ++ChunkNo) { 154*b121a24fSChris Lattner size_t ThisMatch, ThisLength = StringRef::npos; 155*b121a24fSChris Lattner ThisMatch = Chunks[ChunkNo].Match(MatchAttempt, ThisLength); 156f08d2db9SChris Lattner 157f08d2db9SChris Lattner // Otherwise, what we do depends on if this is the first match or not. If 158f08d2db9SChris Lattner // this is the first match, it doesn't match to match at the start of 159f08d2db9SChris Lattner // MatchAttempt. 160f08d2db9SChris Lattner if (ChunkNo == 0) { 161f08d2db9SChris Lattner // If the first match fails then this pattern will never match in 162f08d2db9SChris Lattner // Buffer. 163f08d2db9SChris Lattner if (ThisMatch == StringRef::npos) 164f08d2db9SChris Lattner return ThisMatch; 165f08d2db9SChris Lattner 166f08d2db9SChris Lattner FirstMatch = ThisMatch; 167f08d2db9SChris Lattner MatchAttempt = MatchAttempt.substr(FirstMatch); 168f08d2db9SChris Lattner ThisMatch = 0; 169f08d2db9SChris Lattner } 170f08d2db9SChris Lattner 171f08d2db9SChris Lattner // If this chunk didn't match, then the entire pattern didn't match from 172f08d2db9SChris Lattner // FirstMatch, try later in the buffer. 173f08d2db9SChris Lattner if (ThisMatch == StringRef::npos) 174f08d2db9SChris Lattner break; 175f08d2db9SChris Lattner 176f08d2db9SChris Lattner // Ok, if the match didn't match at the beginning of MatchAttempt, then we 177f08d2db9SChris Lattner // have something like "ABC{{DEF}} and something was in-between. Reject 178f08d2db9SChris Lattner // the match. 179f08d2db9SChris Lattner if (ThisMatch != 0) 180f08d2db9SChris Lattner break; 181f08d2db9SChris Lattner 182f08d2db9SChris Lattner // Otherwise, match the string and move to the next chunk. 183f08d2db9SChris Lattner MatchLen += ThisLength; 184f08d2db9SChris Lattner MatchAttempt = MatchAttempt.substr(ThisLength); 185f08d2db9SChris Lattner } 186f08d2db9SChris Lattner 187f08d2db9SChris Lattner // If the whole thing matched, we win. 188f08d2db9SChris Lattner if (ChunkNo == e) 189f08d2db9SChris Lattner return FirstMatch; 190f08d2db9SChris Lattner 191f08d2db9SChris Lattner // Otherwise, try matching again after FirstMatch to see if this pattern 192f08d2db9SChris Lattner // matches later in the buffer. 193f08d2db9SChris Lattner Buffer = Buffer.substr(FirstMatch+1); 194f08d2db9SChris Lattner } 195f08d2db9SChris Lattner 196f08d2db9SChris Lattner // If we ran out of stuff to scan, then we didn't match. 197f08d2db9SChris Lattner return StringRef::npos; 198f08d2db9SChris Lattner } 199f08d2db9SChris Lattner 20074d50731SChris Lattner 20174d50731SChris Lattner //===----------------------------------------------------------------------===// 20274d50731SChris Lattner // Check Strings. 20374d50731SChris Lattner //===----------------------------------------------------------------------===// 2043b40b445SChris Lattner 2053b40b445SChris Lattner /// CheckString - This is a check that we found in the input file. 2063b40b445SChris Lattner struct CheckString { 2073b40b445SChris Lattner /// Pat - The pattern to match. 2083b40b445SChris Lattner Pattern Pat; 20926cccfe1SChris Lattner 21026cccfe1SChris Lattner /// Loc - The location in the match file that the check string was specified. 21126cccfe1SChris Lattner SMLoc Loc; 21226cccfe1SChris Lattner 213da108b4eSChris Lattner /// IsCheckNext - This is true if this is a CHECK-NEXT: directive (as opposed 214da108b4eSChris Lattner /// to a CHECK: directive. 215da108b4eSChris Lattner bool IsCheckNext; 216da108b4eSChris Lattner 217236d2d5eSChris Lattner /// NotStrings - These are all of the strings that are disallowed from 218236d2d5eSChris Lattner /// occurring between this match string and the previous one (or start of 219236d2d5eSChris Lattner /// file). 22074d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotStrings; 221236d2d5eSChris Lattner 2223b40b445SChris Lattner CheckString(const Pattern &P, SMLoc L, bool isCheckNext) 2233b40b445SChris Lattner : Pat(P), Loc(L), IsCheckNext(isCheckNext) {} 22426cccfe1SChris Lattner }; 22526cccfe1SChris Lattner 226a2f8fc5aSChris Lattner /// CanonicalizeInputFile - Remove duplicate horizontal space from the specified 227a2f8fc5aSChris Lattner /// memory buffer, free it, and return a new one. 228a2f8fc5aSChris Lattner static MemoryBuffer *CanonicalizeInputFile(MemoryBuffer *MB) { 229a2f8fc5aSChris Lattner SmallVector<char, 16> NewFile; 230a2f8fc5aSChris Lattner NewFile.reserve(MB->getBufferSize()); 231a2f8fc5aSChris Lattner 232a2f8fc5aSChris Lattner for (const char *Ptr = MB->getBufferStart(), *End = MB->getBufferEnd(); 233a2f8fc5aSChris Lattner Ptr != End; ++Ptr) { 234a2f8fc5aSChris Lattner // If C is not a horizontal whitespace, skip it. 235a2f8fc5aSChris Lattner if (*Ptr != ' ' && *Ptr != '\t') { 236a2f8fc5aSChris Lattner NewFile.push_back(*Ptr); 237a2f8fc5aSChris Lattner continue; 238a2f8fc5aSChris Lattner } 239a2f8fc5aSChris Lattner 240a2f8fc5aSChris Lattner // Otherwise, add one space and advance over neighboring space. 241a2f8fc5aSChris Lattner NewFile.push_back(' '); 242a2f8fc5aSChris Lattner while (Ptr+1 != End && 243a2f8fc5aSChris Lattner (Ptr[1] == ' ' || Ptr[1] == '\t')) 244a2f8fc5aSChris Lattner ++Ptr; 245a2f8fc5aSChris Lattner } 246a2f8fc5aSChris Lattner 247a2f8fc5aSChris Lattner // Free the old buffer and return a new one. 248a2f8fc5aSChris Lattner MemoryBuffer *MB2 = 249a2f8fc5aSChris Lattner MemoryBuffer::getMemBufferCopy(NewFile.data(), 250a2f8fc5aSChris Lattner NewFile.data() + NewFile.size(), 251a2f8fc5aSChris Lattner MB->getBufferIdentifier()); 252a2f8fc5aSChris Lattner 253a2f8fc5aSChris Lattner delete MB; 254a2f8fc5aSChris Lattner return MB2; 255a2f8fc5aSChris Lattner } 256a2f8fc5aSChris Lattner 257ee3c74fbSChris Lattner 258ee3c74fbSChris Lattner /// ReadCheckFile - Read the check file, which specifies the sequence of 259ee3c74fbSChris Lattner /// expected strings. The strings are added to the CheckStrings vector. 260ee3c74fbSChris Lattner static bool ReadCheckFile(SourceMgr &SM, 26126cccfe1SChris Lattner std::vector<CheckString> &CheckStrings) { 262ee3c74fbSChris Lattner // Open the check file, and tell SourceMgr about it. 263ee3c74fbSChris Lattner std::string ErrorStr; 264ee3c74fbSChris Lattner MemoryBuffer *F = 265ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(CheckFilename.c_str(), &ErrorStr); 266ee3c74fbSChris Lattner if (F == 0) { 267ee3c74fbSChris Lattner errs() << "Could not open check file '" << CheckFilename << "': " 268ee3c74fbSChris Lattner << ErrorStr << '\n'; 269ee3c74fbSChris Lattner return true; 270ee3c74fbSChris Lattner } 271a2f8fc5aSChris Lattner 272a2f8fc5aSChris Lattner // If we want to canonicalize whitespace, strip excess whitespace from the 273a2f8fc5aSChris Lattner // buffer containing the CHECK lines. 274a2f8fc5aSChris Lattner if (!NoCanonicalizeWhiteSpace) 275a2f8fc5aSChris Lattner F = CanonicalizeInputFile(F); 276a2f8fc5aSChris Lattner 277ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 278ee3c74fbSChris Lattner 27910f10cedSChris Lattner // Find all instances of CheckPrefix followed by : in the file. 280caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 281ee3c74fbSChris Lattner 28274d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotMatches; 283236d2d5eSChris Lattner 284ee3c74fbSChris Lattner while (1) { 285ee3c74fbSChris Lattner // See if Prefix occurs in the memory buffer. 286caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find(CheckPrefix)); 287ee3c74fbSChris Lattner 288ee3c74fbSChris Lattner // If we didn't find a match, we're done. 289caa5fc0cSChris Lattner if (Buffer.empty()) 290ee3c74fbSChris Lattner break; 291ee3c74fbSChris Lattner 292caa5fc0cSChris Lattner const char *CheckPrefixStart = Buffer.data(); 293da108b4eSChris Lattner 294da108b4eSChris Lattner // When we find a check prefix, keep track of whether we find CHECK: or 295da108b4eSChris Lattner // CHECK-NEXT: 296236d2d5eSChris Lattner bool IsCheckNext = false, IsCheckNot = false; 297da108b4eSChris Lattner 29810f10cedSChris Lattner // Verify that the : is present after the prefix. 299caa5fc0cSChris Lattner if (Buffer[CheckPrefix.size()] == ':') { 300caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+1); 301caa5fc0cSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+6 && 302caa5fc0cSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NEXT:", 6) == 0) { 303caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+7); 304da108b4eSChris Lattner IsCheckNext = true; 305236d2d5eSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+5 && 306236d2d5eSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NOT:", 5) == 0) { 307236d2d5eSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+6); 308236d2d5eSChris Lattner IsCheckNot = true; 309da108b4eSChris Lattner } else { 310caa5fc0cSChris Lattner Buffer = Buffer.substr(1); 31110f10cedSChris Lattner continue; 31210f10cedSChris Lattner } 31310f10cedSChris Lattner 314ee3c74fbSChris Lattner // Okay, we found the prefix, yay. Remember the rest of the line, but 315ee3c74fbSChris Lattner // ignore leading and trailing whitespace. 316236d2d5eSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t")); 317ee3c74fbSChris Lattner 318ee3c74fbSChris Lattner // Scan ahead to the end of line. 319caa5fc0cSChris Lattner size_t EOL = Buffer.find_first_of("\n\r"); 320ee3c74fbSChris Lattner 32174d50731SChris Lattner // Parse the pattern. 32274d50731SChris Lattner Pattern P; 32374d50731SChris Lattner if (P.ParsePattern(Buffer.substr(0, EOL), SM)) 324ee3c74fbSChris Lattner return true; 325ee3c74fbSChris Lattner 326236d2d5eSChris Lattner Buffer = Buffer.substr(EOL); 32774d50731SChris Lattner 328236d2d5eSChris Lattner 329da108b4eSChris Lattner // Verify that CHECK-NEXT lines have at least one CHECK line before them. 330da108b4eSChris Lattner if (IsCheckNext && CheckStrings.empty()) { 331da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(CheckPrefixStart), 332da108b4eSChris Lattner "found '"+CheckPrefix+"-NEXT:' without previous '"+ 333da108b4eSChris Lattner CheckPrefix+ ": line", "error"); 334da108b4eSChris Lattner return true; 335da108b4eSChris Lattner } 336da108b4eSChris Lattner 33774d50731SChris Lattner // Handle CHECK-NOT. 33874d50731SChris Lattner if (IsCheckNot) { 33974d50731SChris Lattner NotMatches.push_back(std::make_pair(SMLoc::getFromPointer(Buffer.data()), 34074d50731SChris Lattner P)); 34174d50731SChris Lattner continue; 34274d50731SChris Lattner } 34374d50731SChris Lattner 3443b40b445SChris Lattner 345ee3c74fbSChris Lattner // Okay, add the string we captured to the output vector and move on. 3463b40b445SChris Lattner CheckStrings.push_back(CheckString(P, 347caa5fc0cSChris Lattner SMLoc::getFromPointer(Buffer.data()), 348da108b4eSChris Lattner IsCheckNext)); 349236d2d5eSChris Lattner std::swap(NotMatches, CheckStrings.back().NotStrings); 350ee3c74fbSChris Lattner } 351ee3c74fbSChris Lattner 352ee3c74fbSChris Lattner if (CheckStrings.empty()) { 35310f10cedSChris Lattner errs() << "error: no check strings found with prefix '" << CheckPrefix 35410f10cedSChris Lattner << ":'\n"; 355ee3c74fbSChris Lattner return true; 356ee3c74fbSChris Lattner } 357ee3c74fbSChris Lattner 358236d2d5eSChris Lattner if (!NotMatches.empty()) { 359236d2d5eSChris Lattner errs() << "error: '" << CheckPrefix 360236d2d5eSChris Lattner << "-NOT:' not supported after last check line.\n"; 361236d2d5eSChris Lattner return true; 362236d2d5eSChris Lattner } 363236d2d5eSChris Lattner 364ee3c74fbSChris Lattner return false; 365ee3c74fbSChris Lattner } 366ee3c74fbSChris Lattner 367da108b4eSChris Lattner static void PrintCheckFailed(const SourceMgr &SM, const CheckString &CheckStr, 368caa5fc0cSChris Lattner StringRef Buffer) { 369da108b4eSChris Lattner // Otherwise, we have an error, emit an error message. 370da108b4eSChris Lattner SM.PrintMessage(CheckStr.Loc, "expected string not found in input", 371da108b4eSChris Lattner "error"); 372da108b4eSChris Lattner 373da108b4eSChris Lattner // Print the "scanning from here" line. If the current position is at the 374da108b4eSChris Lattner // end of a line, advance to the start of the next line. 375caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t\n\r")); 376da108b4eSChris Lattner 377caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), "scanning from here", 378da108b4eSChris Lattner "note"); 379da108b4eSChris Lattner } 380da108b4eSChris Lattner 38137183584SChris Lattner /// CountNumNewlinesBetween - Count the number of newlines in the specified 38237183584SChris Lattner /// range. 38337183584SChris Lattner static unsigned CountNumNewlinesBetween(StringRef Range) { 384da108b4eSChris Lattner unsigned NumNewLines = 0; 38537183584SChris Lattner while (1) { 386da108b4eSChris Lattner // Scan for newline. 38737183584SChris Lattner Range = Range.substr(Range.find_first_of("\n\r")); 38837183584SChris Lattner if (Range.empty()) return NumNewLines; 389da108b4eSChris Lattner 390da108b4eSChris Lattner ++NumNewLines; 391da108b4eSChris Lattner 392da108b4eSChris Lattner // Handle \n\r and \r\n as a single newline. 39337183584SChris Lattner if (Range.size() > 1 && 39437183584SChris Lattner (Range[1] == '\n' || Range[1] == '\r') && 39537183584SChris Lattner (Range[0] != Range[1])) 39637183584SChris Lattner Range = Range.substr(1); 39737183584SChris Lattner Range = Range.substr(1); 398da108b4eSChris Lattner } 399da108b4eSChris Lattner } 400da108b4eSChris Lattner 401ee3c74fbSChris Lattner int main(int argc, char **argv) { 402ee3c74fbSChris Lattner sys::PrintStackTraceOnErrorSignal(); 403ee3c74fbSChris Lattner PrettyStackTraceProgram X(argc, argv); 404ee3c74fbSChris Lattner cl::ParseCommandLineOptions(argc, argv); 405ee3c74fbSChris Lattner 406ee3c74fbSChris Lattner SourceMgr SM; 407ee3c74fbSChris Lattner 408ee3c74fbSChris Lattner // Read the expected strings from the check file. 40926cccfe1SChris Lattner std::vector<CheckString> CheckStrings; 410ee3c74fbSChris Lattner if (ReadCheckFile(SM, CheckStrings)) 411ee3c74fbSChris Lattner return 2; 412ee3c74fbSChris Lattner 413ee3c74fbSChris Lattner // Open the file to check and add it to SourceMgr. 414ee3c74fbSChris Lattner std::string ErrorStr; 415ee3c74fbSChris Lattner MemoryBuffer *F = 416ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(InputFilename.c_str(), &ErrorStr); 417ee3c74fbSChris Lattner if (F == 0) { 418ee3c74fbSChris Lattner errs() << "Could not open input file '" << InputFilename << "': " 419ee3c74fbSChris Lattner << ErrorStr << '\n'; 420ee3c74fbSChris Lattner return true; 421ee3c74fbSChris Lattner } 4222c3e5cdfSChris Lattner 4232c3e5cdfSChris Lattner // Remove duplicate spaces in the input file if requested. 4242c3e5cdfSChris Lattner if (!NoCanonicalizeWhiteSpace) 4252c3e5cdfSChris Lattner F = CanonicalizeInputFile(F); 4262c3e5cdfSChris Lattner 427ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 428ee3c74fbSChris Lattner 429ee3c74fbSChris Lattner // Check that we have all of the expected strings, in order, in the input 430ee3c74fbSChris Lattner // file. 431caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 432ee3c74fbSChris Lattner 433236d2d5eSChris Lattner const char *LastMatch = Buffer.data(); 434236d2d5eSChris Lattner 435ee3c74fbSChris Lattner for (unsigned StrNo = 0, e = CheckStrings.size(); StrNo != e; ++StrNo) { 43626cccfe1SChris Lattner const CheckString &CheckStr = CheckStrings[StrNo]; 437ee3c74fbSChris Lattner 438caa5fc0cSChris Lattner StringRef SearchFrom = Buffer; 439caa5fc0cSChris Lattner 440ee3c74fbSChris Lattner // Find StrNo in the file. 4413b40b445SChris Lattner size_t MatchLen = 0; 4423b40b445SChris Lattner Buffer = Buffer.substr(CheckStr.Pat.Match(Buffer, MatchLen)); 443ee3c74fbSChris Lattner 444da108b4eSChris Lattner // If we didn't find a match, reject the input. 445caa5fc0cSChris Lattner if (Buffer.empty()) { 446caa5fc0cSChris Lattner PrintCheckFailed(SM, CheckStr, SearchFrom); 447da108b4eSChris Lattner return 1; 448ee3c74fbSChris Lattner } 449ee3c74fbSChris Lattner 45037183584SChris Lattner StringRef SkippedRegion(LastMatch, Buffer.data()-LastMatch); 45137183584SChris Lattner 452da108b4eSChris Lattner // If this check is a "CHECK-NEXT", verify that the previous match was on 453da108b4eSChris Lattner // the previous line (i.e. that there is one newline between them). 454da108b4eSChris Lattner if (CheckStr.IsCheckNext) { 455da108b4eSChris Lattner // Count the number of newlines between the previous match and this one. 456236d2d5eSChris Lattner assert(LastMatch != F->getBufferStart() && 457236d2d5eSChris Lattner "CHECK-NEXT can't be the first check in a file"); 458da108b4eSChris Lattner 45937183584SChris Lattner unsigned NumNewLines = CountNumNewlinesBetween(SkippedRegion); 460da108b4eSChris Lattner if (NumNewLines == 0) { 461107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 462da108b4eSChris Lattner CheckPrefix+"-NEXT: is on the same line as previous match", 463ee3c74fbSChris Lattner "error"); 464caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 465107c21eaSChris Lattner "'next' match was here", "note"); 466da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 467da108b4eSChris Lattner "previous match was here", "note"); 468aedd8185SChris Lattner return 1; 469ee3c74fbSChris Lattner } 470ee3c74fbSChris Lattner 471da108b4eSChris Lattner if (NumNewLines != 1) { 472107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 473da108b4eSChris Lattner CheckPrefix+ 474da108b4eSChris Lattner "-NEXT: is not on the line after the previous match", 475da108b4eSChris Lattner "error"); 476caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 477107c21eaSChris Lattner "'next' match was here", "note"); 478da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 479da108b4eSChris Lattner "previous match was here", "note"); 480da108b4eSChris Lattner return 1; 481da108b4eSChris Lattner } 482da108b4eSChris Lattner } 483da108b4eSChris Lattner 484236d2d5eSChris Lattner // If this match had "not strings", verify that they don't exist in the 485236d2d5eSChris Lattner // skipped region. 486f08d2db9SChris Lattner for (unsigned ChunkNo = 0, e = CheckStr.NotStrings.size(); ChunkNo != e; ++ChunkNo) { 48774d50731SChris Lattner size_t MatchLen = 0; 488f08d2db9SChris Lattner size_t Pos = CheckStr.NotStrings[ChunkNo].second.Match(SkippedRegion, MatchLen); 489236d2d5eSChris Lattner if (Pos == StringRef::npos) continue; 490236d2d5eSChris Lattner 491236d2d5eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch+Pos), 492236d2d5eSChris Lattner CheckPrefix+"-NOT: string occurred!", "error"); 493f08d2db9SChris Lattner SM.PrintMessage(CheckStr.NotStrings[ChunkNo].first, 494236d2d5eSChris Lattner CheckPrefix+"-NOT: pattern specified here", "note"); 495236d2d5eSChris Lattner return 1; 496236d2d5eSChris Lattner } 497236d2d5eSChris Lattner 498236d2d5eSChris Lattner 499b9f2bf46SChris Lattner // Otherwise, everything is good. Step over the matched text and remember 500b9f2bf46SChris Lattner // the position after the match as the end of the last match. 5013b40b445SChris Lattner Buffer = Buffer.substr(MatchLen); 502b9f2bf46SChris Lattner LastMatch = Buffer.data(); 503da108b4eSChris Lattner } 504da108b4eSChris Lattner 505ee3c74fbSChris Lattner return 0; 506ee3c74fbSChris Lattner } 507