1ee3c74fbSChris Lattner //===- FileCheck.cpp - Check that File's Contents match what is expected --===// 2ee3c74fbSChris Lattner // 3ee3c74fbSChris Lattner // The LLVM Compiler Infrastructure 4ee3c74fbSChris Lattner // 5ee3c74fbSChris Lattner // This file is distributed under the University of Illinois Open Source 6ee3c74fbSChris Lattner // License. See LICENSE.TXT for details. 7ee3c74fbSChris Lattner // 8ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 9ee3c74fbSChris Lattner // 10ee3c74fbSChris Lattner // FileCheck does a line-by line check of a file that validates whether it 11ee3c74fbSChris Lattner // contains the expected content. This is useful for regression tests etc. 12ee3c74fbSChris Lattner // 13ee3c74fbSChris Lattner // This program exits with an error status of 2 on error, exit status of 0 if 14ee3c74fbSChris Lattner // the file matched the expected contents, and exit status of 1 if it did not 15ee3c74fbSChris Lattner // contain the expected contents. 16ee3c74fbSChris Lattner // 17ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 18ee3c74fbSChris Lattner 19ee3c74fbSChris Lattner #include "llvm/Support/CommandLine.h" 20ee3c74fbSChris Lattner #include "llvm/Support/MemoryBuffer.h" 21ee3c74fbSChris Lattner #include "llvm/Support/PrettyStackTrace.h" 22*f08d2db9SChris Lattner #include "llvm/Support/Regex.h" 23ee3c74fbSChris Lattner #include "llvm/Support/SourceMgr.h" 24ee3c74fbSChris Lattner #include "llvm/Support/raw_ostream.h" 25ee3c74fbSChris Lattner #include "llvm/System/Signals.h" 26ee3c74fbSChris Lattner using namespace llvm; 27ee3c74fbSChris Lattner 28ee3c74fbSChris Lattner static cl::opt<std::string> 29ee3c74fbSChris Lattner CheckFilename(cl::Positional, cl::desc("<check-file>"), cl::Required); 30ee3c74fbSChris Lattner 31ee3c74fbSChris Lattner static cl::opt<std::string> 32ee3c74fbSChris Lattner InputFilename("input-file", cl::desc("File to check (defaults to stdin)"), 33ee3c74fbSChris Lattner cl::init("-"), cl::value_desc("filename")); 34ee3c74fbSChris Lattner 35ee3c74fbSChris Lattner static cl::opt<std::string> 36ee3c74fbSChris Lattner CheckPrefix("check-prefix", cl::init("CHECK"), 37ee3c74fbSChris Lattner cl::desc("Prefix to use from check file (defaults to 'CHECK')")); 38ee3c74fbSChris Lattner 392c3e5cdfSChris Lattner static cl::opt<bool> 402c3e5cdfSChris Lattner NoCanonicalizeWhiteSpace("strict-whitespace", 412c3e5cdfSChris Lattner cl::desc("Do not treat all horizontal whitespace as equivalent")); 422c3e5cdfSChris Lattner 4374d50731SChris Lattner //===----------------------------------------------------------------------===// 4474d50731SChris Lattner // Pattern Handling Code. 4574d50731SChris Lattner //===----------------------------------------------------------------------===// 4674d50731SChris Lattner 473b40b445SChris Lattner class Pattern { 48*f08d2db9SChris Lattner /// Chunks - The pattern chunks to match. If the bool is false, it is a fixed 49*f08d2db9SChris Lattner /// string match, if it is true, it is a regex match. 50*f08d2db9SChris Lattner SmallVector<std::pair<StringRef, bool>, 4> Chunks; 513b40b445SChris Lattner public: 523b40b445SChris Lattner 5374d50731SChris Lattner Pattern() { } 5474d50731SChris Lattner 5574d50731SChris Lattner bool ParsePattern(StringRef PatternStr, SourceMgr &SM); 563b40b445SChris Lattner 573b40b445SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 583b40b445SChris Lattner /// returns the position that is matched or npos if there is no match. If 593b40b445SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 60*f08d2db9SChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen) const; 613b40b445SChris Lattner }; 623b40b445SChris Lattner 6374d50731SChris Lattner bool Pattern::ParsePattern(StringRef PatternStr, SourceMgr &SM) { 6474d50731SChris Lattner // Ignore trailing whitespace. 6574d50731SChris Lattner while (!PatternStr.empty() && 6674d50731SChris Lattner (PatternStr.back() == ' ' || PatternStr.back() == '\t')) 6774d50731SChris Lattner PatternStr = PatternStr.substr(0, PatternStr.size()-1); 6874d50731SChris Lattner 6974d50731SChris Lattner // Check that there is something on the line. 7074d50731SChris Lattner if (PatternStr.empty()) { 7174d50731SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 7274d50731SChris Lattner "found empty check string with prefix '"+CheckPrefix+":'", 7374d50731SChris Lattner "error"); 7474d50731SChris Lattner return true; 7574d50731SChris Lattner } 7674d50731SChris Lattner 77*f08d2db9SChris Lattner // Scan the pattern to break it into regex and non-regex pieces. 78*f08d2db9SChris Lattner while (!PatternStr.empty()) { 79*f08d2db9SChris Lattner // Handle fixed string matches. 80*f08d2db9SChris Lattner if (PatternStr.size() < 2 || 81*f08d2db9SChris Lattner PatternStr[0] != '{' || PatternStr[1] != '{') { 82*f08d2db9SChris Lattner // Find the end, which is the start of the next regex. 83*f08d2db9SChris Lattner size_t FixedMatchEnd = PatternStr.find("{{"); 8474d50731SChris Lattner 85*f08d2db9SChris Lattner Chunks.push_back(std::make_pair(PatternStr.substr(0, FixedMatchEnd), 86*f08d2db9SChris Lattner false)); 87*f08d2db9SChris Lattner PatternStr = PatternStr.substr(FixedMatchEnd); 88*f08d2db9SChris Lattner continue; 89*f08d2db9SChris Lattner } 9074d50731SChris Lattner 91*f08d2db9SChris Lattner // Otherwise, this is the start of a regex match. Scan for the }}. 92*f08d2db9SChris Lattner size_t End = PatternStr.find("}}"); 93*f08d2db9SChris Lattner if (End == StringRef::npos) { 94*f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 95*f08d2db9SChris Lattner "found start of regex string with no end '}}'", "error"); 96*f08d2db9SChris Lattner return true; 97*f08d2db9SChris Lattner } 98*f08d2db9SChris Lattner 99*f08d2db9SChris Lattner Regex R(PatternStr.substr(2, End-2)); 100*f08d2db9SChris Lattner std::string Error; 101*f08d2db9SChris Lattner if (!R.isValid(Error)) { 102*f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()+2), 103*f08d2db9SChris Lattner "invalid regex: " + Error, "error"); 104*f08d2db9SChris Lattner return true; 105*f08d2db9SChris Lattner } 106*f08d2db9SChris Lattner 107*f08d2db9SChris Lattner Chunks.push_back(std::make_pair(PatternStr.substr(2, End-2), true)); 108*f08d2db9SChris Lattner PatternStr = PatternStr.substr(End+2); 109*f08d2db9SChris Lattner } 110*f08d2db9SChris Lattner 11174d50731SChris Lattner return false; 11274d50731SChris Lattner } 11374d50731SChris Lattner 114*f08d2db9SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 115*f08d2db9SChris Lattner /// returns the position that is matched or npos if there is no match. If 116*f08d2db9SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 117*f08d2db9SChris Lattner size_t Pattern::Match(StringRef Buffer, size_t &MatchLen) const { 118*f08d2db9SChris Lattner size_t FirstMatch = StringRef::npos; 119*f08d2db9SChris Lattner MatchLen = 0; 120*f08d2db9SChris Lattner 121*f08d2db9SChris Lattner SmallVector<StringRef, 4> MatchInfo; 122*f08d2db9SChris Lattner 123*f08d2db9SChris Lattner while (!Buffer.empty()) { 124*f08d2db9SChris Lattner StringRef MatchAttempt = Buffer; 125*f08d2db9SChris Lattner 126*f08d2db9SChris Lattner unsigned ChunkNo = 0, e = Chunks.size(); 127*f08d2db9SChris Lattner for (; ChunkNo != e; ++ChunkNo) { 128*f08d2db9SChris Lattner StringRef PatternStr = Chunks[ChunkNo].first; 129*f08d2db9SChris Lattner 130*f08d2db9SChris Lattner size_t ThisMatch = StringRef::npos; 131*f08d2db9SChris Lattner size_t ThisLength = StringRef::npos; 132*f08d2db9SChris Lattner if (!Chunks[ChunkNo].second) { 133*f08d2db9SChris Lattner // Fixed string match. 134*f08d2db9SChris Lattner ThisMatch = MatchAttempt.find(Chunks[ChunkNo].first); 135*f08d2db9SChris Lattner ThisLength = Chunks[ChunkNo].first.size(); 136*f08d2db9SChris Lattner } else if (Regex(Chunks[ChunkNo].first, Regex::Sub).match(MatchAttempt, &MatchInfo)) { 137*f08d2db9SChris Lattner // Successful regex match. 138*f08d2db9SChris Lattner assert(!MatchInfo.empty() && "Didn't get any match"); 139*f08d2db9SChris Lattner StringRef FullMatch = MatchInfo[0]; 140*f08d2db9SChris Lattner MatchInfo.clear(); 141*f08d2db9SChris Lattner 142*f08d2db9SChris Lattner ThisMatch = FullMatch.data()-MatchAttempt.data(); 143*f08d2db9SChris Lattner ThisLength = FullMatch.size(); 144*f08d2db9SChris Lattner } 145*f08d2db9SChris Lattner 146*f08d2db9SChris Lattner // Otherwise, what we do depends on if this is the first match or not. If 147*f08d2db9SChris Lattner // this is the first match, it doesn't match to match at the start of 148*f08d2db9SChris Lattner // MatchAttempt. 149*f08d2db9SChris Lattner if (ChunkNo == 0) { 150*f08d2db9SChris Lattner // If the first match fails then this pattern will never match in 151*f08d2db9SChris Lattner // Buffer. 152*f08d2db9SChris Lattner if (ThisMatch == StringRef::npos) 153*f08d2db9SChris Lattner return ThisMatch; 154*f08d2db9SChris Lattner 155*f08d2db9SChris Lattner FirstMatch = ThisMatch; 156*f08d2db9SChris Lattner MatchAttempt = MatchAttempt.substr(FirstMatch); 157*f08d2db9SChris Lattner ThisMatch = 0; 158*f08d2db9SChris Lattner } 159*f08d2db9SChris Lattner 160*f08d2db9SChris Lattner // If this chunk didn't match, then the entire pattern didn't match from 161*f08d2db9SChris Lattner // FirstMatch, try later in the buffer. 162*f08d2db9SChris Lattner if (ThisMatch == StringRef::npos) 163*f08d2db9SChris Lattner break; 164*f08d2db9SChris Lattner 165*f08d2db9SChris Lattner // Ok, if the match didn't match at the beginning of MatchAttempt, then we 166*f08d2db9SChris Lattner // have something like "ABC{{DEF}} and something was in-between. Reject 167*f08d2db9SChris Lattner // the match. 168*f08d2db9SChris Lattner if (ThisMatch != 0) 169*f08d2db9SChris Lattner break; 170*f08d2db9SChris Lattner 171*f08d2db9SChris Lattner // Otherwise, match the string and move to the next chunk. 172*f08d2db9SChris Lattner MatchLen += ThisLength; 173*f08d2db9SChris Lattner MatchAttempt = MatchAttempt.substr(ThisLength); 174*f08d2db9SChris Lattner } 175*f08d2db9SChris Lattner 176*f08d2db9SChris Lattner // If the whole thing matched, we win. 177*f08d2db9SChris Lattner if (ChunkNo == e) 178*f08d2db9SChris Lattner return FirstMatch; 179*f08d2db9SChris Lattner 180*f08d2db9SChris Lattner // Otherwise, try matching again after FirstMatch to see if this pattern 181*f08d2db9SChris Lattner // matches later in the buffer. 182*f08d2db9SChris Lattner Buffer = Buffer.substr(FirstMatch+1); 183*f08d2db9SChris Lattner } 184*f08d2db9SChris Lattner 185*f08d2db9SChris Lattner // If we ran out of stuff to scan, then we didn't match. 186*f08d2db9SChris Lattner return StringRef::npos; 187*f08d2db9SChris Lattner } 188*f08d2db9SChris Lattner 18974d50731SChris Lattner 19074d50731SChris Lattner //===----------------------------------------------------------------------===// 19174d50731SChris Lattner // Check Strings. 19274d50731SChris Lattner //===----------------------------------------------------------------------===// 1933b40b445SChris Lattner 1943b40b445SChris Lattner /// CheckString - This is a check that we found in the input file. 1953b40b445SChris Lattner struct CheckString { 1963b40b445SChris Lattner /// Pat - The pattern to match. 1973b40b445SChris Lattner Pattern Pat; 19826cccfe1SChris Lattner 19926cccfe1SChris Lattner /// Loc - The location in the match file that the check string was specified. 20026cccfe1SChris Lattner SMLoc Loc; 20126cccfe1SChris Lattner 202da108b4eSChris Lattner /// IsCheckNext - This is true if this is a CHECK-NEXT: directive (as opposed 203da108b4eSChris Lattner /// to a CHECK: directive. 204da108b4eSChris Lattner bool IsCheckNext; 205da108b4eSChris Lattner 206236d2d5eSChris Lattner /// NotStrings - These are all of the strings that are disallowed from 207236d2d5eSChris Lattner /// occurring between this match string and the previous one (or start of 208236d2d5eSChris Lattner /// file). 20974d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotStrings; 210236d2d5eSChris Lattner 2113b40b445SChris Lattner CheckString(const Pattern &P, SMLoc L, bool isCheckNext) 2123b40b445SChris Lattner : Pat(P), Loc(L), IsCheckNext(isCheckNext) {} 21326cccfe1SChris Lattner }; 21426cccfe1SChris Lattner 215a2f8fc5aSChris Lattner /// CanonicalizeInputFile - Remove duplicate horizontal space from the specified 216a2f8fc5aSChris Lattner /// memory buffer, free it, and return a new one. 217a2f8fc5aSChris Lattner static MemoryBuffer *CanonicalizeInputFile(MemoryBuffer *MB) { 218a2f8fc5aSChris Lattner SmallVector<char, 16> NewFile; 219a2f8fc5aSChris Lattner NewFile.reserve(MB->getBufferSize()); 220a2f8fc5aSChris Lattner 221a2f8fc5aSChris Lattner for (const char *Ptr = MB->getBufferStart(), *End = MB->getBufferEnd(); 222a2f8fc5aSChris Lattner Ptr != End; ++Ptr) { 223a2f8fc5aSChris Lattner // If C is not a horizontal whitespace, skip it. 224a2f8fc5aSChris Lattner if (*Ptr != ' ' && *Ptr != '\t') { 225a2f8fc5aSChris Lattner NewFile.push_back(*Ptr); 226a2f8fc5aSChris Lattner continue; 227a2f8fc5aSChris Lattner } 228a2f8fc5aSChris Lattner 229a2f8fc5aSChris Lattner // Otherwise, add one space and advance over neighboring space. 230a2f8fc5aSChris Lattner NewFile.push_back(' '); 231a2f8fc5aSChris Lattner while (Ptr+1 != End && 232a2f8fc5aSChris Lattner (Ptr[1] == ' ' || Ptr[1] == '\t')) 233a2f8fc5aSChris Lattner ++Ptr; 234a2f8fc5aSChris Lattner } 235a2f8fc5aSChris Lattner 236a2f8fc5aSChris Lattner // Free the old buffer and return a new one. 237a2f8fc5aSChris Lattner MemoryBuffer *MB2 = 238a2f8fc5aSChris Lattner MemoryBuffer::getMemBufferCopy(NewFile.data(), 239a2f8fc5aSChris Lattner NewFile.data() + NewFile.size(), 240a2f8fc5aSChris Lattner MB->getBufferIdentifier()); 241a2f8fc5aSChris Lattner 242a2f8fc5aSChris Lattner delete MB; 243a2f8fc5aSChris Lattner return MB2; 244a2f8fc5aSChris Lattner } 245a2f8fc5aSChris Lattner 246ee3c74fbSChris Lattner 247ee3c74fbSChris Lattner /// ReadCheckFile - Read the check file, which specifies the sequence of 248ee3c74fbSChris Lattner /// expected strings. The strings are added to the CheckStrings vector. 249ee3c74fbSChris Lattner static bool ReadCheckFile(SourceMgr &SM, 25026cccfe1SChris Lattner std::vector<CheckString> &CheckStrings) { 251ee3c74fbSChris Lattner // Open the check file, and tell SourceMgr about it. 252ee3c74fbSChris Lattner std::string ErrorStr; 253ee3c74fbSChris Lattner MemoryBuffer *F = 254ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(CheckFilename.c_str(), &ErrorStr); 255ee3c74fbSChris Lattner if (F == 0) { 256ee3c74fbSChris Lattner errs() << "Could not open check file '" << CheckFilename << "': " 257ee3c74fbSChris Lattner << ErrorStr << '\n'; 258ee3c74fbSChris Lattner return true; 259ee3c74fbSChris Lattner } 260a2f8fc5aSChris Lattner 261a2f8fc5aSChris Lattner // If we want to canonicalize whitespace, strip excess whitespace from the 262a2f8fc5aSChris Lattner // buffer containing the CHECK lines. 263a2f8fc5aSChris Lattner if (!NoCanonicalizeWhiteSpace) 264a2f8fc5aSChris Lattner F = CanonicalizeInputFile(F); 265a2f8fc5aSChris Lattner 266ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 267ee3c74fbSChris Lattner 26810f10cedSChris Lattner // Find all instances of CheckPrefix followed by : in the file. 269caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 270ee3c74fbSChris Lattner 27174d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotMatches; 272236d2d5eSChris Lattner 273ee3c74fbSChris Lattner while (1) { 274ee3c74fbSChris Lattner // See if Prefix occurs in the memory buffer. 275caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find(CheckPrefix)); 276ee3c74fbSChris Lattner 277ee3c74fbSChris Lattner // If we didn't find a match, we're done. 278caa5fc0cSChris Lattner if (Buffer.empty()) 279ee3c74fbSChris Lattner break; 280ee3c74fbSChris Lattner 281caa5fc0cSChris Lattner const char *CheckPrefixStart = Buffer.data(); 282da108b4eSChris Lattner 283da108b4eSChris Lattner // When we find a check prefix, keep track of whether we find CHECK: or 284da108b4eSChris Lattner // CHECK-NEXT: 285236d2d5eSChris Lattner bool IsCheckNext = false, IsCheckNot = false; 286da108b4eSChris Lattner 28710f10cedSChris Lattner // Verify that the : is present after the prefix. 288caa5fc0cSChris Lattner if (Buffer[CheckPrefix.size()] == ':') { 289caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+1); 290caa5fc0cSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+6 && 291caa5fc0cSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NEXT:", 6) == 0) { 292caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+7); 293da108b4eSChris Lattner IsCheckNext = true; 294236d2d5eSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+5 && 295236d2d5eSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NOT:", 5) == 0) { 296236d2d5eSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+6); 297236d2d5eSChris Lattner IsCheckNot = true; 298da108b4eSChris Lattner } else { 299caa5fc0cSChris Lattner Buffer = Buffer.substr(1); 30010f10cedSChris Lattner continue; 30110f10cedSChris Lattner } 30210f10cedSChris Lattner 303ee3c74fbSChris Lattner // Okay, we found the prefix, yay. Remember the rest of the line, but 304ee3c74fbSChris Lattner // ignore leading and trailing whitespace. 305236d2d5eSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t")); 306ee3c74fbSChris Lattner 307ee3c74fbSChris Lattner // Scan ahead to the end of line. 308caa5fc0cSChris Lattner size_t EOL = Buffer.find_first_of("\n\r"); 309ee3c74fbSChris Lattner 31074d50731SChris Lattner // Parse the pattern. 31174d50731SChris Lattner Pattern P; 31274d50731SChris Lattner if (P.ParsePattern(Buffer.substr(0, EOL), SM)) 313ee3c74fbSChris Lattner return true; 314ee3c74fbSChris Lattner 315236d2d5eSChris Lattner Buffer = Buffer.substr(EOL); 31674d50731SChris Lattner 317236d2d5eSChris Lattner 318da108b4eSChris Lattner // Verify that CHECK-NEXT lines have at least one CHECK line before them. 319da108b4eSChris Lattner if (IsCheckNext && CheckStrings.empty()) { 320da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(CheckPrefixStart), 321da108b4eSChris Lattner "found '"+CheckPrefix+"-NEXT:' without previous '"+ 322da108b4eSChris Lattner CheckPrefix+ ": line", "error"); 323da108b4eSChris Lattner return true; 324da108b4eSChris Lattner } 325da108b4eSChris Lattner 32674d50731SChris Lattner // Handle CHECK-NOT. 32774d50731SChris Lattner if (IsCheckNot) { 32874d50731SChris Lattner NotMatches.push_back(std::make_pair(SMLoc::getFromPointer(Buffer.data()), 32974d50731SChris Lattner P)); 33074d50731SChris Lattner continue; 33174d50731SChris Lattner } 33274d50731SChris Lattner 3333b40b445SChris Lattner 334ee3c74fbSChris Lattner // Okay, add the string we captured to the output vector and move on. 3353b40b445SChris Lattner CheckStrings.push_back(CheckString(P, 336caa5fc0cSChris Lattner SMLoc::getFromPointer(Buffer.data()), 337da108b4eSChris Lattner IsCheckNext)); 338236d2d5eSChris Lattner std::swap(NotMatches, CheckStrings.back().NotStrings); 339ee3c74fbSChris Lattner } 340ee3c74fbSChris Lattner 341ee3c74fbSChris Lattner if (CheckStrings.empty()) { 34210f10cedSChris Lattner errs() << "error: no check strings found with prefix '" << CheckPrefix 34310f10cedSChris Lattner << ":'\n"; 344ee3c74fbSChris Lattner return true; 345ee3c74fbSChris Lattner } 346ee3c74fbSChris Lattner 347236d2d5eSChris Lattner if (!NotMatches.empty()) { 348236d2d5eSChris Lattner errs() << "error: '" << CheckPrefix 349236d2d5eSChris Lattner << "-NOT:' not supported after last check line.\n"; 350236d2d5eSChris Lattner return true; 351236d2d5eSChris Lattner } 352236d2d5eSChris Lattner 353ee3c74fbSChris Lattner return false; 354ee3c74fbSChris Lattner } 355ee3c74fbSChris Lattner 356da108b4eSChris Lattner static void PrintCheckFailed(const SourceMgr &SM, const CheckString &CheckStr, 357caa5fc0cSChris Lattner StringRef Buffer) { 358da108b4eSChris Lattner // Otherwise, we have an error, emit an error message. 359da108b4eSChris Lattner SM.PrintMessage(CheckStr.Loc, "expected string not found in input", 360da108b4eSChris Lattner "error"); 361da108b4eSChris Lattner 362da108b4eSChris Lattner // Print the "scanning from here" line. If the current position is at the 363da108b4eSChris Lattner // end of a line, advance to the start of the next line. 364caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t\n\r")); 365da108b4eSChris Lattner 366caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), "scanning from here", 367da108b4eSChris Lattner "note"); 368da108b4eSChris Lattner } 369da108b4eSChris Lattner 37037183584SChris Lattner /// CountNumNewlinesBetween - Count the number of newlines in the specified 37137183584SChris Lattner /// range. 37237183584SChris Lattner static unsigned CountNumNewlinesBetween(StringRef Range) { 373da108b4eSChris Lattner unsigned NumNewLines = 0; 37437183584SChris Lattner while (1) { 375da108b4eSChris Lattner // Scan for newline. 37637183584SChris Lattner Range = Range.substr(Range.find_first_of("\n\r")); 37737183584SChris Lattner if (Range.empty()) return NumNewLines; 378da108b4eSChris Lattner 379da108b4eSChris Lattner ++NumNewLines; 380da108b4eSChris Lattner 381da108b4eSChris Lattner // Handle \n\r and \r\n as a single newline. 38237183584SChris Lattner if (Range.size() > 1 && 38337183584SChris Lattner (Range[1] == '\n' || Range[1] == '\r') && 38437183584SChris Lattner (Range[0] != Range[1])) 38537183584SChris Lattner Range = Range.substr(1); 38637183584SChris Lattner Range = Range.substr(1); 387da108b4eSChris Lattner } 388da108b4eSChris Lattner } 389da108b4eSChris Lattner 390ee3c74fbSChris Lattner int main(int argc, char **argv) { 391ee3c74fbSChris Lattner sys::PrintStackTraceOnErrorSignal(); 392ee3c74fbSChris Lattner PrettyStackTraceProgram X(argc, argv); 393ee3c74fbSChris Lattner cl::ParseCommandLineOptions(argc, argv); 394ee3c74fbSChris Lattner 395ee3c74fbSChris Lattner SourceMgr SM; 396ee3c74fbSChris Lattner 397ee3c74fbSChris Lattner // Read the expected strings from the check file. 39826cccfe1SChris Lattner std::vector<CheckString> CheckStrings; 399ee3c74fbSChris Lattner if (ReadCheckFile(SM, CheckStrings)) 400ee3c74fbSChris Lattner return 2; 401ee3c74fbSChris Lattner 402ee3c74fbSChris Lattner // Open the file to check and add it to SourceMgr. 403ee3c74fbSChris Lattner std::string ErrorStr; 404ee3c74fbSChris Lattner MemoryBuffer *F = 405ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(InputFilename.c_str(), &ErrorStr); 406ee3c74fbSChris Lattner if (F == 0) { 407ee3c74fbSChris Lattner errs() << "Could not open input file '" << InputFilename << "': " 408ee3c74fbSChris Lattner << ErrorStr << '\n'; 409ee3c74fbSChris Lattner return true; 410ee3c74fbSChris Lattner } 4112c3e5cdfSChris Lattner 4122c3e5cdfSChris Lattner // Remove duplicate spaces in the input file if requested. 4132c3e5cdfSChris Lattner if (!NoCanonicalizeWhiteSpace) 4142c3e5cdfSChris Lattner F = CanonicalizeInputFile(F); 4152c3e5cdfSChris Lattner 416ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 417ee3c74fbSChris Lattner 418ee3c74fbSChris Lattner // Check that we have all of the expected strings, in order, in the input 419ee3c74fbSChris Lattner // file. 420caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 421ee3c74fbSChris Lattner 422236d2d5eSChris Lattner const char *LastMatch = Buffer.data(); 423236d2d5eSChris Lattner 424ee3c74fbSChris Lattner for (unsigned StrNo = 0, e = CheckStrings.size(); StrNo != e; ++StrNo) { 42526cccfe1SChris Lattner const CheckString &CheckStr = CheckStrings[StrNo]; 426ee3c74fbSChris Lattner 427caa5fc0cSChris Lattner StringRef SearchFrom = Buffer; 428caa5fc0cSChris Lattner 429ee3c74fbSChris Lattner // Find StrNo in the file. 4303b40b445SChris Lattner size_t MatchLen = 0; 4313b40b445SChris Lattner Buffer = Buffer.substr(CheckStr.Pat.Match(Buffer, MatchLen)); 432ee3c74fbSChris Lattner 433da108b4eSChris Lattner // If we didn't find a match, reject the input. 434caa5fc0cSChris Lattner if (Buffer.empty()) { 435caa5fc0cSChris Lattner PrintCheckFailed(SM, CheckStr, SearchFrom); 436da108b4eSChris Lattner return 1; 437ee3c74fbSChris Lattner } 438ee3c74fbSChris Lattner 43937183584SChris Lattner StringRef SkippedRegion(LastMatch, Buffer.data()-LastMatch); 44037183584SChris Lattner 441da108b4eSChris Lattner // If this check is a "CHECK-NEXT", verify that the previous match was on 442da108b4eSChris Lattner // the previous line (i.e. that there is one newline between them). 443da108b4eSChris Lattner if (CheckStr.IsCheckNext) { 444da108b4eSChris Lattner // Count the number of newlines between the previous match and this one. 445236d2d5eSChris Lattner assert(LastMatch != F->getBufferStart() && 446236d2d5eSChris Lattner "CHECK-NEXT can't be the first check in a file"); 447da108b4eSChris Lattner 44837183584SChris Lattner unsigned NumNewLines = CountNumNewlinesBetween(SkippedRegion); 449da108b4eSChris Lattner if (NumNewLines == 0) { 450107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 451da108b4eSChris Lattner CheckPrefix+"-NEXT: is on the same line as previous match", 452ee3c74fbSChris Lattner "error"); 453caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 454107c21eaSChris Lattner "'next' match was here", "note"); 455da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 456da108b4eSChris Lattner "previous match was here", "note"); 457aedd8185SChris Lattner return 1; 458ee3c74fbSChris Lattner } 459ee3c74fbSChris Lattner 460da108b4eSChris Lattner if (NumNewLines != 1) { 461107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 462da108b4eSChris Lattner CheckPrefix+ 463da108b4eSChris Lattner "-NEXT: is not on the line after the previous match", 464da108b4eSChris Lattner "error"); 465caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 466107c21eaSChris Lattner "'next' match was here", "note"); 467da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 468da108b4eSChris Lattner "previous match was here", "note"); 469da108b4eSChris Lattner return 1; 470da108b4eSChris Lattner } 471da108b4eSChris Lattner } 472da108b4eSChris Lattner 473236d2d5eSChris Lattner // If this match had "not strings", verify that they don't exist in the 474236d2d5eSChris Lattner // skipped region. 475*f08d2db9SChris Lattner for (unsigned ChunkNo = 0, e = CheckStr.NotStrings.size(); ChunkNo != e; ++ChunkNo) { 47674d50731SChris Lattner size_t MatchLen = 0; 477*f08d2db9SChris Lattner size_t Pos = CheckStr.NotStrings[ChunkNo].second.Match(SkippedRegion, MatchLen); 478236d2d5eSChris Lattner if (Pos == StringRef::npos) continue; 479236d2d5eSChris Lattner 480236d2d5eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch+Pos), 481236d2d5eSChris Lattner CheckPrefix+"-NOT: string occurred!", "error"); 482*f08d2db9SChris Lattner SM.PrintMessage(CheckStr.NotStrings[ChunkNo].first, 483236d2d5eSChris Lattner CheckPrefix+"-NOT: pattern specified here", "note"); 484236d2d5eSChris Lattner return 1; 485236d2d5eSChris Lattner } 486236d2d5eSChris Lattner 487236d2d5eSChris Lattner 488b9f2bf46SChris Lattner // Otherwise, everything is good. Step over the matched text and remember 489b9f2bf46SChris Lattner // the position after the match as the end of the last match. 4903b40b445SChris Lattner Buffer = Buffer.substr(MatchLen); 491b9f2bf46SChris Lattner LastMatch = Buffer.data(); 492da108b4eSChris Lattner } 493da108b4eSChris Lattner 494ee3c74fbSChris Lattner return 0; 495ee3c74fbSChris Lattner } 496