1ee3c74fbSChris Lattner //===- FileCheck.cpp - Check that File's Contents match what is expected --===// 2ee3c74fbSChris Lattner // 3ee3c74fbSChris Lattner // The LLVM Compiler Infrastructure 4ee3c74fbSChris Lattner // 5ee3c74fbSChris Lattner // This file is distributed under the University of Illinois Open Source 6ee3c74fbSChris Lattner // License. See LICENSE.TXT for details. 7ee3c74fbSChris Lattner // 8ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 9ee3c74fbSChris Lattner // 10ee3c74fbSChris Lattner // FileCheck does a line-by line check of a file that validates whether it 11ee3c74fbSChris Lattner // contains the expected content. This is useful for regression tests etc. 12ee3c74fbSChris Lattner // 13ee3c74fbSChris Lattner // This program exits with an error status of 2 on error, exit status of 0 if 14ee3c74fbSChris Lattner // the file matched the expected contents, and exit status of 1 if it did not 15ee3c74fbSChris Lattner // contain the expected contents. 16ee3c74fbSChris Lattner // 17ee3c74fbSChris Lattner //===----------------------------------------------------------------------===// 18ee3c74fbSChris Lattner 19ee3c74fbSChris Lattner #include "llvm/Support/CommandLine.h" 20ee3c74fbSChris Lattner #include "llvm/Support/MemoryBuffer.h" 21ee3c74fbSChris Lattner #include "llvm/Support/PrettyStackTrace.h" 22f08d2db9SChris Lattner #include "llvm/Support/Regex.h" 23ee3c74fbSChris Lattner #include "llvm/Support/SourceMgr.h" 24ee3c74fbSChris Lattner #include "llvm/Support/raw_ostream.h" 25ee3c74fbSChris Lattner #include "llvm/System/Signals.h" 26ee3c74fbSChris Lattner using namespace llvm; 27ee3c74fbSChris Lattner 28ee3c74fbSChris Lattner static cl::opt<std::string> 29ee3c74fbSChris Lattner CheckFilename(cl::Positional, cl::desc("<check-file>"), cl::Required); 30ee3c74fbSChris Lattner 31ee3c74fbSChris Lattner static cl::opt<std::string> 32ee3c74fbSChris Lattner InputFilename("input-file", cl::desc("File to check (defaults to stdin)"), 33ee3c74fbSChris Lattner cl::init("-"), cl::value_desc("filename")); 34ee3c74fbSChris Lattner 35ee3c74fbSChris Lattner static cl::opt<std::string> 36ee3c74fbSChris Lattner CheckPrefix("check-prefix", cl::init("CHECK"), 37ee3c74fbSChris Lattner cl::desc("Prefix to use from check file (defaults to 'CHECK')")); 38ee3c74fbSChris Lattner 392c3e5cdfSChris Lattner static cl::opt<bool> 402c3e5cdfSChris Lattner NoCanonicalizeWhiteSpace("strict-whitespace", 412c3e5cdfSChris Lattner cl::desc("Do not treat all horizontal whitespace as equivalent")); 422c3e5cdfSChris Lattner 4374d50731SChris Lattner //===----------------------------------------------------------------------===// 4474d50731SChris Lattner // Pattern Handling Code. 4574d50731SChris Lattner //===----------------------------------------------------------------------===// 4674d50731SChris Lattner 473b40b445SChris Lattner class Pattern { 48*b16ab0c4SChris Lattner /// FixedStr - If non-empty, this pattern is a fixed string match with the 49*b16ab0c4SChris Lattner /// specified fixed string. 50221460e0SChris Lattner StringRef FixedStr; 51*b16ab0c4SChris Lattner 52*b16ab0c4SChris Lattner /// RegEx - If non-empty, this is a regex pattern. 53*b16ab0c4SChris Lattner std::string RegExStr; 543b40b445SChris Lattner public: 553b40b445SChris Lattner 5674d50731SChris Lattner Pattern() { } 5774d50731SChris Lattner 5874d50731SChris Lattner bool ParsePattern(StringRef PatternStr, SourceMgr &SM); 593b40b445SChris Lattner 603b40b445SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 613b40b445SChris Lattner /// returns the position that is matched or npos if there is no match. If 623b40b445SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 63f08d2db9SChris Lattner size_t Match(StringRef Buffer, size_t &MatchLen) const; 64*b16ab0c4SChris Lattner 65*b16ab0c4SChris Lattner private: 66*b16ab0c4SChris Lattner void AddFixedStringToRegEx(StringRef FixedStr); 673b40b445SChris Lattner }; 683b40b445SChris Lattner 6974d50731SChris Lattner bool Pattern::ParsePattern(StringRef PatternStr, SourceMgr &SM) { 7074d50731SChris Lattner // Ignore trailing whitespace. 7174d50731SChris Lattner while (!PatternStr.empty() && 7274d50731SChris Lattner (PatternStr.back() == ' ' || PatternStr.back() == '\t')) 7374d50731SChris Lattner PatternStr = PatternStr.substr(0, PatternStr.size()-1); 7474d50731SChris Lattner 7574d50731SChris Lattner // Check that there is something on the line. 7674d50731SChris Lattner if (PatternStr.empty()) { 7774d50731SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 7874d50731SChris Lattner "found empty check string with prefix '"+CheckPrefix+":'", 7974d50731SChris Lattner "error"); 8074d50731SChris Lattner return true; 8174d50731SChris Lattner } 8274d50731SChris Lattner 83221460e0SChris Lattner // Check to see if this is a fixed string, or if it has regex pieces. 84221460e0SChris Lattner if (PatternStr.size() < 2 || PatternStr.find("{{") == StringRef::npos) { 85221460e0SChris Lattner FixedStr = PatternStr; 86221460e0SChris Lattner return false; 87221460e0SChris Lattner } 88221460e0SChris Lattner 89*b16ab0c4SChris Lattner // Otherwise, there is at least one regex piece. Build up the regex pattern 90*b16ab0c4SChris Lattner // by escaping scary characters in fixed strings, building up one big regex. 91f08d2db9SChris Lattner while (!PatternStr.empty()) { 92f08d2db9SChris Lattner // Handle fixed string matches. 93f08d2db9SChris Lattner if (PatternStr.size() < 2 || 94f08d2db9SChris Lattner PatternStr[0] != '{' || PatternStr[1] != '{') { 95f08d2db9SChris Lattner // Find the end, which is the start of the next regex. 96f08d2db9SChris Lattner size_t FixedMatchEnd = PatternStr.find("{{"); 97*b16ab0c4SChris Lattner AddFixedStringToRegEx(PatternStr.substr(0, FixedMatchEnd)); 98f08d2db9SChris Lattner PatternStr = PatternStr.substr(FixedMatchEnd); 99f08d2db9SChris Lattner continue; 100f08d2db9SChris Lattner } 10174d50731SChris Lattner 102f08d2db9SChris Lattner // Otherwise, this is the start of a regex match. Scan for the }}. 103f08d2db9SChris Lattner size_t End = PatternStr.find("}}"); 104f08d2db9SChris Lattner if (End == StringRef::npos) { 105f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()), 106f08d2db9SChris Lattner "found start of regex string with no end '}}'", "error"); 107f08d2db9SChris Lattner return true; 108f08d2db9SChris Lattner } 109f08d2db9SChris Lattner 110*b16ab0c4SChris Lattner StringRef RegexStr = PatternStr.substr(2, End-2); 111*b16ab0c4SChris Lattner Regex R(RegexStr); 112f08d2db9SChris Lattner std::string Error; 113f08d2db9SChris Lattner if (!R.isValid(Error)) { 114f08d2db9SChris Lattner SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()+2), 115f08d2db9SChris Lattner "invalid regex: " + Error, "error"); 116f08d2db9SChris Lattner return true; 117f08d2db9SChris Lattner } 118f08d2db9SChris Lattner 119*b16ab0c4SChris Lattner RegExStr += RegexStr.str(); 120f08d2db9SChris Lattner PatternStr = PatternStr.substr(End+2); 121f08d2db9SChris Lattner } 122f08d2db9SChris Lattner 12374d50731SChris Lattner return false; 12474d50731SChris Lattner } 12574d50731SChris Lattner 126*b16ab0c4SChris Lattner void Pattern::AddFixedStringToRegEx(StringRef FixedStr) { 127*b16ab0c4SChris Lattner // Add the characters from FixedStr to the regex, escaping as needed. This 128*b16ab0c4SChris Lattner // avoids "leaning toothpicks" in common patterns. 129*b16ab0c4SChris Lattner for (unsigned i = 0, e = FixedStr.size(); i != e; ++i) { 130*b16ab0c4SChris Lattner switch (FixedStr[i]) { 131*b16ab0c4SChris Lattner // These are the special characters matched in "p_ere_exp". 132*b16ab0c4SChris Lattner case '(': 133*b16ab0c4SChris Lattner case ')': 134*b16ab0c4SChris Lattner case '^': 135*b16ab0c4SChris Lattner case '$': 136*b16ab0c4SChris Lattner case '|': 137*b16ab0c4SChris Lattner case '*': 138*b16ab0c4SChris Lattner case '+': 139*b16ab0c4SChris Lattner case '?': 140*b16ab0c4SChris Lattner case '.': 141*b16ab0c4SChris Lattner case '[': 142*b16ab0c4SChris Lattner case '\\': 143*b16ab0c4SChris Lattner case '{': 144*b16ab0c4SChris Lattner RegExStr += '\\'; 145*b16ab0c4SChris Lattner // FALL THROUGH. 146*b16ab0c4SChris Lattner default: 147*b16ab0c4SChris Lattner RegExStr += FixedStr[i]; 148*b16ab0c4SChris Lattner break; 149*b16ab0c4SChris Lattner } 150*b16ab0c4SChris Lattner } 151*b16ab0c4SChris Lattner } 152*b16ab0c4SChris Lattner 153*b16ab0c4SChris Lattner 154f08d2db9SChris Lattner /// Match - Match the pattern string against the input buffer Buffer. This 155f08d2db9SChris Lattner /// returns the position that is matched or npos if there is no match. If 156f08d2db9SChris Lattner /// there is a match, the size of the matched string is returned in MatchLen. 157f08d2db9SChris Lattner size_t Pattern::Match(StringRef Buffer, size_t &MatchLen) const { 158221460e0SChris Lattner // If this is a fixed string pattern, just match it now. 159221460e0SChris Lattner if (!FixedStr.empty()) { 160221460e0SChris Lattner MatchLen = FixedStr.size(); 161221460e0SChris Lattner return Buffer.find(FixedStr); 162221460e0SChris Lattner } 163221460e0SChris Lattner 164*b16ab0c4SChris Lattner // Regex match. 165*b16ab0c4SChris Lattner SmallVector<StringRef, 4> MatchInfo; 166*b16ab0c4SChris Lattner if (!Regex(RegExStr, Regex::Sub|Regex::Newline).match(Buffer, &MatchInfo)) 167f08d2db9SChris Lattner return StringRef::npos; 168*b16ab0c4SChris Lattner 169*b16ab0c4SChris Lattner // Successful regex match. 170*b16ab0c4SChris Lattner assert(!MatchInfo.empty() && "Didn't get any match"); 171*b16ab0c4SChris Lattner StringRef FullMatch = MatchInfo[0]; 172*b16ab0c4SChris Lattner 173*b16ab0c4SChris Lattner MatchLen = FullMatch.size(); 174*b16ab0c4SChris Lattner return FullMatch.data()-Buffer.data(); 175f08d2db9SChris Lattner } 176f08d2db9SChris Lattner 17774d50731SChris Lattner 17874d50731SChris Lattner //===----------------------------------------------------------------------===// 17974d50731SChris Lattner // Check Strings. 18074d50731SChris Lattner //===----------------------------------------------------------------------===// 1813b40b445SChris Lattner 1823b40b445SChris Lattner /// CheckString - This is a check that we found in the input file. 1833b40b445SChris Lattner struct CheckString { 1843b40b445SChris Lattner /// Pat - The pattern to match. 1853b40b445SChris Lattner Pattern Pat; 18626cccfe1SChris Lattner 18726cccfe1SChris Lattner /// Loc - The location in the match file that the check string was specified. 18826cccfe1SChris Lattner SMLoc Loc; 18926cccfe1SChris Lattner 190da108b4eSChris Lattner /// IsCheckNext - This is true if this is a CHECK-NEXT: directive (as opposed 191da108b4eSChris Lattner /// to a CHECK: directive. 192da108b4eSChris Lattner bool IsCheckNext; 193da108b4eSChris Lattner 194236d2d5eSChris Lattner /// NotStrings - These are all of the strings that are disallowed from 195236d2d5eSChris Lattner /// occurring between this match string and the previous one (or start of 196236d2d5eSChris Lattner /// file). 19774d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotStrings; 198236d2d5eSChris Lattner 1993b40b445SChris Lattner CheckString(const Pattern &P, SMLoc L, bool isCheckNext) 2003b40b445SChris Lattner : Pat(P), Loc(L), IsCheckNext(isCheckNext) {} 20126cccfe1SChris Lattner }; 20226cccfe1SChris Lattner 203a2f8fc5aSChris Lattner /// CanonicalizeInputFile - Remove duplicate horizontal space from the specified 204a2f8fc5aSChris Lattner /// memory buffer, free it, and return a new one. 205a2f8fc5aSChris Lattner static MemoryBuffer *CanonicalizeInputFile(MemoryBuffer *MB) { 206a2f8fc5aSChris Lattner SmallVector<char, 16> NewFile; 207a2f8fc5aSChris Lattner NewFile.reserve(MB->getBufferSize()); 208a2f8fc5aSChris Lattner 209a2f8fc5aSChris Lattner for (const char *Ptr = MB->getBufferStart(), *End = MB->getBufferEnd(); 210a2f8fc5aSChris Lattner Ptr != End; ++Ptr) { 211a2f8fc5aSChris Lattner // If C is not a horizontal whitespace, skip it. 212a2f8fc5aSChris Lattner if (*Ptr != ' ' && *Ptr != '\t') { 213a2f8fc5aSChris Lattner NewFile.push_back(*Ptr); 214a2f8fc5aSChris Lattner continue; 215a2f8fc5aSChris Lattner } 216a2f8fc5aSChris Lattner 217a2f8fc5aSChris Lattner // Otherwise, add one space and advance over neighboring space. 218a2f8fc5aSChris Lattner NewFile.push_back(' '); 219a2f8fc5aSChris Lattner while (Ptr+1 != End && 220a2f8fc5aSChris Lattner (Ptr[1] == ' ' || Ptr[1] == '\t')) 221a2f8fc5aSChris Lattner ++Ptr; 222a2f8fc5aSChris Lattner } 223a2f8fc5aSChris Lattner 224a2f8fc5aSChris Lattner // Free the old buffer and return a new one. 225a2f8fc5aSChris Lattner MemoryBuffer *MB2 = 226a2f8fc5aSChris Lattner MemoryBuffer::getMemBufferCopy(NewFile.data(), 227a2f8fc5aSChris Lattner NewFile.data() + NewFile.size(), 228a2f8fc5aSChris Lattner MB->getBufferIdentifier()); 229a2f8fc5aSChris Lattner 230a2f8fc5aSChris Lattner delete MB; 231a2f8fc5aSChris Lattner return MB2; 232a2f8fc5aSChris Lattner } 233a2f8fc5aSChris Lattner 234ee3c74fbSChris Lattner 235ee3c74fbSChris Lattner /// ReadCheckFile - Read the check file, which specifies the sequence of 236ee3c74fbSChris Lattner /// expected strings. The strings are added to the CheckStrings vector. 237ee3c74fbSChris Lattner static bool ReadCheckFile(SourceMgr &SM, 23826cccfe1SChris Lattner std::vector<CheckString> &CheckStrings) { 239ee3c74fbSChris Lattner // Open the check file, and tell SourceMgr about it. 240ee3c74fbSChris Lattner std::string ErrorStr; 241ee3c74fbSChris Lattner MemoryBuffer *F = 242ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(CheckFilename.c_str(), &ErrorStr); 243ee3c74fbSChris Lattner if (F == 0) { 244ee3c74fbSChris Lattner errs() << "Could not open check file '" << CheckFilename << "': " 245ee3c74fbSChris Lattner << ErrorStr << '\n'; 246ee3c74fbSChris Lattner return true; 247ee3c74fbSChris Lattner } 248a2f8fc5aSChris Lattner 249a2f8fc5aSChris Lattner // If we want to canonicalize whitespace, strip excess whitespace from the 250a2f8fc5aSChris Lattner // buffer containing the CHECK lines. 251a2f8fc5aSChris Lattner if (!NoCanonicalizeWhiteSpace) 252a2f8fc5aSChris Lattner F = CanonicalizeInputFile(F); 253a2f8fc5aSChris Lattner 254ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 255ee3c74fbSChris Lattner 25610f10cedSChris Lattner // Find all instances of CheckPrefix followed by : in the file. 257caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 258ee3c74fbSChris Lattner 25974d50731SChris Lattner std::vector<std::pair<SMLoc, Pattern> > NotMatches; 260236d2d5eSChris Lattner 261ee3c74fbSChris Lattner while (1) { 262ee3c74fbSChris Lattner // See if Prefix occurs in the memory buffer. 263caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find(CheckPrefix)); 264ee3c74fbSChris Lattner 265ee3c74fbSChris Lattner // If we didn't find a match, we're done. 266caa5fc0cSChris Lattner if (Buffer.empty()) 267ee3c74fbSChris Lattner break; 268ee3c74fbSChris Lattner 269caa5fc0cSChris Lattner const char *CheckPrefixStart = Buffer.data(); 270da108b4eSChris Lattner 271da108b4eSChris Lattner // When we find a check prefix, keep track of whether we find CHECK: or 272da108b4eSChris Lattner // CHECK-NEXT: 273236d2d5eSChris Lattner bool IsCheckNext = false, IsCheckNot = false; 274da108b4eSChris Lattner 27510f10cedSChris Lattner // Verify that the : is present after the prefix. 276caa5fc0cSChris Lattner if (Buffer[CheckPrefix.size()] == ':') { 277caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+1); 278caa5fc0cSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+6 && 279caa5fc0cSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NEXT:", 6) == 0) { 280caa5fc0cSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+7); 281da108b4eSChris Lattner IsCheckNext = true; 282236d2d5eSChris Lattner } else if (Buffer.size() > CheckPrefix.size()+5 && 283236d2d5eSChris Lattner memcmp(Buffer.data()+CheckPrefix.size(), "-NOT:", 5) == 0) { 284236d2d5eSChris Lattner Buffer = Buffer.substr(CheckPrefix.size()+6); 285236d2d5eSChris Lattner IsCheckNot = true; 286da108b4eSChris Lattner } else { 287caa5fc0cSChris Lattner Buffer = Buffer.substr(1); 28810f10cedSChris Lattner continue; 28910f10cedSChris Lattner } 29010f10cedSChris Lattner 291ee3c74fbSChris Lattner // Okay, we found the prefix, yay. Remember the rest of the line, but 292ee3c74fbSChris Lattner // ignore leading and trailing whitespace. 293236d2d5eSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t")); 294ee3c74fbSChris Lattner 295ee3c74fbSChris Lattner // Scan ahead to the end of line. 296caa5fc0cSChris Lattner size_t EOL = Buffer.find_first_of("\n\r"); 297ee3c74fbSChris Lattner 29874d50731SChris Lattner // Parse the pattern. 29974d50731SChris Lattner Pattern P; 30074d50731SChris Lattner if (P.ParsePattern(Buffer.substr(0, EOL), SM)) 301ee3c74fbSChris Lattner return true; 302ee3c74fbSChris Lattner 303236d2d5eSChris Lattner Buffer = Buffer.substr(EOL); 30474d50731SChris Lattner 305236d2d5eSChris Lattner 306da108b4eSChris Lattner // Verify that CHECK-NEXT lines have at least one CHECK line before them. 307da108b4eSChris Lattner if (IsCheckNext && CheckStrings.empty()) { 308da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(CheckPrefixStart), 309da108b4eSChris Lattner "found '"+CheckPrefix+"-NEXT:' without previous '"+ 310da108b4eSChris Lattner CheckPrefix+ ": line", "error"); 311da108b4eSChris Lattner return true; 312da108b4eSChris Lattner } 313da108b4eSChris Lattner 31474d50731SChris Lattner // Handle CHECK-NOT. 31574d50731SChris Lattner if (IsCheckNot) { 31674d50731SChris Lattner NotMatches.push_back(std::make_pair(SMLoc::getFromPointer(Buffer.data()), 31774d50731SChris Lattner P)); 31874d50731SChris Lattner continue; 31974d50731SChris Lattner } 32074d50731SChris Lattner 3213b40b445SChris Lattner 322ee3c74fbSChris Lattner // Okay, add the string we captured to the output vector and move on. 3233b40b445SChris Lattner CheckStrings.push_back(CheckString(P, 324caa5fc0cSChris Lattner SMLoc::getFromPointer(Buffer.data()), 325da108b4eSChris Lattner IsCheckNext)); 326236d2d5eSChris Lattner std::swap(NotMatches, CheckStrings.back().NotStrings); 327ee3c74fbSChris Lattner } 328ee3c74fbSChris Lattner 329ee3c74fbSChris Lattner if (CheckStrings.empty()) { 33010f10cedSChris Lattner errs() << "error: no check strings found with prefix '" << CheckPrefix 33110f10cedSChris Lattner << ":'\n"; 332ee3c74fbSChris Lattner return true; 333ee3c74fbSChris Lattner } 334ee3c74fbSChris Lattner 335236d2d5eSChris Lattner if (!NotMatches.empty()) { 336236d2d5eSChris Lattner errs() << "error: '" << CheckPrefix 337236d2d5eSChris Lattner << "-NOT:' not supported after last check line.\n"; 338236d2d5eSChris Lattner return true; 339236d2d5eSChris Lattner } 340236d2d5eSChris Lattner 341ee3c74fbSChris Lattner return false; 342ee3c74fbSChris Lattner } 343ee3c74fbSChris Lattner 344da108b4eSChris Lattner static void PrintCheckFailed(const SourceMgr &SM, const CheckString &CheckStr, 345caa5fc0cSChris Lattner StringRef Buffer) { 346da108b4eSChris Lattner // Otherwise, we have an error, emit an error message. 347da108b4eSChris Lattner SM.PrintMessage(CheckStr.Loc, "expected string not found in input", 348da108b4eSChris Lattner "error"); 349da108b4eSChris Lattner 350da108b4eSChris Lattner // Print the "scanning from here" line. If the current position is at the 351da108b4eSChris Lattner // end of a line, advance to the start of the next line. 352caa5fc0cSChris Lattner Buffer = Buffer.substr(Buffer.find_first_not_of(" \t\n\r")); 353da108b4eSChris Lattner 354caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), "scanning from here", 355da108b4eSChris Lattner "note"); 356da108b4eSChris Lattner } 357da108b4eSChris Lattner 35837183584SChris Lattner /// CountNumNewlinesBetween - Count the number of newlines in the specified 35937183584SChris Lattner /// range. 36037183584SChris Lattner static unsigned CountNumNewlinesBetween(StringRef Range) { 361da108b4eSChris Lattner unsigned NumNewLines = 0; 36237183584SChris Lattner while (1) { 363da108b4eSChris Lattner // Scan for newline. 36437183584SChris Lattner Range = Range.substr(Range.find_first_of("\n\r")); 36537183584SChris Lattner if (Range.empty()) return NumNewLines; 366da108b4eSChris Lattner 367da108b4eSChris Lattner ++NumNewLines; 368da108b4eSChris Lattner 369da108b4eSChris Lattner // Handle \n\r and \r\n as a single newline. 37037183584SChris Lattner if (Range.size() > 1 && 37137183584SChris Lattner (Range[1] == '\n' || Range[1] == '\r') && 37237183584SChris Lattner (Range[0] != Range[1])) 37337183584SChris Lattner Range = Range.substr(1); 37437183584SChris Lattner Range = Range.substr(1); 375da108b4eSChris Lattner } 376da108b4eSChris Lattner } 377da108b4eSChris Lattner 378ee3c74fbSChris Lattner int main(int argc, char **argv) { 379ee3c74fbSChris Lattner sys::PrintStackTraceOnErrorSignal(); 380ee3c74fbSChris Lattner PrettyStackTraceProgram X(argc, argv); 381ee3c74fbSChris Lattner cl::ParseCommandLineOptions(argc, argv); 382ee3c74fbSChris Lattner 383ee3c74fbSChris Lattner SourceMgr SM; 384ee3c74fbSChris Lattner 385ee3c74fbSChris Lattner // Read the expected strings from the check file. 38626cccfe1SChris Lattner std::vector<CheckString> CheckStrings; 387ee3c74fbSChris Lattner if (ReadCheckFile(SM, CheckStrings)) 388ee3c74fbSChris Lattner return 2; 389ee3c74fbSChris Lattner 390ee3c74fbSChris Lattner // Open the file to check and add it to SourceMgr. 391ee3c74fbSChris Lattner std::string ErrorStr; 392ee3c74fbSChris Lattner MemoryBuffer *F = 393ee3c74fbSChris Lattner MemoryBuffer::getFileOrSTDIN(InputFilename.c_str(), &ErrorStr); 394ee3c74fbSChris Lattner if (F == 0) { 395ee3c74fbSChris Lattner errs() << "Could not open input file '" << InputFilename << "': " 396ee3c74fbSChris Lattner << ErrorStr << '\n'; 397ee3c74fbSChris Lattner return true; 398ee3c74fbSChris Lattner } 3992c3e5cdfSChris Lattner 4002c3e5cdfSChris Lattner // Remove duplicate spaces in the input file if requested. 4012c3e5cdfSChris Lattner if (!NoCanonicalizeWhiteSpace) 4022c3e5cdfSChris Lattner F = CanonicalizeInputFile(F); 4032c3e5cdfSChris Lattner 404ee3c74fbSChris Lattner SM.AddNewSourceBuffer(F, SMLoc()); 405ee3c74fbSChris Lattner 406ee3c74fbSChris Lattner // Check that we have all of the expected strings, in order, in the input 407ee3c74fbSChris Lattner // file. 408caa5fc0cSChris Lattner StringRef Buffer = F->getBuffer(); 409ee3c74fbSChris Lattner 410236d2d5eSChris Lattner const char *LastMatch = Buffer.data(); 411236d2d5eSChris Lattner 412ee3c74fbSChris Lattner for (unsigned StrNo = 0, e = CheckStrings.size(); StrNo != e; ++StrNo) { 41326cccfe1SChris Lattner const CheckString &CheckStr = CheckStrings[StrNo]; 414ee3c74fbSChris Lattner 415caa5fc0cSChris Lattner StringRef SearchFrom = Buffer; 416caa5fc0cSChris Lattner 417ee3c74fbSChris Lattner // Find StrNo in the file. 4183b40b445SChris Lattner size_t MatchLen = 0; 4193b40b445SChris Lattner Buffer = Buffer.substr(CheckStr.Pat.Match(Buffer, MatchLen)); 420ee3c74fbSChris Lattner 421da108b4eSChris Lattner // If we didn't find a match, reject the input. 422caa5fc0cSChris Lattner if (Buffer.empty()) { 423caa5fc0cSChris Lattner PrintCheckFailed(SM, CheckStr, SearchFrom); 424da108b4eSChris Lattner return 1; 425ee3c74fbSChris Lattner } 426ee3c74fbSChris Lattner 42737183584SChris Lattner StringRef SkippedRegion(LastMatch, Buffer.data()-LastMatch); 42837183584SChris Lattner 429da108b4eSChris Lattner // If this check is a "CHECK-NEXT", verify that the previous match was on 430da108b4eSChris Lattner // the previous line (i.e. that there is one newline between them). 431da108b4eSChris Lattner if (CheckStr.IsCheckNext) { 432da108b4eSChris Lattner // Count the number of newlines between the previous match and this one. 433236d2d5eSChris Lattner assert(LastMatch != F->getBufferStart() && 434236d2d5eSChris Lattner "CHECK-NEXT can't be the first check in a file"); 435da108b4eSChris Lattner 43637183584SChris Lattner unsigned NumNewLines = CountNumNewlinesBetween(SkippedRegion); 437da108b4eSChris Lattner if (NumNewLines == 0) { 438107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 439da108b4eSChris Lattner CheckPrefix+"-NEXT: is on the same line as previous match", 440ee3c74fbSChris Lattner "error"); 441caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 442107c21eaSChris Lattner "'next' match was here", "note"); 443da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 444da108b4eSChris Lattner "previous match was here", "note"); 445aedd8185SChris Lattner return 1; 446ee3c74fbSChris Lattner } 447ee3c74fbSChris Lattner 448da108b4eSChris Lattner if (NumNewLines != 1) { 449107c21eaSChris Lattner SM.PrintMessage(CheckStr.Loc, 450da108b4eSChris Lattner CheckPrefix+ 451da108b4eSChris Lattner "-NEXT: is not on the line after the previous match", 452da108b4eSChris Lattner "error"); 453caa5fc0cSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), 454107c21eaSChris Lattner "'next' match was here", "note"); 455da108b4eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch), 456da108b4eSChris Lattner "previous match was here", "note"); 457da108b4eSChris Lattner return 1; 458da108b4eSChris Lattner } 459da108b4eSChris Lattner } 460da108b4eSChris Lattner 461236d2d5eSChris Lattner // If this match had "not strings", verify that they don't exist in the 462236d2d5eSChris Lattner // skipped region. 463f08d2db9SChris Lattner for (unsigned ChunkNo = 0, e = CheckStr.NotStrings.size(); ChunkNo != e; ++ChunkNo) { 46474d50731SChris Lattner size_t MatchLen = 0; 465f08d2db9SChris Lattner size_t Pos = CheckStr.NotStrings[ChunkNo].second.Match(SkippedRegion, MatchLen); 466236d2d5eSChris Lattner if (Pos == StringRef::npos) continue; 467236d2d5eSChris Lattner 468236d2d5eSChris Lattner SM.PrintMessage(SMLoc::getFromPointer(LastMatch+Pos), 469236d2d5eSChris Lattner CheckPrefix+"-NOT: string occurred!", "error"); 470f08d2db9SChris Lattner SM.PrintMessage(CheckStr.NotStrings[ChunkNo].first, 471236d2d5eSChris Lattner CheckPrefix+"-NOT: pattern specified here", "note"); 472236d2d5eSChris Lattner return 1; 473236d2d5eSChris Lattner } 474236d2d5eSChris Lattner 475236d2d5eSChris Lattner 476b9f2bf46SChris Lattner // Otherwise, everything is good. Step over the matched text and remember 477b9f2bf46SChris Lattner // the position after the match as the end of the last match. 4783b40b445SChris Lattner Buffer = Buffer.substr(MatchLen); 479b9f2bf46SChris Lattner LastMatch = Buffer.data(); 480da108b4eSChris Lattner } 481da108b4eSChris Lattner 482ee3c74fbSChris Lattner return 0; 483ee3c74fbSChris Lattner } 484