15ffd940aSRaphael Isemann //===- FileCheck.cpp - Check that File's Contents match what is expected --===//
25ffd940aSRaphael Isemann //
35ffd940aSRaphael Isemann // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
45ffd940aSRaphael Isemann // See https://llvm.org/LICENSE.txt for license information.
55ffd940aSRaphael Isemann // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
65ffd940aSRaphael Isemann //
75ffd940aSRaphael Isemann //===----------------------------------------------------------------------===//
85ffd940aSRaphael Isemann //
95ffd940aSRaphael Isemann // FileCheck does a line-by line check of a file that validates whether it
105ffd940aSRaphael Isemann // contains the expected content.  This is useful for regression tests etc.
115ffd940aSRaphael Isemann //
125ffd940aSRaphael Isemann // This file implements most of the API that will be used by the FileCheck utility
135ffd940aSRaphael Isemann // as well as various unittests.
145ffd940aSRaphael Isemann //===----------------------------------------------------------------------===//
155ffd940aSRaphael Isemann 
165ffd940aSRaphael Isemann #include "llvm/FileCheck/FileCheck.h"
175ffd940aSRaphael Isemann #include "FileCheckImpl.h"
185ffd940aSRaphael Isemann #include "llvm/ADT/STLExtras.h"
195ffd940aSRaphael Isemann #include "llvm/ADT/StringSet.h"
205ffd940aSRaphael Isemann #include "llvm/ADT/Twine.h"
215ffd940aSRaphael Isemann #include "llvm/Support/CheckedArithmetic.h"
225ffd940aSRaphael Isemann #include "llvm/Support/FormatVariadic.h"
235ffd940aSRaphael Isemann #include <cstdint>
245ffd940aSRaphael Isemann #include <list>
25871d658cSMircea Trofin #include <set>
265ffd940aSRaphael Isemann #include <tuple>
275ffd940aSRaphael Isemann #include <utility>
285ffd940aSRaphael Isemann 
295ffd940aSRaphael Isemann using namespace llvm;
305ffd940aSRaphael Isemann 
315ffd940aSRaphael Isemann StringRef ExpressionFormat::toString() const {
325ffd940aSRaphael Isemann   switch (Value) {
335ffd940aSRaphael Isemann   case Kind::NoFormat:
345ffd940aSRaphael Isemann     return StringRef("<none>");
355ffd940aSRaphael Isemann   case Kind::Unsigned:
365ffd940aSRaphael Isemann     return StringRef("%u");
375ffd940aSRaphael Isemann   case Kind::Signed:
385ffd940aSRaphael Isemann     return StringRef("%d");
395ffd940aSRaphael Isemann   case Kind::HexUpper:
405ffd940aSRaphael Isemann     return StringRef("%X");
415ffd940aSRaphael Isemann   case Kind::HexLower:
425ffd940aSRaphael Isemann     return StringRef("%x");
435ffd940aSRaphael Isemann   }
445ffd940aSRaphael Isemann   llvm_unreachable("unknown expression format");
455ffd940aSRaphael Isemann }
465ffd940aSRaphael Isemann 
475ffd940aSRaphael Isemann Expected<std::string> ExpressionFormat::getWildcardRegex() const {
485ffd940aSRaphael Isemann   auto CreatePrecisionRegex = [this](StringRef S) {
495ffd940aSRaphael Isemann     return (S + Twine('{') + Twine(Precision) + "}").str();
505ffd940aSRaphael Isemann   };
515ffd940aSRaphael Isemann 
525ffd940aSRaphael Isemann   switch (Value) {
535ffd940aSRaphael Isemann   case Kind::Unsigned:
545ffd940aSRaphael Isemann     if (Precision)
555ffd940aSRaphael Isemann       return CreatePrecisionRegex("([1-9][0-9]*)?[0-9]");
565ffd940aSRaphael Isemann     return std::string("[0-9]+");
575ffd940aSRaphael Isemann   case Kind::Signed:
585ffd940aSRaphael Isemann     if (Precision)
595ffd940aSRaphael Isemann       return CreatePrecisionRegex("-?([1-9][0-9]*)?[0-9]");
605ffd940aSRaphael Isemann     return std::string("-?[0-9]+");
615ffd940aSRaphael Isemann   case Kind::HexUpper:
625ffd940aSRaphael Isemann     if (Precision)
635ffd940aSRaphael Isemann       return CreatePrecisionRegex("([1-9A-F][0-9A-F]*)?[0-9A-F]");
645ffd940aSRaphael Isemann     return std::string("[0-9A-F]+");
655ffd940aSRaphael Isemann   case Kind::HexLower:
665ffd940aSRaphael Isemann     if (Precision)
675ffd940aSRaphael Isemann       return CreatePrecisionRegex("([1-9a-f][0-9a-f]*)?[0-9a-f]");
685ffd940aSRaphael Isemann     return std::string("[0-9a-f]+");
695ffd940aSRaphael Isemann   default:
705ffd940aSRaphael Isemann     return createStringError(std::errc::invalid_argument,
715ffd940aSRaphael Isemann                              "trying to match value with invalid format");
725ffd940aSRaphael Isemann   }
735ffd940aSRaphael Isemann }
745ffd940aSRaphael Isemann 
755ffd940aSRaphael Isemann Expected<std::string>
765ffd940aSRaphael Isemann ExpressionFormat::getMatchingString(ExpressionValue IntegerValue) const {
775ffd940aSRaphael Isemann   uint64_t AbsoluteValue;
785ffd940aSRaphael Isemann   StringRef SignPrefix = IntegerValue.isNegative() ? "-" : "";
795ffd940aSRaphael Isemann 
805ffd940aSRaphael Isemann   if (Value == Kind::Signed) {
815ffd940aSRaphael Isemann     Expected<int64_t> SignedValue = IntegerValue.getSignedValue();
825ffd940aSRaphael Isemann     if (!SignedValue)
835ffd940aSRaphael Isemann       return SignedValue.takeError();
845ffd940aSRaphael Isemann     if (*SignedValue < 0)
855ffd940aSRaphael Isemann       AbsoluteValue = cantFail(IntegerValue.getAbsolute().getUnsignedValue());
865ffd940aSRaphael Isemann     else
875ffd940aSRaphael Isemann       AbsoluteValue = *SignedValue;
885ffd940aSRaphael Isemann   } else {
895ffd940aSRaphael Isemann     Expected<uint64_t> UnsignedValue = IntegerValue.getUnsignedValue();
905ffd940aSRaphael Isemann     if (!UnsignedValue)
915ffd940aSRaphael Isemann       return UnsignedValue.takeError();
925ffd940aSRaphael Isemann     AbsoluteValue = *UnsignedValue;
935ffd940aSRaphael Isemann   }
945ffd940aSRaphael Isemann 
955ffd940aSRaphael Isemann   std::string AbsoluteValueStr;
965ffd940aSRaphael Isemann   switch (Value) {
975ffd940aSRaphael Isemann   case Kind::Unsigned:
985ffd940aSRaphael Isemann   case Kind::Signed:
995ffd940aSRaphael Isemann     AbsoluteValueStr = utostr(AbsoluteValue);
1005ffd940aSRaphael Isemann     break;
1015ffd940aSRaphael Isemann   case Kind::HexUpper:
1025ffd940aSRaphael Isemann   case Kind::HexLower:
1035ffd940aSRaphael Isemann     AbsoluteValueStr = utohexstr(AbsoluteValue, Value == Kind::HexLower);
1045ffd940aSRaphael Isemann     break;
1055ffd940aSRaphael Isemann   default:
1065ffd940aSRaphael Isemann     return createStringError(std::errc::invalid_argument,
1075ffd940aSRaphael Isemann                              "trying to match value with invalid format");
1085ffd940aSRaphael Isemann   }
1095ffd940aSRaphael Isemann 
1105ffd940aSRaphael Isemann   if (Precision > AbsoluteValueStr.size()) {
1115ffd940aSRaphael Isemann     unsigned LeadingZeros = Precision - AbsoluteValueStr.size();
1125ffd940aSRaphael Isemann     return (Twine(SignPrefix) + std::string(LeadingZeros, '0') +
1135ffd940aSRaphael Isemann             AbsoluteValueStr)
1145ffd940aSRaphael Isemann         .str();
1155ffd940aSRaphael Isemann   }
1165ffd940aSRaphael Isemann 
1175ffd940aSRaphael Isemann   return (Twine(SignPrefix) + AbsoluteValueStr).str();
1185ffd940aSRaphael Isemann }
1195ffd940aSRaphael Isemann 
1205ffd940aSRaphael Isemann Expected<ExpressionValue>
1215ffd940aSRaphael Isemann ExpressionFormat::valueFromStringRepr(StringRef StrVal,
1225ffd940aSRaphael Isemann                                       const SourceMgr &SM) const {
1235ffd940aSRaphael Isemann   bool ValueIsSigned = Value == Kind::Signed;
1245ffd940aSRaphael Isemann   StringRef OverflowErrorStr = "unable to represent numeric value";
1255ffd940aSRaphael Isemann   if (ValueIsSigned) {
1265ffd940aSRaphael Isemann     int64_t SignedValue;
1275ffd940aSRaphael Isemann 
1285ffd940aSRaphael Isemann     if (StrVal.getAsInteger(10, SignedValue))
1295ffd940aSRaphael Isemann       return ErrorDiagnostic::get(SM, StrVal, OverflowErrorStr);
1305ffd940aSRaphael Isemann 
1315ffd940aSRaphael Isemann     return ExpressionValue(SignedValue);
1325ffd940aSRaphael Isemann   }
1335ffd940aSRaphael Isemann 
1345ffd940aSRaphael Isemann   bool Hex = Value == Kind::HexUpper || Value == Kind::HexLower;
1355ffd940aSRaphael Isemann   uint64_t UnsignedValue;
1365ffd940aSRaphael Isemann   if (StrVal.getAsInteger(Hex ? 16 : 10, UnsignedValue))
1375ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, StrVal, OverflowErrorStr);
1385ffd940aSRaphael Isemann 
1395ffd940aSRaphael Isemann   return ExpressionValue(UnsignedValue);
1405ffd940aSRaphael Isemann }
1415ffd940aSRaphael Isemann 
1425ffd940aSRaphael Isemann static int64_t getAsSigned(uint64_t UnsignedValue) {
1435ffd940aSRaphael Isemann   // Use memcpy to reinterpret the bitpattern in Value since casting to
1445ffd940aSRaphael Isemann   // signed is implementation-defined if the unsigned value is too big to be
1455ffd940aSRaphael Isemann   // represented in the signed type and using an union violates type aliasing
1465ffd940aSRaphael Isemann   // rules.
1475ffd940aSRaphael Isemann   int64_t SignedValue;
1485ffd940aSRaphael Isemann   memcpy(&SignedValue, &UnsignedValue, sizeof(SignedValue));
1495ffd940aSRaphael Isemann   return SignedValue;
1505ffd940aSRaphael Isemann }
1515ffd940aSRaphael Isemann 
1525ffd940aSRaphael Isemann Expected<int64_t> ExpressionValue::getSignedValue() const {
1535ffd940aSRaphael Isemann   if (Negative)
1545ffd940aSRaphael Isemann     return getAsSigned(Value);
1555ffd940aSRaphael Isemann 
1565ffd940aSRaphael Isemann   if (Value > (uint64_t)std::numeric_limits<int64_t>::max())
1575ffd940aSRaphael Isemann     return make_error<OverflowError>();
1585ffd940aSRaphael Isemann 
1595ffd940aSRaphael Isemann   // Value is in the representable range of int64_t so we can use cast.
1605ffd940aSRaphael Isemann   return static_cast<int64_t>(Value);
1615ffd940aSRaphael Isemann }
1625ffd940aSRaphael Isemann 
1635ffd940aSRaphael Isemann Expected<uint64_t> ExpressionValue::getUnsignedValue() const {
1645ffd940aSRaphael Isemann   if (Negative)
1655ffd940aSRaphael Isemann     return make_error<OverflowError>();
1665ffd940aSRaphael Isemann 
1675ffd940aSRaphael Isemann   return Value;
1685ffd940aSRaphael Isemann }
1695ffd940aSRaphael Isemann 
1705ffd940aSRaphael Isemann ExpressionValue ExpressionValue::getAbsolute() const {
1715ffd940aSRaphael Isemann   if (!Negative)
1725ffd940aSRaphael Isemann     return *this;
1735ffd940aSRaphael Isemann 
1745ffd940aSRaphael Isemann   int64_t SignedValue = getAsSigned(Value);
1755ffd940aSRaphael Isemann   int64_t MaxInt64 = std::numeric_limits<int64_t>::max();
1765ffd940aSRaphael Isemann   // Absolute value can be represented as int64_t.
1775ffd940aSRaphael Isemann   if (SignedValue >= -MaxInt64)
1785ffd940aSRaphael Isemann     return ExpressionValue(-getAsSigned(Value));
1795ffd940aSRaphael Isemann 
1805ffd940aSRaphael Isemann   // -X == -(max int64_t + Rem), negate each component independently.
1815ffd940aSRaphael Isemann   SignedValue += MaxInt64;
1825ffd940aSRaphael Isemann   uint64_t RemainingValueAbsolute = -SignedValue;
1835ffd940aSRaphael Isemann   return ExpressionValue(MaxInt64 + RemainingValueAbsolute);
1845ffd940aSRaphael Isemann }
1855ffd940aSRaphael Isemann 
1865ffd940aSRaphael Isemann Expected<ExpressionValue> llvm::operator+(const ExpressionValue &LeftOperand,
1875ffd940aSRaphael Isemann                                           const ExpressionValue &RightOperand) {
1885ffd940aSRaphael Isemann   if (LeftOperand.isNegative() && RightOperand.isNegative()) {
1895ffd940aSRaphael Isemann     int64_t LeftValue = cantFail(LeftOperand.getSignedValue());
1905ffd940aSRaphael Isemann     int64_t RightValue = cantFail(RightOperand.getSignedValue());
1915ffd940aSRaphael Isemann     Optional<int64_t> Result = checkedAdd<int64_t>(LeftValue, RightValue);
1925ffd940aSRaphael Isemann     if (!Result)
1935ffd940aSRaphael Isemann       return make_error<OverflowError>();
1945ffd940aSRaphael Isemann 
1955ffd940aSRaphael Isemann     return ExpressionValue(*Result);
1965ffd940aSRaphael Isemann   }
1975ffd940aSRaphael Isemann 
1985ffd940aSRaphael Isemann   // (-A) + B == B - A.
1995ffd940aSRaphael Isemann   if (LeftOperand.isNegative())
2005ffd940aSRaphael Isemann     return RightOperand - LeftOperand.getAbsolute();
2015ffd940aSRaphael Isemann 
2025ffd940aSRaphael Isemann   // A + (-B) == A - B.
2035ffd940aSRaphael Isemann   if (RightOperand.isNegative())
2045ffd940aSRaphael Isemann     return LeftOperand - RightOperand.getAbsolute();
2055ffd940aSRaphael Isemann 
2065ffd940aSRaphael Isemann   // Both values are positive at this point.
2075ffd940aSRaphael Isemann   uint64_t LeftValue = cantFail(LeftOperand.getUnsignedValue());
2085ffd940aSRaphael Isemann   uint64_t RightValue = cantFail(RightOperand.getUnsignedValue());
2095ffd940aSRaphael Isemann   Optional<uint64_t> Result =
2105ffd940aSRaphael Isemann       checkedAddUnsigned<uint64_t>(LeftValue, RightValue);
2115ffd940aSRaphael Isemann   if (!Result)
2125ffd940aSRaphael Isemann     return make_error<OverflowError>();
2135ffd940aSRaphael Isemann 
2145ffd940aSRaphael Isemann   return ExpressionValue(*Result);
2155ffd940aSRaphael Isemann }
2165ffd940aSRaphael Isemann 
2175ffd940aSRaphael Isemann Expected<ExpressionValue> llvm::operator-(const ExpressionValue &LeftOperand,
2185ffd940aSRaphael Isemann                                           const ExpressionValue &RightOperand) {
2195ffd940aSRaphael Isemann   // Result will be negative and thus might underflow.
2205ffd940aSRaphael Isemann   if (LeftOperand.isNegative() && !RightOperand.isNegative()) {
2215ffd940aSRaphael Isemann     int64_t LeftValue = cantFail(LeftOperand.getSignedValue());
2225ffd940aSRaphael Isemann     uint64_t RightValue = cantFail(RightOperand.getUnsignedValue());
2235ffd940aSRaphael Isemann     // Result <= -1 - (max int64_t) which overflows on 1- and 2-complement.
2245ffd940aSRaphael Isemann     if (RightValue > (uint64_t)std::numeric_limits<int64_t>::max())
2255ffd940aSRaphael Isemann       return make_error<OverflowError>();
2265ffd940aSRaphael Isemann     Optional<int64_t> Result =
2275ffd940aSRaphael Isemann         checkedSub(LeftValue, static_cast<int64_t>(RightValue));
2285ffd940aSRaphael Isemann     if (!Result)
2295ffd940aSRaphael Isemann       return make_error<OverflowError>();
2305ffd940aSRaphael Isemann 
2315ffd940aSRaphael Isemann     return ExpressionValue(*Result);
2325ffd940aSRaphael Isemann   }
2335ffd940aSRaphael Isemann 
2345ffd940aSRaphael Isemann   // (-A) - (-B) == B - A.
2355ffd940aSRaphael Isemann   if (LeftOperand.isNegative())
2365ffd940aSRaphael Isemann     return RightOperand.getAbsolute() - LeftOperand.getAbsolute();
2375ffd940aSRaphael Isemann 
2385ffd940aSRaphael Isemann   // A - (-B) == A + B.
2395ffd940aSRaphael Isemann   if (RightOperand.isNegative())
2405ffd940aSRaphael Isemann     return LeftOperand + RightOperand.getAbsolute();
2415ffd940aSRaphael Isemann 
2425ffd940aSRaphael Isemann   // Both values are positive at this point.
2435ffd940aSRaphael Isemann   uint64_t LeftValue = cantFail(LeftOperand.getUnsignedValue());
2445ffd940aSRaphael Isemann   uint64_t RightValue = cantFail(RightOperand.getUnsignedValue());
2455ffd940aSRaphael Isemann   if (LeftValue >= RightValue)
2465ffd940aSRaphael Isemann     return ExpressionValue(LeftValue - RightValue);
2475ffd940aSRaphael Isemann   else {
2485ffd940aSRaphael Isemann     uint64_t AbsoluteDifference = RightValue - LeftValue;
2495ffd940aSRaphael Isemann     uint64_t MaxInt64 = std::numeric_limits<int64_t>::max();
2505ffd940aSRaphael Isemann     // Value might underflow.
2515ffd940aSRaphael Isemann     if (AbsoluteDifference > MaxInt64) {
2525ffd940aSRaphael Isemann       AbsoluteDifference -= MaxInt64;
2535ffd940aSRaphael Isemann       int64_t Result = -MaxInt64;
2545ffd940aSRaphael Isemann       int64_t MinInt64 = std::numeric_limits<int64_t>::min();
2555ffd940aSRaphael Isemann       // Underflow, tested by:
2565ffd940aSRaphael Isemann       //   abs(Result + (max int64_t)) > abs((min int64_t) + (max int64_t))
2575ffd940aSRaphael Isemann       if (AbsoluteDifference > static_cast<uint64_t>(-(MinInt64 - Result)))
2585ffd940aSRaphael Isemann         return make_error<OverflowError>();
2595ffd940aSRaphael Isemann       Result -= static_cast<int64_t>(AbsoluteDifference);
2605ffd940aSRaphael Isemann       return ExpressionValue(Result);
2615ffd940aSRaphael Isemann     }
2625ffd940aSRaphael Isemann 
2635ffd940aSRaphael Isemann     return ExpressionValue(-static_cast<int64_t>(AbsoluteDifference));
2645ffd940aSRaphael Isemann   }
2655ffd940aSRaphael Isemann }
2665ffd940aSRaphael Isemann 
2675ffd940aSRaphael Isemann Expected<ExpressionValue> llvm::operator*(const ExpressionValue &LeftOperand,
2685ffd940aSRaphael Isemann                                           const ExpressionValue &RightOperand) {
2695ffd940aSRaphael Isemann   // -A * -B == A * B
2705ffd940aSRaphael Isemann   if (LeftOperand.isNegative() && RightOperand.isNegative())
2715ffd940aSRaphael Isemann     return LeftOperand.getAbsolute() * RightOperand.getAbsolute();
2725ffd940aSRaphael Isemann 
2735ffd940aSRaphael Isemann   // A * -B == -B * A
2745ffd940aSRaphael Isemann   if (RightOperand.isNegative())
2755ffd940aSRaphael Isemann     return RightOperand * LeftOperand;
2765ffd940aSRaphael Isemann 
2775ffd940aSRaphael Isemann   assert(!RightOperand.isNegative() && "Unexpected negative operand!");
2785ffd940aSRaphael Isemann 
2795ffd940aSRaphael Isemann   // Result will be negative and can underflow.
2805ffd940aSRaphael Isemann   if (LeftOperand.isNegative()) {
2815ffd940aSRaphael Isemann     auto Result = LeftOperand.getAbsolute() * RightOperand.getAbsolute();
2825ffd940aSRaphael Isemann     if (!Result)
2835ffd940aSRaphael Isemann       return Result;
2845ffd940aSRaphael Isemann 
2855ffd940aSRaphael Isemann     return ExpressionValue(0) - *Result;
2865ffd940aSRaphael Isemann   }
2875ffd940aSRaphael Isemann 
2885ffd940aSRaphael Isemann   // Result will be positive and can overflow.
2895ffd940aSRaphael Isemann   uint64_t LeftValue = cantFail(LeftOperand.getUnsignedValue());
2905ffd940aSRaphael Isemann   uint64_t RightValue = cantFail(RightOperand.getUnsignedValue());
2915ffd940aSRaphael Isemann   Optional<uint64_t> Result =
2925ffd940aSRaphael Isemann       checkedMulUnsigned<uint64_t>(LeftValue, RightValue);
2935ffd940aSRaphael Isemann   if (!Result)
2945ffd940aSRaphael Isemann     return make_error<OverflowError>();
2955ffd940aSRaphael Isemann 
2965ffd940aSRaphael Isemann   return ExpressionValue(*Result);
2975ffd940aSRaphael Isemann }
2985ffd940aSRaphael Isemann 
2995ffd940aSRaphael Isemann Expected<ExpressionValue> llvm::operator/(const ExpressionValue &LeftOperand,
3005ffd940aSRaphael Isemann                                           const ExpressionValue &RightOperand) {
3015ffd940aSRaphael Isemann   // -A / -B == A / B
3025ffd940aSRaphael Isemann   if (LeftOperand.isNegative() && RightOperand.isNegative())
3035ffd940aSRaphael Isemann     return LeftOperand.getAbsolute() / RightOperand.getAbsolute();
3045ffd940aSRaphael Isemann 
3055ffd940aSRaphael Isemann   // Check for divide by zero.
3065ffd940aSRaphael Isemann   if (RightOperand == ExpressionValue(0))
3075ffd940aSRaphael Isemann     return make_error<OverflowError>();
3085ffd940aSRaphael Isemann 
3095ffd940aSRaphael Isemann   // Result will be negative and can underflow.
3105ffd940aSRaphael Isemann   if (LeftOperand.isNegative() || RightOperand.isNegative())
3115ffd940aSRaphael Isemann     return ExpressionValue(0) -
3125ffd940aSRaphael Isemann            cantFail(LeftOperand.getAbsolute() / RightOperand.getAbsolute());
3135ffd940aSRaphael Isemann 
3145ffd940aSRaphael Isemann   uint64_t LeftValue = cantFail(LeftOperand.getUnsignedValue());
3155ffd940aSRaphael Isemann   uint64_t RightValue = cantFail(RightOperand.getUnsignedValue());
3165ffd940aSRaphael Isemann   return ExpressionValue(LeftValue / RightValue);
3175ffd940aSRaphael Isemann }
3185ffd940aSRaphael Isemann 
3195ffd940aSRaphael Isemann Expected<ExpressionValue> llvm::max(const ExpressionValue &LeftOperand,
3205ffd940aSRaphael Isemann                                     const ExpressionValue &RightOperand) {
3215ffd940aSRaphael Isemann   if (LeftOperand.isNegative() && RightOperand.isNegative()) {
3225ffd940aSRaphael Isemann     int64_t LeftValue = cantFail(LeftOperand.getSignedValue());
3235ffd940aSRaphael Isemann     int64_t RightValue = cantFail(RightOperand.getSignedValue());
3245ffd940aSRaphael Isemann     return ExpressionValue(std::max(LeftValue, RightValue));
3255ffd940aSRaphael Isemann   }
3265ffd940aSRaphael Isemann 
3275ffd940aSRaphael Isemann   if (!LeftOperand.isNegative() && !RightOperand.isNegative()) {
3285ffd940aSRaphael Isemann     uint64_t LeftValue = cantFail(LeftOperand.getUnsignedValue());
3295ffd940aSRaphael Isemann     uint64_t RightValue = cantFail(RightOperand.getUnsignedValue());
3305ffd940aSRaphael Isemann     return ExpressionValue(std::max(LeftValue, RightValue));
3315ffd940aSRaphael Isemann   }
3325ffd940aSRaphael Isemann 
3335ffd940aSRaphael Isemann   if (LeftOperand.isNegative())
3345ffd940aSRaphael Isemann     return RightOperand;
3355ffd940aSRaphael Isemann 
3365ffd940aSRaphael Isemann   return LeftOperand;
3375ffd940aSRaphael Isemann }
3385ffd940aSRaphael Isemann 
3395ffd940aSRaphael Isemann Expected<ExpressionValue> llvm::min(const ExpressionValue &LeftOperand,
3405ffd940aSRaphael Isemann                                     const ExpressionValue &RightOperand) {
3415ffd940aSRaphael Isemann   if (cantFail(max(LeftOperand, RightOperand)) == LeftOperand)
3425ffd940aSRaphael Isemann     return RightOperand;
3435ffd940aSRaphael Isemann 
3445ffd940aSRaphael Isemann   return LeftOperand;
3455ffd940aSRaphael Isemann }
3465ffd940aSRaphael Isemann 
3475ffd940aSRaphael Isemann Expected<ExpressionValue> NumericVariableUse::eval() const {
3485ffd940aSRaphael Isemann   Optional<ExpressionValue> Value = Variable->getValue();
3495ffd940aSRaphael Isemann   if (Value)
3505ffd940aSRaphael Isemann     return *Value;
3515ffd940aSRaphael Isemann 
3525ffd940aSRaphael Isemann   return make_error<UndefVarError>(getExpressionStr());
3535ffd940aSRaphael Isemann }
3545ffd940aSRaphael Isemann 
3555ffd940aSRaphael Isemann Expected<ExpressionValue> BinaryOperation::eval() const {
3565ffd940aSRaphael Isemann   Expected<ExpressionValue> LeftOp = LeftOperand->eval();
3575ffd940aSRaphael Isemann   Expected<ExpressionValue> RightOp = RightOperand->eval();
3585ffd940aSRaphael Isemann 
3595ffd940aSRaphael Isemann   // Bubble up any error (e.g. undefined variables) in the recursive
3605ffd940aSRaphael Isemann   // evaluation.
3615ffd940aSRaphael Isemann   if (!LeftOp || !RightOp) {
3625ffd940aSRaphael Isemann     Error Err = Error::success();
3635ffd940aSRaphael Isemann     if (!LeftOp)
3645ffd940aSRaphael Isemann       Err = joinErrors(std::move(Err), LeftOp.takeError());
3655ffd940aSRaphael Isemann     if (!RightOp)
3665ffd940aSRaphael Isemann       Err = joinErrors(std::move(Err), RightOp.takeError());
3675ffd940aSRaphael Isemann     return std::move(Err);
3685ffd940aSRaphael Isemann   }
3695ffd940aSRaphael Isemann 
3705ffd940aSRaphael Isemann   return EvalBinop(*LeftOp, *RightOp);
3715ffd940aSRaphael Isemann }
3725ffd940aSRaphael Isemann 
3735ffd940aSRaphael Isemann Expected<ExpressionFormat>
3745ffd940aSRaphael Isemann BinaryOperation::getImplicitFormat(const SourceMgr &SM) const {
3755ffd940aSRaphael Isemann   Expected<ExpressionFormat> LeftFormat = LeftOperand->getImplicitFormat(SM);
3765ffd940aSRaphael Isemann   Expected<ExpressionFormat> RightFormat = RightOperand->getImplicitFormat(SM);
3775ffd940aSRaphael Isemann   if (!LeftFormat || !RightFormat) {
3785ffd940aSRaphael Isemann     Error Err = Error::success();
3795ffd940aSRaphael Isemann     if (!LeftFormat)
3805ffd940aSRaphael Isemann       Err = joinErrors(std::move(Err), LeftFormat.takeError());
3815ffd940aSRaphael Isemann     if (!RightFormat)
3825ffd940aSRaphael Isemann       Err = joinErrors(std::move(Err), RightFormat.takeError());
3835ffd940aSRaphael Isemann     return std::move(Err);
3845ffd940aSRaphael Isemann   }
3855ffd940aSRaphael Isemann 
3865ffd940aSRaphael Isemann   if (*LeftFormat != ExpressionFormat::Kind::NoFormat &&
3875ffd940aSRaphael Isemann       *RightFormat != ExpressionFormat::Kind::NoFormat &&
3885ffd940aSRaphael Isemann       *LeftFormat != *RightFormat)
3895ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
3905ffd940aSRaphael Isemann         SM, getExpressionStr(),
3915ffd940aSRaphael Isemann         "implicit format conflict between '" + LeftOperand->getExpressionStr() +
3925ffd940aSRaphael Isemann             "' (" + LeftFormat->toString() + ") and '" +
3935ffd940aSRaphael Isemann             RightOperand->getExpressionStr() + "' (" + RightFormat->toString() +
3945ffd940aSRaphael Isemann             "), need an explicit format specifier");
3955ffd940aSRaphael Isemann 
3965ffd940aSRaphael Isemann   return *LeftFormat != ExpressionFormat::Kind::NoFormat ? *LeftFormat
3975ffd940aSRaphael Isemann                                                          : *RightFormat;
3985ffd940aSRaphael Isemann }
3995ffd940aSRaphael Isemann 
4005ffd940aSRaphael Isemann Expected<std::string> NumericSubstitution::getResult() const {
4015ffd940aSRaphael Isemann   assert(ExpressionPointer->getAST() != nullptr &&
4025ffd940aSRaphael Isemann          "Substituting empty expression");
4035ffd940aSRaphael Isemann   Expected<ExpressionValue> EvaluatedValue =
4045ffd940aSRaphael Isemann       ExpressionPointer->getAST()->eval();
4055ffd940aSRaphael Isemann   if (!EvaluatedValue)
4065ffd940aSRaphael Isemann     return EvaluatedValue.takeError();
4075ffd940aSRaphael Isemann   ExpressionFormat Format = ExpressionPointer->getFormat();
4085ffd940aSRaphael Isemann   return Format.getMatchingString(*EvaluatedValue);
4095ffd940aSRaphael Isemann }
4105ffd940aSRaphael Isemann 
4115ffd940aSRaphael Isemann Expected<std::string> StringSubstitution::getResult() const {
4125ffd940aSRaphael Isemann   // Look up the value and escape it so that we can put it into the regex.
4135ffd940aSRaphael Isemann   Expected<StringRef> VarVal = Context->getPatternVarValue(FromStr);
4145ffd940aSRaphael Isemann   if (!VarVal)
4155ffd940aSRaphael Isemann     return VarVal.takeError();
4165ffd940aSRaphael Isemann   return Regex::escape(*VarVal);
4175ffd940aSRaphael Isemann }
4185ffd940aSRaphael Isemann 
4195ffd940aSRaphael Isemann bool Pattern::isValidVarNameStart(char C) { return C == '_' || isAlpha(C); }
4205ffd940aSRaphael Isemann 
4215ffd940aSRaphael Isemann Expected<Pattern::VariableProperties>
4225ffd940aSRaphael Isemann Pattern::parseVariable(StringRef &Str, const SourceMgr &SM) {
4235ffd940aSRaphael Isemann   if (Str.empty())
4245ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Str, "empty variable name");
4255ffd940aSRaphael Isemann 
4265ffd940aSRaphael Isemann   size_t I = 0;
4275ffd940aSRaphael Isemann   bool IsPseudo = Str[0] == '@';
4285ffd940aSRaphael Isemann 
4295ffd940aSRaphael Isemann   // Global vars start with '$'.
4305ffd940aSRaphael Isemann   if (Str[0] == '$' || IsPseudo)
4315ffd940aSRaphael Isemann     ++I;
4325ffd940aSRaphael Isemann 
4335ffd940aSRaphael Isemann   if (!isValidVarNameStart(Str[I++]))
4345ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Str, "invalid variable name");
4355ffd940aSRaphael Isemann 
4365ffd940aSRaphael Isemann   for (size_t E = Str.size(); I != E; ++I)
4375ffd940aSRaphael Isemann     // Variable names are composed of alphanumeric characters and underscores.
4385ffd940aSRaphael Isemann     if (Str[I] != '_' && !isAlnum(Str[I]))
4395ffd940aSRaphael Isemann       break;
4405ffd940aSRaphael Isemann 
4415ffd940aSRaphael Isemann   StringRef Name = Str.take_front(I);
4425ffd940aSRaphael Isemann   Str = Str.substr(I);
4435ffd940aSRaphael Isemann   return VariableProperties {Name, IsPseudo};
4445ffd940aSRaphael Isemann }
4455ffd940aSRaphael Isemann 
4465ffd940aSRaphael Isemann // StringRef holding all characters considered as horizontal whitespaces by
4475ffd940aSRaphael Isemann // FileCheck input canonicalization.
4485ffd940aSRaphael Isemann constexpr StringLiteral SpaceChars = " \t";
4495ffd940aSRaphael Isemann 
4505ffd940aSRaphael Isemann // Parsing helper function that strips the first character in S and returns it.
4515ffd940aSRaphael Isemann static char popFront(StringRef &S) {
4525ffd940aSRaphael Isemann   char C = S.front();
4535ffd940aSRaphael Isemann   S = S.drop_front();
4545ffd940aSRaphael Isemann   return C;
4555ffd940aSRaphael Isemann }
4565ffd940aSRaphael Isemann 
4575ffd940aSRaphael Isemann char OverflowError::ID = 0;
4585ffd940aSRaphael Isemann char UndefVarError::ID = 0;
4595ffd940aSRaphael Isemann char ErrorDiagnostic::ID = 0;
4605ffd940aSRaphael Isemann char NotFoundError::ID = 0;
4615ffd940aSRaphael Isemann 
4625ffd940aSRaphael Isemann Expected<NumericVariable *> Pattern::parseNumericVariableDefinition(
4635ffd940aSRaphael Isemann     StringRef &Expr, FileCheckPatternContext *Context,
4645ffd940aSRaphael Isemann     Optional<size_t> LineNumber, ExpressionFormat ImplicitFormat,
4655ffd940aSRaphael Isemann     const SourceMgr &SM) {
4665ffd940aSRaphael Isemann   Expected<VariableProperties> ParseVarResult = parseVariable(Expr, SM);
4675ffd940aSRaphael Isemann   if (!ParseVarResult)
4685ffd940aSRaphael Isemann     return ParseVarResult.takeError();
4695ffd940aSRaphael Isemann   StringRef Name = ParseVarResult->Name;
4705ffd940aSRaphael Isemann 
4715ffd940aSRaphael Isemann   if (ParseVarResult->IsPseudo)
4725ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
4735ffd940aSRaphael Isemann         SM, Name, "definition of pseudo numeric variable unsupported");
4745ffd940aSRaphael Isemann 
4755ffd940aSRaphael Isemann   // Detect collisions between string and numeric variables when the latter
4765ffd940aSRaphael Isemann   // is created later than the former.
4775ffd940aSRaphael Isemann   if (Context->DefinedVariableTable.find(Name) !=
4785ffd940aSRaphael Isemann       Context->DefinedVariableTable.end())
4795ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
4805ffd940aSRaphael Isemann         SM, Name, "string variable with name '" + Name + "' already exists");
4815ffd940aSRaphael Isemann 
4825ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
4835ffd940aSRaphael Isemann   if (!Expr.empty())
4845ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
4855ffd940aSRaphael Isemann         SM, Expr, "unexpected characters after numeric variable name");
4865ffd940aSRaphael Isemann 
4875ffd940aSRaphael Isemann   NumericVariable *DefinedNumericVariable;
4885ffd940aSRaphael Isemann   auto VarTableIter = Context->GlobalNumericVariableTable.find(Name);
4895ffd940aSRaphael Isemann   if (VarTableIter != Context->GlobalNumericVariableTable.end()) {
4905ffd940aSRaphael Isemann     DefinedNumericVariable = VarTableIter->second;
4915ffd940aSRaphael Isemann     if (DefinedNumericVariable->getImplicitFormat() != ImplicitFormat)
4925ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
4935ffd940aSRaphael Isemann           SM, Expr, "format different from previous variable definition");
4945ffd940aSRaphael Isemann   } else
4955ffd940aSRaphael Isemann     DefinedNumericVariable =
4965ffd940aSRaphael Isemann         Context->makeNumericVariable(Name, ImplicitFormat, LineNumber);
4975ffd940aSRaphael Isemann 
4985ffd940aSRaphael Isemann   return DefinedNumericVariable;
4995ffd940aSRaphael Isemann }
5005ffd940aSRaphael Isemann 
5015ffd940aSRaphael Isemann Expected<std::unique_ptr<NumericVariableUse>> Pattern::parseNumericVariableUse(
5025ffd940aSRaphael Isemann     StringRef Name, bool IsPseudo, Optional<size_t> LineNumber,
5035ffd940aSRaphael Isemann     FileCheckPatternContext *Context, const SourceMgr &SM) {
5045ffd940aSRaphael Isemann   if (IsPseudo && !Name.equals("@LINE"))
5055ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
5065ffd940aSRaphael Isemann         SM, Name, "invalid pseudo numeric variable '" + Name + "'");
5075ffd940aSRaphael Isemann 
5085ffd940aSRaphael Isemann   // Numeric variable definitions and uses are parsed in the order in which
5095ffd940aSRaphael Isemann   // they appear in the CHECK patterns. For each definition, the pointer to the
5105ffd940aSRaphael Isemann   // class instance of the corresponding numeric variable definition is stored
5115ffd940aSRaphael Isemann   // in GlobalNumericVariableTable in parsePattern. Therefore, if the pointer
5125ffd940aSRaphael Isemann   // we get below is null, it means no such variable was defined before. When
5135ffd940aSRaphael Isemann   // that happens, we create a dummy variable so that parsing can continue. All
5145ffd940aSRaphael Isemann   // uses of undefined variables, whether string or numeric, are then diagnosed
5155ffd940aSRaphael Isemann   // in printSubstitutions() after failing to match.
5165ffd940aSRaphael Isemann   auto VarTableIter = Context->GlobalNumericVariableTable.find(Name);
5175ffd940aSRaphael Isemann   NumericVariable *NumericVariable;
5185ffd940aSRaphael Isemann   if (VarTableIter != Context->GlobalNumericVariableTable.end())
5195ffd940aSRaphael Isemann     NumericVariable = VarTableIter->second;
5205ffd940aSRaphael Isemann   else {
5215ffd940aSRaphael Isemann     NumericVariable = Context->makeNumericVariable(
5225ffd940aSRaphael Isemann         Name, ExpressionFormat(ExpressionFormat::Kind::Unsigned));
5235ffd940aSRaphael Isemann     Context->GlobalNumericVariableTable[Name] = NumericVariable;
5245ffd940aSRaphael Isemann   }
5255ffd940aSRaphael Isemann 
5265ffd940aSRaphael Isemann   Optional<size_t> DefLineNumber = NumericVariable->getDefLineNumber();
5275ffd940aSRaphael Isemann   if (DefLineNumber && LineNumber && *DefLineNumber == *LineNumber)
5285ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
5295ffd940aSRaphael Isemann         SM, Name,
5305ffd940aSRaphael Isemann         "numeric variable '" + Name +
5315ffd940aSRaphael Isemann             "' defined earlier in the same CHECK directive");
5325ffd940aSRaphael Isemann 
5335ffd940aSRaphael Isemann   return std::make_unique<NumericVariableUse>(Name, NumericVariable);
5345ffd940aSRaphael Isemann }
5355ffd940aSRaphael Isemann 
5365ffd940aSRaphael Isemann Expected<std::unique_ptr<ExpressionAST>> Pattern::parseNumericOperand(
5375ffd940aSRaphael Isemann     StringRef &Expr, AllowedOperand AO, bool MaybeInvalidConstraint,
5385ffd940aSRaphael Isemann     Optional<size_t> LineNumber, FileCheckPatternContext *Context,
5395ffd940aSRaphael Isemann     const SourceMgr &SM) {
5405ffd940aSRaphael Isemann   if (Expr.startswith("(")) {
5415ffd940aSRaphael Isemann     if (AO != AllowedOperand::Any)
5425ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
5435ffd940aSRaphael Isemann           SM, Expr, "parenthesized expression not permitted here");
5445ffd940aSRaphael Isemann     return parseParenExpr(Expr, LineNumber, Context, SM);
5455ffd940aSRaphael Isemann   }
5465ffd940aSRaphael Isemann 
5475ffd940aSRaphael Isemann   if (AO == AllowedOperand::LineVar || AO == AllowedOperand::Any) {
5485ffd940aSRaphael Isemann     // Try to parse as a numeric variable use.
5495ffd940aSRaphael Isemann     Expected<Pattern::VariableProperties> ParseVarResult =
5505ffd940aSRaphael Isemann         parseVariable(Expr, SM);
5515ffd940aSRaphael Isemann     if (ParseVarResult) {
5525ffd940aSRaphael Isemann       // Try to parse a function call.
5535ffd940aSRaphael Isemann       if (Expr.ltrim(SpaceChars).startswith("(")) {
5545ffd940aSRaphael Isemann         if (AO != AllowedOperand::Any)
5555ffd940aSRaphael Isemann           return ErrorDiagnostic::get(SM, ParseVarResult->Name,
5565ffd940aSRaphael Isemann                                       "unexpected function call");
5575ffd940aSRaphael Isemann 
5585ffd940aSRaphael Isemann         return parseCallExpr(Expr, ParseVarResult->Name, LineNumber, Context,
5595ffd940aSRaphael Isemann                              SM);
5605ffd940aSRaphael Isemann       }
5615ffd940aSRaphael Isemann 
5625ffd940aSRaphael Isemann       return parseNumericVariableUse(ParseVarResult->Name,
5635ffd940aSRaphael Isemann                                      ParseVarResult->IsPseudo, LineNumber,
5645ffd940aSRaphael Isemann                                      Context, SM);
5655ffd940aSRaphael Isemann     }
5665ffd940aSRaphael Isemann 
5675ffd940aSRaphael Isemann     if (AO == AllowedOperand::LineVar)
5685ffd940aSRaphael Isemann       return ParseVarResult.takeError();
5695ffd940aSRaphael Isemann     // Ignore the error and retry parsing as a literal.
5705ffd940aSRaphael Isemann     consumeError(ParseVarResult.takeError());
5715ffd940aSRaphael Isemann   }
5725ffd940aSRaphael Isemann 
5735ffd940aSRaphael Isemann   // Otherwise, parse it as a literal.
5745ffd940aSRaphael Isemann   int64_t SignedLiteralValue;
5755ffd940aSRaphael Isemann   uint64_t UnsignedLiteralValue;
5765ffd940aSRaphael Isemann   StringRef SaveExpr = Expr;
5775ffd940aSRaphael Isemann   // Accept both signed and unsigned literal, default to signed literal.
5785ffd940aSRaphael Isemann   if (!Expr.consumeInteger((AO == AllowedOperand::LegacyLiteral) ? 10 : 0,
5795ffd940aSRaphael Isemann                            UnsignedLiteralValue))
5805ffd940aSRaphael Isemann     return std::make_unique<ExpressionLiteral>(SaveExpr.drop_back(Expr.size()),
5815ffd940aSRaphael Isemann                                                UnsignedLiteralValue);
5825ffd940aSRaphael Isemann   Expr = SaveExpr;
5835ffd940aSRaphael Isemann   if (AO == AllowedOperand::Any && !Expr.consumeInteger(0, SignedLiteralValue))
5845ffd940aSRaphael Isemann     return std::make_unique<ExpressionLiteral>(SaveExpr.drop_back(Expr.size()),
5855ffd940aSRaphael Isemann                                                SignedLiteralValue);
5865ffd940aSRaphael Isemann 
5875ffd940aSRaphael Isemann   return ErrorDiagnostic::get(
5885ffd940aSRaphael Isemann       SM, Expr,
5895ffd940aSRaphael Isemann       Twine("invalid ") +
5905ffd940aSRaphael Isemann           (MaybeInvalidConstraint ? "matching constraint or " : "") +
5915ffd940aSRaphael Isemann           "operand format");
5925ffd940aSRaphael Isemann }
5935ffd940aSRaphael Isemann 
5945ffd940aSRaphael Isemann Expected<std::unique_ptr<ExpressionAST>>
5955ffd940aSRaphael Isemann Pattern::parseParenExpr(StringRef &Expr, Optional<size_t> LineNumber,
5965ffd940aSRaphael Isemann                         FileCheckPatternContext *Context, const SourceMgr &SM) {
5975ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
5985ffd940aSRaphael Isemann   assert(Expr.startswith("("));
5995ffd940aSRaphael Isemann 
6005ffd940aSRaphael Isemann   // Parse right operand.
6015ffd940aSRaphael Isemann   Expr.consume_front("(");
6025ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
6035ffd940aSRaphael Isemann   if (Expr.empty())
6045ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Expr, "missing operand in expression");
6055ffd940aSRaphael Isemann 
6065ffd940aSRaphael Isemann   // Note: parseNumericOperand handles nested opening parentheses.
6075ffd940aSRaphael Isemann   Expected<std::unique_ptr<ExpressionAST>> SubExprResult = parseNumericOperand(
6085ffd940aSRaphael Isemann       Expr, AllowedOperand::Any, /*MaybeInvalidConstraint=*/false, LineNumber,
6095ffd940aSRaphael Isemann       Context, SM);
6105ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
6115ffd940aSRaphael Isemann   while (SubExprResult && !Expr.empty() && !Expr.startswith(")")) {
6125ffd940aSRaphael Isemann     StringRef OrigExpr = Expr;
6135ffd940aSRaphael Isemann     SubExprResult = parseBinop(OrigExpr, Expr, std::move(*SubExprResult), false,
6145ffd940aSRaphael Isemann                                LineNumber, Context, SM);
6155ffd940aSRaphael Isemann     Expr = Expr.ltrim(SpaceChars);
6165ffd940aSRaphael Isemann   }
6175ffd940aSRaphael Isemann   if (!SubExprResult)
6185ffd940aSRaphael Isemann     return SubExprResult;
6195ffd940aSRaphael Isemann 
6205ffd940aSRaphael Isemann   if (!Expr.consume_front(")")) {
6215ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Expr,
6225ffd940aSRaphael Isemann                                 "missing ')' at end of nested expression");
6235ffd940aSRaphael Isemann   }
6245ffd940aSRaphael Isemann   return SubExprResult;
6255ffd940aSRaphael Isemann }
6265ffd940aSRaphael Isemann 
6275ffd940aSRaphael Isemann Expected<std::unique_ptr<ExpressionAST>>
6285ffd940aSRaphael Isemann Pattern::parseBinop(StringRef Expr, StringRef &RemainingExpr,
6295ffd940aSRaphael Isemann                     std::unique_ptr<ExpressionAST> LeftOp,
6305ffd940aSRaphael Isemann                     bool IsLegacyLineExpr, Optional<size_t> LineNumber,
6315ffd940aSRaphael Isemann                     FileCheckPatternContext *Context, const SourceMgr &SM) {
6325ffd940aSRaphael Isemann   RemainingExpr = RemainingExpr.ltrim(SpaceChars);
6335ffd940aSRaphael Isemann   if (RemainingExpr.empty())
6345ffd940aSRaphael Isemann     return std::move(LeftOp);
6355ffd940aSRaphael Isemann 
6365ffd940aSRaphael Isemann   // Check if this is a supported operation and select a function to perform
6375ffd940aSRaphael Isemann   // it.
6385ffd940aSRaphael Isemann   SMLoc OpLoc = SMLoc::getFromPointer(RemainingExpr.data());
6395ffd940aSRaphael Isemann   char Operator = popFront(RemainingExpr);
6405ffd940aSRaphael Isemann   binop_eval_t EvalBinop;
6415ffd940aSRaphael Isemann   switch (Operator) {
6425ffd940aSRaphael Isemann   case '+':
6435ffd940aSRaphael Isemann     EvalBinop = operator+;
6445ffd940aSRaphael Isemann     break;
6455ffd940aSRaphael Isemann   case '-':
6465ffd940aSRaphael Isemann     EvalBinop = operator-;
6475ffd940aSRaphael Isemann     break;
6485ffd940aSRaphael Isemann   default:
6495ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
6505ffd940aSRaphael Isemann         SM, OpLoc, Twine("unsupported operation '") + Twine(Operator) + "'");
6515ffd940aSRaphael Isemann   }
6525ffd940aSRaphael Isemann 
6535ffd940aSRaphael Isemann   // Parse right operand.
6545ffd940aSRaphael Isemann   RemainingExpr = RemainingExpr.ltrim(SpaceChars);
6555ffd940aSRaphael Isemann   if (RemainingExpr.empty())
6565ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, RemainingExpr,
6575ffd940aSRaphael Isemann                                 "missing operand in expression");
6585ffd940aSRaphael Isemann   // The second operand in a legacy @LINE expression is always a literal.
6595ffd940aSRaphael Isemann   AllowedOperand AO =
6605ffd940aSRaphael Isemann       IsLegacyLineExpr ? AllowedOperand::LegacyLiteral : AllowedOperand::Any;
6615ffd940aSRaphael Isemann   Expected<std::unique_ptr<ExpressionAST>> RightOpResult =
6625ffd940aSRaphael Isemann       parseNumericOperand(RemainingExpr, AO, /*MaybeInvalidConstraint=*/false,
6635ffd940aSRaphael Isemann                           LineNumber, Context, SM);
6645ffd940aSRaphael Isemann   if (!RightOpResult)
6655ffd940aSRaphael Isemann     return RightOpResult;
6665ffd940aSRaphael Isemann 
6675ffd940aSRaphael Isemann   Expr = Expr.drop_back(RemainingExpr.size());
6685ffd940aSRaphael Isemann   return std::make_unique<BinaryOperation>(Expr, EvalBinop, std::move(LeftOp),
6695ffd940aSRaphael Isemann                                            std::move(*RightOpResult));
6705ffd940aSRaphael Isemann }
6715ffd940aSRaphael Isemann 
6725ffd940aSRaphael Isemann Expected<std::unique_ptr<ExpressionAST>>
6735ffd940aSRaphael Isemann Pattern::parseCallExpr(StringRef &Expr, StringRef FuncName,
6745ffd940aSRaphael Isemann                        Optional<size_t> LineNumber,
6755ffd940aSRaphael Isemann                        FileCheckPatternContext *Context, const SourceMgr &SM) {
6765ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
6775ffd940aSRaphael Isemann   assert(Expr.startswith("("));
6785ffd940aSRaphael Isemann 
6795ffd940aSRaphael Isemann   auto OptFunc = StringSwitch<Optional<binop_eval_t>>(FuncName)
6805ffd940aSRaphael Isemann                      .Case("add", operator+)
6815ffd940aSRaphael Isemann                      .Case("div", operator/)
6825ffd940aSRaphael Isemann                      .Case("max", max)
6835ffd940aSRaphael Isemann                      .Case("min", min)
6845ffd940aSRaphael Isemann                      .Case("mul", operator*)
6855ffd940aSRaphael Isemann                      .Case("sub", operator-)
6865ffd940aSRaphael Isemann                      .Default(None);
6875ffd940aSRaphael Isemann 
6885ffd940aSRaphael Isemann   if (!OptFunc)
6895ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
6905ffd940aSRaphael Isemann         SM, FuncName, Twine("call to undefined function '") + FuncName + "'");
6915ffd940aSRaphael Isemann 
6925ffd940aSRaphael Isemann   Expr.consume_front("(");
6935ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
6945ffd940aSRaphael Isemann 
6955ffd940aSRaphael Isemann   // Parse call arguments, which are comma separated.
6965ffd940aSRaphael Isemann   SmallVector<std::unique_ptr<ExpressionAST>, 4> Args;
6975ffd940aSRaphael Isemann   while (!Expr.empty() && !Expr.startswith(")")) {
6985ffd940aSRaphael Isemann     if (Expr.startswith(","))
6995ffd940aSRaphael Isemann       return ErrorDiagnostic::get(SM, Expr, "missing argument");
7005ffd940aSRaphael Isemann 
7015ffd940aSRaphael Isemann     // Parse the argument, which is an arbitary expression.
7025ffd940aSRaphael Isemann     StringRef OuterBinOpExpr = Expr;
7035ffd940aSRaphael Isemann     Expected<std::unique_ptr<ExpressionAST>> Arg = parseNumericOperand(
7045ffd940aSRaphael Isemann         Expr, AllowedOperand::Any, /*MaybeInvalidConstraint=*/false, LineNumber,
7055ffd940aSRaphael Isemann         Context, SM);
7065ffd940aSRaphael Isemann     while (Arg && !Expr.empty()) {
7075ffd940aSRaphael Isemann       Expr = Expr.ltrim(SpaceChars);
7085ffd940aSRaphael Isemann       // Have we reached an argument terminator?
7095ffd940aSRaphael Isemann       if (Expr.startswith(",") || Expr.startswith(")"))
7105ffd940aSRaphael Isemann         break;
7115ffd940aSRaphael Isemann 
7125ffd940aSRaphael Isemann       // Arg = Arg <op> <expr>
7135ffd940aSRaphael Isemann       Arg = parseBinop(OuterBinOpExpr, Expr, std::move(*Arg), false, LineNumber,
7145ffd940aSRaphael Isemann                        Context, SM);
7155ffd940aSRaphael Isemann     }
7165ffd940aSRaphael Isemann 
7175ffd940aSRaphael Isemann     // Prefer an expression error over a generic invalid argument message.
7185ffd940aSRaphael Isemann     if (!Arg)
7195ffd940aSRaphael Isemann       return Arg.takeError();
7205ffd940aSRaphael Isemann     Args.push_back(std::move(*Arg));
7215ffd940aSRaphael Isemann 
7225ffd940aSRaphael Isemann     // Have we parsed all available arguments?
7235ffd940aSRaphael Isemann     Expr = Expr.ltrim(SpaceChars);
7245ffd940aSRaphael Isemann     if (!Expr.consume_front(","))
7255ffd940aSRaphael Isemann       break;
7265ffd940aSRaphael Isemann 
7275ffd940aSRaphael Isemann     Expr = Expr.ltrim(SpaceChars);
7285ffd940aSRaphael Isemann     if (Expr.startswith(")"))
7295ffd940aSRaphael Isemann       return ErrorDiagnostic::get(SM, Expr, "missing argument");
7305ffd940aSRaphael Isemann   }
7315ffd940aSRaphael Isemann 
7325ffd940aSRaphael Isemann   if (!Expr.consume_front(")"))
7335ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Expr,
7345ffd940aSRaphael Isemann                                 "missing ')' at end of call expression");
7355ffd940aSRaphael Isemann 
7365ffd940aSRaphael Isemann   const unsigned NumArgs = Args.size();
7375ffd940aSRaphael Isemann   if (NumArgs == 2)
7385ffd940aSRaphael Isemann     return std::make_unique<BinaryOperation>(Expr, *OptFunc, std::move(Args[0]),
7395ffd940aSRaphael Isemann                                              std::move(Args[1]));
7405ffd940aSRaphael Isemann 
7415ffd940aSRaphael Isemann   // TODO: Support more than binop_eval_t.
7425ffd940aSRaphael Isemann   return ErrorDiagnostic::get(SM, FuncName,
7435ffd940aSRaphael Isemann                               Twine("function '") + FuncName +
7445ffd940aSRaphael Isemann                                   Twine("' takes 2 arguments but ") +
7455ffd940aSRaphael Isemann                                   Twine(NumArgs) + " given");
7465ffd940aSRaphael Isemann }
7475ffd940aSRaphael Isemann 
7485ffd940aSRaphael Isemann Expected<std::unique_ptr<Expression>> Pattern::parseNumericSubstitutionBlock(
7495ffd940aSRaphael Isemann     StringRef Expr, Optional<NumericVariable *> &DefinedNumericVariable,
7505ffd940aSRaphael Isemann     bool IsLegacyLineExpr, Optional<size_t> LineNumber,
7515ffd940aSRaphael Isemann     FileCheckPatternContext *Context, const SourceMgr &SM) {
7525ffd940aSRaphael Isemann   std::unique_ptr<ExpressionAST> ExpressionASTPointer = nullptr;
7535ffd940aSRaphael Isemann   StringRef DefExpr = StringRef();
7545ffd940aSRaphael Isemann   DefinedNumericVariable = None;
7555ffd940aSRaphael Isemann   ExpressionFormat ExplicitFormat = ExpressionFormat();
7565ffd940aSRaphael Isemann   unsigned Precision = 0;
7575ffd940aSRaphael Isemann 
7585ffd940aSRaphael Isemann   // Parse format specifier (NOTE: ',' is also an argument seperator).
7595ffd940aSRaphael Isemann   size_t FormatSpecEnd = Expr.find(',');
7605ffd940aSRaphael Isemann   size_t FunctionStart = Expr.find('(');
7615ffd940aSRaphael Isemann   if (FormatSpecEnd != StringRef::npos && FormatSpecEnd < FunctionStart) {
7625ffd940aSRaphael Isemann     StringRef FormatExpr = Expr.take_front(FormatSpecEnd);
7635ffd940aSRaphael Isemann     Expr = Expr.drop_front(FormatSpecEnd + 1);
7645ffd940aSRaphael Isemann     FormatExpr = FormatExpr.trim(SpaceChars);
7655ffd940aSRaphael Isemann     if (!FormatExpr.consume_front("%"))
7665ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
7675ffd940aSRaphael Isemann           SM, FormatExpr,
7685ffd940aSRaphael Isemann           "invalid matching format specification in expression");
7695ffd940aSRaphael Isemann 
7705ffd940aSRaphael Isemann     // Parse precision.
7715ffd940aSRaphael Isemann     if (FormatExpr.consume_front(".")) {
7725ffd940aSRaphael Isemann       if (FormatExpr.consumeInteger(10, Precision))
7735ffd940aSRaphael Isemann         return ErrorDiagnostic::get(SM, FormatExpr,
7745ffd940aSRaphael Isemann                                     "invalid precision in format specifier");
7755ffd940aSRaphael Isemann     }
7765ffd940aSRaphael Isemann 
7775ffd940aSRaphael Isemann     if (!FormatExpr.empty()) {
7785ffd940aSRaphael Isemann       // Check for unknown matching format specifier and set matching format in
7795ffd940aSRaphael Isemann       // class instance representing this expression.
7805ffd940aSRaphael Isemann       SMLoc FmtLoc = SMLoc::getFromPointer(FormatExpr.data());
7815ffd940aSRaphael Isemann       switch (popFront(FormatExpr)) {
7825ffd940aSRaphael Isemann       case 'u':
7835ffd940aSRaphael Isemann         ExplicitFormat =
7845ffd940aSRaphael Isemann             ExpressionFormat(ExpressionFormat::Kind::Unsigned, Precision);
7855ffd940aSRaphael Isemann         break;
7865ffd940aSRaphael Isemann       case 'd':
7875ffd940aSRaphael Isemann         ExplicitFormat =
7885ffd940aSRaphael Isemann             ExpressionFormat(ExpressionFormat::Kind::Signed, Precision);
7895ffd940aSRaphael Isemann         break;
7905ffd940aSRaphael Isemann       case 'x':
7915ffd940aSRaphael Isemann         ExplicitFormat =
7925ffd940aSRaphael Isemann             ExpressionFormat(ExpressionFormat::Kind::HexLower, Precision);
7935ffd940aSRaphael Isemann         break;
7945ffd940aSRaphael Isemann       case 'X':
7955ffd940aSRaphael Isemann         ExplicitFormat =
7965ffd940aSRaphael Isemann             ExpressionFormat(ExpressionFormat::Kind::HexUpper, Precision);
7975ffd940aSRaphael Isemann         break;
7985ffd940aSRaphael Isemann       default:
7995ffd940aSRaphael Isemann         return ErrorDiagnostic::get(SM, FmtLoc,
8005ffd940aSRaphael Isemann                                     "invalid format specifier in expression");
8015ffd940aSRaphael Isemann       }
8025ffd940aSRaphael Isemann     }
8035ffd940aSRaphael Isemann 
8045ffd940aSRaphael Isemann     FormatExpr = FormatExpr.ltrim(SpaceChars);
8055ffd940aSRaphael Isemann     if (!FormatExpr.empty())
8065ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
8075ffd940aSRaphael Isemann           SM, FormatExpr,
8085ffd940aSRaphael Isemann           "invalid matching format specification in expression");
8095ffd940aSRaphael Isemann   }
8105ffd940aSRaphael Isemann 
8115ffd940aSRaphael Isemann   // Save variable definition expression if any.
8125ffd940aSRaphael Isemann   size_t DefEnd = Expr.find(':');
8135ffd940aSRaphael Isemann   if (DefEnd != StringRef::npos) {
8145ffd940aSRaphael Isemann     DefExpr = Expr.substr(0, DefEnd);
8155ffd940aSRaphael Isemann     Expr = Expr.substr(DefEnd + 1);
8165ffd940aSRaphael Isemann   }
8175ffd940aSRaphael Isemann 
8185ffd940aSRaphael Isemann   // Parse matching constraint.
8195ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
8205ffd940aSRaphael Isemann   bool HasParsedValidConstraint = false;
8215ffd940aSRaphael Isemann   if (Expr.consume_front("=="))
8225ffd940aSRaphael Isemann     HasParsedValidConstraint = true;
8235ffd940aSRaphael Isemann 
8245ffd940aSRaphael Isemann   // Parse the expression itself.
8255ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
8265ffd940aSRaphael Isemann   if (Expr.empty()) {
8275ffd940aSRaphael Isemann     if (HasParsedValidConstraint)
8285ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
8295ffd940aSRaphael Isemann           SM, Expr, "empty numeric expression should not have a constraint");
8305ffd940aSRaphael Isemann   } else {
8315ffd940aSRaphael Isemann     Expr = Expr.rtrim(SpaceChars);
8325ffd940aSRaphael Isemann     StringRef OuterBinOpExpr = Expr;
8335ffd940aSRaphael Isemann     // The first operand in a legacy @LINE expression is always the @LINE
8345ffd940aSRaphael Isemann     // pseudo variable.
8355ffd940aSRaphael Isemann     AllowedOperand AO =
8365ffd940aSRaphael Isemann         IsLegacyLineExpr ? AllowedOperand::LineVar : AllowedOperand::Any;
8375ffd940aSRaphael Isemann     Expected<std::unique_ptr<ExpressionAST>> ParseResult = parseNumericOperand(
8385ffd940aSRaphael Isemann         Expr, AO, !HasParsedValidConstraint, LineNumber, Context, SM);
8395ffd940aSRaphael Isemann     while (ParseResult && !Expr.empty()) {
8405ffd940aSRaphael Isemann       ParseResult = parseBinop(OuterBinOpExpr, Expr, std::move(*ParseResult),
8415ffd940aSRaphael Isemann                                IsLegacyLineExpr, LineNumber, Context, SM);
8425ffd940aSRaphael Isemann       // Legacy @LINE expressions only allow 2 operands.
8435ffd940aSRaphael Isemann       if (ParseResult && IsLegacyLineExpr && !Expr.empty())
8445ffd940aSRaphael Isemann         return ErrorDiagnostic::get(
8455ffd940aSRaphael Isemann             SM, Expr,
8465ffd940aSRaphael Isemann             "unexpected characters at end of expression '" + Expr + "'");
8475ffd940aSRaphael Isemann     }
8485ffd940aSRaphael Isemann     if (!ParseResult)
8495ffd940aSRaphael Isemann       return ParseResult.takeError();
8505ffd940aSRaphael Isemann     ExpressionASTPointer = std::move(*ParseResult);
8515ffd940aSRaphael Isemann   }
8525ffd940aSRaphael Isemann 
8535ffd940aSRaphael Isemann   // Select format of the expression, i.e. (i) its explicit format, if any,
8545ffd940aSRaphael Isemann   // otherwise (ii) its implicit format, if any, otherwise (iii) the default
8555ffd940aSRaphael Isemann   // format (unsigned). Error out in case of conflicting implicit format
8565ffd940aSRaphael Isemann   // without explicit format.
8575ffd940aSRaphael Isemann   ExpressionFormat Format;
8585ffd940aSRaphael Isemann   if (ExplicitFormat)
8595ffd940aSRaphael Isemann     Format = ExplicitFormat;
8605ffd940aSRaphael Isemann   else if (ExpressionASTPointer) {
8615ffd940aSRaphael Isemann     Expected<ExpressionFormat> ImplicitFormat =
8625ffd940aSRaphael Isemann         ExpressionASTPointer->getImplicitFormat(SM);
8635ffd940aSRaphael Isemann     if (!ImplicitFormat)
8645ffd940aSRaphael Isemann       return ImplicitFormat.takeError();
8655ffd940aSRaphael Isemann     Format = *ImplicitFormat;
8665ffd940aSRaphael Isemann   }
8675ffd940aSRaphael Isemann   if (!Format)
8685ffd940aSRaphael Isemann     Format = ExpressionFormat(ExpressionFormat::Kind::Unsigned, Precision);
8695ffd940aSRaphael Isemann 
8705ffd940aSRaphael Isemann   std::unique_ptr<Expression> ExpressionPointer =
8715ffd940aSRaphael Isemann       std::make_unique<Expression>(std::move(ExpressionASTPointer), Format);
8725ffd940aSRaphael Isemann 
8735ffd940aSRaphael Isemann   // Parse the numeric variable definition.
8745ffd940aSRaphael Isemann   if (DefEnd != StringRef::npos) {
8755ffd940aSRaphael Isemann     DefExpr = DefExpr.ltrim(SpaceChars);
8765ffd940aSRaphael Isemann     Expected<NumericVariable *> ParseResult = parseNumericVariableDefinition(
8775ffd940aSRaphael Isemann         DefExpr, Context, LineNumber, ExpressionPointer->getFormat(), SM);
8785ffd940aSRaphael Isemann 
8795ffd940aSRaphael Isemann     if (!ParseResult)
8805ffd940aSRaphael Isemann       return ParseResult.takeError();
8815ffd940aSRaphael Isemann     DefinedNumericVariable = *ParseResult;
8825ffd940aSRaphael Isemann   }
8835ffd940aSRaphael Isemann 
8845ffd940aSRaphael Isemann   return std::move(ExpressionPointer);
8855ffd940aSRaphael Isemann }
8865ffd940aSRaphael Isemann 
8875ffd940aSRaphael Isemann bool Pattern::parsePattern(StringRef PatternStr, StringRef Prefix,
8885ffd940aSRaphael Isemann                            SourceMgr &SM, const FileCheckRequest &Req) {
8895ffd940aSRaphael Isemann   bool MatchFullLinesHere = Req.MatchFullLines && CheckTy != Check::CheckNot;
8905ffd940aSRaphael Isemann   IgnoreCase = Req.IgnoreCase;
8915ffd940aSRaphael Isemann 
8925ffd940aSRaphael Isemann   PatternLoc = SMLoc::getFromPointer(PatternStr.data());
8935ffd940aSRaphael Isemann 
8945ffd940aSRaphael Isemann   if (!(Req.NoCanonicalizeWhiteSpace && Req.MatchFullLines))
8955ffd940aSRaphael Isemann     // Ignore trailing whitespace.
8965ffd940aSRaphael Isemann     while (!PatternStr.empty() &&
8975ffd940aSRaphael Isemann            (PatternStr.back() == ' ' || PatternStr.back() == '\t'))
8985ffd940aSRaphael Isemann       PatternStr = PatternStr.substr(0, PatternStr.size() - 1);
8995ffd940aSRaphael Isemann 
9005ffd940aSRaphael Isemann   // Check that there is something on the line.
9015ffd940aSRaphael Isemann   if (PatternStr.empty() && CheckTy != Check::CheckEmpty) {
9025ffd940aSRaphael Isemann     SM.PrintMessage(PatternLoc, SourceMgr::DK_Error,
9035ffd940aSRaphael Isemann                     "found empty check string with prefix '" + Prefix + ":'");
9045ffd940aSRaphael Isemann     return true;
9055ffd940aSRaphael Isemann   }
9065ffd940aSRaphael Isemann 
9075ffd940aSRaphael Isemann   if (!PatternStr.empty() && CheckTy == Check::CheckEmpty) {
9085ffd940aSRaphael Isemann     SM.PrintMessage(
9095ffd940aSRaphael Isemann         PatternLoc, SourceMgr::DK_Error,
9105ffd940aSRaphael Isemann         "found non-empty check string for empty check with prefix '" + Prefix +
9115ffd940aSRaphael Isemann             ":'");
9125ffd940aSRaphael Isemann     return true;
9135ffd940aSRaphael Isemann   }
9145ffd940aSRaphael Isemann 
9155ffd940aSRaphael Isemann   if (CheckTy == Check::CheckEmpty) {
9165ffd940aSRaphael Isemann     RegExStr = "(\n$)";
9175ffd940aSRaphael Isemann     return false;
9185ffd940aSRaphael Isemann   }
9195ffd940aSRaphael Isemann 
92044f399ccSJacques Pienaar   // If literal check, set fixed string.
92144f399ccSJacques Pienaar   if (CheckTy.isLiteralMatch()) {
92244f399ccSJacques Pienaar     FixedStr = PatternStr;
92344f399ccSJacques Pienaar     return false;
92444f399ccSJacques Pienaar   }
92544f399ccSJacques Pienaar 
9265ffd940aSRaphael Isemann   // Check to see if this is a fixed string, or if it has regex pieces.
9275ffd940aSRaphael Isemann   if (!MatchFullLinesHere &&
9285ffd940aSRaphael Isemann       (PatternStr.size() < 2 || (PatternStr.find("{{") == StringRef::npos &&
9295ffd940aSRaphael Isemann                                  PatternStr.find("[[") == StringRef::npos))) {
9305ffd940aSRaphael Isemann     FixedStr = PatternStr;
9315ffd940aSRaphael Isemann     return false;
9325ffd940aSRaphael Isemann   }
9335ffd940aSRaphael Isemann 
9345ffd940aSRaphael Isemann   if (MatchFullLinesHere) {
9355ffd940aSRaphael Isemann     RegExStr += '^';
9365ffd940aSRaphael Isemann     if (!Req.NoCanonicalizeWhiteSpace)
9375ffd940aSRaphael Isemann       RegExStr += " *";
9385ffd940aSRaphael Isemann   }
9395ffd940aSRaphael Isemann 
9405ffd940aSRaphael Isemann   // Paren value #0 is for the fully matched string.  Any new parenthesized
9415ffd940aSRaphael Isemann   // values add from there.
9425ffd940aSRaphael Isemann   unsigned CurParen = 1;
9435ffd940aSRaphael Isemann 
9445ffd940aSRaphael Isemann   // Otherwise, there is at least one regex piece.  Build up the regex pattern
9455ffd940aSRaphael Isemann   // by escaping scary characters in fixed strings, building up one big regex.
9465ffd940aSRaphael Isemann   while (!PatternStr.empty()) {
9475ffd940aSRaphael Isemann     // RegEx matches.
9485ffd940aSRaphael Isemann     if (PatternStr.startswith("{{")) {
9495ffd940aSRaphael Isemann       // This is the start of a regex match.  Scan for the }}.
9505ffd940aSRaphael Isemann       size_t End = PatternStr.find("}}");
9515ffd940aSRaphael Isemann       if (End == StringRef::npos) {
9525ffd940aSRaphael Isemann         SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()),
9535ffd940aSRaphael Isemann                         SourceMgr::DK_Error,
9545ffd940aSRaphael Isemann                         "found start of regex string with no end '}}'");
9555ffd940aSRaphael Isemann         return true;
9565ffd940aSRaphael Isemann       }
9575ffd940aSRaphael Isemann 
9585ffd940aSRaphael Isemann       // Enclose {{}} patterns in parens just like [[]] even though we're not
9595ffd940aSRaphael Isemann       // capturing the result for any purpose.  This is required in case the
9605ffd940aSRaphael Isemann       // expression contains an alternation like: CHECK:  abc{{x|z}}def.  We
9615ffd940aSRaphael Isemann       // want this to turn into: "abc(x|z)def" not "abcx|zdef".
9625ffd940aSRaphael Isemann       RegExStr += '(';
9635ffd940aSRaphael Isemann       ++CurParen;
9645ffd940aSRaphael Isemann 
9655ffd940aSRaphael Isemann       if (AddRegExToRegEx(PatternStr.substr(2, End - 2), CurParen, SM))
9665ffd940aSRaphael Isemann         return true;
9675ffd940aSRaphael Isemann       RegExStr += ')';
9685ffd940aSRaphael Isemann 
9695ffd940aSRaphael Isemann       PatternStr = PatternStr.substr(End + 2);
9705ffd940aSRaphael Isemann       continue;
9715ffd940aSRaphael Isemann     }
9725ffd940aSRaphael Isemann 
9735ffd940aSRaphael Isemann     // String and numeric substitution blocks. Pattern substitution blocks come
9745ffd940aSRaphael Isemann     // in two forms: [[foo:.*]] and [[foo]]. The former matches .* (or some
9755ffd940aSRaphael Isemann     // other regex) and assigns it to the string variable 'foo'. The latter
9765ffd940aSRaphael Isemann     // substitutes foo's value. Numeric substitution blocks recognize the same
9775ffd940aSRaphael Isemann     // form as string ones, but start with a '#' sign after the double
9785ffd940aSRaphael Isemann     // brackets. They also accept a combined form which sets a numeric variable
9795ffd940aSRaphael Isemann     // to the evaluation of an expression. Both string and numeric variable
9805ffd940aSRaphael Isemann     // names must satisfy the regular expression "[a-zA-Z_][0-9a-zA-Z_]*" to be
9815ffd940aSRaphael Isemann     // valid, as this helps catch some common errors.
9825ffd940aSRaphael Isemann     if (PatternStr.startswith("[[")) {
9835ffd940aSRaphael Isemann       StringRef UnparsedPatternStr = PatternStr.substr(2);
9845ffd940aSRaphael Isemann       // Find the closing bracket pair ending the match.  End is going to be an
9855ffd940aSRaphael Isemann       // offset relative to the beginning of the match string.
9865ffd940aSRaphael Isemann       size_t End = FindRegexVarEnd(UnparsedPatternStr, SM);
9875ffd940aSRaphael Isemann       StringRef MatchStr = UnparsedPatternStr.substr(0, End);
9885ffd940aSRaphael Isemann       bool IsNumBlock = MatchStr.consume_front("#");
9895ffd940aSRaphael Isemann 
9905ffd940aSRaphael Isemann       if (End == StringRef::npos) {
9915ffd940aSRaphael Isemann         SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()),
9925ffd940aSRaphael Isemann                         SourceMgr::DK_Error,
9935ffd940aSRaphael Isemann                         "Invalid substitution block, no ]] found");
9945ffd940aSRaphael Isemann         return true;
9955ffd940aSRaphael Isemann       }
9965ffd940aSRaphael Isemann       // Strip the substitution block we are parsing. End points to the start
9975ffd940aSRaphael Isemann       // of the "]]" closing the expression so account for it in computing the
9985ffd940aSRaphael Isemann       // index of the first unparsed character.
9995ffd940aSRaphael Isemann       PatternStr = UnparsedPatternStr.substr(End + 2);
10005ffd940aSRaphael Isemann 
10015ffd940aSRaphael Isemann       bool IsDefinition = false;
10025ffd940aSRaphael Isemann       bool SubstNeeded = false;
10035ffd940aSRaphael Isemann       // Whether the substitution block is a legacy use of @LINE with string
10045ffd940aSRaphael Isemann       // substitution block syntax.
10055ffd940aSRaphael Isemann       bool IsLegacyLineExpr = false;
10065ffd940aSRaphael Isemann       StringRef DefName;
10075ffd940aSRaphael Isemann       StringRef SubstStr;
10085ffd940aSRaphael Isemann       std::string MatchRegexp;
10095ffd940aSRaphael Isemann       size_t SubstInsertIdx = RegExStr.size();
10105ffd940aSRaphael Isemann 
10115ffd940aSRaphael Isemann       // Parse string variable or legacy @LINE expression.
10125ffd940aSRaphael Isemann       if (!IsNumBlock) {
1013c70f3686SFangrui Song         size_t VarEndIdx = MatchStr.find(':');
10145ffd940aSRaphael Isemann         size_t SpacePos = MatchStr.substr(0, VarEndIdx).find_first_of(" \t");
10155ffd940aSRaphael Isemann         if (SpacePos != StringRef::npos) {
10165ffd940aSRaphael Isemann           SM.PrintMessage(SMLoc::getFromPointer(MatchStr.data() + SpacePos),
10175ffd940aSRaphael Isemann                           SourceMgr::DK_Error, "unexpected whitespace");
10185ffd940aSRaphael Isemann           return true;
10195ffd940aSRaphael Isemann         }
10205ffd940aSRaphael Isemann 
10215ffd940aSRaphael Isemann         // Get the name (e.g. "foo") and verify it is well formed.
10225ffd940aSRaphael Isemann         StringRef OrigMatchStr = MatchStr;
10235ffd940aSRaphael Isemann         Expected<Pattern::VariableProperties> ParseVarResult =
10245ffd940aSRaphael Isemann             parseVariable(MatchStr, SM);
10255ffd940aSRaphael Isemann         if (!ParseVarResult) {
10265ffd940aSRaphael Isemann           logAllUnhandledErrors(ParseVarResult.takeError(), errs());
10275ffd940aSRaphael Isemann           return true;
10285ffd940aSRaphael Isemann         }
10295ffd940aSRaphael Isemann         StringRef Name = ParseVarResult->Name;
10305ffd940aSRaphael Isemann         bool IsPseudo = ParseVarResult->IsPseudo;
10315ffd940aSRaphael Isemann 
10325ffd940aSRaphael Isemann         IsDefinition = (VarEndIdx != StringRef::npos);
10335ffd940aSRaphael Isemann         SubstNeeded = !IsDefinition;
10345ffd940aSRaphael Isemann         if (IsDefinition) {
10355ffd940aSRaphael Isemann           if ((IsPseudo || !MatchStr.consume_front(":"))) {
10365ffd940aSRaphael Isemann             SM.PrintMessage(SMLoc::getFromPointer(Name.data()),
10375ffd940aSRaphael Isemann                             SourceMgr::DK_Error,
10385ffd940aSRaphael Isemann                             "invalid name in string variable definition");
10395ffd940aSRaphael Isemann             return true;
10405ffd940aSRaphael Isemann           }
10415ffd940aSRaphael Isemann 
10425ffd940aSRaphael Isemann           // Detect collisions between string and numeric variables when the
10435ffd940aSRaphael Isemann           // former is created later than the latter.
10445ffd940aSRaphael Isemann           if (Context->GlobalNumericVariableTable.find(Name) !=
10455ffd940aSRaphael Isemann               Context->GlobalNumericVariableTable.end()) {
10465ffd940aSRaphael Isemann             SM.PrintMessage(
10475ffd940aSRaphael Isemann                 SMLoc::getFromPointer(Name.data()), SourceMgr::DK_Error,
10485ffd940aSRaphael Isemann                 "numeric variable with name '" + Name + "' already exists");
10495ffd940aSRaphael Isemann             return true;
10505ffd940aSRaphael Isemann           }
10515ffd940aSRaphael Isemann           DefName = Name;
10525ffd940aSRaphael Isemann           MatchRegexp = MatchStr.str();
10535ffd940aSRaphael Isemann         } else {
10545ffd940aSRaphael Isemann           if (IsPseudo) {
10555ffd940aSRaphael Isemann             MatchStr = OrigMatchStr;
10565ffd940aSRaphael Isemann             IsLegacyLineExpr = IsNumBlock = true;
10575ffd940aSRaphael Isemann           } else
10585ffd940aSRaphael Isemann             SubstStr = Name;
10595ffd940aSRaphael Isemann         }
10605ffd940aSRaphael Isemann       }
10615ffd940aSRaphael Isemann 
10625ffd940aSRaphael Isemann       // Parse numeric substitution block.
10635ffd940aSRaphael Isemann       std::unique_ptr<Expression> ExpressionPointer;
10645ffd940aSRaphael Isemann       Optional<NumericVariable *> DefinedNumericVariable;
10655ffd940aSRaphael Isemann       if (IsNumBlock) {
10665ffd940aSRaphael Isemann         Expected<std::unique_ptr<Expression>> ParseResult =
10675ffd940aSRaphael Isemann             parseNumericSubstitutionBlock(MatchStr, DefinedNumericVariable,
10685ffd940aSRaphael Isemann                                           IsLegacyLineExpr, LineNumber, Context,
10695ffd940aSRaphael Isemann                                           SM);
10705ffd940aSRaphael Isemann         if (!ParseResult) {
10715ffd940aSRaphael Isemann           logAllUnhandledErrors(ParseResult.takeError(), errs());
10725ffd940aSRaphael Isemann           return true;
10735ffd940aSRaphael Isemann         }
10745ffd940aSRaphael Isemann         ExpressionPointer = std::move(*ParseResult);
10755ffd940aSRaphael Isemann         SubstNeeded = ExpressionPointer->getAST() != nullptr;
10765ffd940aSRaphael Isemann         if (DefinedNumericVariable) {
10775ffd940aSRaphael Isemann           IsDefinition = true;
10785ffd940aSRaphael Isemann           DefName = (*DefinedNumericVariable)->getName();
10795ffd940aSRaphael Isemann         }
10805ffd940aSRaphael Isemann         if (SubstNeeded)
10815ffd940aSRaphael Isemann           SubstStr = MatchStr;
10825ffd940aSRaphael Isemann         else {
10835ffd940aSRaphael Isemann           ExpressionFormat Format = ExpressionPointer->getFormat();
10845ffd940aSRaphael Isemann           MatchRegexp = cantFail(Format.getWildcardRegex());
10855ffd940aSRaphael Isemann         }
10865ffd940aSRaphael Isemann       }
10875ffd940aSRaphael Isemann 
10885ffd940aSRaphael Isemann       // Handle variable definition: [[<def>:(...)]] and [[#(...)<def>:(...)]].
10895ffd940aSRaphael Isemann       if (IsDefinition) {
10905ffd940aSRaphael Isemann         RegExStr += '(';
10915ffd940aSRaphael Isemann         ++SubstInsertIdx;
10925ffd940aSRaphael Isemann 
10935ffd940aSRaphael Isemann         if (IsNumBlock) {
10945ffd940aSRaphael Isemann           NumericVariableMatch NumericVariableDefinition = {
10955ffd940aSRaphael Isemann               *DefinedNumericVariable, CurParen};
10965ffd940aSRaphael Isemann           NumericVariableDefs[DefName] = NumericVariableDefinition;
10975ffd940aSRaphael Isemann           // This store is done here rather than in match() to allow
10985ffd940aSRaphael Isemann           // parseNumericVariableUse() to get the pointer to the class instance
10995ffd940aSRaphael Isemann           // of the right variable definition corresponding to a given numeric
11005ffd940aSRaphael Isemann           // variable use.
11015ffd940aSRaphael Isemann           Context->GlobalNumericVariableTable[DefName] =
11025ffd940aSRaphael Isemann               *DefinedNumericVariable;
11035ffd940aSRaphael Isemann         } else {
11045ffd940aSRaphael Isemann           VariableDefs[DefName] = CurParen;
11055ffd940aSRaphael Isemann           // Mark string variable as defined to detect collisions between
11065ffd940aSRaphael Isemann           // string and numeric variables in parseNumericVariableUse() and
11075ffd940aSRaphael Isemann           // defineCmdlineVariables() when the latter is created later than the
11085ffd940aSRaphael Isemann           // former. We cannot reuse GlobalVariableTable for this by populating
11095ffd940aSRaphael Isemann           // it with an empty string since we would then lose the ability to
11105ffd940aSRaphael Isemann           // detect the use of an undefined variable in match().
11115ffd940aSRaphael Isemann           Context->DefinedVariableTable[DefName] = true;
11125ffd940aSRaphael Isemann         }
11135ffd940aSRaphael Isemann 
11145ffd940aSRaphael Isemann         ++CurParen;
11155ffd940aSRaphael Isemann       }
11165ffd940aSRaphael Isemann 
11175ffd940aSRaphael Isemann       if (!MatchRegexp.empty() && AddRegExToRegEx(MatchRegexp, CurParen, SM))
11185ffd940aSRaphael Isemann         return true;
11195ffd940aSRaphael Isemann 
11205ffd940aSRaphael Isemann       if (IsDefinition)
11215ffd940aSRaphael Isemann         RegExStr += ')';
11225ffd940aSRaphael Isemann 
11235ffd940aSRaphael Isemann       // Handle substitutions: [[foo]] and [[#<foo expr>]].
11245ffd940aSRaphael Isemann       if (SubstNeeded) {
11255ffd940aSRaphael Isemann         // Handle substitution of string variables that were defined earlier on
11265ffd940aSRaphael Isemann         // the same line by emitting a backreference. Expressions do not
11275ffd940aSRaphael Isemann         // support substituting a numeric variable defined on the same line.
11285ffd940aSRaphael Isemann         if (!IsNumBlock && VariableDefs.find(SubstStr) != VariableDefs.end()) {
11295ffd940aSRaphael Isemann           unsigned CaptureParenGroup = VariableDefs[SubstStr];
11305ffd940aSRaphael Isemann           if (CaptureParenGroup < 1 || CaptureParenGroup > 9) {
11315ffd940aSRaphael Isemann             SM.PrintMessage(SMLoc::getFromPointer(SubstStr.data()),
11325ffd940aSRaphael Isemann                             SourceMgr::DK_Error,
11335ffd940aSRaphael Isemann                             "Can't back-reference more than 9 variables");
11345ffd940aSRaphael Isemann             return true;
11355ffd940aSRaphael Isemann           }
11365ffd940aSRaphael Isemann           AddBackrefToRegEx(CaptureParenGroup);
11375ffd940aSRaphael Isemann         } else {
11385ffd940aSRaphael Isemann           // Handle substitution of string variables ([[<var>]]) defined in
11395ffd940aSRaphael Isemann           // previous CHECK patterns, and substitution of expressions.
11405ffd940aSRaphael Isemann           Substitution *Substitution =
11415ffd940aSRaphael Isemann               IsNumBlock
11425ffd940aSRaphael Isemann                   ? Context->makeNumericSubstitution(
11435ffd940aSRaphael Isemann                         SubstStr, std::move(ExpressionPointer), SubstInsertIdx)
11445ffd940aSRaphael Isemann                   : Context->makeStringSubstitution(SubstStr, SubstInsertIdx);
11455ffd940aSRaphael Isemann           Substitutions.push_back(Substitution);
11465ffd940aSRaphael Isemann         }
11475ffd940aSRaphael Isemann       }
11485ffd940aSRaphael Isemann     }
11495ffd940aSRaphael Isemann 
11505ffd940aSRaphael Isemann     // Handle fixed string matches.
11515ffd940aSRaphael Isemann     // Find the end, which is the start of the next regex.
11525ffd940aSRaphael Isemann     size_t FixedMatchEnd = PatternStr.find("{{");
11535ffd940aSRaphael Isemann     FixedMatchEnd = std::min(FixedMatchEnd, PatternStr.find("[["));
11545ffd940aSRaphael Isemann     RegExStr += Regex::escape(PatternStr.substr(0, FixedMatchEnd));
11555ffd940aSRaphael Isemann     PatternStr = PatternStr.substr(FixedMatchEnd);
11565ffd940aSRaphael Isemann   }
11575ffd940aSRaphael Isemann 
11585ffd940aSRaphael Isemann   if (MatchFullLinesHere) {
11595ffd940aSRaphael Isemann     if (!Req.NoCanonicalizeWhiteSpace)
11605ffd940aSRaphael Isemann       RegExStr += " *";
11615ffd940aSRaphael Isemann     RegExStr += '$';
11625ffd940aSRaphael Isemann   }
11635ffd940aSRaphael Isemann 
11645ffd940aSRaphael Isemann   return false;
11655ffd940aSRaphael Isemann }
11665ffd940aSRaphael Isemann 
11675ffd940aSRaphael Isemann bool Pattern::AddRegExToRegEx(StringRef RS, unsigned &CurParen, SourceMgr &SM) {
11685ffd940aSRaphael Isemann   Regex R(RS);
11695ffd940aSRaphael Isemann   std::string Error;
11705ffd940aSRaphael Isemann   if (!R.isValid(Error)) {
11715ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(RS.data()), SourceMgr::DK_Error,
11725ffd940aSRaphael Isemann                     "invalid regex: " + Error);
11735ffd940aSRaphael Isemann     return true;
11745ffd940aSRaphael Isemann   }
11755ffd940aSRaphael Isemann 
11765ffd940aSRaphael Isemann   RegExStr += RS.str();
11775ffd940aSRaphael Isemann   CurParen += R.getNumMatches();
11785ffd940aSRaphael Isemann   return false;
11795ffd940aSRaphael Isemann }
11805ffd940aSRaphael Isemann 
11815ffd940aSRaphael Isemann void Pattern::AddBackrefToRegEx(unsigned BackrefNum) {
11825ffd940aSRaphael Isemann   assert(BackrefNum >= 1 && BackrefNum <= 9 && "Invalid backref number");
11835ffd940aSRaphael Isemann   std::string Backref = std::string("\\") + std::string(1, '0' + BackrefNum);
11845ffd940aSRaphael Isemann   RegExStr += Backref;
11855ffd940aSRaphael Isemann }
11865ffd940aSRaphael Isemann 
11875ffd940aSRaphael Isemann Expected<size_t> Pattern::match(StringRef Buffer, size_t &MatchLen,
11885ffd940aSRaphael Isemann                                 const SourceMgr &SM) const {
11895ffd940aSRaphael Isemann   // If this is the EOF pattern, match it immediately.
11905ffd940aSRaphael Isemann   if (CheckTy == Check::CheckEOF) {
11915ffd940aSRaphael Isemann     MatchLen = 0;
11925ffd940aSRaphael Isemann     return Buffer.size();
11935ffd940aSRaphael Isemann   }
11945ffd940aSRaphael Isemann 
11955ffd940aSRaphael Isemann   // If this is a fixed string pattern, just match it now.
11965ffd940aSRaphael Isemann   if (!FixedStr.empty()) {
11975ffd940aSRaphael Isemann     MatchLen = FixedStr.size();
11985ffd940aSRaphael Isemann     size_t Pos =
11995ffd940aSRaphael Isemann         IgnoreCase ? Buffer.find_lower(FixedStr) : Buffer.find(FixedStr);
12005ffd940aSRaphael Isemann     if (Pos == StringRef::npos)
12015ffd940aSRaphael Isemann       return make_error<NotFoundError>();
12025ffd940aSRaphael Isemann     return Pos;
12035ffd940aSRaphael Isemann   }
12045ffd940aSRaphael Isemann 
12055ffd940aSRaphael Isemann   // Regex match.
12065ffd940aSRaphael Isemann 
12075ffd940aSRaphael Isemann   // If there are substitutions, we need to create a temporary string with the
12085ffd940aSRaphael Isemann   // actual value.
12095ffd940aSRaphael Isemann   StringRef RegExToMatch = RegExStr;
12105ffd940aSRaphael Isemann   std::string TmpStr;
12115ffd940aSRaphael Isemann   if (!Substitutions.empty()) {
12125ffd940aSRaphael Isemann     TmpStr = RegExStr;
12135ffd940aSRaphael Isemann     if (LineNumber)
12145ffd940aSRaphael Isemann       Context->LineVariable->setValue(ExpressionValue(*LineNumber));
12155ffd940aSRaphael Isemann 
12165ffd940aSRaphael Isemann     size_t InsertOffset = 0;
12175ffd940aSRaphael Isemann     // Substitute all string variables and expressions whose values are only
12185ffd940aSRaphael Isemann     // now known. Use of string variables defined on the same line are handled
12195ffd940aSRaphael Isemann     // by back-references.
12205ffd940aSRaphael Isemann     for (const auto &Substitution : Substitutions) {
12215ffd940aSRaphael Isemann       // Substitute and check for failure (e.g. use of undefined variable).
12225ffd940aSRaphael Isemann       Expected<std::string> Value = Substitution->getResult();
12235ffd940aSRaphael Isemann       if (!Value) {
12245ffd940aSRaphael Isemann         // Convert to an ErrorDiagnostic to get location information. This is
12255ffd940aSRaphael Isemann         // done here rather than PrintNoMatch since now we know which
12265ffd940aSRaphael Isemann         // substitution block caused the overflow.
12275ffd940aSRaphael Isemann         Error Err =
12285ffd940aSRaphael Isemann             handleErrors(Value.takeError(), [&](const OverflowError &E) {
12295ffd940aSRaphael Isemann               return ErrorDiagnostic::get(SM, Substitution->getFromString(),
12305ffd940aSRaphael Isemann                                           "unable to substitute variable or "
12315ffd940aSRaphael Isemann                                           "numeric expression: overflow error");
12325ffd940aSRaphael Isemann             });
12335ffd940aSRaphael Isemann         return std::move(Err);
12345ffd940aSRaphael Isemann       }
12355ffd940aSRaphael Isemann 
12365ffd940aSRaphael Isemann       // Plop it into the regex at the adjusted offset.
12375ffd940aSRaphael Isemann       TmpStr.insert(TmpStr.begin() + Substitution->getIndex() + InsertOffset,
12385ffd940aSRaphael Isemann                     Value->begin(), Value->end());
12395ffd940aSRaphael Isemann       InsertOffset += Value->size();
12405ffd940aSRaphael Isemann     }
12415ffd940aSRaphael Isemann 
12425ffd940aSRaphael Isemann     // Match the newly constructed regex.
12435ffd940aSRaphael Isemann     RegExToMatch = TmpStr;
12445ffd940aSRaphael Isemann   }
12455ffd940aSRaphael Isemann 
12465ffd940aSRaphael Isemann   SmallVector<StringRef, 4> MatchInfo;
12475ffd940aSRaphael Isemann   unsigned int Flags = Regex::Newline;
12485ffd940aSRaphael Isemann   if (IgnoreCase)
12495ffd940aSRaphael Isemann     Flags |= Regex::IgnoreCase;
12505ffd940aSRaphael Isemann   if (!Regex(RegExToMatch, Flags).match(Buffer, &MatchInfo))
12515ffd940aSRaphael Isemann     return make_error<NotFoundError>();
12525ffd940aSRaphael Isemann 
12535ffd940aSRaphael Isemann   // Successful regex match.
12545ffd940aSRaphael Isemann   assert(!MatchInfo.empty() && "Didn't get any match");
12555ffd940aSRaphael Isemann   StringRef FullMatch = MatchInfo[0];
12565ffd940aSRaphael Isemann 
12575ffd940aSRaphael Isemann   // If this defines any string variables, remember their values.
12585ffd940aSRaphael Isemann   for (const auto &VariableDef : VariableDefs) {
12595ffd940aSRaphael Isemann     assert(VariableDef.second < MatchInfo.size() && "Internal paren error");
12605ffd940aSRaphael Isemann     Context->GlobalVariableTable[VariableDef.first] =
12615ffd940aSRaphael Isemann         MatchInfo[VariableDef.second];
12625ffd940aSRaphael Isemann   }
12635ffd940aSRaphael Isemann 
12645ffd940aSRaphael Isemann   // If this defines any numeric variables, remember their values.
12655ffd940aSRaphael Isemann   for (const auto &NumericVariableDef : NumericVariableDefs) {
12665ffd940aSRaphael Isemann     const NumericVariableMatch &NumericVariableMatch =
12675ffd940aSRaphael Isemann         NumericVariableDef.getValue();
12685ffd940aSRaphael Isemann     unsigned CaptureParenGroup = NumericVariableMatch.CaptureParenGroup;
12695ffd940aSRaphael Isemann     assert(CaptureParenGroup < MatchInfo.size() && "Internal paren error");
12705ffd940aSRaphael Isemann     NumericVariable *DefinedNumericVariable =
12715ffd940aSRaphael Isemann         NumericVariableMatch.DefinedNumericVariable;
12725ffd940aSRaphael Isemann 
12735ffd940aSRaphael Isemann     StringRef MatchedValue = MatchInfo[CaptureParenGroup];
12745ffd940aSRaphael Isemann     ExpressionFormat Format = DefinedNumericVariable->getImplicitFormat();
12755ffd940aSRaphael Isemann     Expected<ExpressionValue> Value =
12765ffd940aSRaphael Isemann         Format.valueFromStringRepr(MatchedValue, SM);
12775ffd940aSRaphael Isemann     if (!Value)
12785ffd940aSRaphael Isemann       return Value.takeError();
12795ffd940aSRaphael Isemann     DefinedNumericVariable->setValue(*Value, MatchedValue);
12805ffd940aSRaphael Isemann   }
12815ffd940aSRaphael Isemann 
12825ffd940aSRaphael Isemann   // Like CHECK-NEXT, CHECK-EMPTY's match range is considered to start after
12835ffd940aSRaphael Isemann   // the required preceding newline, which is consumed by the pattern in the
12845ffd940aSRaphael Isemann   // case of CHECK-EMPTY but not CHECK-NEXT.
12855ffd940aSRaphael Isemann   size_t MatchStartSkip = CheckTy == Check::CheckEmpty;
12865ffd940aSRaphael Isemann   MatchLen = FullMatch.size() - MatchStartSkip;
12875ffd940aSRaphael Isemann   return FullMatch.data() - Buffer.data() + MatchStartSkip;
12885ffd940aSRaphael Isemann }
12895ffd940aSRaphael Isemann 
12905ffd940aSRaphael Isemann unsigned Pattern::computeMatchDistance(StringRef Buffer) const {
12915ffd940aSRaphael Isemann   // Just compute the number of matching characters. For regular expressions, we
12925ffd940aSRaphael Isemann   // just compare against the regex itself and hope for the best.
12935ffd940aSRaphael Isemann   //
12945ffd940aSRaphael Isemann   // FIXME: One easy improvement here is have the regex lib generate a single
12955ffd940aSRaphael Isemann   // example regular expression which matches, and use that as the example
12965ffd940aSRaphael Isemann   // string.
12975ffd940aSRaphael Isemann   StringRef ExampleString(FixedStr);
12985ffd940aSRaphael Isemann   if (ExampleString.empty())
12995ffd940aSRaphael Isemann     ExampleString = RegExStr;
13005ffd940aSRaphael Isemann 
13015ffd940aSRaphael Isemann   // Only compare up to the first line in the buffer, or the string size.
13025ffd940aSRaphael Isemann   StringRef BufferPrefix = Buffer.substr(0, ExampleString.size());
13035ffd940aSRaphael Isemann   BufferPrefix = BufferPrefix.split('\n').first;
13045ffd940aSRaphael Isemann   return BufferPrefix.edit_distance(ExampleString);
13055ffd940aSRaphael Isemann }
13065ffd940aSRaphael Isemann 
13075ffd940aSRaphael Isemann void Pattern::printSubstitutions(const SourceMgr &SM, StringRef Buffer,
13085ffd940aSRaphael Isemann                                  SMRange Range,
13095ffd940aSRaphael Isemann                                  FileCheckDiag::MatchType MatchTy,
13105ffd940aSRaphael Isemann                                  std::vector<FileCheckDiag> *Diags) const {
13115ffd940aSRaphael Isemann   // Print what we know about substitutions.
13125ffd940aSRaphael Isemann   if (!Substitutions.empty()) {
13135ffd940aSRaphael Isemann     for (const auto &Substitution : Substitutions) {
13145ffd940aSRaphael Isemann       SmallString<256> Msg;
13155ffd940aSRaphael Isemann       raw_svector_ostream OS(Msg);
13165ffd940aSRaphael Isemann       Expected<std::string> MatchedValue = Substitution->getResult();
13175ffd940aSRaphael Isemann 
13185ffd940aSRaphael Isemann       // Substitution failed or is not known at match time, print the undefined
13195ffd940aSRaphael Isemann       // variables it uses.
13205ffd940aSRaphael Isemann       if (!MatchedValue) {
13215ffd940aSRaphael Isemann         bool UndefSeen = false;
13225ffd940aSRaphael Isemann         handleAllErrors(
13235ffd940aSRaphael Isemann             MatchedValue.takeError(), [](const NotFoundError &E) {},
13245ffd940aSRaphael Isemann             // Handled in PrintNoMatch().
13255ffd940aSRaphael Isemann             [](const ErrorDiagnostic &E) {},
13265ffd940aSRaphael Isemann             // Handled in match().
13275ffd940aSRaphael Isemann             [](const OverflowError &E) {},
13285ffd940aSRaphael Isemann             [&](const UndefVarError &E) {
13295ffd940aSRaphael Isemann               if (!UndefSeen) {
13305ffd940aSRaphael Isemann                 OS << "uses undefined variable(s):";
13315ffd940aSRaphael Isemann                 UndefSeen = true;
13325ffd940aSRaphael Isemann               }
13335ffd940aSRaphael Isemann               OS << " ";
13345ffd940aSRaphael Isemann               E.log(OS);
13355ffd940aSRaphael Isemann             });
13365ffd940aSRaphael Isemann       } else {
13375ffd940aSRaphael Isemann         // Substitution succeeded. Print substituted value.
13385ffd940aSRaphael Isemann         OS << "with \"";
13395ffd940aSRaphael Isemann         OS.write_escaped(Substitution->getFromString()) << "\" equal to \"";
13405ffd940aSRaphael Isemann         OS.write_escaped(*MatchedValue) << "\"";
13415ffd940aSRaphael Isemann       }
13425ffd940aSRaphael Isemann 
13435ffd940aSRaphael Isemann       // We report only the start of the match/search range to suggest we are
13445ffd940aSRaphael Isemann       // reporting the substitutions as set at the start of the match/search.
13455ffd940aSRaphael Isemann       // Indicating a non-zero-length range might instead seem to imply that the
13465ffd940aSRaphael Isemann       // substitution matches or was captured from exactly that range.
13475ffd940aSRaphael Isemann       if (Diags)
13485ffd940aSRaphael Isemann         Diags->emplace_back(SM, CheckTy, getLoc(), MatchTy,
13495ffd940aSRaphael Isemann                             SMRange(Range.Start, Range.Start), OS.str());
13505ffd940aSRaphael Isemann       else
13515ffd940aSRaphael Isemann         SM.PrintMessage(Range.Start, SourceMgr::DK_Note, OS.str());
13525ffd940aSRaphael Isemann     }
13535ffd940aSRaphael Isemann   }
13545ffd940aSRaphael Isemann }
13555ffd940aSRaphael Isemann 
13565ffd940aSRaphael Isemann void Pattern::printVariableDefs(const SourceMgr &SM,
13575ffd940aSRaphael Isemann                                 FileCheckDiag::MatchType MatchTy,
13585ffd940aSRaphael Isemann                                 std::vector<FileCheckDiag> *Diags) const {
13595ffd940aSRaphael Isemann   if (VariableDefs.empty() && NumericVariableDefs.empty())
13605ffd940aSRaphael Isemann     return;
13615ffd940aSRaphael Isemann   // Build list of variable captures.
13625ffd940aSRaphael Isemann   struct VarCapture {
13635ffd940aSRaphael Isemann     StringRef Name;
13645ffd940aSRaphael Isemann     SMRange Range;
13655ffd940aSRaphael Isemann   };
13665ffd940aSRaphael Isemann   SmallVector<VarCapture, 2> VarCaptures;
13675ffd940aSRaphael Isemann   for (const auto &VariableDef : VariableDefs) {
13685ffd940aSRaphael Isemann     VarCapture VC;
13695ffd940aSRaphael Isemann     VC.Name = VariableDef.first;
13705ffd940aSRaphael Isemann     StringRef Value = Context->GlobalVariableTable[VC.Name];
13715ffd940aSRaphael Isemann     SMLoc Start = SMLoc::getFromPointer(Value.data());
13725ffd940aSRaphael Isemann     SMLoc End = SMLoc::getFromPointer(Value.data() + Value.size());
13735ffd940aSRaphael Isemann     VC.Range = SMRange(Start, End);
13745ffd940aSRaphael Isemann     VarCaptures.push_back(VC);
13755ffd940aSRaphael Isemann   }
13765ffd940aSRaphael Isemann   for (const auto &VariableDef : NumericVariableDefs) {
13775ffd940aSRaphael Isemann     VarCapture VC;
13785ffd940aSRaphael Isemann     VC.Name = VariableDef.getKey();
13795ffd940aSRaphael Isemann     StringRef StrValue = VariableDef.getValue()
13805ffd940aSRaphael Isemann                              .DefinedNumericVariable->getStringValue()
13815ffd940aSRaphael Isemann                              .getValue();
13825ffd940aSRaphael Isemann     SMLoc Start = SMLoc::getFromPointer(StrValue.data());
13835ffd940aSRaphael Isemann     SMLoc End = SMLoc::getFromPointer(StrValue.data() + StrValue.size());
13845ffd940aSRaphael Isemann     VC.Range = SMRange(Start, End);
13855ffd940aSRaphael Isemann     VarCaptures.push_back(VC);
13865ffd940aSRaphael Isemann   }
13875ffd940aSRaphael Isemann   // Sort variable captures by the order in which they matched the input.
13885ffd940aSRaphael Isemann   // Ranges shouldn't be overlapping, so we can just compare the start.
1389*352fcfc6SKazu Hirata   llvm::sort(VarCaptures, [](const VarCapture &A, const VarCapture &B) {
13905ffd940aSRaphael Isemann     assert(A.Range.Start != B.Range.Start &&
13915ffd940aSRaphael Isemann            "unexpected overlapping variable captures");
13925ffd940aSRaphael Isemann     return A.Range.Start.getPointer() < B.Range.Start.getPointer();
13935ffd940aSRaphael Isemann   });
13945ffd940aSRaphael Isemann   // Create notes for the sorted captures.
13955ffd940aSRaphael Isemann   for (const VarCapture &VC : VarCaptures) {
13965ffd940aSRaphael Isemann     SmallString<256> Msg;
13975ffd940aSRaphael Isemann     raw_svector_ostream OS(Msg);
13985ffd940aSRaphael Isemann     OS << "captured var \"" << VC.Name << "\"";
13995ffd940aSRaphael Isemann     if (Diags)
14005ffd940aSRaphael Isemann       Diags->emplace_back(SM, CheckTy, getLoc(), MatchTy, VC.Range, OS.str());
14015ffd940aSRaphael Isemann     else
14025ffd940aSRaphael Isemann       SM.PrintMessage(VC.Range.Start, SourceMgr::DK_Note, OS.str(), VC.Range);
14035ffd940aSRaphael Isemann   }
14045ffd940aSRaphael Isemann }
14055ffd940aSRaphael Isemann 
14065ffd940aSRaphael Isemann static SMRange ProcessMatchResult(FileCheckDiag::MatchType MatchTy,
14075ffd940aSRaphael Isemann                                   const SourceMgr &SM, SMLoc Loc,
14085ffd940aSRaphael Isemann                                   Check::FileCheckType CheckTy,
14095ffd940aSRaphael Isemann                                   StringRef Buffer, size_t Pos, size_t Len,
14105ffd940aSRaphael Isemann                                   std::vector<FileCheckDiag> *Diags,
14115ffd940aSRaphael Isemann                                   bool AdjustPrevDiags = false) {
14125ffd940aSRaphael Isemann   SMLoc Start = SMLoc::getFromPointer(Buffer.data() + Pos);
14135ffd940aSRaphael Isemann   SMLoc End = SMLoc::getFromPointer(Buffer.data() + Pos + Len);
14145ffd940aSRaphael Isemann   SMRange Range(Start, End);
14155ffd940aSRaphael Isemann   if (Diags) {
14165ffd940aSRaphael Isemann     if (AdjustPrevDiags) {
14175ffd940aSRaphael Isemann       SMLoc CheckLoc = Diags->rbegin()->CheckLoc;
14185ffd940aSRaphael Isemann       for (auto I = Diags->rbegin(), E = Diags->rend();
14195ffd940aSRaphael Isemann            I != E && I->CheckLoc == CheckLoc; ++I)
14205ffd940aSRaphael Isemann         I->MatchTy = MatchTy;
14215ffd940aSRaphael Isemann     } else
14225ffd940aSRaphael Isemann       Diags->emplace_back(SM, CheckTy, Loc, MatchTy, Range);
14235ffd940aSRaphael Isemann   }
14245ffd940aSRaphael Isemann   return Range;
14255ffd940aSRaphael Isemann }
14265ffd940aSRaphael Isemann 
14275ffd940aSRaphael Isemann void Pattern::printFuzzyMatch(const SourceMgr &SM, StringRef Buffer,
14285ffd940aSRaphael Isemann                               std::vector<FileCheckDiag> *Diags) const {
14295ffd940aSRaphael Isemann   // Attempt to find the closest/best fuzzy match.  Usually an error happens
14305ffd940aSRaphael Isemann   // because some string in the output didn't exactly match. In these cases, we
14315ffd940aSRaphael Isemann   // would like to show the user a best guess at what "should have" matched, to
14325ffd940aSRaphael Isemann   // save them having to actually check the input manually.
14335ffd940aSRaphael Isemann   size_t NumLinesForward = 0;
14345ffd940aSRaphael Isemann   size_t Best = StringRef::npos;
14355ffd940aSRaphael Isemann   double BestQuality = 0;
14365ffd940aSRaphael Isemann 
14375ffd940aSRaphael Isemann   // Use an arbitrary 4k limit on how far we will search.
14385ffd940aSRaphael Isemann   for (size_t i = 0, e = std::min(size_t(4096), Buffer.size()); i != e; ++i) {
14395ffd940aSRaphael Isemann     if (Buffer[i] == '\n')
14405ffd940aSRaphael Isemann       ++NumLinesForward;
14415ffd940aSRaphael Isemann 
14425ffd940aSRaphael Isemann     // Patterns have leading whitespace stripped, so skip whitespace when
14435ffd940aSRaphael Isemann     // looking for something which looks like a pattern.
14445ffd940aSRaphael Isemann     if (Buffer[i] == ' ' || Buffer[i] == '\t')
14455ffd940aSRaphael Isemann       continue;
14465ffd940aSRaphael Isemann 
14475ffd940aSRaphael Isemann     // Compute the "quality" of this match as an arbitrary combination of the
14485ffd940aSRaphael Isemann     // match distance and the number of lines skipped to get to this match.
14495ffd940aSRaphael Isemann     unsigned Distance = computeMatchDistance(Buffer.substr(i));
14505ffd940aSRaphael Isemann     double Quality = Distance + (NumLinesForward / 100.);
14515ffd940aSRaphael Isemann 
14525ffd940aSRaphael Isemann     if (Quality < BestQuality || Best == StringRef::npos) {
14535ffd940aSRaphael Isemann       Best = i;
14545ffd940aSRaphael Isemann       BestQuality = Quality;
14555ffd940aSRaphael Isemann     }
14565ffd940aSRaphael Isemann   }
14575ffd940aSRaphael Isemann 
14585ffd940aSRaphael Isemann   // Print the "possible intended match here" line if we found something
14595ffd940aSRaphael Isemann   // reasonable and not equal to what we showed in the "scanning from here"
14605ffd940aSRaphael Isemann   // line.
14615ffd940aSRaphael Isemann   if (Best && Best != StringRef::npos && BestQuality < 50) {
14625ffd940aSRaphael Isemann     SMRange MatchRange =
14635ffd940aSRaphael Isemann         ProcessMatchResult(FileCheckDiag::MatchFuzzy, SM, getLoc(),
14645ffd940aSRaphael Isemann                            getCheckTy(), Buffer, Best, 0, Diags);
14655ffd940aSRaphael Isemann     SM.PrintMessage(MatchRange.Start, SourceMgr::DK_Note,
14665ffd940aSRaphael Isemann                     "possible intended match here");
14675ffd940aSRaphael Isemann 
14685ffd940aSRaphael Isemann     // FIXME: If we wanted to be really friendly we would show why the match
14695ffd940aSRaphael Isemann     // failed, as it can be hard to spot simple one character differences.
14705ffd940aSRaphael Isemann   }
14715ffd940aSRaphael Isemann }
14725ffd940aSRaphael Isemann 
14735ffd940aSRaphael Isemann Expected<StringRef>
14745ffd940aSRaphael Isemann FileCheckPatternContext::getPatternVarValue(StringRef VarName) {
14755ffd940aSRaphael Isemann   auto VarIter = GlobalVariableTable.find(VarName);
14765ffd940aSRaphael Isemann   if (VarIter == GlobalVariableTable.end())
14775ffd940aSRaphael Isemann     return make_error<UndefVarError>(VarName);
14785ffd940aSRaphael Isemann 
14795ffd940aSRaphael Isemann   return VarIter->second;
14805ffd940aSRaphael Isemann }
14815ffd940aSRaphael Isemann 
14825ffd940aSRaphael Isemann template <class... Types>
14835ffd940aSRaphael Isemann NumericVariable *FileCheckPatternContext::makeNumericVariable(Types... args) {
14845ffd940aSRaphael Isemann   NumericVariables.push_back(std::make_unique<NumericVariable>(args...));
14855ffd940aSRaphael Isemann   return NumericVariables.back().get();
14865ffd940aSRaphael Isemann }
14875ffd940aSRaphael Isemann 
14885ffd940aSRaphael Isemann Substitution *
14895ffd940aSRaphael Isemann FileCheckPatternContext::makeStringSubstitution(StringRef VarName,
14905ffd940aSRaphael Isemann                                                 size_t InsertIdx) {
14915ffd940aSRaphael Isemann   Substitutions.push_back(
14925ffd940aSRaphael Isemann       std::make_unique<StringSubstitution>(this, VarName, InsertIdx));
14935ffd940aSRaphael Isemann   return Substitutions.back().get();
14945ffd940aSRaphael Isemann }
14955ffd940aSRaphael Isemann 
14965ffd940aSRaphael Isemann Substitution *FileCheckPatternContext::makeNumericSubstitution(
14975ffd940aSRaphael Isemann     StringRef ExpressionStr, std::unique_ptr<Expression> Expression,
14985ffd940aSRaphael Isemann     size_t InsertIdx) {
14995ffd940aSRaphael Isemann   Substitutions.push_back(std::make_unique<NumericSubstitution>(
15005ffd940aSRaphael Isemann       this, ExpressionStr, std::move(Expression), InsertIdx));
15015ffd940aSRaphael Isemann   return Substitutions.back().get();
15025ffd940aSRaphael Isemann }
15035ffd940aSRaphael Isemann 
15045ffd940aSRaphael Isemann size_t Pattern::FindRegexVarEnd(StringRef Str, SourceMgr &SM) {
15055ffd940aSRaphael Isemann   // Offset keeps track of the current offset within the input Str
15065ffd940aSRaphael Isemann   size_t Offset = 0;
15075ffd940aSRaphael Isemann   // [...] Nesting depth
15085ffd940aSRaphael Isemann   size_t BracketDepth = 0;
15095ffd940aSRaphael Isemann 
15105ffd940aSRaphael Isemann   while (!Str.empty()) {
15115ffd940aSRaphael Isemann     if (Str.startswith("]]") && BracketDepth == 0)
15125ffd940aSRaphael Isemann       return Offset;
15135ffd940aSRaphael Isemann     if (Str[0] == '\\') {
15145ffd940aSRaphael Isemann       // Backslash escapes the next char within regexes, so skip them both.
15155ffd940aSRaphael Isemann       Str = Str.substr(2);
15165ffd940aSRaphael Isemann       Offset += 2;
15175ffd940aSRaphael Isemann     } else {
15185ffd940aSRaphael Isemann       switch (Str[0]) {
15195ffd940aSRaphael Isemann       default:
15205ffd940aSRaphael Isemann         break;
15215ffd940aSRaphael Isemann       case '[':
15225ffd940aSRaphael Isemann         BracketDepth++;
15235ffd940aSRaphael Isemann         break;
15245ffd940aSRaphael Isemann       case ']':
15255ffd940aSRaphael Isemann         if (BracketDepth == 0) {
15265ffd940aSRaphael Isemann           SM.PrintMessage(SMLoc::getFromPointer(Str.data()),
15275ffd940aSRaphael Isemann                           SourceMgr::DK_Error,
15285ffd940aSRaphael Isemann                           "missing closing \"]\" for regex variable");
15295ffd940aSRaphael Isemann           exit(1);
15305ffd940aSRaphael Isemann         }
15315ffd940aSRaphael Isemann         BracketDepth--;
15325ffd940aSRaphael Isemann         break;
15335ffd940aSRaphael Isemann       }
15345ffd940aSRaphael Isemann       Str = Str.substr(1);
15355ffd940aSRaphael Isemann       Offset++;
15365ffd940aSRaphael Isemann     }
15375ffd940aSRaphael Isemann   }
15385ffd940aSRaphael Isemann 
15395ffd940aSRaphael Isemann   return StringRef::npos;
15405ffd940aSRaphael Isemann }
15415ffd940aSRaphael Isemann 
15425ffd940aSRaphael Isemann StringRef FileCheck::CanonicalizeFile(MemoryBuffer &MB,
15435ffd940aSRaphael Isemann                                       SmallVectorImpl<char> &OutputBuffer) {
15445ffd940aSRaphael Isemann   OutputBuffer.reserve(MB.getBufferSize());
15455ffd940aSRaphael Isemann 
15465ffd940aSRaphael Isemann   for (const char *Ptr = MB.getBufferStart(), *End = MB.getBufferEnd();
15475ffd940aSRaphael Isemann        Ptr != End; ++Ptr) {
15485ffd940aSRaphael Isemann     // Eliminate trailing dosish \r.
15495ffd940aSRaphael Isemann     if (Ptr <= End - 2 && Ptr[0] == '\r' && Ptr[1] == '\n') {
15505ffd940aSRaphael Isemann       continue;
15515ffd940aSRaphael Isemann     }
15525ffd940aSRaphael Isemann 
15535ffd940aSRaphael Isemann     // If current char is not a horizontal whitespace or if horizontal
15545ffd940aSRaphael Isemann     // whitespace canonicalization is disabled, dump it to output as is.
15555ffd940aSRaphael Isemann     if (Req.NoCanonicalizeWhiteSpace || (*Ptr != ' ' && *Ptr != '\t')) {
15565ffd940aSRaphael Isemann       OutputBuffer.push_back(*Ptr);
15575ffd940aSRaphael Isemann       continue;
15585ffd940aSRaphael Isemann     }
15595ffd940aSRaphael Isemann 
15605ffd940aSRaphael Isemann     // Otherwise, add one space and advance over neighboring space.
15615ffd940aSRaphael Isemann     OutputBuffer.push_back(' ');
15625ffd940aSRaphael Isemann     while (Ptr + 1 != End && (Ptr[1] == ' ' || Ptr[1] == '\t'))
15635ffd940aSRaphael Isemann       ++Ptr;
15645ffd940aSRaphael Isemann   }
15655ffd940aSRaphael Isemann 
15665ffd940aSRaphael Isemann   // Add a null byte and then return all but that byte.
15675ffd940aSRaphael Isemann   OutputBuffer.push_back('\0');
15685ffd940aSRaphael Isemann   return StringRef(OutputBuffer.data(), OutputBuffer.size() - 1);
15695ffd940aSRaphael Isemann }
15705ffd940aSRaphael Isemann 
15715ffd940aSRaphael Isemann FileCheckDiag::FileCheckDiag(const SourceMgr &SM,
15725ffd940aSRaphael Isemann                              const Check::FileCheckType &CheckTy,
15735ffd940aSRaphael Isemann                              SMLoc CheckLoc, MatchType MatchTy,
15745ffd940aSRaphael Isemann                              SMRange InputRange, StringRef Note)
15755ffd940aSRaphael Isemann     : CheckTy(CheckTy), CheckLoc(CheckLoc), MatchTy(MatchTy), Note(Note) {
15765ffd940aSRaphael Isemann   auto Start = SM.getLineAndColumn(InputRange.Start);
15775ffd940aSRaphael Isemann   auto End = SM.getLineAndColumn(InputRange.End);
15785ffd940aSRaphael Isemann   InputStartLine = Start.first;
15795ffd940aSRaphael Isemann   InputStartCol = Start.second;
15805ffd940aSRaphael Isemann   InputEndLine = End.first;
15815ffd940aSRaphael Isemann   InputEndCol = End.second;
15825ffd940aSRaphael Isemann }
15835ffd940aSRaphael Isemann 
15845ffd940aSRaphael Isemann static bool IsPartOfWord(char c) {
15855ffd940aSRaphael Isemann   return (isAlnum(c) || c == '-' || c == '_');
15865ffd940aSRaphael Isemann }
15875ffd940aSRaphael Isemann 
15885ffd940aSRaphael Isemann Check::FileCheckType &Check::FileCheckType::setCount(int C) {
15895ffd940aSRaphael Isemann   assert(Count > 0 && "zero and negative counts are not supported");
15905ffd940aSRaphael Isemann   assert((C == 1 || Kind == CheckPlain) &&
15915ffd940aSRaphael Isemann          "count supported only for plain CHECK directives");
15925ffd940aSRaphael Isemann   Count = C;
15935ffd940aSRaphael Isemann   return *this;
15945ffd940aSRaphael Isemann }
15955ffd940aSRaphael Isemann 
159644f399ccSJacques Pienaar std::string Check::FileCheckType::getModifiersDescription() const {
159744f399ccSJacques Pienaar   if (Modifiers.none())
159844f399ccSJacques Pienaar     return "";
159944f399ccSJacques Pienaar   std::string Ret;
160044f399ccSJacques Pienaar   raw_string_ostream OS(Ret);
160144f399ccSJacques Pienaar   OS << '{';
160244f399ccSJacques Pienaar   if (isLiteralMatch())
160344f399ccSJacques Pienaar     OS << "LITERAL";
160444f399ccSJacques Pienaar   OS << '}';
160544f399ccSJacques Pienaar   return OS.str();
160644f399ccSJacques Pienaar }
160744f399ccSJacques Pienaar 
16085ffd940aSRaphael Isemann std::string Check::FileCheckType::getDescription(StringRef Prefix) const {
160944f399ccSJacques Pienaar   // Append directive modifiers.
161044f399ccSJacques Pienaar   auto WithModifiers = [this, Prefix](StringRef Str) -> std::string {
161144f399ccSJacques Pienaar     return (Prefix + Str + getModifiersDescription()).str();
161244f399ccSJacques Pienaar   };
161344f399ccSJacques Pienaar 
16145ffd940aSRaphael Isemann   switch (Kind) {
16155ffd940aSRaphael Isemann   case Check::CheckNone:
16165ffd940aSRaphael Isemann     return "invalid";
16175ffd940aSRaphael Isemann   case Check::CheckPlain:
16185ffd940aSRaphael Isemann     if (Count > 1)
161944f399ccSJacques Pienaar       return WithModifiers("-COUNT");
162044f399ccSJacques Pienaar     return WithModifiers("");
16215ffd940aSRaphael Isemann   case Check::CheckNext:
162244f399ccSJacques Pienaar     return WithModifiers("-NEXT");
16235ffd940aSRaphael Isemann   case Check::CheckSame:
162444f399ccSJacques Pienaar     return WithModifiers("-SAME");
16255ffd940aSRaphael Isemann   case Check::CheckNot:
162644f399ccSJacques Pienaar     return WithModifiers("-NOT");
16275ffd940aSRaphael Isemann   case Check::CheckDAG:
162844f399ccSJacques Pienaar     return WithModifiers("-DAG");
16295ffd940aSRaphael Isemann   case Check::CheckLabel:
163044f399ccSJacques Pienaar     return WithModifiers("-LABEL");
16315ffd940aSRaphael Isemann   case Check::CheckEmpty:
163244f399ccSJacques Pienaar     return WithModifiers("-EMPTY");
16335ffd940aSRaphael Isemann   case Check::CheckComment:
16345ffd940aSRaphael Isemann     return std::string(Prefix);
16355ffd940aSRaphael Isemann   case Check::CheckEOF:
16365ffd940aSRaphael Isemann     return "implicit EOF";
16375ffd940aSRaphael Isemann   case Check::CheckBadNot:
16385ffd940aSRaphael Isemann     return "bad NOT";
16395ffd940aSRaphael Isemann   case Check::CheckBadCount:
16405ffd940aSRaphael Isemann     return "bad COUNT";
16415ffd940aSRaphael Isemann   }
16425ffd940aSRaphael Isemann   llvm_unreachable("unknown FileCheckType");
16435ffd940aSRaphael Isemann }
16445ffd940aSRaphael Isemann 
16455ffd940aSRaphael Isemann static std::pair<Check::FileCheckType, StringRef>
16465ffd940aSRaphael Isemann FindCheckType(const FileCheckRequest &Req, StringRef Buffer, StringRef Prefix) {
16475ffd940aSRaphael Isemann   if (Buffer.size() <= Prefix.size())
16485ffd940aSRaphael Isemann     return {Check::CheckNone, StringRef()};
16495ffd940aSRaphael Isemann 
165044f399ccSJacques Pienaar   StringRef Rest = Buffer.drop_front(Prefix.size());
16515ffd940aSRaphael Isemann   // Check for comment.
16525ffd940aSRaphael Isemann   if (llvm::is_contained(Req.CommentPrefixes, Prefix)) {
165344f399ccSJacques Pienaar     if (Rest.consume_front(":"))
16545ffd940aSRaphael Isemann       return {Check::CheckComment, Rest};
16555ffd940aSRaphael Isemann     // Ignore a comment prefix if it has a suffix like "-NOT".
16565ffd940aSRaphael Isemann     return {Check::CheckNone, StringRef()};
16575ffd940aSRaphael Isemann   }
16585ffd940aSRaphael Isemann 
165944f399ccSJacques Pienaar   auto ConsumeModifiers = [&](Check::FileCheckType Ret)
166044f399ccSJacques Pienaar       -> std::pair<Check::FileCheckType, StringRef> {
166144f399ccSJacques Pienaar     if (Rest.consume_front(":"))
166244f399ccSJacques Pienaar       return {Ret, Rest};
166344f399ccSJacques Pienaar     if (!Rest.consume_front("{"))
166444f399ccSJacques Pienaar       return {Check::CheckNone, StringRef()};
16655ffd940aSRaphael Isemann 
166644f399ccSJacques Pienaar     // Parse the modifiers, speparated by commas.
166744f399ccSJacques Pienaar     do {
166844f399ccSJacques Pienaar       // Allow whitespace in modifiers list.
166944f399ccSJacques Pienaar       Rest = Rest.ltrim();
167044f399ccSJacques Pienaar       if (Rest.consume_front("LITERAL"))
167144f399ccSJacques Pienaar         Ret.setLiteralMatch();
167244f399ccSJacques Pienaar       else
167344f399ccSJacques Pienaar         return {Check::CheckNone, Rest};
167444f399ccSJacques Pienaar       // Allow whitespace in modifiers list.
167544f399ccSJacques Pienaar       Rest = Rest.ltrim();
167644f399ccSJacques Pienaar     } while (Rest.consume_front(","));
167744f399ccSJacques Pienaar     if (!Rest.consume_front("}:"))
167844f399ccSJacques Pienaar       return {Check::CheckNone, Rest};
167944f399ccSJacques Pienaar     return {Ret, Rest};
168044f399ccSJacques Pienaar   };
168144f399ccSJacques Pienaar 
168244f399ccSJacques Pienaar   // Verify that the prefix is followed by directive modifiers or a colon.
168344f399ccSJacques Pienaar   if (Rest.consume_front(":"))
168444f399ccSJacques Pienaar     return {Check::CheckPlain, Rest};
168544f399ccSJacques Pienaar   if (Rest.front() == '{')
168644f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckPlain);
168744f399ccSJacques Pienaar 
168844f399ccSJacques Pienaar   if (!Rest.consume_front("-"))
16895ffd940aSRaphael Isemann     return {Check::CheckNone, StringRef()};
16905ffd940aSRaphael Isemann 
16915ffd940aSRaphael Isemann   if (Rest.consume_front("COUNT-")) {
16925ffd940aSRaphael Isemann     int64_t Count;
16935ffd940aSRaphael Isemann     if (Rest.consumeInteger(10, Count))
16945ffd940aSRaphael Isemann       // Error happened in parsing integer.
16955ffd940aSRaphael Isemann       return {Check::CheckBadCount, Rest};
16965ffd940aSRaphael Isemann     if (Count <= 0 || Count > INT32_MAX)
16975ffd940aSRaphael Isemann       return {Check::CheckBadCount, Rest};
169844f399ccSJacques Pienaar     if (Rest.front() != ':' && Rest.front() != '{')
16995ffd940aSRaphael Isemann       return {Check::CheckBadCount, Rest};
170044f399ccSJacques Pienaar     return ConsumeModifiers(
170144f399ccSJacques Pienaar         Check::FileCheckType(Check::CheckPlain).setCount(Count));
17025ffd940aSRaphael Isemann   }
17035ffd940aSRaphael Isemann 
17045ffd940aSRaphael Isemann   // You can't combine -NOT with another suffix.
17055ffd940aSRaphael Isemann   if (Rest.startswith("DAG-NOT:") || Rest.startswith("NOT-DAG:") ||
17065ffd940aSRaphael Isemann       Rest.startswith("NEXT-NOT:") || Rest.startswith("NOT-NEXT:") ||
17075ffd940aSRaphael Isemann       Rest.startswith("SAME-NOT:") || Rest.startswith("NOT-SAME:") ||
17085ffd940aSRaphael Isemann       Rest.startswith("EMPTY-NOT:") || Rest.startswith("NOT-EMPTY:"))
17095ffd940aSRaphael Isemann     return {Check::CheckBadNot, Rest};
17105ffd940aSRaphael Isemann 
171144f399ccSJacques Pienaar   if (Rest.consume_front("NEXT"))
171244f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckNext);
171344f399ccSJacques Pienaar 
171444f399ccSJacques Pienaar   if (Rest.consume_front("SAME"))
171544f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckSame);
171644f399ccSJacques Pienaar 
171744f399ccSJacques Pienaar   if (Rest.consume_front("NOT"))
171844f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckNot);
171944f399ccSJacques Pienaar 
172044f399ccSJacques Pienaar   if (Rest.consume_front("DAG"))
172144f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckDAG);
172244f399ccSJacques Pienaar 
172344f399ccSJacques Pienaar   if (Rest.consume_front("LABEL"))
172444f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckLabel);
172544f399ccSJacques Pienaar 
172644f399ccSJacques Pienaar   if (Rest.consume_front("EMPTY"))
172744f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckEmpty);
172844f399ccSJacques Pienaar 
17295ffd940aSRaphael Isemann   return {Check::CheckNone, Rest};
17305ffd940aSRaphael Isemann }
17315ffd940aSRaphael Isemann 
17325ffd940aSRaphael Isemann // From the given position, find the next character after the word.
17335ffd940aSRaphael Isemann static size_t SkipWord(StringRef Str, size_t Loc) {
17345ffd940aSRaphael Isemann   while (Loc < Str.size() && IsPartOfWord(Str[Loc]))
17355ffd940aSRaphael Isemann     ++Loc;
17365ffd940aSRaphael Isemann   return Loc;
17375ffd940aSRaphael Isemann }
17385ffd940aSRaphael Isemann 
17395ffd940aSRaphael Isemann /// Searches the buffer for the first prefix in the prefix regular expression.
17405ffd940aSRaphael Isemann ///
17415ffd940aSRaphael Isemann /// This searches the buffer using the provided regular expression, however it
17425ffd940aSRaphael Isemann /// enforces constraints beyond that:
17435ffd940aSRaphael Isemann /// 1) The found prefix must not be a suffix of something that looks like
17445ffd940aSRaphael Isemann ///    a valid prefix.
17455ffd940aSRaphael Isemann /// 2) The found prefix must be followed by a valid check type suffix using \c
17465ffd940aSRaphael Isemann ///    FindCheckType above.
17475ffd940aSRaphael Isemann ///
17485ffd940aSRaphael Isemann /// \returns a pair of StringRefs into the Buffer, which combines:
17495ffd940aSRaphael Isemann ///   - the first match of the regular expression to satisfy these two is
17505ffd940aSRaphael Isemann ///   returned,
17515ffd940aSRaphael Isemann ///     otherwise an empty StringRef is returned to indicate failure.
17525ffd940aSRaphael Isemann ///   - buffer rewound to the location right after parsed suffix, for parsing
17535ffd940aSRaphael Isemann ///     to continue from
17545ffd940aSRaphael Isemann ///
17555ffd940aSRaphael Isemann /// If this routine returns a valid prefix, it will also shrink \p Buffer to
17565ffd940aSRaphael Isemann /// start at the beginning of the returned prefix, increment \p LineNumber for
17575ffd940aSRaphael Isemann /// each new line consumed from \p Buffer, and set \p CheckTy to the type of
17585ffd940aSRaphael Isemann /// check found by examining the suffix.
17595ffd940aSRaphael Isemann ///
17605ffd940aSRaphael Isemann /// If no valid prefix is found, the state of Buffer, LineNumber, and CheckTy
17615ffd940aSRaphael Isemann /// is unspecified.
17625ffd940aSRaphael Isemann static std::pair<StringRef, StringRef>
17635ffd940aSRaphael Isemann FindFirstMatchingPrefix(const FileCheckRequest &Req, Regex &PrefixRE,
17645ffd940aSRaphael Isemann                         StringRef &Buffer, unsigned &LineNumber,
17655ffd940aSRaphael Isemann                         Check::FileCheckType &CheckTy) {
17665ffd940aSRaphael Isemann   SmallVector<StringRef, 2> Matches;
17675ffd940aSRaphael Isemann 
17685ffd940aSRaphael Isemann   while (!Buffer.empty()) {
17695ffd940aSRaphael Isemann     // Find the first (longest) match using the RE.
17705ffd940aSRaphael Isemann     if (!PrefixRE.match(Buffer, &Matches))
17715ffd940aSRaphael Isemann       // No match at all, bail.
17725ffd940aSRaphael Isemann       return {StringRef(), StringRef()};
17735ffd940aSRaphael Isemann 
17745ffd940aSRaphael Isemann     StringRef Prefix = Matches[0];
17755ffd940aSRaphael Isemann     Matches.clear();
17765ffd940aSRaphael Isemann 
17775ffd940aSRaphael Isemann     assert(Prefix.data() >= Buffer.data() &&
17785ffd940aSRaphael Isemann            Prefix.data() < Buffer.data() + Buffer.size() &&
17795ffd940aSRaphael Isemann            "Prefix doesn't start inside of buffer!");
17805ffd940aSRaphael Isemann     size_t Loc = Prefix.data() - Buffer.data();
17815ffd940aSRaphael Isemann     StringRef Skipped = Buffer.substr(0, Loc);
17825ffd940aSRaphael Isemann     Buffer = Buffer.drop_front(Loc);
17835ffd940aSRaphael Isemann     LineNumber += Skipped.count('\n');
17845ffd940aSRaphael Isemann 
17855ffd940aSRaphael Isemann     // Check that the matched prefix isn't a suffix of some other check-like
17865ffd940aSRaphael Isemann     // word.
17875ffd940aSRaphael Isemann     // FIXME: This is a very ad-hoc check. it would be better handled in some
17885ffd940aSRaphael Isemann     // other way. Among other things it seems hard to distinguish between
17895ffd940aSRaphael Isemann     // intentional and unintentional uses of this feature.
17905ffd940aSRaphael Isemann     if (Skipped.empty() || !IsPartOfWord(Skipped.back())) {
17915ffd940aSRaphael Isemann       // Now extract the type.
17925ffd940aSRaphael Isemann       StringRef AfterSuffix;
17935ffd940aSRaphael Isemann       std::tie(CheckTy, AfterSuffix) = FindCheckType(Req, Buffer, Prefix);
17945ffd940aSRaphael Isemann 
17955ffd940aSRaphael Isemann       // If we've found a valid check type for this prefix, we're done.
17965ffd940aSRaphael Isemann       if (CheckTy != Check::CheckNone)
17975ffd940aSRaphael Isemann         return {Prefix, AfterSuffix};
17985ffd940aSRaphael Isemann     }
17995ffd940aSRaphael Isemann 
18005ffd940aSRaphael Isemann     // If we didn't successfully find a prefix, we need to skip this invalid
18015ffd940aSRaphael Isemann     // prefix and continue scanning. We directly skip the prefix that was
18025ffd940aSRaphael Isemann     // matched and any additional parts of that check-like word.
18035ffd940aSRaphael Isemann     Buffer = Buffer.drop_front(SkipWord(Buffer, Prefix.size()));
18045ffd940aSRaphael Isemann   }
18055ffd940aSRaphael Isemann 
18065ffd940aSRaphael Isemann   // We ran out of buffer while skipping partial matches so give up.
18075ffd940aSRaphael Isemann   return {StringRef(), StringRef()};
18085ffd940aSRaphael Isemann }
18095ffd940aSRaphael Isemann 
18105ffd940aSRaphael Isemann void FileCheckPatternContext::createLineVariable() {
18115ffd940aSRaphael Isemann   assert(!LineVariable && "@LINE pseudo numeric variable already created");
18125ffd940aSRaphael Isemann   StringRef LineName = "@LINE";
18135ffd940aSRaphael Isemann   LineVariable = makeNumericVariable(
18145ffd940aSRaphael Isemann       LineName, ExpressionFormat(ExpressionFormat::Kind::Unsigned));
18155ffd940aSRaphael Isemann   GlobalNumericVariableTable[LineName] = LineVariable;
18165ffd940aSRaphael Isemann }
18175ffd940aSRaphael Isemann 
18185ffd940aSRaphael Isemann FileCheck::FileCheck(FileCheckRequest Req)
18195ffd940aSRaphael Isemann     : Req(Req), PatternContext(std::make_unique<FileCheckPatternContext>()),
18205ffd940aSRaphael Isemann       CheckStrings(std::make_unique<std::vector<FileCheckString>>()) {}
18215ffd940aSRaphael Isemann 
18225ffd940aSRaphael Isemann FileCheck::~FileCheck() = default;
18235ffd940aSRaphael Isemann 
18245ffd940aSRaphael Isemann bool FileCheck::readCheckFile(
18255ffd940aSRaphael Isemann     SourceMgr &SM, StringRef Buffer, Regex &PrefixRE,
18265ffd940aSRaphael Isemann     std::pair<unsigned, unsigned> *ImpPatBufferIDRange) {
18275ffd940aSRaphael Isemann   if (ImpPatBufferIDRange)
18285ffd940aSRaphael Isemann     ImpPatBufferIDRange->first = ImpPatBufferIDRange->second = 0;
18295ffd940aSRaphael Isemann 
18305ffd940aSRaphael Isemann   Error DefineError =
18315ffd940aSRaphael Isemann       PatternContext->defineCmdlineVariables(Req.GlobalDefines, SM);
18325ffd940aSRaphael Isemann   if (DefineError) {
18335ffd940aSRaphael Isemann     logAllUnhandledErrors(std::move(DefineError), errs());
18345ffd940aSRaphael Isemann     return true;
18355ffd940aSRaphael Isemann   }
18365ffd940aSRaphael Isemann 
18375ffd940aSRaphael Isemann   PatternContext->createLineVariable();
18385ffd940aSRaphael Isemann 
18395ffd940aSRaphael Isemann   std::vector<Pattern> ImplicitNegativeChecks;
18405ffd940aSRaphael Isemann   for (StringRef PatternString : Req.ImplicitCheckNot) {
18415ffd940aSRaphael Isemann     // Create a buffer with fake command line content in order to display the
18425ffd940aSRaphael Isemann     // command line option responsible for the specific implicit CHECK-NOT.
18435ffd940aSRaphael Isemann     std::string Prefix = "-implicit-check-not='";
18445ffd940aSRaphael Isemann     std::string Suffix = "'";
18455ffd940aSRaphael Isemann     std::unique_ptr<MemoryBuffer> CmdLine = MemoryBuffer::getMemBufferCopy(
18465ffd940aSRaphael Isemann         (Prefix + PatternString + Suffix).str(), "command line");
18475ffd940aSRaphael Isemann 
18485ffd940aSRaphael Isemann     StringRef PatternInBuffer =
18495ffd940aSRaphael Isemann         CmdLine->getBuffer().substr(Prefix.size(), PatternString.size());
18505ffd940aSRaphael Isemann     unsigned BufferID = SM.AddNewSourceBuffer(std::move(CmdLine), SMLoc());
18515ffd940aSRaphael Isemann     if (ImpPatBufferIDRange) {
18525ffd940aSRaphael Isemann       if (ImpPatBufferIDRange->first == ImpPatBufferIDRange->second) {
18535ffd940aSRaphael Isemann         ImpPatBufferIDRange->first = BufferID;
18545ffd940aSRaphael Isemann         ImpPatBufferIDRange->second = BufferID + 1;
18555ffd940aSRaphael Isemann       } else {
18565ffd940aSRaphael Isemann         assert(BufferID == ImpPatBufferIDRange->second &&
18575ffd940aSRaphael Isemann                "expected consecutive source buffer IDs");
18585ffd940aSRaphael Isemann         ++ImpPatBufferIDRange->second;
18595ffd940aSRaphael Isemann       }
18605ffd940aSRaphael Isemann     }
18615ffd940aSRaphael Isemann 
18625ffd940aSRaphael Isemann     ImplicitNegativeChecks.push_back(
18635ffd940aSRaphael Isemann         Pattern(Check::CheckNot, PatternContext.get()));
18645ffd940aSRaphael Isemann     ImplicitNegativeChecks.back().parsePattern(PatternInBuffer,
18655ffd940aSRaphael Isemann                                                "IMPLICIT-CHECK", SM, Req);
18665ffd940aSRaphael Isemann   }
18675ffd940aSRaphael Isemann 
18685ffd940aSRaphael Isemann   std::vector<Pattern> DagNotMatches = ImplicitNegativeChecks;
18695ffd940aSRaphael Isemann 
18705ffd940aSRaphael Isemann   // LineNumber keeps track of the line on which CheckPrefix instances are
18715ffd940aSRaphael Isemann   // found.
18725ffd940aSRaphael Isemann   unsigned LineNumber = 1;
18735ffd940aSRaphael Isemann 
1874871d658cSMircea Trofin   std::set<StringRef> PrefixesNotFound(Req.CheckPrefixes.begin(),
1875871d658cSMircea Trofin                                        Req.CheckPrefixes.end());
1876871d658cSMircea Trofin   const size_t DistinctPrefixes = PrefixesNotFound.size();
1877871d658cSMircea Trofin   while (true) {
18785ffd940aSRaphael Isemann     Check::FileCheckType CheckTy;
18795ffd940aSRaphael Isemann 
18805ffd940aSRaphael Isemann     // See if a prefix occurs in the memory buffer.
18815ffd940aSRaphael Isemann     StringRef UsedPrefix;
18825ffd940aSRaphael Isemann     StringRef AfterSuffix;
18835ffd940aSRaphael Isemann     std::tie(UsedPrefix, AfterSuffix) =
18845ffd940aSRaphael Isemann         FindFirstMatchingPrefix(Req, PrefixRE, Buffer, LineNumber, CheckTy);
18855ffd940aSRaphael Isemann     if (UsedPrefix.empty())
18865ffd940aSRaphael Isemann       break;
18875ffd940aSRaphael Isemann     if (CheckTy != Check::CheckComment)
1888871d658cSMircea Trofin       PrefixesNotFound.erase(UsedPrefix);
18895ffd940aSRaphael Isemann 
18905ffd940aSRaphael Isemann     assert(UsedPrefix.data() == Buffer.data() &&
18915ffd940aSRaphael Isemann            "Failed to move Buffer's start forward, or pointed prefix outside "
18925ffd940aSRaphael Isemann            "of the buffer!");
18935ffd940aSRaphael Isemann     assert(AfterSuffix.data() >= Buffer.data() &&
18945ffd940aSRaphael Isemann            AfterSuffix.data() < Buffer.data() + Buffer.size() &&
18955ffd940aSRaphael Isemann            "Parsing after suffix doesn't start inside of buffer!");
18965ffd940aSRaphael Isemann 
18975ffd940aSRaphael Isemann     // Location to use for error messages.
18985ffd940aSRaphael Isemann     const char *UsedPrefixStart = UsedPrefix.data();
18995ffd940aSRaphael Isemann 
19005ffd940aSRaphael Isemann     // Skip the buffer to the end of parsed suffix (or just prefix, if no good
19015ffd940aSRaphael Isemann     // suffix was processed).
19025ffd940aSRaphael Isemann     Buffer = AfterSuffix.empty() ? Buffer.drop_front(UsedPrefix.size())
19035ffd940aSRaphael Isemann                                  : AfterSuffix;
19045ffd940aSRaphael Isemann 
19055ffd940aSRaphael Isemann     // Complain about useful-looking but unsupported suffixes.
19065ffd940aSRaphael Isemann     if (CheckTy == Check::CheckBadNot) {
19075ffd940aSRaphael Isemann       SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Error,
19085ffd940aSRaphael Isemann                       "unsupported -NOT combo on prefix '" + UsedPrefix + "'");
19095ffd940aSRaphael Isemann       return true;
19105ffd940aSRaphael Isemann     }
19115ffd940aSRaphael Isemann 
19125ffd940aSRaphael Isemann     // Complain about invalid count specification.
19135ffd940aSRaphael Isemann     if (CheckTy == Check::CheckBadCount) {
19145ffd940aSRaphael Isemann       SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Error,
19155ffd940aSRaphael Isemann                       "invalid count in -COUNT specification on prefix '" +
19165ffd940aSRaphael Isemann                           UsedPrefix + "'");
19175ffd940aSRaphael Isemann       return true;
19185ffd940aSRaphael Isemann     }
19195ffd940aSRaphael Isemann 
19205ffd940aSRaphael Isemann     // Okay, we found the prefix, yay. Remember the rest of the line, but ignore
19215ffd940aSRaphael Isemann     // leading whitespace.
19225ffd940aSRaphael Isemann     if (!(Req.NoCanonicalizeWhiteSpace && Req.MatchFullLines))
19235ffd940aSRaphael Isemann       Buffer = Buffer.substr(Buffer.find_first_not_of(" \t"));
19245ffd940aSRaphael Isemann 
19255ffd940aSRaphael Isemann     // Scan ahead to the end of line.
19265ffd940aSRaphael Isemann     size_t EOL = Buffer.find_first_of("\n\r");
19275ffd940aSRaphael Isemann 
19285ffd940aSRaphael Isemann     // Remember the location of the start of the pattern, for diagnostics.
19295ffd940aSRaphael Isemann     SMLoc PatternLoc = SMLoc::getFromPointer(Buffer.data());
19305ffd940aSRaphael Isemann 
19315ffd940aSRaphael Isemann     // Extract the pattern from the buffer.
19325ffd940aSRaphael Isemann     StringRef PatternBuffer = Buffer.substr(0, EOL);
19335ffd940aSRaphael Isemann     Buffer = Buffer.substr(EOL);
19345ffd940aSRaphael Isemann 
19355ffd940aSRaphael Isemann     // If this is a comment, we're done.
19365ffd940aSRaphael Isemann     if (CheckTy == Check::CheckComment)
19375ffd940aSRaphael Isemann       continue;
19385ffd940aSRaphael Isemann 
19395ffd940aSRaphael Isemann     // Parse the pattern.
19405ffd940aSRaphael Isemann     Pattern P(CheckTy, PatternContext.get(), LineNumber);
19415ffd940aSRaphael Isemann     if (P.parsePattern(PatternBuffer, UsedPrefix, SM, Req))
19425ffd940aSRaphael Isemann       return true;
19435ffd940aSRaphael Isemann 
19445ffd940aSRaphael Isemann     // Verify that CHECK-LABEL lines do not define or use variables
19455ffd940aSRaphael Isemann     if ((CheckTy == Check::CheckLabel) && P.hasVariable()) {
19465ffd940aSRaphael Isemann       SM.PrintMessage(
19475ffd940aSRaphael Isemann           SMLoc::getFromPointer(UsedPrefixStart), SourceMgr::DK_Error,
19485ffd940aSRaphael Isemann           "found '" + UsedPrefix + "-LABEL:'"
19495ffd940aSRaphael Isemann                                    " with variable definition or use");
19505ffd940aSRaphael Isemann       return true;
19515ffd940aSRaphael Isemann     }
19525ffd940aSRaphael Isemann 
19535ffd940aSRaphael Isemann     // Verify that CHECK-NEXT/SAME/EMPTY lines have at least one CHECK line before them.
19545ffd940aSRaphael Isemann     if ((CheckTy == Check::CheckNext || CheckTy == Check::CheckSame ||
19555ffd940aSRaphael Isemann          CheckTy == Check::CheckEmpty) &&
19565ffd940aSRaphael Isemann         CheckStrings->empty()) {
19575ffd940aSRaphael Isemann       StringRef Type = CheckTy == Check::CheckNext
19585ffd940aSRaphael Isemann                            ? "NEXT"
19595ffd940aSRaphael Isemann                            : CheckTy == Check::CheckEmpty ? "EMPTY" : "SAME";
19605ffd940aSRaphael Isemann       SM.PrintMessage(SMLoc::getFromPointer(UsedPrefixStart),
19615ffd940aSRaphael Isemann                       SourceMgr::DK_Error,
19625ffd940aSRaphael Isemann                       "found '" + UsedPrefix + "-" + Type +
19635ffd940aSRaphael Isemann                           "' without previous '" + UsedPrefix + ": line");
19645ffd940aSRaphael Isemann       return true;
19655ffd940aSRaphael Isemann     }
19665ffd940aSRaphael Isemann 
19675ffd940aSRaphael Isemann     // Handle CHECK-DAG/-NOT.
19685ffd940aSRaphael Isemann     if (CheckTy == Check::CheckDAG || CheckTy == Check::CheckNot) {
19695ffd940aSRaphael Isemann       DagNotMatches.push_back(P);
19705ffd940aSRaphael Isemann       continue;
19715ffd940aSRaphael Isemann     }
19725ffd940aSRaphael Isemann 
19735ffd940aSRaphael Isemann     // Okay, add the string we captured to the output vector and move on.
19745ffd940aSRaphael Isemann     CheckStrings->emplace_back(P, UsedPrefix, PatternLoc);
19755ffd940aSRaphael Isemann     std::swap(DagNotMatches, CheckStrings->back().DagNotStrings);
19765ffd940aSRaphael Isemann     DagNotMatches = ImplicitNegativeChecks;
19775ffd940aSRaphael Isemann   }
19785ffd940aSRaphael Isemann 
19795ffd940aSRaphael Isemann   // When there are no used prefixes we report an error except in the case that
19805ffd940aSRaphael Isemann   // no prefix is specified explicitly but -implicit-check-not is specified.
1981871d658cSMircea Trofin   const bool NoPrefixesFound = PrefixesNotFound.size() == DistinctPrefixes;
1982871d658cSMircea Trofin   const bool SomePrefixesUnexpectedlyNotUsed =
1983871d658cSMircea Trofin       !Req.AllowUnusedPrefixes && !PrefixesNotFound.empty();
1984871d658cSMircea Trofin   if ((NoPrefixesFound || SomePrefixesUnexpectedlyNotUsed) &&
19855ffd940aSRaphael Isemann       (ImplicitNegativeChecks.empty() || !Req.IsDefaultCheckPrefix)) {
19865ffd940aSRaphael Isemann     errs() << "error: no check strings found with prefix"
1987871d658cSMircea Trofin            << (PrefixesNotFound.size() > 1 ? "es " : " ");
1988871d658cSMircea Trofin     bool First = true;
1989871d658cSMircea Trofin     for (StringRef MissingPrefix : PrefixesNotFound) {
1990871d658cSMircea Trofin       if (!First)
19915ffd940aSRaphael Isemann         errs() << ", ";
1992871d658cSMircea Trofin       errs() << "\'" << MissingPrefix << ":'";
1993871d658cSMircea Trofin       First = false;
19945ffd940aSRaphael Isemann     }
19955ffd940aSRaphael Isemann     errs() << '\n';
19965ffd940aSRaphael Isemann     return true;
19975ffd940aSRaphael Isemann   }
19985ffd940aSRaphael Isemann 
19995ffd940aSRaphael Isemann   // Add an EOF pattern for any trailing --implicit-check-not/CHECK-DAG/-NOTs,
20005ffd940aSRaphael Isemann   // and use the first prefix as a filler for the error message.
20015ffd940aSRaphael Isemann   if (!DagNotMatches.empty()) {
20025ffd940aSRaphael Isemann     CheckStrings->emplace_back(
20035ffd940aSRaphael Isemann         Pattern(Check::CheckEOF, PatternContext.get(), LineNumber + 1),
20045ffd940aSRaphael Isemann         *Req.CheckPrefixes.begin(), SMLoc::getFromPointer(Buffer.data()));
20055ffd940aSRaphael Isemann     std::swap(DagNotMatches, CheckStrings->back().DagNotStrings);
20065ffd940aSRaphael Isemann   }
20075ffd940aSRaphael Isemann 
20085ffd940aSRaphael Isemann   return false;
20095ffd940aSRaphael Isemann }
20105ffd940aSRaphael Isemann 
20115ffd940aSRaphael Isemann static void PrintMatch(bool ExpectedMatch, const SourceMgr &SM,
20125ffd940aSRaphael Isemann                        StringRef Prefix, SMLoc Loc, const Pattern &Pat,
20135ffd940aSRaphael Isemann                        int MatchedCount, StringRef Buffer, size_t MatchPos,
20145ffd940aSRaphael Isemann                        size_t MatchLen, const FileCheckRequest &Req,
20155ffd940aSRaphael Isemann                        std::vector<FileCheckDiag> *Diags) {
20165ffd940aSRaphael Isemann   bool PrintDiag = true;
20175ffd940aSRaphael Isemann   if (ExpectedMatch) {
20185ffd940aSRaphael Isemann     if (!Req.Verbose)
20195ffd940aSRaphael Isemann       return;
20205ffd940aSRaphael Isemann     if (!Req.VerboseVerbose && Pat.getCheckTy() == Check::CheckEOF)
20215ffd940aSRaphael Isemann       return;
20225ffd940aSRaphael Isemann     // Due to their verbosity, we don't print verbose diagnostics here if we're
20235ffd940aSRaphael Isemann     // gathering them for a different rendering, but we always print other
20245ffd940aSRaphael Isemann     // diagnostics.
20255ffd940aSRaphael Isemann     PrintDiag = !Diags;
20265ffd940aSRaphael Isemann   }
20275ffd940aSRaphael Isemann   FileCheckDiag::MatchType MatchTy = ExpectedMatch
20285ffd940aSRaphael Isemann                                          ? FileCheckDiag::MatchFoundAndExpected
20295ffd940aSRaphael Isemann                                          : FileCheckDiag::MatchFoundButExcluded;
20305ffd940aSRaphael Isemann   SMRange MatchRange = ProcessMatchResult(MatchTy, SM, Loc, Pat.getCheckTy(),
20315ffd940aSRaphael Isemann                                           Buffer, MatchPos, MatchLen, Diags);
20325ffd940aSRaphael Isemann   if (Diags) {
20335ffd940aSRaphael Isemann     Pat.printSubstitutions(SM, Buffer, MatchRange, MatchTy, Diags);
20345ffd940aSRaphael Isemann     Pat.printVariableDefs(SM, MatchTy, Diags);
20355ffd940aSRaphael Isemann   }
20365ffd940aSRaphael Isemann   if (!PrintDiag)
20375ffd940aSRaphael Isemann     return;
20385ffd940aSRaphael Isemann 
20395ffd940aSRaphael Isemann   std::string Message = formatv("{0}: {1} string found in input",
20405ffd940aSRaphael Isemann                                 Pat.getCheckTy().getDescription(Prefix),
20415ffd940aSRaphael Isemann                                 (ExpectedMatch ? "expected" : "excluded"))
20425ffd940aSRaphael Isemann                             .str();
20435ffd940aSRaphael Isemann   if (Pat.getCount() > 1)
20445ffd940aSRaphael Isemann     Message += formatv(" ({0} out of {1})", MatchedCount, Pat.getCount()).str();
20455ffd940aSRaphael Isemann 
20465ffd940aSRaphael Isemann   SM.PrintMessage(
20475ffd940aSRaphael Isemann       Loc, ExpectedMatch ? SourceMgr::DK_Remark : SourceMgr::DK_Error, Message);
20485ffd940aSRaphael Isemann   SM.PrintMessage(MatchRange.Start, SourceMgr::DK_Note, "found here",
20495ffd940aSRaphael Isemann                   {MatchRange});
20505ffd940aSRaphael Isemann   Pat.printSubstitutions(SM, Buffer, MatchRange, MatchTy, nullptr);
20515ffd940aSRaphael Isemann   Pat.printVariableDefs(SM, MatchTy, nullptr);
20525ffd940aSRaphael Isemann }
20535ffd940aSRaphael Isemann 
20545ffd940aSRaphael Isemann static void PrintMatch(bool ExpectedMatch, const SourceMgr &SM,
20555ffd940aSRaphael Isemann                        const FileCheckString &CheckStr, int MatchedCount,
20565ffd940aSRaphael Isemann                        StringRef Buffer, size_t MatchPos, size_t MatchLen,
20575ffd940aSRaphael Isemann                        FileCheckRequest &Req,
20585ffd940aSRaphael Isemann                        std::vector<FileCheckDiag> *Diags) {
20595ffd940aSRaphael Isemann   PrintMatch(ExpectedMatch, SM, CheckStr.Prefix, CheckStr.Loc, CheckStr.Pat,
20605ffd940aSRaphael Isemann              MatchedCount, Buffer, MatchPos, MatchLen, Req, Diags);
20615ffd940aSRaphael Isemann }
20625ffd940aSRaphael Isemann 
20635ffd940aSRaphael Isemann static void PrintNoMatch(bool ExpectedMatch, const SourceMgr &SM,
20645ffd940aSRaphael Isemann                          StringRef Prefix, SMLoc Loc, const Pattern &Pat,
20655ffd940aSRaphael Isemann                          int MatchedCount, StringRef Buffer,
20665ffd940aSRaphael Isemann                          bool VerboseVerbose, std::vector<FileCheckDiag> *Diags,
20675ffd940aSRaphael Isemann                          Error MatchErrors) {
20685ffd940aSRaphael Isemann   assert(MatchErrors && "Called on successful match");
20695ffd940aSRaphael Isemann   bool PrintDiag = true;
20705ffd940aSRaphael Isemann   if (!ExpectedMatch) {
20715ffd940aSRaphael Isemann     if (!VerboseVerbose) {
20725ffd940aSRaphael Isemann       consumeError(std::move(MatchErrors));
20735ffd940aSRaphael Isemann       return;
20745ffd940aSRaphael Isemann     }
20755ffd940aSRaphael Isemann     // Due to their verbosity, we don't print verbose diagnostics here if we're
20765ffd940aSRaphael Isemann     // gathering them for a different rendering, but we always print other
20775ffd940aSRaphael Isemann     // diagnostics.
20785ffd940aSRaphael Isemann     PrintDiag = !Diags;
20795ffd940aSRaphael Isemann   }
20805ffd940aSRaphael Isemann 
20815ffd940aSRaphael Isemann   // If the current position is at the end of a line, advance to the start of
20825ffd940aSRaphael Isemann   // the next line.
20835ffd940aSRaphael Isemann   Buffer = Buffer.substr(Buffer.find_first_not_of(" \t\n\r"));
20845ffd940aSRaphael Isemann   FileCheckDiag::MatchType MatchTy = ExpectedMatch
20855ffd940aSRaphael Isemann                                          ? FileCheckDiag::MatchNoneButExpected
20865ffd940aSRaphael Isemann                                          : FileCheckDiag::MatchNoneAndExcluded;
20875ffd940aSRaphael Isemann   SMRange SearchRange = ProcessMatchResult(MatchTy, SM, Loc, Pat.getCheckTy(),
20885ffd940aSRaphael Isemann                                            Buffer, 0, Buffer.size(), Diags);
20895ffd940aSRaphael Isemann   if (Diags)
20905ffd940aSRaphael Isemann     Pat.printSubstitutions(SM, Buffer, SearchRange, MatchTy, Diags);
20915ffd940aSRaphael Isemann   if (!PrintDiag) {
20925ffd940aSRaphael Isemann     consumeError(std::move(MatchErrors));
20935ffd940aSRaphael Isemann     return;
20945ffd940aSRaphael Isemann   }
20955ffd940aSRaphael Isemann 
20965ffd940aSRaphael Isemann   MatchErrors = handleErrors(std::move(MatchErrors),
20975ffd940aSRaphael Isemann                              [](const ErrorDiagnostic &E) { E.log(errs()); });
20985ffd940aSRaphael Isemann 
20995ffd940aSRaphael Isemann   // No problem matching the string per se.
21005ffd940aSRaphael Isemann   if (!MatchErrors)
21015ffd940aSRaphael Isemann     return;
21025ffd940aSRaphael Isemann   consumeError(std::move(MatchErrors));
21035ffd940aSRaphael Isemann 
21045ffd940aSRaphael Isemann   // Print "not found" diagnostic.
21055ffd940aSRaphael Isemann   std::string Message = formatv("{0}: {1} string not found in input",
21065ffd940aSRaphael Isemann                                 Pat.getCheckTy().getDescription(Prefix),
21075ffd940aSRaphael Isemann                                 (ExpectedMatch ? "expected" : "excluded"))
21085ffd940aSRaphael Isemann                             .str();
21095ffd940aSRaphael Isemann   if (Pat.getCount() > 1)
21105ffd940aSRaphael Isemann     Message += formatv(" ({0} out of {1})", MatchedCount, Pat.getCount()).str();
21115ffd940aSRaphael Isemann   SM.PrintMessage(
21125ffd940aSRaphael Isemann       Loc, ExpectedMatch ? SourceMgr::DK_Error : SourceMgr::DK_Remark, Message);
21135ffd940aSRaphael Isemann 
21145ffd940aSRaphael Isemann   // Print the "scanning from here" line.
21155ffd940aSRaphael Isemann   SM.PrintMessage(SearchRange.Start, SourceMgr::DK_Note, "scanning from here");
21165ffd940aSRaphael Isemann 
21175ffd940aSRaphael Isemann   // Allow the pattern to print additional information if desired.
21185ffd940aSRaphael Isemann   Pat.printSubstitutions(SM, Buffer, SearchRange, MatchTy, nullptr);
21195ffd940aSRaphael Isemann 
21205ffd940aSRaphael Isemann   if (ExpectedMatch)
21215ffd940aSRaphael Isemann     Pat.printFuzzyMatch(SM, Buffer, Diags);
21225ffd940aSRaphael Isemann }
21235ffd940aSRaphael Isemann 
21245ffd940aSRaphael Isemann static void PrintNoMatch(bool ExpectedMatch, const SourceMgr &SM,
21255ffd940aSRaphael Isemann                          const FileCheckString &CheckStr, int MatchedCount,
21265ffd940aSRaphael Isemann                          StringRef Buffer, bool VerboseVerbose,
21275ffd940aSRaphael Isemann                          std::vector<FileCheckDiag> *Diags, Error MatchErrors) {
21285ffd940aSRaphael Isemann   PrintNoMatch(ExpectedMatch, SM, CheckStr.Prefix, CheckStr.Loc, CheckStr.Pat,
21295ffd940aSRaphael Isemann                MatchedCount, Buffer, VerboseVerbose, Diags,
21305ffd940aSRaphael Isemann                std::move(MatchErrors));
21315ffd940aSRaphael Isemann }
21325ffd940aSRaphael Isemann 
21335ffd940aSRaphael Isemann /// Counts the number of newlines in the specified range.
21345ffd940aSRaphael Isemann static unsigned CountNumNewlinesBetween(StringRef Range,
21355ffd940aSRaphael Isemann                                         const char *&FirstNewLine) {
21365ffd940aSRaphael Isemann   unsigned NumNewLines = 0;
21375ffd940aSRaphael Isemann   while (1) {
21385ffd940aSRaphael Isemann     // Scan for newline.
21395ffd940aSRaphael Isemann     Range = Range.substr(Range.find_first_of("\n\r"));
21405ffd940aSRaphael Isemann     if (Range.empty())
21415ffd940aSRaphael Isemann       return NumNewLines;
21425ffd940aSRaphael Isemann 
21435ffd940aSRaphael Isemann     ++NumNewLines;
21445ffd940aSRaphael Isemann 
21455ffd940aSRaphael Isemann     // Handle \n\r and \r\n as a single newline.
21465ffd940aSRaphael Isemann     if (Range.size() > 1 && (Range[1] == '\n' || Range[1] == '\r') &&
21475ffd940aSRaphael Isemann         (Range[0] != Range[1]))
21485ffd940aSRaphael Isemann       Range = Range.substr(1);
21495ffd940aSRaphael Isemann     Range = Range.substr(1);
21505ffd940aSRaphael Isemann 
21515ffd940aSRaphael Isemann     if (NumNewLines == 1)
21525ffd940aSRaphael Isemann       FirstNewLine = Range.begin();
21535ffd940aSRaphael Isemann   }
21545ffd940aSRaphael Isemann }
21555ffd940aSRaphael Isemann 
21565ffd940aSRaphael Isemann size_t FileCheckString::Check(const SourceMgr &SM, StringRef Buffer,
21575ffd940aSRaphael Isemann                               bool IsLabelScanMode, size_t &MatchLen,
21585ffd940aSRaphael Isemann                               FileCheckRequest &Req,
21595ffd940aSRaphael Isemann                               std::vector<FileCheckDiag> *Diags) const {
21605ffd940aSRaphael Isemann   size_t LastPos = 0;
21615ffd940aSRaphael Isemann   std::vector<const Pattern *> NotStrings;
21625ffd940aSRaphael Isemann 
21635ffd940aSRaphael Isemann   // IsLabelScanMode is true when we are scanning forward to find CHECK-LABEL
21645ffd940aSRaphael Isemann   // bounds; we have not processed variable definitions within the bounded block
21655ffd940aSRaphael Isemann   // yet so cannot handle any final CHECK-DAG yet; this is handled when going
21665ffd940aSRaphael Isemann   // over the block again (including the last CHECK-LABEL) in normal mode.
21675ffd940aSRaphael Isemann   if (!IsLabelScanMode) {
21685ffd940aSRaphael Isemann     // Match "dag strings" (with mixed "not strings" if any).
21695ffd940aSRaphael Isemann     LastPos = CheckDag(SM, Buffer, NotStrings, Req, Diags);
21705ffd940aSRaphael Isemann     if (LastPos == StringRef::npos)
21715ffd940aSRaphael Isemann       return StringRef::npos;
21725ffd940aSRaphael Isemann   }
21735ffd940aSRaphael Isemann 
21745ffd940aSRaphael Isemann   // Match itself from the last position after matching CHECK-DAG.
21755ffd940aSRaphael Isemann   size_t LastMatchEnd = LastPos;
21765ffd940aSRaphael Isemann   size_t FirstMatchPos = 0;
21775ffd940aSRaphael Isemann   // Go match the pattern Count times. Majority of patterns only match with
21785ffd940aSRaphael Isemann   // count 1 though.
21795ffd940aSRaphael Isemann   assert(Pat.getCount() != 0 && "pattern count can not be zero");
21805ffd940aSRaphael Isemann   for (int i = 1; i <= Pat.getCount(); i++) {
21815ffd940aSRaphael Isemann     StringRef MatchBuffer = Buffer.substr(LastMatchEnd);
21825ffd940aSRaphael Isemann     size_t CurrentMatchLen;
21835ffd940aSRaphael Isemann     // get a match at current start point
21845ffd940aSRaphael Isemann     Expected<size_t> MatchResult = Pat.match(MatchBuffer, CurrentMatchLen, SM);
21855ffd940aSRaphael Isemann 
21865ffd940aSRaphael Isemann     // report
21875ffd940aSRaphael Isemann     if (!MatchResult) {
21885ffd940aSRaphael Isemann       PrintNoMatch(true, SM, *this, i, MatchBuffer, Req.VerboseVerbose, Diags,
21895ffd940aSRaphael Isemann                    MatchResult.takeError());
21905ffd940aSRaphael Isemann       return StringRef::npos;
21915ffd940aSRaphael Isemann     }
21925ffd940aSRaphael Isemann     size_t MatchPos = *MatchResult;
21935ffd940aSRaphael Isemann     PrintMatch(true, SM, *this, i, MatchBuffer, MatchPos, CurrentMatchLen, Req,
21945ffd940aSRaphael Isemann                Diags);
21955ffd940aSRaphael Isemann     if (i == 1)
21965ffd940aSRaphael Isemann       FirstMatchPos = LastPos + MatchPos;
21975ffd940aSRaphael Isemann 
21985ffd940aSRaphael Isemann     // move start point after the match
21995ffd940aSRaphael Isemann     LastMatchEnd += MatchPos + CurrentMatchLen;
22005ffd940aSRaphael Isemann   }
22015ffd940aSRaphael Isemann   // Full match len counts from first match pos.
22025ffd940aSRaphael Isemann   MatchLen = LastMatchEnd - FirstMatchPos;
22035ffd940aSRaphael Isemann 
22045ffd940aSRaphael Isemann   // Similar to the above, in "label-scan mode" we can't yet handle CHECK-NEXT
22055ffd940aSRaphael Isemann   // or CHECK-NOT
22065ffd940aSRaphael Isemann   if (!IsLabelScanMode) {
22075ffd940aSRaphael Isemann     size_t MatchPos = FirstMatchPos - LastPos;
22085ffd940aSRaphael Isemann     StringRef MatchBuffer = Buffer.substr(LastPos);
22095ffd940aSRaphael Isemann     StringRef SkippedRegion = Buffer.substr(LastPos, MatchPos);
22105ffd940aSRaphael Isemann 
22115ffd940aSRaphael Isemann     // If this check is a "CHECK-NEXT", verify that the previous match was on
22125ffd940aSRaphael Isemann     // the previous line (i.e. that there is one newline between them).
22135ffd940aSRaphael Isemann     if (CheckNext(SM, SkippedRegion)) {
22145ffd940aSRaphael Isemann       ProcessMatchResult(FileCheckDiag::MatchFoundButWrongLine, SM, Loc,
22155ffd940aSRaphael Isemann                          Pat.getCheckTy(), MatchBuffer, MatchPos, MatchLen,
22165ffd940aSRaphael Isemann                          Diags, Req.Verbose);
22175ffd940aSRaphael Isemann       return StringRef::npos;
22185ffd940aSRaphael Isemann     }
22195ffd940aSRaphael Isemann 
22205ffd940aSRaphael Isemann     // If this check is a "CHECK-SAME", verify that the previous match was on
22215ffd940aSRaphael Isemann     // the same line (i.e. that there is no newline between them).
22225ffd940aSRaphael Isemann     if (CheckSame(SM, SkippedRegion)) {
22235ffd940aSRaphael Isemann       ProcessMatchResult(FileCheckDiag::MatchFoundButWrongLine, SM, Loc,
22245ffd940aSRaphael Isemann                          Pat.getCheckTy(), MatchBuffer, MatchPos, MatchLen,
22255ffd940aSRaphael Isemann                          Diags, Req.Verbose);
22265ffd940aSRaphael Isemann       return StringRef::npos;
22275ffd940aSRaphael Isemann     }
22285ffd940aSRaphael Isemann 
22295ffd940aSRaphael Isemann     // If this match had "not strings", verify that they don't exist in the
22305ffd940aSRaphael Isemann     // skipped region.
22315ffd940aSRaphael Isemann     if (CheckNot(SM, SkippedRegion, NotStrings, Req, Diags))
22325ffd940aSRaphael Isemann       return StringRef::npos;
22335ffd940aSRaphael Isemann   }
22345ffd940aSRaphael Isemann 
22355ffd940aSRaphael Isemann   return FirstMatchPos;
22365ffd940aSRaphael Isemann }
22375ffd940aSRaphael Isemann 
22385ffd940aSRaphael Isemann bool FileCheckString::CheckNext(const SourceMgr &SM, StringRef Buffer) const {
22395ffd940aSRaphael Isemann   if (Pat.getCheckTy() != Check::CheckNext &&
22405ffd940aSRaphael Isemann       Pat.getCheckTy() != Check::CheckEmpty)
22415ffd940aSRaphael Isemann     return false;
22425ffd940aSRaphael Isemann 
22435ffd940aSRaphael Isemann   Twine CheckName =
22445ffd940aSRaphael Isemann       Prefix +
22455ffd940aSRaphael Isemann       Twine(Pat.getCheckTy() == Check::CheckEmpty ? "-EMPTY" : "-NEXT");
22465ffd940aSRaphael Isemann 
22475ffd940aSRaphael Isemann   // Count the number of newlines between the previous match and this one.
22485ffd940aSRaphael Isemann   const char *FirstNewLine = nullptr;
22495ffd940aSRaphael Isemann   unsigned NumNewLines = CountNumNewlinesBetween(Buffer, FirstNewLine);
22505ffd940aSRaphael Isemann 
22515ffd940aSRaphael Isemann   if (NumNewLines == 0) {
22525ffd940aSRaphael Isemann     SM.PrintMessage(Loc, SourceMgr::DK_Error,
22535ffd940aSRaphael Isemann                     CheckName + ": is on the same line as previous match");
22545ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note,
22555ffd940aSRaphael Isemann                     "'next' match was here");
22565ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note,
22575ffd940aSRaphael Isemann                     "previous match ended here");
22585ffd940aSRaphael Isemann     return true;
22595ffd940aSRaphael Isemann   }
22605ffd940aSRaphael Isemann 
22615ffd940aSRaphael Isemann   if (NumNewLines != 1) {
22625ffd940aSRaphael Isemann     SM.PrintMessage(Loc, SourceMgr::DK_Error,
22635ffd940aSRaphael Isemann                     CheckName +
22645ffd940aSRaphael Isemann                         ": is not on the line after the previous match");
22655ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note,
22665ffd940aSRaphael Isemann                     "'next' match was here");
22675ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note,
22685ffd940aSRaphael Isemann                     "previous match ended here");
22695ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(FirstNewLine), SourceMgr::DK_Note,
22705ffd940aSRaphael Isemann                     "non-matching line after previous match is here");
22715ffd940aSRaphael Isemann     return true;
22725ffd940aSRaphael Isemann   }
22735ffd940aSRaphael Isemann 
22745ffd940aSRaphael Isemann   return false;
22755ffd940aSRaphael Isemann }
22765ffd940aSRaphael Isemann 
22775ffd940aSRaphael Isemann bool FileCheckString::CheckSame(const SourceMgr &SM, StringRef Buffer) const {
22785ffd940aSRaphael Isemann   if (Pat.getCheckTy() != Check::CheckSame)
22795ffd940aSRaphael Isemann     return false;
22805ffd940aSRaphael Isemann 
22815ffd940aSRaphael Isemann   // Count the number of newlines between the previous match and this one.
22825ffd940aSRaphael Isemann   const char *FirstNewLine = nullptr;
22835ffd940aSRaphael Isemann   unsigned NumNewLines = CountNumNewlinesBetween(Buffer, FirstNewLine);
22845ffd940aSRaphael Isemann 
22855ffd940aSRaphael Isemann   if (NumNewLines != 0) {
22865ffd940aSRaphael Isemann     SM.PrintMessage(Loc, SourceMgr::DK_Error,
22875ffd940aSRaphael Isemann                     Prefix +
22885ffd940aSRaphael Isemann                         "-SAME: is not on the same line as the previous match");
22895ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note,
22905ffd940aSRaphael Isemann                     "'next' match was here");
22915ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note,
22925ffd940aSRaphael Isemann                     "previous match ended here");
22935ffd940aSRaphael Isemann     return true;
22945ffd940aSRaphael Isemann   }
22955ffd940aSRaphael Isemann 
22965ffd940aSRaphael Isemann   return false;
22975ffd940aSRaphael Isemann }
22985ffd940aSRaphael Isemann 
22995ffd940aSRaphael Isemann bool FileCheckString::CheckNot(const SourceMgr &SM, StringRef Buffer,
23005ffd940aSRaphael Isemann                                const std::vector<const Pattern *> &NotStrings,
23015ffd940aSRaphael Isemann                                const FileCheckRequest &Req,
23025ffd940aSRaphael Isemann                                std::vector<FileCheckDiag> *Diags) const {
23035ffd940aSRaphael Isemann   bool DirectiveFail = false;
23045ffd940aSRaphael Isemann   for (const Pattern *Pat : NotStrings) {
23055ffd940aSRaphael Isemann     assert((Pat->getCheckTy() == Check::CheckNot) && "Expect CHECK-NOT!");
23065ffd940aSRaphael Isemann 
23075ffd940aSRaphael Isemann     size_t MatchLen = 0;
23085ffd940aSRaphael Isemann     Expected<size_t> MatchResult = Pat->match(Buffer, MatchLen, SM);
23095ffd940aSRaphael Isemann 
23105ffd940aSRaphael Isemann     if (!MatchResult) {
23115ffd940aSRaphael Isemann       PrintNoMatch(false, SM, Prefix, Pat->getLoc(), *Pat, 1, Buffer,
23125ffd940aSRaphael Isemann                    Req.VerboseVerbose, Diags, MatchResult.takeError());
23135ffd940aSRaphael Isemann       continue;
23145ffd940aSRaphael Isemann     }
23155ffd940aSRaphael Isemann     size_t Pos = *MatchResult;
23165ffd940aSRaphael Isemann 
23175ffd940aSRaphael Isemann     PrintMatch(false, SM, Prefix, Pat->getLoc(), *Pat, 1, Buffer, Pos, MatchLen,
23185ffd940aSRaphael Isemann                Req, Diags);
23195ffd940aSRaphael Isemann     DirectiveFail = true;
23205ffd940aSRaphael Isemann   }
23215ffd940aSRaphael Isemann 
23225ffd940aSRaphael Isemann   return DirectiveFail;
23235ffd940aSRaphael Isemann }
23245ffd940aSRaphael Isemann 
23255ffd940aSRaphael Isemann size_t FileCheckString::CheckDag(const SourceMgr &SM, StringRef Buffer,
23265ffd940aSRaphael Isemann                                  std::vector<const Pattern *> &NotStrings,
23275ffd940aSRaphael Isemann                                  const FileCheckRequest &Req,
23285ffd940aSRaphael Isemann                                  std::vector<FileCheckDiag> *Diags) const {
23295ffd940aSRaphael Isemann   if (DagNotStrings.empty())
23305ffd940aSRaphael Isemann     return 0;
23315ffd940aSRaphael Isemann 
23325ffd940aSRaphael Isemann   // The start of the search range.
23335ffd940aSRaphael Isemann   size_t StartPos = 0;
23345ffd940aSRaphael Isemann 
23355ffd940aSRaphael Isemann   struct MatchRange {
23365ffd940aSRaphael Isemann     size_t Pos;
23375ffd940aSRaphael Isemann     size_t End;
23385ffd940aSRaphael Isemann   };
23395ffd940aSRaphael Isemann   // A sorted list of ranges for non-overlapping CHECK-DAG matches.  Match
23405ffd940aSRaphael Isemann   // ranges are erased from this list once they are no longer in the search
23415ffd940aSRaphael Isemann   // range.
23425ffd940aSRaphael Isemann   std::list<MatchRange> MatchRanges;
23435ffd940aSRaphael Isemann 
23445ffd940aSRaphael Isemann   // We need PatItr and PatEnd later for detecting the end of a CHECK-DAG
23455ffd940aSRaphael Isemann   // group, so we don't use a range-based for loop here.
23465ffd940aSRaphael Isemann   for (auto PatItr = DagNotStrings.begin(), PatEnd = DagNotStrings.end();
23475ffd940aSRaphael Isemann        PatItr != PatEnd; ++PatItr) {
23485ffd940aSRaphael Isemann     const Pattern &Pat = *PatItr;
23495ffd940aSRaphael Isemann     assert((Pat.getCheckTy() == Check::CheckDAG ||
23505ffd940aSRaphael Isemann             Pat.getCheckTy() == Check::CheckNot) &&
23515ffd940aSRaphael Isemann            "Invalid CHECK-DAG or CHECK-NOT!");
23525ffd940aSRaphael Isemann 
23535ffd940aSRaphael Isemann     if (Pat.getCheckTy() == Check::CheckNot) {
23545ffd940aSRaphael Isemann       NotStrings.push_back(&Pat);
23555ffd940aSRaphael Isemann       continue;
23565ffd940aSRaphael Isemann     }
23575ffd940aSRaphael Isemann 
23585ffd940aSRaphael Isemann     assert((Pat.getCheckTy() == Check::CheckDAG) && "Expect CHECK-DAG!");
23595ffd940aSRaphael Isemann 
23605ffd940aSRaphael Isemann     // CHECK-DAG always matches from the start.
23615ffd940aSRaphael Isemann     size_t MatchLen = 0, MatchPos = StartPos;
23625ffd940aSRaphael Isemann 
23635ffd940aSRaphael Isemann     // Search for a match that doesn't overlap a previous match in this
23645ffd940aSRaphael Isemann     // CHECK-DAG group.
23655ffd940aSRaphael Isemann     for (auto MI = MatchRanges.begin(), ME = MatchRanges.end(); true; ++MI) {
23665ffd940aSRaphael Isemann       StringRef MatchBuffer = Buffer.substr(MatchPos);
23675ffd940aSRaphael Isemann       Expected<size_t> MatchResult = Pat.match(MatchBuffer, MatchLen, SM);
23685ffd940aSRaphael Isemann       // With a group of CHECK-DAGs, a single mismatching means the match on
23695ffd940aSRaphael Isemann       // that group of CHECK-DAGs fails immediately.
23705ffd940aSRaphael Isemann       if (!MatchResult) {
23715ffd940aSRaphael Isemann         PrintNoMatch(true, SM, Prefix, Pat.getLoc(), Pat, 1, MatchBuffer,
23725ffd940aSRaphael Isemann                      Req.VerboseVerbose, Diags, MatchResult.takeError());
23735ffd940aSRaphael Isemann         return StringRef::npos;
23745ffd940aSRaphael Isemann       }
23755ffd940aSRaphael Isemann       size_t MatchPosBuf = *MatchResult;
23765ffd940aSRaphael Isemann       // Re-calc it as the offset relative to the start of the original string.
23775ffd940aSRaphael Isemann       MatchPos += MatchPosBuf;
23785ffd940aSRaphael Isemann       if (Req.VerboseVerbose)
23795ffd940aSRaphael Isemann         PrintMatch(true, SM, Prefix, Pat.getLoc(), Pat, 1, Buffer, MatchPos,
23805ffd940aSRaphael Isemann                    MatchLen, Req, Diags);
23815ffd940aSRaphael Isemann       MatchRange M{MatchPos, MatchPos + MatchLen};
23825ffd940aSRaphael Isemann       if (Req.AllowDeprecatedDagOverlap) {
23835ffd940aSRaphael Isemann         // We don't need to track all matches in this mode, so we just maintain
23845ffd940aSRaphael Isemann         // one match range that encompasses the current CHECK-DAG group's
23855ffd940aSRaphael Isemann         // matches.
23865ffd940aSRaphael Isemann         if (MatchRanges.empty())
23875ffd940aSRaphael Isemann           MatchRanges.insert(MatchRanges.end(), M);
23885ffd940aSRaphael Isemann         else {
23895ffd940aSRaphael Isemann           auto Block = MatchRanges.begin();
23905ffd940aSRaphael Isemann           Block->Pos = std::min(Block->Pos, M.Pos);
23915ffd940aSRaphael Isemann           Block->End = std::max(Block->End, M.End);
23925ffd940aSRaphael Isemann         }
23935ffd940aSRaphael Isemann         break;
23945ffd940aSRaphael Isemann       }
23955ffd940aSRaphael Isemann       // Iterate previous matches until overlapping match or insertion point.
23965ffd940aSRaphael Isemann       bool Overlap = false;
23975ffd940aSRaphael Isemann       for (; MI != ME; ++MI) {
23985ffd940aSRaphael Isemann         if (M.Pos < MI->End) {
23995ffd940aSRaphael Isemann           // !Overlap => New match has no overlap and is before this old match.
24005ffd940aSRaphael Isemann           // Overlap => New match overlaps this old match.
24015ffd940aSRaphael Isemann           Overlap = MI->Pos < M.End;
24025ffd940aSRaphael Isemann           break;
24035ffd940aSRaphael Isemann         }
24045ffd940aSRaphael Isemann       }
24055ffd940aSRaphael Isemann       if (!Overlap) {
24065ffd940aSRaphael Isemann         // Insert non-overlapping match into list.
24075ffd940aSRaphael Isemann         MatchRanges.insert(MI, M);
24085ffd940aSRaphael Isemann         break;
24095ffd940aSRaphael Isemann       }
24105ffd940aSRaphael Isemann       if (Req.VerboseVerbose) {
24115ffd940aSRaphael Isemann         // Due to their verbosity, we don't print verbose diagnostics here if
24125ffd940aSRaphael Isemann         // we're gathering them for a different rendering, but we always print
24135ffd940aSRaphael Isemann         // other diagnostics.
24145ffd940aSRaphael Isemann         if (!Diags) {
24155ffd940aSRaphael Isemann           SMLoc OldStart = SMLoc::getFromPointer(Buffer.data() + MI->Pos);
24165ffd940aSRaphael Isemann           SMLoc OldEnd = SMLoc::getFromPointer(Buffer.data() + MI->End);
24175ffd940aSRaphael Isemann           SMRange OldRange(OldStart, OldEnd);
24185ffd940aSRaphael Isemann           SM.PrintMessage(OldStart, SourceMgr::DK_Note,
24195ffd940aSRaphael Isemann                           "match discarded, overlaps earlier DAG match here",
24205ffd940aSRaphael Isemann                           {OldRange});
24215ffd940aSRaphael Isemann         } else {
24225ffd940aSRaphael Isemann           SMLoc CheckLoc = Diags->rbegin()->CheckLoc;
24235ffd940aSRaphael Isemann           for (auto I = Diags->rbegin(), E = Diags->rend();
24245ffd940aSRaphael Isemann                I != E && I->CheckLoc == CheckLoc; ++I)
24255ffd940aSRaphael Isemann             I->MatchTy = FileCheckDiag::MatchFoundButDiscarded;
24265ffd940aSRaphael Isemann         }
24275ffd940aSRaphael Isemann       }
24285ffd940aSRaphael Isemann       MatchPos = MI->End;
24295ffd940aSRaphael Isemann     }
24305ffd940aSRaphael Isemann     if (!Req.VerboseVerbose)
24315ffd940aSRaphael Isemann       PrintMatch(true, SM, Prefix, Pat.getLoc(), Pat, 1, Buffer, MatchPos,
24325ffd940aSRaphael Isemann                  MatchLen, Req, Diags);
24335ffd940aSRaphael Isemann 
24345ffd940aSRaphael Isemann     // Handle the end of a CHECK-DAG group.
24355ffd940aSRaphael Isemann     if (std::next(PatItr) == PatEnd ||
24365ffd940aSRaphael Isemann         std::next(PatItr)->getCheckTy() == Check::CheckNot) {
24375ffd940aSRaphael Isemann       if (!NotStrings.empty()) {
24385ffd940aSRaphael Isemann         // If there are CHECK-NOTs between two CHECK-DAGs or from CHECK to
24395ffd940aSRaphael Isemann         // CHECK-DAG, verify that there are no 'not' strings occurred in that
24405ffd940aSRaphael Isemann         // region.
24415ffd940aSRaphael Isemann         StringRef SkippedRegion =
24425ffd940aSRaphael Isemann             Buffer.slice(StartPos, MatchRanges.begin()->Pos);
24435ffd940aSRaphael Isemann         if (CheckNot(SM, SkippedRegion, NotStrings, Req, Diags))
24445ffd940aSRaphael Isemann           return StringRef::npos;
24455ffd940aSRaphael Isemann         // Clear "not strings".
24465ffd940aSRaphael Isemann         NotStrings.clear();
24475ffd940aSRaphael Isemann       }
24485ffd940aSRaphael Isemann       // All subsequent CHECK-DAGs and CHECK-NOTs should be matched from the
24495ffd940aSRaphael Isemann       // end of this CHECK-DAG group's match range.
24505ffd940aSRaphael Isemann       StartPos = MatchRanges.rbegin()->End;
24515ffd940aSRaphael Isemann       // Don't waste time checking for (impossible) overlaps before that.
24525ffd940aSRaphael Isemann       MatchRanges.clear();
24535ffd940aSRaphael Isemann     }
24545ffd940aSRaphael Isemann   }
24555ffd940aSRaphael Isemann 
24565ffd940aSRaphael Isemann   return StartPos;
24575ffd940aSRaphael Isemann }
24585ffd940aSRaphael Isemann 
24595ffd940aSRaphael Isemann static bool ValidatePrefixes(StringRef Kind, StringSet<> &UniquePrefixes,
24605ffd940aSRaphael Isemann                              ArrayRef<StringRef> SuppliedPrefixes) {
24615ffd940aSRaphael Isemann   for (StringRef Prefix : SuppliedPrefixes) {
24625ffd940aSRaphael Isemann     if (Prefix.empty()) {
24635ffd940aSRaphael Isemann       errs() << "error: supplied " << Kind << " prefix must not be the empty "
24645ffd940aSRaphael Isemann              << "string\n";
24655ffd940aSRaphael Isemann       return false;
24665ffd940aSRaphael Isemann     }
24675ffd940aSRaphael Isemann     static const Regex Validator("^[a-zA-Z0-9_-]*$");
24685ffd940aSRaphael Isemann     if (!Validator.match(Prefix)) {
24695ffd940aSRaphael Isemann       errs() << "error: supplied " << Kind << " prefix must start with a "
24705ffd940aSRaphael Isemann              << "letter and contain only alphanumeric characters, hyphens, and "
24715ffd940aSRaphael Isemann              << "underscores: '" << Prefix << "'\n";
24725ffd940aSRaphael Isemann       return false;
24735ffd940aSRaphael Isemann     }
24745ffd940aSRaphael Isemann     if (!UniquePrefixes.insert(Prefix).second) {
24755ffd940aSRaphael Isemann       errs() << "error: supplied " << Kind << " prefix must be unique among "
24765ffd940aSRaphael Isemann              << "check and comment prefixes: '" << Prefix << "'\n";
24775ffd940aSRaphael Isemann       return false;
24785ffd940aSRaphael Isemann     }
24795ffd940aSRaphael Isemann   }
24805ffd940aSRaphael Isemann   return true;
24815ffd940aSRaphael Isemann }
24825ffd940aSRaphael Isemann 
24835ffd940aSRaphael Isemann static const char *DefaultCheckPrefixes[] = {"CHECK"};
24845ffd940aSRaphael Isemann static const char *DefaultCommentPrefixes[] = {"COM", "RUN"};
24855ffd940aSRaphael Isemann 
24865ffd940aSRaphael Isemann bool FileCheck::ValidateCheckPrefixes() {
24875ffd940aSRaphael Isemann   StringSet<> UniquePrefixes;
24885ffd940aSRaphael Isemann   // Add default prefixes to catch user-supplied duplicates of them below.
24895ffd940aSRaphael Isemann   if (Req.CheckPrefixes.empty()) {
24905ffd940aSRaphael Isemann     for (const char *Prefix : DefaultCheckPrefixes)
24915ffd940aSRaphael Isemann       UniquePrefixes.insert(Prefix);
24925ffd940aSRaphael Isemann   }
24935ffd940aSRaphael Isemann   if (Req.CommentPrefixes.empty()) {
24945ffd940aSRaphael Isemann     for (const char *Prefix : DefaultCommentPrefixes)
24955ffd940aSRaphael Isemann       UniquePrefixes.insert(Prefix);
24965ffd940aSRaphael Isemann   }
24975ffd940aSRaphael Isemann   // Do not validate the default prefixes, or diagnostics about duplicates might
24985ffd940aSRaphael Isemann   // incorrectly indicate that they were supplied by the user.
24995ffd940aSRaphael Isemann   if (!ValidatePrefixes("check", UniquePrefixes, Req.CheckPrefixes))
25005ffd940aSRaphael Isemann     return false;
25015ffd940aSRaphael Isemann   if (!ValidatePrefixes("comment", UniquePrefixes, Req.CommentPrefixes))
25025ffd940aSRaphael Isemann     return false;
25035ffd940aSRaphael Isemann   return true;
25045ffd940aSRaphael Isemann }
25055ffd940aSRaphael Isemann 
25065ffd940aSRaphael Isemann Regex FileCheck::buildCheckPrefixRegex() {
25075ffd940aSRaphael Isemann   if (Req.CheckPrefixes.empty()) {
25085ffd940aSRaphael Isemann     for (const char *Prefix : DefaultCheckPrefixes)
25095ffd940aSRaphael Isemann       Req.CheckPrefixes.push_back(Prefix);
25105ffd940aSRaphael Isemann     Req.IsDefaultCheckPrefix = true;
25115ffd940aSRaphael Isemann   }
25125ffd940aSRaphael Isemann   if (Req.CommentPrefixes.empty()) {
25135ffd940aSRaphael Isemann     for (const char *Prefix : DefaultCommentPrefixes)
25145ffd940aSRaphael Isemann       Req.CommentPrefixes.push_back(Prefix);
25155ffd940aSRaphael Isemann   }
25165ffd940aSRaphael Isemann 
25175ffd940aSRaphael Isemann   // We already validated the contents of CheckPrefixes and CommentPrefixes so
25185ffd940aSRaphael Isemann   // just concatenate them as alternatives.
25195ffd940aSRaphael Isemann   SmallString<32> PrefixRegexStr;
25205ffd940aSRaphael Isemann   for (size_t I = 0, E = Req.CheckPrefixes.size(); I != E; ++I) {
25215ffd940aSRaphael Isemann     if (I != 0)
25225ffd940aSRaphael Isemann       PrefixRegexStr.push_back('|');
25235ffd940aSRaphael Isemann     PrefixRegexStr.append(Req.CheckPrefixes[I]);
25245ffd940aSRaphael Isemann   }
25255ffd940aSRaphael Isemann   for (StringRef Prefix : Req.CommentPrefixes) {
25265ffd940aSRaphael Isemann     PrefixRegexStr.push_back('|');
25275ffd940aSRaphael Isemann     PrefixRegexStr.append(Prefix);
25285ffd940aSRaphael Isemann   }
25295ffd940aSRaphael Isemann 
25305ffd940aSRaphael Isemann   return Regex(PrefixRegexStr);
25315ffd940aSRaphael Isemann }
25325ffd940aSRaphael Isemann 
25335ffd940aSRaphael Isemann Error FileCheckPatternContext::defineCmdlineVariables(
25345ffd940aSRaphael Isemann     ArrayRef<StringRef> CmdlineDefines, SourceMgr &SM) {
25355ffd940aSRaphael Isemann   assert(GlobalVariableTable.empty() && GlobalNumericVariableTable.empty() &&
25365ffd940aSRaphael Isemann          "Overriding defined variable with command-line variable definitions");
25375ffd940aSRaphael Isemann 
25385ffd940aSRaphael Isemann   if (CmdlineDefines.empty())
25395ffd940aSRaphael Isemann     return Error::success();
25405ffd940aSRaphael Isemann 
25415ffd940aSRaphael Isemann   // Create a string representing the vector of command-line definitions. Each
25425ffd940aSRaphael Isemann   // definition is on its own line and prefixed with a definition number to
25435ffd940aSRaphael Isemann   // clarify which definition a given diagnostic corresponds to.
25445ffd940aSRaphael Isemann   unsigned I = 0;
25455ffd940aSRaphael Isemann   Error Errs = Error::success();
25465ffd940aSRaphael Isemann   std::string CmdlineDefsDiag;
25475ffd940aSRaphael Isemann   SmallVector<std::pair<size_t, size_t>, 4> CmdlineDefsIndices;
25485ffd940aSRaphael Isemann   for (StringRef CmdlineDef : CmdlineDefines) {
25495ffd940aSRaphael Isemann     std::string DefPrefix = ("Global define #" + Twine(++I) + ": ").str();
25505ffd940aSRaphael Isemann     size_t EqIdx = CmdlineDef.find('=');
25515ffd940aSRaphael Isemann     if (EqIdx == StringRef::npos) {
25525ffd940aSRaphael Isemann       CmdlineDefsIndices.push_back(std::make_pair(CmdlineDefsDiag.size(), 0));
25535ffd940aSRaphael Isemann       continue;
25545ffd940aSRaphael Isemann     }
25555ffd940aSRaphael Isemann     // Numeric variable definition.
25565ffd940aSRaphael Isemann     if (CmdlineDef[0] == '#') {
25575ffd940aSRaphael Isemann       // Append a copy of the command-line definition adapted to use the same
25585ffd940aSRaphael Isemann       // format as in the input file to be able to reuse
25595ffd940aSRaphael Isemann       // parseNumericSubstitutionBlock.
25605ffd940aSRaphael Isemann       CmdlineDefsDiag += (DefPrefix + CmdlineDef + " (parsed as: [[").str();
25615ffd940aSRaphael Isemann       std::string SubstitutionStr = std::string(CmdlineDef);
25625ffd940aSRaphael Isemann       SubstitutionStr[EqIdx] = ':';
25635ffd940aSRaphael Isemann       CmdlineDefsIndices.push_back(
25645ffd940aSRaphael Isemann           std::make_pair(CmdlineDefsDiag.size(), SubstitutionStr.size()));
25655ffd940aSRaphael Isemann       CmdlineDefsDiag += (SubstitutionStr + Twine("]])\n")).str();
25665ffd940aSRaphael Isemann     } else {
25675ffd940aSRaphael Isemann       CmdlineDefsDiag += DefPrefix;
25685ffd940aSRaphael Isemann       CmdlineDefsIndices.push_back(
25695ffd940aSRaphael Isemann           std::make_pair(CmdlineDefsDiag.size(), CmdlineDef.size()));
25705ffd940aSRaphael Isemann       CmdlineDefsDiag += (CmdlineDef + "\n").str();
25715ffd940aSRaphael Isemann     }
25725ffd940aSRaphael Isemann   }
25735ffd940aSRaphael Isemann 
25745ffd940aSRaphael Isemann   // Create a buffer with fake command line content in order to display
25755ffd940aSRaphael Isemann   // parsing diagnostic with location information and point to the
25765ffd940aSRaphael Isemann   // global definition with invalid syntax.
25775ffd940aSRaphael Isemann   std::unique_ptr<MemoryBuffer> CmdLineDefsDiagBuffer =
25785ffd940aSRaphael Isemann       MemoryBuffer::getMemBufferCopy(CmdlineDefsDiag, "Global defines");
25795ffd940aSRaphael Isemann   StringRef CmdlineDefsDiagRef = CmdLineDefsDiagBuffer->getBuffer();
25805ffd940aSRaphael Isemann   SM.AddNewSourceBuffer(std::move(CmdLineDefsDiagBuffer), SMLoc());
25815ffd940aSRaphael Isemann 
25825ffd940aSRaphael Isemann   for (std::pair<size_t, size_t> CmdlineDefIndices : CmdlineDefsIndices) {
25835ffd940aSRaphael Isemann     StringRef CmdlineDef = CmdlineDefsDiagRef.substr(CmdlineDefIndices.first,
25845ffd940aSRaphael Isemann                                                      CmdlineDefIndices.second);
25855ffd940aSRaphael Isemann     if (CmdlineDef.empty()) {
25865ffd940aSRaphael Isemann       Errs = joinErrors(
25875ffd940aSRaphael Isemann           std::move(Errs),
25885ffd940aSRaphael Isemann           ErrorDiagnostic::get(SM, CmdlineDef,
25895ffd940aSRaphael Isemann                                "missing equal sign in global definition"));
25905ffd940aSRaphael Isemann       continue;
25915ffd940aSRaphael Isemann     }
25925ffd940aSRaphael Isemann 
25935ffd940aSRaphael Isemann     // Numeric variable definition.
25945ffd940aSRaphael Isemann     if (CmdlineDef[0] == '#') {
25955ffd940aSRaphael Isemann       // Now parse the definition both to check that the syntax is correct and
25965ffd940aSRaphael Isemann       // to create the necessary class instance.
25975ffd940aSRaphael Isemann       StringRef CmdlineDefExpr = CmdlineDef.substr(1);
25985ffd940aSRaphael Isemann       Optional<NumericVariable *> DefinedNumericVariable;
25995ffd940aSRaphael Isemann       Expected<std::unique_ptr<Expression>> ExpressionResult =
26005ffd940aSRaphael Isemann           Pattern::parseNumericSubstitutionBlock(
26015ffd940aSRaphael Isemann               CmdlineDefExpr, DefinedNumericVariable, false, None, this, SM);
26025ffd940aSRaphael Isemann       if (!ExpressionResult) {
26035ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs), ExpressionResult.takeError());
26045ffd940aSRaphael Isemann         continue;
26055ffd940aSRaphael Isemann       }
26065ffd940aSRaphael Isemann       std::unique_ptr<Expression> Expression = std::move(*ExpressionResult);
26075ffd940aSRaphael Isemann       // Now evaluate the expression whose value this variable should be set
26085ffd940aSRaphael Isemann       // to, since the expression of a command-line variable definition should
26095ffd940aSRaphael Isemann       // only use variables defined earlier on the command-line. If not, this
26105ffd940aSRaphael Isemann       // is an error and we report it.
26115ffd940aSRaphael Isemann       Expected<ExpressionValue> Value = Expression->getAST()->eval();
26125ffd940aSRaphael Isemann       if (!Value) {
26135ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs), Value.takeError());
26145ffd940aSRaphael Isemann         continue;
26155ffd940aSRaphael Isemann       }
26165ffd940aSRaphael Isemann 
26175ffd940aSRaphael Isemann       assert(DefinedNumericVariable && "No variable defined");
26185ffd940aSRaphael Isemann       (*DefinedNumericVariable)->setValue(*Value);
26195ffd940aSRaphael Isemann 
26205ffd940aSRaphael Isemann       // Record this variable definition.
26215ffd940aSRaphael Isemann       GlobalNumericVariableTable[(*DefinedNumericVariable)->getName()] =
26225ffd940aSRaphael Isemann           *DefinedNumericVariable;
26235ffd940aSRaphael Isemann     } else {
26245ffd940aSRaphael Isemann       // String variable definition.
26255ffd940aSRaphael Isemann       std::pair<StringRef, StringRef> CmdlineNameVal = CmdlineDef.split('=');
26265ffd940aSRaphael Isemann       StringRef CmdlineName = CmdlineNameVal.first;
26275ffd940aSRaphael Isemann       StringRef OrigCmdlineName = CmdlineName;
26285ffd940aSRaphael Isemann       Expected<Pattern::VariableProperties> ParseVarResult =
26295ffd940aSRaphael Isemann           Pattern::parseVariable(CmdlineName, SM);
26305ffd940aSRaphael Isemann       if (!ParseVarResult) {
26315ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs), ParseVarResult.takeError());
26325ffd940aSRaphael Isemann         continue;
26335ffd940aSRaphael Isemann       }
26345ffd940aSRaphael Isemann       // Check that CmdlineName does not denote a pseudo variable is only
26355ffd940aSRaphael Isemann       // composed of the parsed numeric variable. This catches cases like
26365ffd940aSRaphael Isemann       // "FOO+2" in a "FOO+2=10" definition.
26375ffd940aSRaphael Isemann       if (ParseVarResult->IsPseudo || !CmdlineName.empty()) {
26385ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs),
26395ffd940aSRaphael Isemann                           ErrorDiagnostic::get(
26405ffd940aSRaphael Isemann                               SM, OrigCmdlineName,
26415ffd940aSRaphael Isemann                               "invalid name in string variable definition '" +
26425ffd940aSRaphael Isemann                                   OrigCmdlineName + "'"));
26435ffd940aSRaphael Isemann         continue;
26445ffd940aSRaphael Isemann       }
26455ffd940aSRaphael Isemann       StringRef Name = ParseVarResult->Name;
26465ffd940aSRaphael Isemann 
26475ffd940aSRaphael Isemann       // Detect collisions between string and numeric variables when the former
26485ffd940aSRaphael Isemann       // is created later than the latter.
26495ffd940aSRaphael Isemann       if (GlobalNumericVariableTable.find(Name) !=
26505ffd940aSRaphael Isemann           GlobalNumericVariableTable.end()) {
26515ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs),
26525ffd940aSRaphael Isemann                           ErrorDiagnostic::get(SM, Name,
26535ffd940aSRaphael Isemann                                                "numeric variable with name '" +
26545ffd940aSRaphael Isemann                                                    Name + "' already exists"));
26555ffd940aSRaphael Isemann         continue;
26565ffd940aSRaphael Isemann       }
26575ffd940aSRaphael Isemann       GlobalVariableTable.insert(CmdlineNameVal);
26585ffd940aSRaphael Isemann       // Mark the string variable as defined to detect collisions between
26595ffd940aSRaphael Isemann       // string and numeric variables in defineCmdlineVariables when the latter
26605ffd940aSRaphael Isemann       // is created later than the former. We cannot reuse GlobalVariableTable
26615ffd940aSRaphael Isemann       // for this by populating it with an empty string since we would then
26625ffd940aSRaphael Isemann       // lose the ability to detect the use of an undefined variable in
26635ffd940aSRaphael Isemann       // match().
26645ffd940aSRaphael Isemann       DefinedVariableTable[Name] = true;
26655ffd940aSRaphael Isemann     }
26665ffd940aSRaphael Isemann   }
26675ffd940aSRaphael Isemann 
26685ffd940aSRaphael Isemann   return Errs;
26695ffd940aSRaphael Isemann }
26705ffd940aSRaphael Isemann 
26715ffd940aSRaphael Isemann void FileCheckPatternContext::clearLocalVars() {
26725ffd940aSRaphael Isemann   SmallVector<StringRef, 16> LocalPatternVars, LocalNumericVars;
26735ffd940aSRaphael Isemann   for (const StringMapEntry<StringRef> &Var : GlobalVariableTable)
26745ffd940aSRaphael Isemann     if (Var.first()[0] != '$')
26755ffd940aSRaphael Isemann       LocalPatternVars.push_back(Var.first());
26765ffd940aSRaphael Isemann 
26775ffd940aSRaphael Isemann   // Numeric substitution reads the value of a variable directly, not via
26785ffd940aSRaphael Isemann   // GlobalNumericVariableTable. Therefore, we clear local variables by
26795ffd940aSRaphael Isemann   // clearing their value which will lead to a numeric substitution failure. We
26805ffd940aSRaphael Isemann   // also mark the variable for removal from GlobalNumericVariableTable since
26815ffd940aSRaphael Isemann   // this is what defineCmdlineVariables checks to decide that no global
26825ffd940aSRaphael Isemann   // variable has been defined.
26835ffd940aSRaphael Isemann   for (const auto &Var : GlobalNumericVariableTable)
26845ffd940aSRaphael Isemann     if (Var.first()[0] != '$') {
26855ffd940aSRaphael Isemann       Var.getValue()->clearValue();
26865ffd940aSRaphael Isemann       LocalNumericVars.push_back(Var.first());
26875ffd940aSRaphael Isemann     }
26885ffd940aSRaphael Isemann 
26895ffd940aSRaphael Isemann   for (const auto &Var : LocalPatternVars)
26905ffd940aSRaphael Isemann     GlobalVariableTable.erase(Var);
26915ffd940aSRaphael Isemann   for (const auto &Var : LocalNumericVars)
26925ffd940aSRaphael Isemann     GlobalNumericVariableTable.erase(Var);
26935ffd940aSRaphael Isemann }
26945ffd940aSRaphael Isemann 
26955ffd940aSRaphael Isemann bool FileCheck::checkInput(SourceMgr &SM, StringRef Buffer,
26965ffd940aSRaphael Isemann                            std::vector<FileCheckDiag> *Diags) {
26975ffd940aSRaphael Isemann   bool ChecksFailed = false;
26985ffd940aSRaphael Isemann 
26995ffd940aSRaphael Isemann   unsigned i = 0, j = 0, e = CheckStrings->size();
27005ffd940aSRaphael Isemann   while (true) {
27015ffd940aSRaphael Isemann     StringRef CheckRegion;
27025ffd940aSRaphael Isemann     if (j == e) {
27035ffd940aSRaphael Isemann       CheckRegion = Buffer;
27045ffd940aSRaphael Isemann     } else {
27055ffd940aSRaphael Isemann       const FileCheckString &CheckLabelStr = (*CheckStrings)[j];
27065ffd940aSRaphael Isemann       if (CheckLabelStr.Pat.getCheckTy() != Check::CheckLabel) {
27075ffd940aSRaphael Isemann         ++j;
27085ffd940aSRaphael Isemann         continue;
27095ffd940aSRaphael Isemann       }
27105ffd940aSRaphael Isemann 
27115ffd940aSRaphael Isemann       // Scan to next CHECK-LABEL match, ignoring CHECK-NOT and CHECK-DAG
27125ffd940aSRaphael Isemann       size_t MatchLabelLen = 0;
27135ffd940aSRaphael Isemann       size_t MatchLabelPos =
27145ffd940aSRaphael Isemann           CheckLabelStr.Check(SM, Buffer, true, MatchLabelLen, Req, Diags);
27155ffd940aSRaphael Isemann       if (MatchLabelPos == StringRef::npos)
27165ffd940aSRaphael Isemann         // Immediately bail if CHECK-LABEL fails, nothing else we can do.
27175ffd940aSRaphael Isemann         return false;
27185ffd940aSRaphael Isemann 
27195ffd940aSRaphael Isemann       CheckRegion = Buffer.substr(0, MatchLabelPos + MatchLabelLen);
27205ffd940aSRaphael Isemann       Buffer = Buffer.substr(MatchLabelPos + MatchLabelLen);
27215ffd940aSRaphael Isemann       ++j;
27225ffd940aSRaphael Isemann     }
27235ffd940aSRaphael Isemann 
27245ffd940aSRaphael Isemann     // Do not clear the first region as it's the one before the first
27255ffd940aSRaphael Isemann     // CHECK-LABEL and it would clear variables defined on the command-line
27265ffd940aSRaphael Isemann     // before they get used.
27275ffd940aSRaphael Isemann     if (i != 0 && Req.EnableVarScope)
27285ffd940aSRaphael Isemann       PatternContext->clearLocalVars();
27295ffd940aSRaphael Isemann 
27305ffd940aSRaphael Isemann     for (; i != j; ++i) {
27315ffd940aSRaphael Isemann       const FileCheckString &CheckStr = (*CheckStrings)[i];
27325ffd940aSRaphael Isemann 
27335ffd940aSRaphael Isemann       // Check each string within the scanned region, including a second check
27345ffd940aSRaphael Isemann       // of any final CHECK-LABEL (to verify CHECK-NOT and CHECK-DAG)
27355ffd940aSRaphael Isemann       size_t MatchLen = 0;
27365ffd940aSRaphael Isemann       size_t MatchPos =
27375ffd940aSRaphael Isemann           CheckStr.Check(SM, CheckRegion, false, MatchLen, Req, Diags);
27385ffd940aSRaphael Isemann 
27395ffd940aSRaphael Isemann       if (MatchPos == StringRef::npos) {
27405ffd940aSRaphael Isemann         ChecksFailed = true;
27415ffd940aSRaphael Isemann         i = j;
27425ffd940aSRaphael Isemann         break;
27435ffd940aSRaphael Isemann       }
27445ffd940aSRaphael Isemann 
27455ffd940aSRaphael Isemann       CheckRegion = CheckRegion.substr(MatchPos + MatchLen);
27465ffd940aSRaphael Isemann     }
27475ffd940aSRaphael Isemann 
27485ffd940aSRaphael Isemann     if (j == e)
27495ffd940aSRaphael Isemann       break;
27505ffd940aSRaphael Isemann   }
27515ffd940aSRaphael Isemann 
27525ffd940aSRaphael Isemann   // Success if no checks failed.
27535ffd940aSRaphael Isemann   return !ChecksFailed;
27545ffd940aSRaphael Isemann }
2755