xref: /llvm-project/llvm/lib/FileCheck/FileCheck.cpp (revision d3d605b7cdee132929d32f8b71b01641eb1d6d37)
15ffd940aSRaphael Isemann //===- FileCheck.cpp - Check that File's Contents match what is expected --===//
25ffd940aSRaphael Isemann //
35ffd940aSRaphael Isemann // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
45ffd940aSRaphael Isemann // See https://llvm.org/LICENSE.txt for license information.
55ffd940aSRaphael Isemann // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
65ffd940aSRaphael Isemann //
75ffd940aSRaphael Isemann //===----------------------------------------------------------------------===//
85ffd940aSRaphael Isemann //
95ffd940aSRaphael Isemann // FileCheck does a line-by line check of a file that validates whether it
105ffd940aSRaphael Isemann // contains the expected content.  This is useful for regression tests etc.
115ffd940aSRaphael Isemann //
125ffd940aSRaphael Isemann // This file implements most of the API that will be used by the FileCheck utility
135ffd940aSRaphael Isemann // as well as various unittests.
145ffd940aSRaphael Isemann //===----------------------------------------------------------------------===//
155ffd940aSRaphael Isemann 
165ffd940aSRaphael Isemann #include "llvm/FileCheck/FileCheck.h"
175ffd940aSRaphael Isemann #include "FileCheckImpl.h"
185ffd940aSRaphael Isemann #include "llvm/ADT/STLExtras.h"
19b0abd489SElliot Goodrich #include "llvm/ADT/StringExtras.h"
205ffd940aSRaphael Isemann #include "llvm/ADT/StringSet.h"
215ffd940aSRaphael Isemann #include "llvm/ADT/Twine.h"
225ffd940aSRaphael Isemann #include "llvm/Support/CheckedArithmetic.h"
235ffd940aSRaphael Isemann #include "llvm/Support/FormatVariadic.h"
245ffd940aSRaphael Isemann #include <cstdint>
255ffd940aSRaphael Isemann #include <list>
26871d658cSMircea Trofin #include <set>
275ffd940aSRaphael Isemann #include <tuple>
285ffd940aSRaphael Isemann #include <utility>
295ffd940aSRaphael Isemann 
305ffd940aSRaphael Isemann using namespace llvm;
315ffd940aSRaphael Isemann 
325ffd940aSRaphael Isemann StringRef ExpressionFormat::toString() const {
335ffd940aSRaphael Isemann   switch (Value) {
345ffd940aSRaphael Isemann   case Kind::NoFormat:
355ffd940aSRaphael Isemann     return StringRef("<none>");
365ffd940aSRaphael Isemann   case Kind::Unsigned:
375ffd940aSRaphael Isemann     return StringRef("%u");
385ffd940aSRaphael Isemann   case Kind::Signed:
395ffd940aSRaphael Isemann     return StringRef("%d");
405ffd940aSRaphael Isemann   case Kind::HexUpper:
415ffd940aSRaphael Isemann     return StringRef("%X");
425ffd940aSRaphael Isemann   case Kind::HexLower:
435ffd940aSRaphael Isemann     return StringRef("%x");
445ffd940aSRaphael Isemann   }
455ffd940aSRaphael Isemann   llvm_unreachable("unknown expression format");
465ffd940aSRaphael Isemann }
475ffd940aSRaphael Isemann 
485ffd940aSRaphael Isemann Expected<std::string> ExpressionFormat::getWildcardRegex() const {
49f9e2a62cSThomas Preud'homme   StringRef AlternateFormPrefix = AlternateForm ? StringRef("0x") : StringRef();
50f9e2a62cSThomas Preud'homme 
51f9e2a62cSThomas Preud'homme   auto CreatePrecisionRegex = [&](StringRef S) {
52f9e2a62cSThomas Preud'homme     return (Twine(AlternateFormPrefix) + S + Twine('{') + Twine(Precision) +
53f9e2a62cSThomas Preud'homme             "}")
54f9e2a62cSThomas Preud'homme         .str();
555ffd940aSRaphael Isemann   };
565ffd940aSRaphael Isemann 
575ffd940aSRaphael Isemann   switch (Value) {
585ffd940aSRaphael Isemann   case Kind::Unsigned:
595ffd940aSRaphael Isemann     if (Precision)
605ffd940aSRaphael Isemann       return CreatePrecisionRegex("([1-9][0-9]*)?[0-9]");
615ffd940aSRaphael Isemann     return std::string("[0-9]+");
625ffd940aSRaphael Isemann   case Kind::Signed:
635ffd940aSRaphael Isemann     if (Precision)
645ffd940aSRaphael Isemann       return CreatePrecisionRegex("-?([1-9][0-9]*)?[0-9]");
655ffd940aSRaphael Isemann     return std::string("-?[0-9]+");
665ffd940aSRaphael Isemann   case Kind::HexUpper:
675ffd940aSRaphael Isemann     if (Precision)
685ffd940aSRaphael Isemann       return CreatePrecisionRegex("([1-9A-F][0-9A-F]*)?[0-9A-F]");
69f9e2a62cSThomas Preud'homme     return (Twine(AlternateFormPrefix) + Twine("[0-9A-F]+")).str();
705ffd940aSRaphael Isemann   case Kind::HexLower:
715ffd940aSRaphael Isemann     if (Precision)
725ffd940aSRaphael Isemann       return CreatePrecisionRegex("([1-9a-f][0-9a-f]*)?[0-9a-f]");
73f9e2a62cSThomas Preud'homme     return (Twine(AlternateFormPrefix) + Twine("[0-9a-f]+")).str();
745ffd940aSRaphael Isemann   default:
755ffd940aSRaphael Isemann     return createStringError(std::errc::invalid_argument,
765ffd940aSRaphael Isemann                              "trying to match value with invalid format");
775ffd940aSRaphael Isemann   }
785ffd940aSRaphael Isemann }
795ffd940aSRaphael Isemann 
805ffd940aSRaphael Isemann Expected<std::string>
81e15e969aSThomas Preud'homme ExpressionFormat::getMatchingString(APInt IntValue) const {
820726cb00SThomas Preud'homme   if (Value != Kind::Signed && IntValue.isNegative())
83fc0d1c05SThomas Preud'homme     return make_error<OverflowError>();
845ffd940aSRaphael Isemann 
85fc0d1c05SThomas Preud'homme   unsigned Radix;
86fc0d1c05SThomas Preud'homme   bool UpperCase = false;
87fc0d1c05SThomas Preud'homme   SmallString<8> AbsoluteValueStr;
88fc0d1c05SThomas Preud'homme   StringRef SignPrefix = IntValue.isNegative() ? "-" : "";
895ffd940aSRaphael Isemann   switch (Value) {
905ffd940aSRaphael Isemann   case Kind::Unsigned:
915ffd940aSRaphael Isemann   case Kind::Signed:
92fc0d1c05SThomas Preud'homme     Radix = 10;
935ffd940aSRaphael Isemann     break;
945ffd940aSRaphael Isemann   case Kind::HexUpper:
95fc0d1c05SThomas Preud'homme     UpperCase = true;
96fc0d1c05SThomas Preud'homme     Radix = 16;
97fc0d1c05SThomas Preud'homme     break;
985ffd940aSRaphael Isemann   case Kind::HexLower:
99fc0d1c05SThomas Preud'homme     Radix = 16;
100fc0d1c05SThomas Preud'homme     UpperCase = false;
1015ffd940aSRaphael Isemann     break;
1025ffd940aSRaphael Isemann   default:
1035ffd940aSRaphael Isemann     return createStringError(std::errc::invalid_argument,
1045ffd940aSRaphael Isemann                              "trying to match value with invalid format");
1055ffd940aSRaphael Isemann   }
106fc0d1c05SThomas Preud'homme   IntValue.abs().toString(AbsoluteValueStr, Radix, /*Signed=*/false,
107fc0d1c05SThomas Preud'homme                           /*formatAsCLiteral=*/false,
108fc0d1c05SThomas Preud'homme                           /*UpperCase=*/UpperCase);
1095ffd940aSRaphael Isemann 
110f9e2a62cSThomas Preud'homme   StringRef AlternateFormPrefix = AlternateForm ? StringRef("0x") : StringRef();
111f9e2a62cSThomas Preud'homme 
1125ffd940aSRaphael Isemann   if (Precision > AbsoluteValueStr.size()) {
1135ffd940aSRaphael Isemann     unsigned LeadingZeros = Precision - AbsoluteValueStr.size();
114f9e2a62cSThomas Preud'homme     return (Twine(SignPrefix) + Twine(AlternateFormPrefix) +
115f9e2a62cSThomas Preud'homme             std::string(LeadingZeros, '0') + AbsoluteValueStr)
1165ffd940aSRaphael Isemann         .str();
1175ffd940aSRaphael Isemann   }
1185ffd940aSRaphael Isemann 
119f9e2a62cSThomas Preud'homme   return (Twine(SignPrefix) + Twine(AlternateFormPrefix) + AbsoluteValueStr)
120f9e2a62cSThomas Preud'homme       .str();
1215ffd940aSRaphael Isemann }
1225ffd940aSRaphael Isemann 
1230726cb00SThomas Preud'homme static unsigned nextAPIntBitWidth(unsigned BitWidth) {
1240726cb00SThomas Preud'homme   return (BitWidth < APInt::APINT_BITS_PER_WORD) ? APInt::APINT_BITS_PER_WORD
1250726cb00SThomas Preud'homme                                                  : BitWidth * 2;
1260726cb00SThomas Preud'homme }
1270726cb00SThomas Preud'homme 
1280726cb00SThomas Preud'homme static APInt toSigned(APInt AbsVal, bool Negative) {
1290726cb00SThomas Preud'homme   if (AbsVal.isSignBitSet())
1300726cb00SThomas Preud'homme     AbsVal = AbsVal.zext(nextAPIntBitWidth(AbsVal.getBitWidth()));
1310726cb00SThomas Preud'homme   APInt Result = AbsVal;
1320726cb00SThomas Preud'homme   if (Negative)
1330726cb00SThomas Preud'homme     Result.negate();
1340726cb00SThomas Preud'homme   return Result;
1350726cb00SThomas Preud'homme }
1360726cb00SThomas Preud'homme 
137b743c193SThomas Preud'homme APInt ExpressionFormat::valueFromStringRepr(StringRef StrVal,
1385ffd940aSRaphael Isemann                                             const SourceMgr &SM) const {
1395ffd940aSRaphael Isemann   bool ValueIsSigned = Value == Kind::Signed;
1400726cb00SThomas Preud'homme   bool Negative = StrVal.consume_front("-");
1415ffd940aSRaphael Isemann   bool Hex = Value == Kind::HexUpper || Value == Kind::HexLower;
1420726cb00SThomas Preud'homme   bool MissingFormPrefix =
1430726cb00SThomas Preud'homme       !ValueIsSigned && AlternateForm && !StrVal.consume_front("0x");
14413eb298dSThomas Preud'homme   (void)MissingFormPrefix;
14513eb298dSThomas Preud'homme   assert(!MissingFormPrefix && "missing alternate form prefix");
1460726cb00SThomas Preud'homme   APInt ResultValue;
147b743c193SThomas Preud'homme   [[maybe_unused]] bool ParseFailure =
148b743c193SThomas Preud'homme       StrVal.getAsInteger(Hex ? 16 : 10, ResultValue);
149b743c193SThomas Preud'homme   // Both the FileCheck utility and library only call this method with a valid
150b743c193SThomas Preud'homme   // value in StrVal. This is guaranteed by the regex returned by
151b743c193SThomas Preud'homme   // getWildcardRegex() above.
152b743c193SThomas Preud'homme   assert(!ParseFailure && "unable to represent numeric value");
153e15e969aSThomas Preud'homme   return toSigned(ResultValue, Negative);
1545ffd940aSRaphael Isemann }
1555ffd940aSRaphael Isemann 
156e15e969aSThomas Preud'homme Expected<APInt> llvm::exprAdd(const APInt &LeftOperand,
157e15e969aSThomas Preud'homme                               const APInt &RightOperand, bool &Overflow) {
158e15e969aSThomas Preud'homme   return LeftOperand.sadd_ov(RightOperand, Overflow);
1595ffd940aSRaphael Isemann }
1605ffd940aSRaphael Isemann 
161e15e969aSThomas Preud'homme Expected<APInt> llvm::exprSub(const APInt &LeftOperand,
162e15e969aSThomas Preud'homme                               const APInt &RightOperand, bool &Overflow) {
163e15e969aSThomas Preud'homme   return LeftOperand.ssub_ov(RightOperand, Overflow);
1645ffd940aSRaphael Isemann }
1655ffd940aSRaphael Isemann 
166e15e969aSThomas Preud'homme Expected<APInt> llvm::exprMul(const APInt &LeftOperand,
167e15e969aSThomas Preud'homme                               const APInt &RightOperand, bool &Overflow) {
168e15e969aSThomas Preud'homme   return LeftOperand.smul_ov(RightOperand, Overflow);
1695ffd940aSRaphael Isemann }
1705ffd940aSRaphael Isemann 
171e15e969aSThomas Preud'homme Expected<APInt> llvm::exprDiv(const APInt &LeftOperand,
172e15e969aSThomas Preud'homme                               const APInt &RightOperand, bool &Overflow) {
173fc0d1c05SThomas Preud'homme   // Check for division by zero.
174e15e969aSThomas Preud'homme   if (RightOperand.isZero())
1755ffd940aSRaphael Isemann     return make_error<OverflowError>();
1765ffd940aSRaphael Isemann 
177e15e969aSThomas Preud'homme   return LeftOperand.sdiv_ov(RightOperand, Overflow);
1785ffd940aSRaphael Isemann }
1795ffd940aSRaphael Isemann 
180e15e969aSThomas Preud'homme Expected<APInt> llvm::exprMax(const APInt &LeftOperand,
181e15e969aSThomas Preud'homme                               const APInt &RightOperand, bool &Overflow) {
1820726cb00SThomas Preud'homme   Overflow = false;
183e15e969aSThomas Preud'homme   return LeftOperand.slt(RightOperand) ? RightOperand : LeftOperand;
1845ffd940aSRaphael Isemann }
1855ffd940aSRaphael Isemann 
186e15e969aSThomas Preud'homme Expected<APInt> llvm::exprMin(const APInt &LeftOperand,
187e15e969aSThomas Preud'homme                               const APInt &RightOperand, bool &Overflow) {
1880726cb00SThomas Preud'homme   Overflow = false;
189e15e969aSThomas Preud'homme   if (cantFail(exprMax(LeftOperand, RightOperand, Overflow)) == LeftOperand)
1905ffd940aSRaphael Isemann     return RightOperand;
1915ffd940aSRaphael Isemann 
1925ffd940aSRaphael Isemann   return LeftOperand;
1935ffd940aSRaphael Isemann }
1945ffd940aSRaphael Isemann 
195e15e969aSThomas Preud'homme Expected<APInt> NumericVariableUse::eval() const {
196e15e969aSThomas Preud'homme   std::optional<APInt> Value = Variable->getValue();
1975ffd940aSRaphael Isemann   if (Value)
1985ffd940aSRaphael Isemann     return *Value;
1995ffd940aSRaphael Isemann 
2005ffd940aSRaphael Isemann   return make_error<UndefVarError>(getExpressionStr());
2015ffd940aSRaphael Isemann }
2025ffd940aSRaphael Isemann 
203e15e969aSThomas Preud'homme Expected<APInt> BinaryOperation::eval() const {
204e15e969aSThomas Preud'homme   Expected<APInt> MaybeLeftOp = LeftOperand->eval();
205e15e969aSThomas Preud'homme   Expected<APInt> MaybeRightOp = RightOperand->eval();
2065ffd940aSRaphael Isemann 
2075ffd940aSRaphael Isemann   // Bubble up any error (e.g. undefined variables) in the recursive
2085ffd940aSRaphael Isemann   // evaluation.
2090726cb00SThomas Preud'homme   if (!MaybeLeftOp || !MaybeRightOp) {
2105ffd940aSRaphael Isemann     Error Err = Error::success();
2110726cb00SThomas Preud'homme     if (!MaybeLeftOp)
2120726cb00SThomas Preud'homme       Err = joinErrors(std::move(Err), MaybeLeftOp.takeError());
2130726cb00SThomas Preud'homme     if (!MaybeRightOp)
2140726cb00SThomas Preud'homme       Err = joinErrors(std::move(Err), MaybeRightOp.takeError());
2155ffd940aSRaphael Isemann     return std::move(Err);
2165ffd940aSRaphael Isemann   }
2175ffd940aSRaphael Isemann 
218e15e969aSThomas Preud'homme   APInt LeftOp = *MaybeLeftOp;
219e15e969aSThomas Preud'homme   APInt RightOp = *MaybeRightOp;
2200726cb00SThomas Preud'homme   bool Overflow;
2210726cb00SThomas Preud'homme   // Ensure both operands have the same bitwidth.
2220726cb00SThomas Preud'homme   unsigned LeftBitWidth = LeftOp.getBitWidth();
2230726cb00SThomas Preud'homme   unsigned RightBitWidth = RightOp.getBitWidth();
2240726cb00SThomas Preud'homme   unsigned NewBitWidth = std::max(LeftBitWidth, RightBitWidth);
2250726cb00SThomas Preud'homme   LeftOp = LeftOp.sext(NewBitWidth);
2260726cb00SThomas Preud'homme   RightOp = RightOp.sext(NewBitWidth);
2270726cb00SThomas Preud'homme   do {
228e15e969aSThomas Preud'homme     Expected<APInt> MaybeResult = EvalBinop(LeftOp, RightOp, Overflow);
2290726cb00SThomas Preud'homme     if (!MaybeResult)
2300726cb00SThomas Preud'homme       return MaybeResult.takeError();
2310726cb00SThomas Preud'homme 
2320726cb00SThomas Preud'homme     if (!Overflow)
2330726cb00SThomas Preud'homme       return MaybeResult;
2340726cb00SThomas Preud'homme 
2350726cb00SThomas Preud'homme     NewBitWidth = nextAPIntBitWidth(NewBitWidth);
2360726cb00SThomas Preud'homme     LeftOp = LeftOp.sext(NewBitWidth);
2370726cb00SThomas Preud'homme     RightOp = RightOp.sext(NewBitWidth);
2380726cb00SThomas Preud'homme   } while (true);
2395ffd940aSRaphael Isemann }
2405ffd940aSRaphael Isemann 
2415ffd940aSRaphael Isemann Expected<ExpressionFormat>
2425ffd940aSRaphael Isemann BinaryOperation::getImplicitFormat(const SourceMgr &SM) const {
2435ffd940aSRaphael Isemann   Expected<ExpressionFormat> LeftFormat = LeftOperand->getImplicitFormat(SM);
2445ffd940aSRaphael Isemann   Expected<ExpressionFormat> RightFormat = RightOperand->getImplicitFormat(SM);
2455ffd940aSRaphael Isemann   if (!LeftFormat || !RightFormat) {
2465ffd940aSRaphael Isemann     Error Err = Error::success();
2475ffd940aSRaphael Isemann     if (!LeftFormat)
2485ffd940aSRaphael Isemann       Err = joinErrors(std::move(Err), LeftFormat.takeError());
2495ffd940aSRaphael Isemann     if (!RightFormat)
2505ffd940aSRaphael Isemann       Err = joinErrors(std::move(Err), RightFormat.takeError());
2515ffd940aSRaphael Isemann     return std::move(Err);
2525ffd940aSRaphael Isemann   }
2535ffd940aSRaphael Isemann 
2545ffd940aSRaphael Isemann   if (*LeftFormat != ExpressionFormat::Kind::NoFormat &&
2555ffd940aSRaphael Isemann       *RightFormat != ExpressionFormat::Kind::NoFormat &&
2565ffd940aSRaphael Isemann       *LeftFormat != *RightFormat)
2575ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
2585ffd940aSRaphael Isemann         SM, getExpressionStr(),
2595ffd940aSRaphael Isemann         "implicit format conflict between '" + LeftOperand->getExpressionStr() +
2605ffd940aSRaphael Isemann             "' (" + LeftFormat->toString() + ") and '" +
2615ffd940aSRaphael Isemann             RightOperand->getExpressionStr() + "' (" + RightFormat->toString() +
2625ffd940aSRaphael Isemann             "), need an explicit format specifier");
2635ffd940aSRaphael Isemann 
2645ffd940aSRaphael Isemann   return *LeftFormat != ExpressionFormat::Kind::NoFormat ? *LeftFormat
2655ffd940aSRaphael Isemann                                                          : *RightFormat;
2665ffd940aSRaphael Isemann }
2675ffd940aSRaphael Isemann 
2685ffd940aSRaphael Isemann Expected<std::string> NumericSubstitution::getResult() const {
2695ffd940aSRaphael Isemann   assert(ExpressionPointer->getAST() != nullptr &&
2705ffd940aSRaphael Isemann          "Substituting empty expression");
271e15e969aSThomas Preud'homme   Expected<APInt> EvaluatedValue = ExpressionPointer->getAST()->eval();
2725ffd940aSRaphael Isemann   if (!EvaluatedValue)
2735ffd940aSRaphael Isemann     return EvaluatedValue.takeError();
2745ffd940aSRaphael Isemann   ExpressionFormat Format = ExpressionPointer->getFormat();
2755ffd940aSRaphael Isemann   return Format.getMatchingString(*EvaluatedValue);
2765ffd940aSRaphael Isemann }
2775ffd940aSRaphael Isemann 
2785ffd940aSRaphael Isemann Expected<std::string> StringSubstitution::getResult() const {
2795ffd940aSRaphael Isemann   // Look up the value and escape it so that we can put it into the regex.
2805ffd940aSRaphael Isemann   Expected<StringRef> VarVal = Context->getPatternVarValue(FromStr);
2815ffd940aSRaphael Isemann   if (!VarVal)
2825ffd940aSRaphael Isemann     return VarVal.takeError();
2835ffd940aSRaphael Isemann   return Regex::escape(*VarVal);
2845ffd940aSRaphael Isemann }
2855ffd940aSRaphael Isemann 
2865ffd940aSRaphael Isemann bool Pattern::isValidVarNameStart(char C) { return C == '_' || isAlpha(C); }
2875ffd940aSRaphael Isemann 
2885ffd940aSRaphael Isemann Expected<Pattern::VariableProperties>
2895ffd940aSRaphael Isemann Pattern::parseVariable(StringRef &Str, const SourceMgr &SM) {
2905ffd940aSRaphael Isemann   if (Str.empty())
2915ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Str, "empty variable name");
2925ffd940aSRaphael Isemann 
2935ffd940aSRaphael Isemann   size_t I = 0;
2945ffd940aSRaphael Isemann   bool IsPseudo = Str[0] == '@';
2955ffd940aSRaphael Isemann 
2965ffd940aSRaphael Isemann   // Global vars start with '$'.
2975ffd940aSRaphael Isemann   if (Str[0] == '$' || IsPseudo)
2985ffd940aSRaphael Isemann     ++I;
2995ffd940aSRaphael Isemann 
3003105cfe7SDaniil Kovalev   if (I == Str.size())
30122e55ba3SKazu Hirata     return ErrorDiagnostic::get(SM, Str.substr(I),
3023105cfe7SDaniil Kovalev                                 StringRef("empty ") +
3033105cfe7SDaniil Kovalev                                     (IsPseudo ? "pseudo " : "global ") +
3043105cfe7SDaniil Kovalev                                     "variable name");
3053105cfe7SDaniil Kovalev 
3065ffd940aSRaphael Isemann   if (!isValidVarNameStart(Str[I++]))
3075ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Str, "invalid variable name");
3085ffd940aSRaphael Isemann 
3095ffd940aSRaphael Isemann   for (size_t E = Str.size(); I != E; ++I)
3105ffd940aSRaphael Isemann     // Variable names are composed of alphanumeric characters and underscores.
3115ffd940aSRaphael Isemann     if (Str[I] != '_' && !isAlnum(Str[I]))
3125ffd940aSRaphael Isemann       break;
3135ffd940aSRaphael Isemann 
3145ffd940aSRaphael Isemann   StringRef Name = Str.take_front(I);
3155ffd940aSRaphael Isemann   Str = Str.substr(I);
3165ffd940aSRaphael Isemann   return VariableProperties {Name, IsPseudo};
3175ffd940aSRaphael Isemann }
3185ffd940aSRaphael Isemann 
3195ffd940aSRaphael Isemann // StringRef holding all characters considered as horizontal whitespaces by
3205ffd940aSRaphael Isemann // FileCheck input canonicalization.
3215ffd940aSRaphael Isemann constexpr StringLiteral SpaceChars = " \t";
3225ffd940aSRaphael Isemann 
3235ffd940aSRaphael Isemann // Parsing helper function that strips the first character in S and returns it.
3245ffd940aSRaphael Isemann static char popFront(StringRef &S) {
3255ffd940aSRaphael Isemann   char C = S.front();
3265ffd940aSRaphael Isemann   S = S.drop_front();
3275ffd940aSRaphael Isemann   return C;
3285ffd940aSRaphael Isemann }
3295ffd940aSRaphael Isemann 
3305ffd940aSRaphael Isemann char OverflowError::ID = 0;
3315ffd940aSRaphael Isemann char UndefVarError::ID = 0;
3325ffd940aSRaphael Isemann char ErrorDiagnostic::ID = 0;
3335ffd940aSRaphael Isemann char NotFoundError::ID = 0;
334dd59c132SJoel E. Denny char ErrorReported::ID = 0;
3355ffd940aSRaphael Isemann 
3365ffd940aSRaphael Isemann Expected<NumericVariable *> Pattern::parseNumericVariableDefinition(
3375ffd940aSRaphael Isemann     StringRef &Expr, FileCheckPatternContext *Context,
33894081642SFangrui Song     std::optional<size_t> LineNumber, ExpressionFormat ImplicitFormat,
3395ffd940aSRaphael Isemann     const SourceMgr &SM) {
3405ffd940aSRaphael Isemann   Expected<VariableProperties> ParseVarResult = parseVariable(Expr, SM);
3415ffd940aSRaphael Isemann   if (!ParseVarResult)
3425ffd940aSRaphael Isemann     return ParseVarResult.takeError();
3435ffd940aSRaphael Isemann   StringRef Name = ParseVarResult->Name;
3445ffd940aSRaphael Isemann 
3455ffd940aSRaphael Isemann   if (ParseVarResult->IsPseudo)
3465ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
3475ffd940aSRaphael Isemann         SM, Name, "definition of pseudo numeric variable unsupported");
3485ffd940aSRaphael Isemann 
3495ffd940aSRaphael Isemann   // Detect collisions between string and numeric variables when the latter
3505ffd940aSRaphael Isemann   // is created later than the former.
351b595eb83SKazu Hirata   if (Context->DefinedVariableTable.contains(Name))
3525ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
3535ffd940aSRaphael Isemann         SM, Name, "string variable with name '" + Name + "' already exists");
3545ffd940aSRaphael Isemann 
3555ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
3565ffd940aSRaphael Isemann   if (!Expr.empty())
3575ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
3585ffd940aSRaphael Isemann         SM, Expr, "unexpected characters after numeric variable name");
3595ffd940aSRaphael Isemann 
3605ffd940aSRaphael Isemann   NumericVariable *DefinedNumericVariable;
3615ffd940aSRaphael Isemann   auto VarTableIter = Context->GlobalNumericVariableTable.find(Name);
3625ffd940aSRaphael Isemann   if (VarTableIter != Context->GlobalNumericVariableTable.end()) {
3635ffd940aSRaphael Isemann     DefinedNumericVariable = VarTableIter->second;
3645ffd940aSRaphael Isemann     if (DefinedNumericVariable->getImplicitFormat() != ImplicitFormat)
3655ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
3665ffd940aSRaphael Isemann           SM, Expr, "format different from previous variable definition");
3675ffd940aSRaphael Isemann   } else
3685ffd940aSRaphael Isemann     DefinedNumericVariable =
3695ffd940aSRaphael Isemann         Context->makeNumericVariable(Name, ImplicitFormat, LineNumber);
3705ffd940aSRaphael Isemann 
3715ffd940aSRaphael Isemann   return DefinedNumericVariable;
3725ffd940aSRaphael Isemann }
3735ffd940aSRaphael Isemann 
3745ffd940aSRaphael Isemann Expected<std::unique_ptr<NumericVariableUse>> Pattern::parseNumericVariableUse(
37594081642SFangrui Song     StringRef Name, bool IsPseudo, std::optional<size_t> LineNumber,
3765ffd940aSRaphael Isemann     FileCheckPatternContext *Context, const SourceMgr &SM) {
377bb6df080SKazu Hirata   if (IsPseudo && Name != "@LINE")
3785ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
3795ffd940aSRaphael Isemann         SM, Name, "invalid pseudo numeric variable '" + Name + "'");
3805ffd940aSRaphael Isemann 
3815ffd940aSRaphael Isemann   // Numeric variable definitions and uses are parsed in the order in which
3825ffd940aSRaphael Isemann   // they appear in the CHECK patterns. For each definition, the pointer to the
3835ffd940aSRaphael Isemann   // class instance of the corresponding numeric variable definition is stored
3845ffd940aSRaphael Isemann   // in GlobalNumericVariableTable in parsePattern. Therefore, if the pointer
3855ffd940aSRaphael Isemann   // we get below is null, it means no such variable was defined before. When
3865ffd940aSRaphael Isemann   // that happens, we create a dummy variable so that parsing can continue. All
3875ffd940aSRaphael Isemann   // uses of undefined variables, whether string or numeric, are then diagnosed
388fd941036SThomas Preud'homme   // in printNoMatch() after failing to match.
3895ffd940aSRaphael Isemann   auto VarTableIter = Context->GlobalNumericVariableTable.find(Name);
3905ffd940aSRaphael Isemann   NumericVariable *NumericVariable;
3915ffd940aSRaphael Isemann   if (VarTableIter != Context->GlobalNumericVariableTable.end())
3925ffd940aSRaphael Isemann     NumericVariable = VarTableIter->second;
3935ffd940aSRaphael Isemann   else {
3945ffd940aSRaphael Isemann     NumericVariable = Context->makeNumericVariable(
3955ffd940aSRaphael Isemann         Name, ExpressionFormat(ExpressionFormat::Kind::Unsigned));
3965ffd940aSRaphael Isemann     Context->GlobalNumericVariableTable[Name] = NumericVariable;
3975ffd940aSRaphael Isemann   }
3985ffd940aSRaphael Isemann 
39994081642SFangrui Song   std::optional<size_t> DefLineNumber = NumericVariable->getDefLineNumber();
4005ffd940aSRaphael Isemann   if (DefLineNumber && LineNumber && *DefLineNumber == *LineNumber)
4015ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
4025ffd940aSRaphael Isemann         SM, Name,
4035ffd940aSRaphael Isemann         "numeric variable '" + Name +
4045ffd940aSRaphael Isemann             "' defined earlier in the same CHECK directive");
4055ffd940aSRaphael Isemann 
4065ffd940aSRaphael Isemann   return std::make_unique<NumericVariableUse>(Name, NumericVariable);
4075ffd940aSRaphael Isemann }
4085ffd940aSRaphael Isemann 
4095ffd940aSRaphael Isemann Expected<std::unique_ptr<ExpressionAST>> Pattern::parseNumericOperand(
4105ffd940aSRaphael Isemann     StringRef &Expr, AllowedOperand AO, bool MaybeInvalidConstraint,
41194081642SFangrui Song     std::optional<size_t> LineNumber, FileCheckPatternContext *Context,
4125ffd940aSRaphael Isemann     const SourceMgr &SM) {
413586ecdf2SKazu Hirata   if (Expr.starts_with("(")) {
4145ffd940aSRaphael Isemann     if (AO != AllowedOperand::Any)
4155ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
4165ffd940aSRaphael Isemann           SM, Expr, "parenthesized expression not permitted here");
4175ffd940aSRaphael Isemann     return parseParenExpr(Expr, LineNumber, Context, SM);
4185ffd940aSRaphael Isemann   }
4195ffd940aSRaphael Isemann 
4205ffd940aSRaphael Isemann   if (AO == AllowedOperand::LineVar || AO == AllowedOperand::Any) {
4215ffd940aSRaphael Isemann     // Try to parse as a numeric variable use.
4225ffd940aSRaphael Isemann     Expected<Pattern::VariableProperties> ParseVarResult =
4235ffd940aSRaphael Isemann         parseVariable(Expr, SM);
4245ffd940aSRaphael Isemann     if (ParseVarResult) {
4255ffd940aSRaphael Isemann       // Try to parse a function call.
426586ecdf2SKazu Hirata       if (Expr.ltrim(SpaceChars).starts_with("(")) {
4275ffd940aSRaphael Isemann         if (AO != AllowedOperand::Any)
4285ffd940aSRaphael Isemann           return ErrorDiagnostic::get(SM, ParseVarResult->Name,
4295ffd940aSRaphael Isemann                                       "unexpected function call");
4305ffd940aSRaphael Isemann 
4315ffd940aSRaphael Isemann         return parseCallExpr(Expr, ParseVarResult->Name, LineNumber, Context,
4325ffd940aSRaphael Isemann                              SM);
4335ffd940aSRaphael Isemann       }
4345ffd940aSRaphael Isemann 
4355ffd940aSRaphael Isemann       return parseNumericVariableUse(ParseVarResult->Name,
4365ffd940aSRaphael Isemann                                      ParseVarResult->IsPseudo, LineNumber,
4375ffd940aSRaphael Isemann                                      Context, SM);
4385ffd940aSRaphael Isemann     }
4395ffd940aSRaphael Isemann 
4405ffd940aSRaphael Isemann     if (AO == AllowedOperand::LineVar)
4415ffd940aSRaphael Isemann       return ParseVarResult.takeError();
4425ffd940aSRaphael Isemann     // Ignore the error and retry parsing as a literal.
4435ffd940aSRaphael Isemann     consumeError(ParseVarResult.takeError());
4445ffd940aSRaphael Isemann   }
4455ffd940aSRaphael Isemann 
4465ffd940aSRaphael Isemann   // Otherwise, parse it as a literal.
4470726cb00SThomas Preud'homme   APInt LiteralValue;
4485ffd940aSRaphael Isemann   StringRef SaveExpr = Expr;
4490726cb00SThomas Preud'homme   bool Negative = Expr.consume_front("-");
4505ffd940aSRaphael Isemann   if (!Expr.consumeInteger((AO == AllowedOperand::LegacyLiteral) ? 10 : 0,
4510726cb00SThomas Preud'homme                            LiteralValue)) {
4520726cb00SThomas Preud'homme     LiteralValue = toSigned(LiteralValue, Negative);
4535ffd940aSRaphael Isemann     return std::make_unique<ExpressionLiteral>(SaveExpr.drop_back(Expr.size()),
4540726cb00SThomas Preud'homme                                                LiteralValue);
4550726cb00SThomas Preud'homme   }
4565ffd940aSRaphael Isemann   return ErrorDiagnostic::get(
4570726cb00SThomas Preud'homme       SM, SaveExpr,
4585ffd940aSRaphael Isemann       Twine("invalid ") +
4595ffd940aSRaphael Isemann           (MaybeInvalidConstraint ? "matching constraint or " : "") +
4605ffd940aSRaphael Isemann           "operand format");
4615ffd940aSRaphael Isemann }
4625ffd940aSRaphael Isemann 
4635ffd940aSRaphael Isemann Expected<std::unique_ptr<ExpressionAST>>
46494081642SFangrui Song Pattern::parseParenExpr(StringRef &Expr, std::optional<size_t> LineNumber,
4655ffd940aSRaphael Isemann                         FileCheckPatternContext *Context, const SourceMgr &SM) {
4665ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
467586ecdf2SKazu Hirata   assert(Expr.starts_with("("));
4685ffd940aSRaphael Isemann 
4695ffd940aSRaphael Isemann   // Parse right operand.
4705ffd940aSRaphael Isemann   Expr.consume_front("(");
4715ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
4725ffd940aSRaphael Isemann   if (Expr.empty())
4735ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Expr, "missing operand in expression");
4745ffd940aSRaphael Isemann 
4755ffd940aSRaphael Isemann   // Note: parseNumericOperand handles nested opening parentheses.
4765ffd940aSRaphael Isemann   Expected<std::unique_ptr<ExpressionAST>> SubExprResult = parseNumericOperand(
4775ffd940aSRaphael Isemann       Expr, AllowedOperand::Any, /*MaybeInvalidConstraint=*/false, LineNumber,
4785ffd940aSRaphael Isemann       Context, SM);
4795ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
480586ecdf2SKazu Hirata   while (SubExprResult && !Expr.empty() && !Expr.starts_with(")")) {
4815ffd940aSRaphael Isemann     StringRef OrigExpr = Expr;
4825ffd940aSRaphael Isemann     SubExprResult = parseBinop(OrigExpr, Expr, std::move(*SubExprResult), false,
4835ffd940aSRaphael Isemann                                LineNumber, Context, SM);
4845ffd940aSRaphael Isemann     Expr = Expr.ltrim(SpaceChars);
4855ffd940aSRaphael Isemann   }
4865ffd940aSRaphael Isemann   if (!SubExprResult)
4875ffd940aSRaphael Isemann     return SubExprResult;
4885ffd940aSRaphael Isemann 
4895ffd940aSRaphael Isemann   if (!Expr.consume_front(")")) {
4905ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Expr,
4915ffd940aSRaphael Isemann                                 "missing ')' at end of nested expression");
4925ffd940aSRaphael Isemann   }
4935ffd940aSRaphael Isemann   return SubExprResult;
4945ffd940aSRaphael Isemann }
4955ffd940aSRaphael Isemann 
4965ffd940aSRaphael Isemann Expected<std::unique_ptr<ExpressionAST>>
4975ffd940aSRaphael Isemann Pattern::parseBinop(StringRef Expr, StringRef &RemainingExpr,
4985ffd940aSRaphael Isemann                     std::unique_ptr<ExpressionAST> LeftOp,
49994081642SFangrui Song                     bool IsLegacyLineExpr, std::optional<size_t> LineNumber,
5005ffd940aSRaphael Isemann                     FileCheckPatternContext *Context, const SourceMgr &SM) {
5015ffd940aSRaphael Isemann   RemainingExpr = RemainingExpr.ltrim(SpaceChars);
5025ffd940aSRaphael Isemann   if (RemainingExpr.empty())
5035ffd940aSRaphael Isemann     return std::move(LeftOp);
5045ffd940aSRaphael Isemann 
5055ffd940aSRaphael Isemann   // Check if this is a supported operation and select a function to perform
5065ffd940aSRaphael Isemann   // it.
5075ffd940aSRaphael Isemann   SMLoc OpLoc = SMLoc::getFromPointer(RemainingExpr.data());
5085ffd940aSRaphael Isemann   char Operator = popFront(RemainingExpr);
5095ffd940aSRaphael Isemann   binop_eval_t EvalBinop;
5105ffd940aSRaphael Isemann   switch (Operator) {
5115ffd940aSRaphael Isemann   case '+':
5120726cb00SThomas Preud'homme     EvalBinop = exprAdd;
5135ffd940aSRaphael Isemann     break;
5145ffd940aSRaphael Isemann   case '-':
5150726cb00SThomas Preud'homme     EvalBinop = exprSub;
5165ffd940aSRaphael Isemann     break;
5175ffd940aSRaphael Isemann   default:
5185ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
5195ffd940aSRaphael Isemann         SM, OpLoc, Twine("unsupported operation '") + Twine(Operator) + "'");
5205ffd940aSRaphael Isemann   }
5215ffd940aSRaphael Isemann 
5225ffd940aSRaphael Isemann   // Parse right operand.
5235ffd940aSRaphael Isemann   RemainingExpr = RemainingExpr.ltrim(SpaceChars);
5245ffd940aSRaphael Isemann   if (RemainingExpr.empty())
5255ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, RemainingExpr,
5265ffd940aSRaphael Isemann                                 "missing operand in expression");
5275ffd940aSRaphael Isemann   // The second operand in a legacy @LINE expression is always a literal.
5285ffd940aSRaphael Isemann   AllowedOperand AO =
5295ffd940aSRaphael Isemann       IsLegacyLineExpr ? AllowedOperand::LegacyLiteral : AllowedOperand::Any;
5305ffd940aSRaphael Isemann   Expected<std::unique_ptr<ExpressionAST>> RightOpResult =
5315ffd940aSRaphael Isemann       parseNumericOperand(RemainingExpr, AO, /*MaybeInvalidConstraint=*/false,
5325ffd940aSRaphael Isemann                           LineNumber, Context, SM);
5335ffd940aSRaphael Isemann   if (!RightOpResult)
5345ffd940aSRaphael Isemann     return RightOpResult;
5355ffd940aSRaphael Isemann 
5365ffd940aSRaphael Isemann   Expr = Expr.drop_back(RemainingExpr.size());
5375ffd940aSRaphael Isemann   return std::make_unique<BinaryOperation>(Expr, EvalBinop, std::move(LeftOp),
5385ffd940aSRaphael Isemann                                            std::move(*RightOpResult));
5395ffd940aSRaphael Isemann }
5405ffd940aSRaphael Isemann 
5415ffd940aSRaphael Isemann Expected<std::unique_ptr<ExpressionAST>>
5425ffd940aSRaphael Isemann Pattern::parseCallExpr(StringRef &Expr, StringRef FuncName,
54394081642SFangrui Song                        std::optional<size_t> LineNumber,
5445ffd940aSRaphael Isemann                        FileCheckPatternContext *Context, const SourceMgr &SM) {
5455ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
546586ecdf2SKazu Hirata   assert(Expr.starts_with("("));
5475ffd940aSRaphael Isemann 
54820bdb451SBenjamin Kramer   auto OptFunc = StringSwitch<binop_eval_t>(FuncName)
5490726cb00SThomas Preud'homme                      .Case("add", exprAdd)
5500726cb00SThomas Preud'homme                      .Case("div", exprDiv)
5510726cb00SThomas Preud'homme                      .Case("max", exprMax)
5520726cb00SThomas Preud'homme                      .Case("min", exprMin)
5530726cb00SThomas Preud'homme                      .Case("mul", exprMul)
5540726cb00SThomas Preud'homme                      .Case("sub", exprSub)
55520bdb451SBenjamin Kramer                      .Default(nullptr);
5565ffd940aSRaphael Isemann 
5575ffd940aSRaphael Isemann   if (!OptFunc)
5585ffd940aSRaphael Isemann     return ErrorDiagnostic::get(
5595ffd940aSRaphael Isemann         SM, FuncName, Twine("call to undefined function '") + FuncName + "'");
5605ffd940aSRaphael Isemann 
5615ffd940aSRaphael Isemann   Expr.consume_front("(");
5625ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
5635ffd940aSRaphael Isemann 
5645ffd940aSRaphael Isemann   // Parse call arguments, which are comma separated.
5655ffd940aSRaphael Isemann   SmallVector<std::unique_ptr<ExpressionAST>, 4> Args;
566586ecdf2SKazu Hirata   while (!Expr.empty() && !Expr.starts_with(")")) {
567586ecdf2SKazu Hirata     if (Expr.starts_with(","))
5685ffd940aSRaphael Isemann       return ErrorDiagnostic::get(SM, Expr, "missing argument");
5695ffd940aSRaphael Isemann 
5705ffd940aSRaphael Isemann     // Parse the argument, which is an arbitary expression.
5715ffd940aSRaphael Isemann     StringRef OuterBinOpExpr = Expr;
5725ffd940aSRaphael Isemann     Expected<std::unique_ptr<ExpressionAST>> Arg = parseNumericOperand(
5735ffd940aSRaphael Isemann         Expr, AllowedOperand::Any, /*MaybeInvalidConstraint=*/false, LineNumber,
5745ffd940aSRaphael Isemann         Context, SM);
5755ffd940aSRaphael Isemann     while (Arg && !Expr.empty()) {
5765ffd940aSRaphael Isemann       Expr = Expr.ltrim(SpaceChars);
5775ffd940aSRaphael Isemann       // Have we reached an argument terminator?
578586ecdf2SKazu Hirata       if (Expr.starts_with(",") || Expr.starts_with(")"))
5795ffd940aSRaphael Isemann         break;
5805ffd940aSRaphael Isemann 
5815ffd940aSRaphael Isemann       // Arg = Arg <op> <expr>
5825ffd940aSRaphael Isemann       Arg = parseBinop(OuterBinOpExpr, Expr, std::move(*Arg), false, LineNumber,
5835ffd940aSRaphael Isemann                        Context, SM);
5845ffd940aSRaphael Isemann     }
5855ffd940aSRaphael Isemann 
5865ffd940aSRaphael Isemann     // Prefer an expression error over a generic invalid argument message.
5875ffd940aSRaphael Isemann     if (!Arg)
5885ffd940aSRaphael Isemann       return Arg.takeError();
5895ffd940aSRaphael Isemann     Args.push_back(std::move(*Arg));
5905ffd940aSRaphael Isemann 
5915ffd940aSRaphael Isemann     // Have we parsed all available arguments?
5925ffd940aSRaphael Isemann     Expr = Expr.ltrim(SpaceChars);
5935ffd940aSRaphael Isemann     if (!Expr.consume_front(","))
5945ffd940aSRaphael Isemann       break;
5955ffd940aSRaphael Isemann 
5965ffd940aSRaphael Isemann     Expr = Expr.ltrim(SpaceChars);
597586ecdf2SKazu Hirata     if (Expr.starts_with(")"))
5985ffd940aSRaphael Isemann       return ErrorDiagnostic::get(SM, Expr, "missing argument");
5995ffd940aSRaphael Isemann   }
6005ffd940aSRaphael Isemann 
6015ffd940aSRaphael Isemann   if (!Expr.consume_front(")"))
6025ffd940aSRaphael Isemann     return ErrorDiagnostic::get(SM, Expr,
6035ffd940aSRaphael Isemann                                 "missing ')' at end of call expression");
6045ffd940aSRaphael Isemann 
6055ffd940aSRaphael Isemann   const unsigned NumArgs = Args.size();
6065ffd940aSRaphael Isemann   if (NumArgs == 2)
6075ffd940aSRaphael Isemann     return std::make_unique<BinaryOperation>(Expr, *OptFunc, std::move(Args[0]),
6085ffd940aSRaphael Isemann                                              std::move(Args[1]));
6095ffd940aSRaphael Isemann 
6105ffd940aSRaphael Isemann   // TODO: Support more than binop_eval_t.
6115ffd940aSRaphael Isemann   return ErrorDiagnostic::get(SM, FuncName,
6125ffd940aSRaphael Isemann                               Twine("function '") + FuncName +
6135ffd940aSRaphael Isemann                                   Twine("' takes 2 arguments but ") +
6145ffd940aSRaphael Isemann                                   Twine(NumArgs) + " given");
6155ffd940aSRaphael Isemann }
6165ffd940aSRaphael Isemann 
6175ffd940aSRaphael Isemann Expected<std::unique_ptr<Expression>> Pattern::parseNumericSubstitutionBlock(
61894081642SFangrui Song     StringRef Expr, std::optional<NumericVariable *> &DefinedNumericVariable,
61994081642SFangrui Song     bool IsLegacyLineExpr, std::optional<size_t> LineNumber,
6205ffd940aSRaphael Isemann     FileCheckPatternContext *Context, const SourceMgr &SM) {
6215ffd940aSRaphael Isemann   std::unique_ptr<ExpressionAST> ExpressionASTPointer = nullptr;
6225ffd940aSRaphael Isemann   StringRef DefExpr = StringRef();
623aadaafacSKazu Hirata   DefinedNumericVariable = std::nullopt;
6245ffd940aSRaphael Isemann   ExpressionFormat ExplicitFormat = ExpressionFormat();
6255ffd940aSRaphael Isemann   unsigned Precision = 0;
6265ffd940aSRaphael Isemann 
627d4a01549SJay Foad   // Parse format specifier (NOTE: ',' is also an argument separator).
6285ffd940aSRaphael Isemann   size_t FormatSpecEnd = Expr.find(',');
6295ffd940aSRaphael Isemann   size_t FunctionStart = Expr.find('(');
6305ffd940aSRaphael Isemann   if (FormatSpecEnd != StringRef::npos && FormatSpecEnd < FunctionStart) {
6315ffd940aSRaphael Isemann     StringRef FormatExpr = Expr.take_front(FormatSpecEnd);
6325ffd940aSRaphael Isemann     Expr = Expr.drop_front(FormatSpecEnd + 1);
6335ffd940aSRaphael Isemann     FormatExpr = FormatExpr.trim(SpaceChars);
6345ffd940aSRaphael Isemann     if (!FormatExpr.consume_front("%"))
6355ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
6365ffd940aSRaphael Isemann           SM, FormatExpr,
6375ffd940aSRaphael Isemann           "invalid matching format specification in expression");
6385ffd940aSRaphael Isemann 
639f9e2a62cSThomas Preud'homme     // Parse alternate form flag.
640f9e2a62cSThomas Preud'homme     SMLoc AlternateFormFlagLoc = SMLoc::getFromPointer(FormatExpr.data());
641f9e2a62cSThomas Preud'homme     bool AlternateForm = FormatExpr.consume_front("#");
642f9e2a62cSThomas Preud'homme 
6435ffd940aSRaphael Isemann     // Parse precision.
6445ffd940aSRaphael Isemann     if (FormatExpr.consume_front(".")) {
6455ffd940aSRaphael Isemann       if (FormatExpr.consumeInteger(10, Precision))
6465ffd940aSRaphael Isemann         return ErrorDiagnostic::get(SM, FormatExpr,
6475ffd940aSRaphael Isemann                                     "invalid precision in format specifier");
6485ffd940aSRaphael Isemann     }
6495ffd940aSRaphael Isemann 
6505ffd940aSRaphael Isemann     if (!FormatExpr.empty()) {
6515ffd940aSRaphael Isemann       // Check for unknown matching format specifier and set matching format in
6525ffd940aSRaphael Isemann       // class instance representing this expression.
6535ffd940aSRaphael Isemann       SMLoc FmtLoc = SMLoc::getFromPointer(FormatExpr.data());
6545ffd940aSRaphael Isemann       switch (popFront(FormatExpr)) {
6555ffd940aSRaphael Isemann       case 'u':
6565ffd940aSRaphael Isemann         ExplicitFormat =
6575ffd940aSRaphael Isemann             ExpressionFormat(ExpressionFormat::Kind::Unsigned, Precision);
6585ffd940aSRaphael Isemann         break;
6595ffd940aSRaphael Isemann       case 'd':
6605ffd940aSRaphael Isemann         ExplicitFormat =
6615ffd940aSRaphael Isemann             ExpressionFormat(ExpressionFormat::Kind::Signed, Precision);
6625ffd940aSRaphael Isemann         break;
6635ffd940aSRaphael Isemann       case 'x':
664f9e2a62cSThomas Preud'homme         ExplicitFormat = ExpressionFormat(ExpressionFormat::Kind::HexLower,
665f9e2a62cSThomas Preud'homme                                           Precision, AlternateForm);
6665ffd940aSRaphael Isemann         break;
6675ffd940aSRaphael Isemann       case 'X':
668f9e2a62cSThomas Preud'homme         ExplicitFormat = ExpressionFormat(ExpressionFormat::Kind::HexUpper,
669f9e2a62cSThomas Preud'homme                                           Precision, AlternateForm);
6705ffd940aSRaphael Isemann         break;
6715ffd940aSRaphael Isemann       default:
6725ffd940aSRaphael Isemann         return ErrorDiagnostic::get(SM, FmtLoc,
6735ffd940aSRaphael Isemann                                     "invalid format specifier in expression");
6745ffd940aSRaphael Isemann       }
6755ffd940aSRaphael Isemann     }
6765ffd940aSRaphael Isemann 
677f9e2a62cSThomas Preud'homme     if (AlternateForm && ExplicitFormat != ExpressionFormat::Kind::HexLower &&
678f9e2a62cSThomas Preud'homme         ExplicitFormat != ExpressionFormat::Kind::HexUpper)
679f9e2a62cSThomas Preud'homme       return ErrorDiagnostic::get(
680f9e2a62cSThomas Preud'homme           SM, AlternateFormFlagLoc,
681f9e2a62cSThomas Preud'homme           "alternate form only supported for hex values");
682f9e2a62cSThomas Preud'homme 
6835ffd940aSRaphael Isemann     FormatExpr = FormatExpr.ltrim(SpaceChars);
6845ffd940aSRaphael Isemann     if (!FormatExpr.empty())
6855ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
6865ffd940aSRaphael Isemann           SM, FormatExpr,
6875ffd940aSRaphael Isemann           "invalid matching format specification in expression");
6885ffd940aSRaphael Isemann   }
6895ffd940aSRaphael Isemann 
6905ffd940aSRaphael Isemann   // Save variable definition expression if any.
6915ffd940aSRaphael Isemann   size_t DefEnd = Expr.find(':');
6925ffd940aSRaphael Isemann   if (DefEnd != StringRef::npos) {
6935ffd940aSRaphael Isemann     DefExpr = Expr.substr(0, DefEnd);
6945ffd940aSRaphael Isemann     Expr = Expr.substr(DefEnd + 1);
6955ffd940aSRaphael Isemann   }
6965ffd940aSRaphael Isemann 
6975ffd940aSRaphael Isemann   // Parse matching constraint.
6985ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
699e7d3a4f3SKazu Hirata   bool HasParsedValidConstraint = Expr.consume_front("==");
7005ffd940aSRaphael Isemann 
7015ffd940aSRaphael Isemann   // Parse the expression itself.
7025ffd940aSRaphael Isemann   Expr = Expr.ltrim(SpaceChars);
7035ffd940aSRaphael Isemann   if (Expr.empty()) {
7045ffd940aSRaphael Isemann     if (HasParsedValidConstraint)
7055ffd940aSRaphael Isemann       return ErrorDiagnostic::get(
7065ffd940aSRaphael Isemann           SM, Expr, "empty numeric expression should not have a constraint");
7075ffd940aSRaphael Isemann   } else {
7085ffd940aSRaphael Isemann     Expr = Expr.rtrim(SpaceChars);
7095ffd940aSRaphael Isemann     StringRef OuterBinOpExpr = Expr;
7105ffd940aSRaphael Isemann     // The first operand in a legacy @LINE expression is always the @LINE
7115ffd940aSRaphael Isemann     // pseudo variable.
7125ffd940aSRaphael Isemann     AllowedOperand AO =
7135ffd940aSRaphael Isemann         IsLegacyLineExpr ? AllowedOperand::LineVar : AllowedOperand::Any;
7145ffd940aSRaphael Isemann     Expected<std::unique_ptr<ExpressionAST>> ParseResult = parseNumericOperand(
7155ffd940aSRaphael Isemann         Expr, AO, !HasParsedValidConstraint, LineNumber, Context, SM);
7165ffd940aSRaphael Isemann     while (ParseResult && !Expr.empty()) {
7175ffd940aSRaphael Isemann       ParseResult = parseBinop(OuterBinOpExpr, Expr, std::move(*ParseResult),
7185ffd940aSRaphael Isemann                                IsLegacyLineExpr, LineNumber, Context, SM);
7195ffd940aSRaphael Isemann       // Legacy @LINE expressions only allow 2 operands.
7205ffd940aSRaphael Isemann       if (ParseResult && IsLegacyLineExpr && !Expr.empty())
7215ffd940aSRaphael Isemann         return ErrorDiagnostic::get(
7225ffd940aSRaphael Isemann             SM, Expr,
7235ffd940aSRaphael Isemann             "unexpected characters at end of expression '" + Expr + "'");
7245ffd940aSRaphael Isemann     }
7255ffd940aSRaphael Isemann     if (!ParseResult)
7265ffd940aSRaphael Isemann       return ParseResult.takeError();
7275ffd940aSRaphael Isemann     ExpressionASTPointer = std::move(*ParseResult);
7285ffd940aSRaphael Isemann   }
7295ffd940aSRaphael Isemann 
7305ffd940aSRaphael Isemann   // Select format of the expression, i.e. (i) its explicit format, if any,
7315ffd940aSRaphael Isemann   // otherwise (ii) its implicit format, if any, otherwise (iii) the default
7325ffd940aSRaphael Isemann   // format (unsigned). Error out in case of conflicting implicit format
7335ffd940aSRaphael Isemann   // without explicit format.
7345ffd940aSRaphael Isemann   ExpressionFormat Format;
7355ffd940aSRaphael Isemann   if (ExplicitFormat)
7365ffd940aSRaphael Isemann     Format = ExplicitFormat;
7375ffd940aSRaphael Isemann   else if (ExpressionASTPointer) {
7385ffd940aSRaphael Isemann     Expected<ExpressionFormat> ImplicitFormat =
7395ffd940aSRaphael Isemann         ExpressionASTPointer->getImplicitFormat(SM);
7405ffd940aSRaphael Isemann     if (!ImplicitFormat)
7415ffd940aSRaphael Isemann       return ImplicitFormat.takeError();
7425ffd940aSRaphael Isemann     Format = *ImplicitFormat;
7435ffd940aSRaphael Isemann   }
7445ffd940aSRaphael Isemann   if (!Format)
7455ffd940aSRaphael Isemann     Format = ExpressionFormat(ExpressionFormat::Kind::Unsigned, Precision);
7465ffd940aSRaphael Isemann 
7475ffd940aSRaphael Isemann   std::unique_ptr<Expression> ExpressionPointer =
7485ffd940aSRaphael Isemann       std::make_unique<Expression>(std::move(ExpressionASTPointer), Format);
7495ffd940aSRaphael Isemann 
7505ffd940aSRaphael Isemann   // Parse the numeric variable definition.
7515ffd940aSRaphael Isemann   if (DefEnd != StringRef::npos) {
7525ffd940aSRaphael Isemann     DefExpr = DefExpr.ltrim(SpaceChars);
7535ffd940aSRaphael Isemann     Expected<NumericVariable *> ParseResult = parseNumericVariableDefinition(
7545ffd940aSRaphael Isemann         DefExpr, Context, LineNumber, ExpressionPointer->getFormat(), SM);
7555ffd940aSRaphael Isemann 
7565ffd940aSRaphael Isemann     if (!ParseResult)
7575ffd940aSRaphael Isemann       return ParseResult.takeError();
7585ffd940aSRaphael Isemann     DefinedNumericVariable = *ParseResult;
7595ffd940aSRaphael Isemann   }
7605ffd940aSRaphael Isemann 
7615ffd940aSRaphael Isemann   return std::move(ExpressionPointer);
7625ffd940aSRaphael Isemann }
7635ffd940aSRaphael Isemann 
7645ffd940aSRaphael Isemann bool Pattern::parsePattern(StringRef PatternStr, StringRef Prefix,
7655ffd940aSRaphael Isemann                            SourceMgr &SM, const FileCheckRequest &Req) {
7665ffd940aSRaphael Isemann   bool MatchFullLinesHere = Req.MatchFullLines && CheckTy != Check::CheckNot;
7675ffd940aSRaphael Isemann   IgnoreCase = Req.IgnoreCase;
7685ffd940aSRaphael Isemann 
7695ffd940aSRaphael Isemann   PatternLoc = SMLoc::getFromPointer(PatternStr.data());
7705ffd940aSRaphael Isemann 
7715ffd940aSRaphael Isemann   if (!(Req.NoCanonicalizeWhiteSpace && Req.MatchFullLines))
7725ffd940aSRaphael Isemann     // Ignore trailing whitespace.
7733be989e8SKazu Hirata     PatternStr = PatternStr.rtrim(" \t");
7745ffd940aSRaphael Isemann 
7755ffd940aSRaphael Isemann   // Check that there is something on the line.
7765ffd940aSRaphael Isemann   if (PatternStr.empty() && CheckTy != Check::CheckEmpty) {
7775ffd940aSRaphael Isemann     SM.PrintMessage(PatternLoc, SourceMgr::DK_Error,
7785ffd940aSRaphael Isemann                     "found empty check string with prefix '" + Prefix + ":'");
7795ffd940aSRaphael Isemann     return true;
7805ffd940aSRaphael Isemann   }
7815ffd940aSRaphael Isemann 
7825ffd940aSRaphael Isemann   if (!PatternStr.empty() && CheckTy == Check::CheckEmpty) {
7835ffd940aSRaphael Isemann     SM.PrintMessage(
7845ffd940aSRaphael Isemann         PatternLoc, SourceMgr::DK_Error,
7855ffd940aSRaphael Isemann         "found non-empty check string for empty check with prefix '" + Prefix +
7865ffd940aSRaphael Isemann             ":'");
7875ffd940aSRaphael Isemann     return true;
7885ffd940aSRaphael Isemann   }
7895ffd940aSRaphael Isemann 
7905ffd940aSRaphael Isemann   if (CheckTy == Check::CheckEmpty) {
7915ffd940aSRaphael Isemann     RegExStr = "(\n$)";
7925ffd940aSRaphael Isemann     return false;
7935ffd940aSRaphael Isemann   }
7945ffd940aSRaphael Isemann 
79544f399ccSJacques Pienaar   // If literal check, set fixed string.
79644f399ccSJacques Pienaar   if (CheckTy.isLiteralMatch()) {
79744f399ccSJacques Pienaar     FixedStr = PatternStr;
79844f399ccSJacques Pienaar     return false;
79944f399ccSJacques Pienaar   }
80044f399ccSJacques Pienaar 
8015ffd940aSRaphael Isemann   // Check to see if this is a fixed string, or if it has regex pieces.
8025ffd940aSRaphael Isemann   if (!MatchFullLinesHere &&
803d14d7068SKazu Hirata       (PatternStr.size() < 2 ||
804d14d7068SKazu Hirata        (!PatternStr.contains("{{") && !PatternStr.contains("[[")))) {
8055ffd940aSRaphael Isemann     FixedStr = PatternStr;
8065ffd940aSRaphael Isemann     return false;
8075ffd940aSRaphael Isemann   }
8085ffd940aSRaphael Isemann 
8095ffd940aSRaphael Isemann   if (MatchFullLinesHere) {
8105ffd940aSRaphael Isemann     RegExStr += '^';
8115ffd940aSRaphael Isemann     if (!Req.NoCanonicalizeWhiteSpace)
8125ffd940aSRaphael Isemann       RegExStr += " *";
8135ffd940aSRaphael Isemann   }
8145ffd940aSRaphael Isemann 
8155ffd940aSRaphael Isemann   // Paren value #0 is for the fully matched string.  Any new parenthesized
8165ffd940aSRaphael Isemann   // values add from there.
8175ffd940aSRaphael Isemann   unsigned CurParen = 1;
8185ffd940aSRaphael Isemann 
8195ffd940aSRaphael Isemann   // Otherwise, there is at least one regex piece.  Build up the regex pattern
8205ffd940aSRaphael Isemann   // by escaping scary characters in fixed strings, building up one big regex.
8215ffd940aSRaphael Isemann   while (!PatternStr.empty()) {
8225ffd940aSRaphael Isemann     // RegEx matches.
823586ecdf2SKazu Hirata     if (PatternStr.starts_with("{{")) {
8245ffd940aSRaphael Isemann       // This is the start of a regex match.  Scan for the }}.
8255ffd940aSRaphael Isemann       size_t End = PatternStr.find("}}");
8265ffd940aSRaphael Isemann       if (End == StringRef::npos) {
8275ffd940aSRaphael Isemann         SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()),
8285ffd940aSRaphael Isemann                         SourceMgr::DK_Error,
8295ffd940aSRaphael Isemann                         "found start of regex string with no end '}}'");
8305ffd940aSRaphael Isemann         return true;
8315ffd940aSRaphael Isemann       }
8325ffd940aSRaphael Isemann 
8335ffd940aSRaphael Isemann       // Enclose {{}} patterns in parens just like [[]] even though we're not
8345ffd940aSRaphael Isemann       // capturing the result for any purpose.  This is required in case the
8355ffd940aSRaphael Isemann       // expression contains an alternation like: CHECK:  abc{{x|z}}def.  We
8365ffd940aSRaphael Isemann       // want this to turn into: "abc(x|z)def" not "abcx|zdef".
837a3eeef82SNikita Popov       bool HasAlternation = PatternStr.contains('|');
838a3eeef82SNikita Popov       if (HasAlternation) {
8395ffd940aSRaphael Isemann         RegExStr += '(';
8405ffd940aSRaphael Isemann         ++CurParen;
841a3eeef82SNikita Popov       }
8425ffd940aSRaphael Isemann 
8435ffd940aSRaphael Isemann       if (AddRegExToRegEx(PatternStr.substr(2, End - 2), CurParen, SM))
8445ffd940aSRaphael Isemann         return true;
845a3eeef82SNikita Popov       if (HasAlternation)
8465ffd940aSRaphael Isemann         RegExStr += ')';
8475ffd940aSRaphael Isemann 
8485ffd940aSRaphael Isemann       PatternStr = PatternStr.substr(End + 2);
8495ffd940aSRaphael Isemann       continue;
8505ffd940aSRaphael Isemann     }
8515ffd940aSRaphael Isemann 
8525ffd940aSRaphael Isemann     // String and numeric substitution blocks. Pattern substitution blocks come
8535ffd940aSRaphael Isemann     // in two forms: [[foo:.*]] and [[foo]]. The former matches .* (or some
8545ffd940aSRaphael Isemann     // other regex) and assigns it to the string variable 'foo'. The latter
8555ffd940aSRaphael Isemann     // substitutes foo's value. Numeric substitution blocks recognize the same
8565ffd940aSRaphael Isemann     // form as string ones, but start with a '#' sign after the double
8575ffd940aSRaphael Isemann     // brackets. They also accept a combined form which sets a numeric variable
8585ffd940aSRaphael Isemann     // to the evaluation of an expression. Both string and numeric variable
8595ffd940aSRaphael Isemann     // names must satisfy the regular expression "[a-zA-Z_][0-9a-zA-Z_]*" to be
860821dd3b0SJay Foad     // valid, as this helps catch some common errors. If there are extra '['s
861821dd3b0SJay Foad     // before the "[[", treat them literally.
862586ecdf2SKazu Hirata     if (PatternStr.starts_with("[[") && !PatternStr.starts_with("[[[")) {
8635ffd940aSRaphael Isemann       StringRef UnparsedPatternStr = PatternStr.substr(2);
8645ffd940aSRaphael Isemann       // Find the closing bracket pair ending the match.  End is going to be an
8655ffd940aSRaphael Isemann       // offset relative to the beginning of the match string.
8665ffd940aSRaphael Isemann       size_t End = FindRegexVarEnd(UnparsedPatternStr, SM);
8675ffd940aSRaphael Isemann       StringRef MatchStr = UnparsedPatternStr.substr(0, End);
8685ffd940aSRaphael Isemann       bool IsNumBlock = MatchStr.consume_front("#");
8695ffd940aSRaphael Isemann 
8705ffd940aSRaphael Isemann       if (End == StringRef::npos) {
8715ffd940aSRaphael Isemann         SM.PrintMessage(SMLoc::getFromPointer(PatternStr.data()),
8725ffd940aSRaphael Isemann                         SourceMgr::DK_Error,
8735ffd940aSRaphael Isemann                         "Invalid substitution block, no ]] found");
8745ffd940aSRaphael Isemann         return true;
8755ffd940aSRaphael Isemann       }
8765ffd940aSRaphael Isemann       // Strip the substitution block we are parsing. End points to the start
8775ffd940aSRaphael Isemann       // of the "]]" closing the expression so account for it in computing the
8785ffd940aSRaphael Isemann       // index of the first unparsed character.
8795ffd940aSRaphael Isemann       PatternStr = UnparsedPatternStr.substr(End + 2);
8805ffd940aSRaphael Isemann 
8815ffd940aSRaphael Isemann       bool IsDefinition = false;
8825ffd940aSRaphael Isemann       bool SubstNeeded = false;
8835ffd940aSRaphael Isemann       // Whether the substitution block is a legacy use of @LINE with string
8845ffd940aSRaphael Isemann       // substitution block syntax.
8855ffd940aSRaphael Isemann       bool IsLegacyLineExpr = false;
8865ffd940aSRaphael Isemann       StringRef DefName;
8875ffd940aSRaphael Isemann       StringRef SubstStr;
888a3d357e5SFlorian Hahn       StringRef MatchRegexp;
889a3d357e5SFlorian Hahn       std::string WildcardRegexp;
8905ffd940aSRaphael Isemann       size_t SubstInsertIdx = RegExStr.size();
8915ffd940aSRaphael Isemann 
8925ffd940aSRaphael Isemann       // Parse string variable or legacy @LINE expression.
8935ffd940aSRaphael Isemann       if (!IsNumBlock) {
894c70f3686SFangrui Song         size_t VarEndIdx = MatchStr.find(':');
8955ffd940aSRaphael Isemann         size_t SpacePos = MatchStr.substr(0, VarEndIdx).find_first_of(" \t");
8965ffd940aSRaphael Isemann         if (SpacePos != StringRef::npos) {
8975ffd940aSRaphael Isemann           SM.PrintMessage(SMLoc::getFromPointer(MatchStr.data() + SpacePos),
8985ffd940aSRaphael Isemann                           SourceMgr::DK_Error, "unexpected whitespace");
8995ffd940aSRaphael Isemann           return true;
9005ffd940aSRaphael Isemann         }
9015ffd940aSRaphael Isemann 
9025ffd940aSRaphael Isemann         // Get the name (e.g. "foo") and verify it is well formed.
9035ffd940aSRaphael Isemann         StringRef OrigMatchStr = MatchStr;
9045ffd940aSRaphael Isemann         Expected<Pattern::VariableProperties> ParseVarResult =
9055ffd940aSRaphael Isemann             parseVariable(MatchStr, SM);
9065ffd940aSRaphael Isemann         if (!ParseVarResult) {
9075ffd940aSRaphael Isemann           logAllUnhandledErrors(ParseVarResult.takeError(), errs());
9085ffd940aSRaphael Isemann           return true;
9095ffd940aSRaphael Isemann         }
9105ffd940aSRaphael Isemann         StringRef Name = ParseVarResult->Name;
9115ffd940aSRaphael Isemann         bool IsPseudo = ParseVarResult->IsPseudo;
9125ffd940aSRaphael Isemann 
9135ffd940aSRaphael Isemann         IsDefinition = (VarEndIdx != StringRef::npos);
9145ffd940aSRaphael Isemann         SubstNeeded = !IsDefinition;
9155ffd940aSRaphael Isemann         if (IsDefinition) {
9165ffd940aSRaphael Isemann           if ((IsPseudo || !MatchStr.consume_front(":"))) {
9175ffd940aSRaphael Isemann             SM.PrintMessage(SMLoc::getFromPointer(Name.data()),
9185ffd940aSRaphael Isemann                             SourceMgr::DK_Error,
9195ffd940aSRaphael Isemann                             "invalid name in string variable definition");
9205ffd940aSRaphael Isemann             return true;
9215ffd940aSRaphael Isemann           }
9225ffd940aSRaphael Isemann 
9235ffd940aSRaphael Isemann           // Detect collisions between string and numeric variables when the
9245ffd940aSRaphael Isemann           // former is created later than the latter.
925b595eb83SKazu Hirata           if (Context->GlobalNumericVariableTable.contains(Name)) {
9265ffd940aSRaphael Isemann             SM.PrintMessage(
9275ffd940aSRaphael Isemann                 SMLoc::getFromPointer(Name.data()), SourceMgr::DK_Error,
9285ffd940aSRaphael Isemann                 "numeric variable with name '" + Name + "' already exists");
9295ffd940aSRaphael Isemann             return true;
9305ffd940aSRaphael Isemann           }
9315ffd940aSRaphael Isemann           DefName = Name;
932a3d357e5SFlorian Hahn           MatchRegexp = MatchStr;
9335ffd940aSRaphael Isemann         } else {
9345ffd940aSRaphael Isemann           if (IsPseudo) {
9355ffd940aSRaphael Isemann             MatchStr = OrigMatchStr;
9365ffd940aSRaphael Isemann             IsLegacyLineExpr = IsNumBlock = true;
937058455ffSThomas Preud'homme           } else {
938058455ffSThomas Preud'homme             if (!MatchStr.empty()) {
939058455ffSThomas Preud'homme               SM.PrintMessage(SMLoc::getFromPointer(Name.data()),
940058455ffSThomas Preud'homme                               SourceMgr::DK_Error,
941058455ffSThomas Preud'homme                               "invalid name in string variable use");
942058455ffSThomas Preud'homme               return true;
943058455ffSThomas Preud'homme             }
9445ffd940aSRaphael Isemann             SubstStr = Name;
9455ffd940aSRaphael Isemann           }
9465ffd940aSRaphael Isemann         }
947058455ffSThomas Preud'homme       }
9485ffd940aSRaphael Isemann 
9495ffd940aSRaphael Isemann       // Parse numeric substitution block.
9505ffd940aSRaphael Isemann       std::unique_ptr<Expression> ExpressionPointer;
95194081642SFangrui Song       std::optional<NumericVariable *> DefinedNumericVariable;
9525ffd940aSRaphael Isemann       if (IsNumBlock) {
9535ffd940aSRaphael Isemann         Expected<std::unique_ptr<Expression>> ParseResult =
9545ffd940aSRaphael Isemann             parseNumericSubstitutionBlock(MatchStr, DefinedNumericVariable,
9555ffd940aSRaphael Isemann                                           IsLegacyLineExpr, LineNumber, Context,
9565ffd940aSRaphael Isemann                                           SM);
9575ffd940aSRaphael Isemann         if (!ParseResult) {
9585ffd940aSRaphael Isemann           logAllUnhandledErrors(ParseResult.takeError(), errs());
9595ffd940aSRaphael Isemann           return true;
9605ffd940aSRaphael Isemann         }
9615ffd940aSRaphael Isemann         ExpressionPointer = std::move(*ParseResult);
9625ffd940aSRaphael Isemann         SubstNeeded = ExpressionPointer->getAST() != nullptr;
9635ffd940aSRaphael Isemann         if (DefinedNumericVariable) {
9645ffd940aSRaphael Isemann           IsDefinition = true;
9655ffd940aSRaphael Isemann           DefName = (*DefinedNumericVariable)->getName();
9665ffd940aSRaphael Isemann         }
9675ffd940aSRaphael Isemann         if (SubstNeeded)
9685ffd940aSRaphael Isemann           SubstStr = MatchStr;
9695ffd940aSRaphael Isemann         else {
9705ffd940aSRaphael Isemann           ExpressionFormat Format = ExpressionPointer->getFormat();
971a3d357e5SFlorian Hahn           WildcardRegexp = cantFail(Format.getWildcardRegex());
972a3d357e5SFlorian Hahn           MatchRegexp = WildcardRegexp;
9735ffd940aSRaphael Isemann         }
9745ffd940aSRaphael Isemann       }
9755ffd940aSRaphael Isemann 
9765ffd940aSRaphael Isemann       // Handle variable definition: [[<def>:(...)]] and [[#(...)<def>:(...)]].
9775ffd940aSRaphael Isemann       if (IsDefinition) {
9785ffd940aSRaphael Isemann         RegExStr += '(';
9795ffd940aSRaphael Isemann         ++SubstInsertIdx;
9805ffd940aSRaphael Isemann 
9815ffd940aSRaphael Isemann         if (IsNumBlock) {
9825ffd940aSRaphael Isemann           NumericVariableMatch NumericVariableDefinition = {
9835ffd940aSRaphael Isemann               *DefinedNumericVariable, CurParen};
9845ffd940aSRaphael Isemann           NumericVariableDefs[DefName] = NumericVariableDefinition;
9855ffd940aSRaphael Isemann           // This store is done here rather than in match() to allow
9865ffd940aSRaphael Isemann           // parseNumericVariableUse() to get the pointer to the class instance
9875ffd940aSRaphael Isemann           // of the right variable definition corresponding to a given numeric
9885ffd940aSRaphael Isemann           // variable use.
9895ffd940aSRaphael Isemann           Context->GlobalNumericVariableTable[DefName] =
9905ffd940aSRaphael Isemann               *DefinedNumericVariable;
9915ffd940aSRaphael Isemann         } else {
9925ffd940aSRaphael Isemann           VariableDefs[DefName] = CurParen;
9935ffd940aSRaphael Isemann           // Mark string variable as defined to detect collisions between
9945ffd940aSRaphael Isemann           // string and numeric variables in parseNumericVariableUse() and
9955ffd940aSRaphael Isemann           // defineCmdlineVariables() when the latter is created later than the
9965ffd940aSRaphael Isemann           // former. We cannot reuse GlobalVariableTable for this by populating
9975ffd940aSRaphael Isemann           // it with an empty string since we would then lose the ability to
9985ffd940aSRaphael Isemann           // detect the use of an undefined variable in match().
9995ffd940aSRaphael Isemann           Context->DefinedVariableTable[DefName] = true;
10005ffd940aSRaphael Isemann         }
10015ffd940aSRaphael Isemann 
10025ffd940aSRaphael Isemann         ++CurParen;
10035ffd940aSRaphael Isemann       }
10045ffd940aSRaphael Isemann 
10055ffd940aSRaphael Isemann       if (!MatchRegexp.empty() && AddRegExToRegEx(MatchRegexp, CurParen, SM))
10065ffd940aSRaphael Isemann         return true;
10075ffd940aSRaphael Isemann 
10085ffd940aSRaphael Isemann       if (IsDefinition)
10095ffd940aSRaphael Isemann         RegExStr += ')';
10105ffd940aSRaphael Isemann 
10115ffd940aSRaphael Isemann       // Handle substitutions: [[foo]] and [[#<foo expr>]].
10125ffd940aSRaphael Isemann       if (SubstNeeded) {
10135ffd940aSRaphael Isemann         // Handle substitution of string variables that were defined earlier on
10145ffd940aSRaphael Isemann         // the same line by emitting a backreference. Expressions do not
10155ffd940aSRaphael Isemann         // support substituting a numeric variable defined on the same line.
10165ffd940aSRaphael Isemann         if (!IsNumBlock && VariableDefs.find(SubstStr) != VariableDefs.end()) {
10175ffd940aSRaphael Isemann           unsigned CaptureParenGroup = VariableDefs[SubstStr];
10185ffd940aSRaphael Isemann           if (CaptureParenGroup < 1 || CaptureParenGroup > 9) {
10195ffd940aSRaphael Isemann             SM.PrintMessage(SMLoc::getFromPointer(SubstStr.data()),
10205ffd940aSRaphael Isemann                             SourceMgr::DK_Error,
10215ffd940aSRaphael Isemann                             "Can't back-reference more than 9 variables");
10225ffd940aSRaphael Isemann             return true;
10235ffd940aSRaphael Isemann           }
10245ffd940aSRaphael Isemann           AddBackrefToRegEx(CaptureParenGroup);
10255ffd940aSRaphael Isemann         } else {
10265ffd940aSRaphael Isemann           // Handle substitution of string variables ([[<var>]]) defined in
10275ffd940aSRaphael Isemann           // previous CHECK patterns, and substitution of expressions.
10285ffd940aSRaphael Isemann           Substitution *Substitution =
10295ffd940aSRaphael Isemann               IsNumBlock
10305ffd940aSRaphael Isemann                   ? Context->makeNumericSubstitution(
10315ffd940aSRaphael Isemann                         SubstStr, std::move(ExpressionPointer), SubstInsertIdx)
10325ffd940aSRaphael Isemann                   : Context->makeStringSubstitution(SubstStr, SubstInsertIdx);
10335ffd940aSRaphael Isemann           Substitutions.push_back(Substitution);
10345ffd940aSRaphael Isemann         }
10355ffd940aSRaphael Isemann       }
1036821dd3b0SJay Foad 
1037821dd3b0SJay Foad       continue;
10385ffd940aSRaphael Isemann     }
10395ffd940aSRaphael Isemann 
10405ffd940aSRaphael Isemann     // Handle fixed string matches.
10415ffd940aSRaphael Isemann     // Find the end, which is the start of the next regex.
1042821dd3b0SJay Foad     size_t FixedMatchEnd =
1043821dd3b0SJay Foad         std::min(PatternStr.find("{{", 1), PatternStr.find("[[", 1));
10445ffd940aSRaphael Isemann     RegExStr += Regex::escape(PatternStr.substr(0, FixedMatchEnd));
10455ffd940aSRaphael Isemann     PatternStr = PatternStr.substr(FixedMatchEnd);
10465ffd940aSRaphael Isemann   }
10475ffd940aSRaphael Isemann 
10485ffd940aSRaphael Isemann   if (MatchFullLinesHere) {
10495ffd940aSRaphael Isemann     if (!Req.NoCanonicalizeWhiteSpace)
10505ffd940aSRaphael Isemann       RegExStr += " *";
10515ffd940aSRaphael Isemann     RegExStr += '$';
10525ffd940aSRaphael Isemann   }
10535ffd940aSRaphael Isemann 
10545ffd940aSRaphael Isemann   return false;
10555ffd940aSRaphael Isemann }
10565ffd940aSRaphael Isemann 
10575ffd940aSRaphael Isemann bool Pattern::AddRegExToRegEx(StringRef RS, unsigned &CurParen, SourceMgr &SM) {
10585ffd940aSRaphael Isemann   Regex R(RS);
10595ffd940aSRaphael Isemann   std::string Error;
10605ffd940aSRaphael Isemann   if (!R.isValid(Error)) {
10615ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(RS.data()), SourceMgr::DK_Error,
10625ffd940aSRaphael Isemann                     "invalid regex: " + Error);
10635ffd940aSRaphael Isemann     return true;
10645ffd940aSRaphael Isemann   }
10655ffd940aSRaphael Isemann 
10665ffd940aSRaphael Isemann   RegExStr += RS.str();
10675ffd940aSRaphael Isemann   CurParen += R.getNumMatches();
10685ffd940aSRaphael Isemann   return false;
10695ffd940aSRaphael Isemann }
10705ffd940aSRaphael Isemann 
10715ffd940aSRaphael Isemann void Pattern::AddBackrefToRegEx(unsigned BackrefNum) {
10725ffd940aSRaphael Isemann   assert(BackrefNum >= 1 && BackrefNum <= 9 && "Invalid backref number");
10735ffd940aSRaphael Isemann   std::string Backref = std::string("\\") + std::string(1, '0' + BackrefNum);
10745ffd940aSRaphael Isemann   RegExStr += Backref;
10755ffd940aSRaphael Isemann }
10765ffd940aSRaphael Isemann 
1077dd59c132SJoel E. Denny Pattern::MatchResult Pattern::match(StringRef Buffer,
10785ffd940aSRaphael Isemann                                     const SourceMgr &SM) const {
10795ffd940aSRaphael Isemann   // If this is the EOF pattern, match it immediately.
1080dd59c132SJoel E. Denny   if (CheckTy == Check::CheckEOF)
1081dd59c132SJoel E. Denny     return MatchResult(Buffer.size(), 0, Error::success());
10825ffd940aSRaphael Isemann 
10835ffd940aSRaphael Isemann   // If this is a fixed string pattern, just match it now.
10845ffd940aSRaphael Isemann   if (!FixedStr.empty()) {
10855ffd940aSRaphael Isemann     size_t Pos =
108642f74e82SMartin Storsjö         IgnoreCase ? Buffer.find_insensitive(FixedStr) : Buffer.find(FixedStr);
10875ffd940aSRaphael Isemann     if (Pos == StringRef::npos)
10885ffd940aSRaphael Isemann       return make_error<NotFoundError>();
1089dd59c132SJoel E. Denny     return MatchResult(Pos, /*MatchLen=*/FixedStr.size(), Error::success());
10905ffd940aSRaphael Isemann   }
10915ffd940aSRaphael Isemann 
10925ffd940aSRaphael Isemann   // Regex match.
10935ffd940aSRaphael Isemann 
10945ffd940aSRaphael Isemann   // If there are substitutions, we need to create a temporary string with the
10955ffd940aSRaphael Isemann   // actual value.
10965ffd940aSRaphael Isemann   StringRef RegExToMatch = RegExStr;
10975ffd940aSRaphael Isemann   std::string TmpStr;
10985ffd940aSRaphael Isemann   if (!Substitutions.empty()) {
10995ffd940aSRaphael Isemann     TmpStr = RegExStr;
11005ffd940aSRaphael Isemann     if (LineNumber)
11010726cb00SThomas Preud'homme       Context->LineVariable->setValue(
1102e15e969aSThomas Preud'homme           APInt(sizeof(*LineNumber) * 8, *LineNumber));
11035ffd940aSRaphael Isemann 
11045ffd940aSRaphael Isemann     size_t InsertOffset = 0;
11055ffd940aSRaphael Isemann     // Substitute all string variables and expressions whose values are only
11065ffd940aSRaphael Isemann     // now known. Use of string variables defined on the same line are handled
11075ffd940aSRaphael Isemann     // by back-references.
1108fd941036SThomas Preud'homme     Error Errs = Error::success();
11095ffd940aSRaphael Isemann     for (const auto &Substitution : Substitutions) {
11105ffd940aSRaphael Isemann       // Substitute and check for failure (e.g. use of undefined variable).
11115ffd940aSRaphael Isemann       Expected<std::string> Value = Substitution->getResult();
11125ffd940aSRaphael Isemann       if (!Value) {
11135ffd940aSRaphael Isemann         // Convert to an ErrorDiagnostic to get location information. This is
1114dd59c132SJoel E. Denny         // done here rather than printMatch/printNoMatch since now we know which
11155ffd940aSRaphael Isemann         // substitution block caused the overflow.
1116fd941036SThomas Preud'homme         Errs = joinErrors(std::move(Errs),
1117fd941036SThomas Preud'homme                           handleErrors(
1118fd941036SThomas Preud'homme                               Value.takeError(),
1119fd941036SThomas Preud'homme                               [&](const OverflowError &E) {
1120fd941036SThomas Preud'homme                                 return ErrorDiagnostic::get(
1121fd941036SThomas Preud'homme                                     SM, Substitution->getFromString(),
11225ffd940aSRaphael Isemann                                     "unable to substitute variable or "
11235ffd940aSRaphael Isemann                                     "numeric expression: overflow error");
1124fd941036SThomas Preud'homme                               },
1125fd941036SThomas Preud'homme                               [&SM](const UndefVarError &E) {
1126fd941036SThomas Preud'homme                                 return ErrorDiagnostic::get(SM, E.getVarName(),
1127fd941036SThomas Preud'homme                                                             E.message());
1128fd941036SThomas Preud'homme                               }));
1129fd941036SThomas Preud'homme         continue;
11305ffd940aSRaphael Isemann       }
11315ffd940aSRaphael Isemann 
11325ffd940aSRaphael Isemann       // Plop it into the regex at the adjusted offset.
11335ffd940aSRaphael Isemann       TmpStr.insert(TmpStr.begin() + Substitution->getIndex() + InsertOffset,
11345ffd940aSRaphael Isemann                     Value->begin(), Value->end());
11355ffd940aSRaphael Isemann       InsertOffset += Value->size();
11365ffd940aSRaphael Isemann     }
1137fd941036SThomas Preud'homme     if (Errs)
1138fd941036SThomas Preud'homme       return std::move(Errs);
11395ffd940aSRaphael Isemann 
11405ffd940aSRaphael Isemann     // Match the newly constructed regex.
11415ffd940aSRaphael Isemann     RegExToMatch = TmpStr;
11425ffd940aSRaphael Isemann   }
11435ffd940aSRaphael Isemann 
11445ffd940aSRaphael Isemann   SmallVector<StringRef, 4> MatchInfo;
11455ffd940aSRaphael Isemann   unsigned int Flags = Regex::Newline;
11465ffd940aSRaphael Isemann   if (IgnoreCase)
11475ffd940aSRaphael Isemann     Flags |= Regex::IgnoreCase;
11485ffd940aSRaphael Isemann   if (!Regex(RegExToMatch, Flags).match(Buffer, &MatchInfo))
11495ffd940aSRaphael Isemann     return make_error<NotFoundError>();
11505ffd940aSRaphael Isemann 
11515ffd940aSRaphael Isemann   // Successful regex match.
11525ffd940aSRaphael Isemann   assert(!MatchInfo.empty() && "Didn't get any match");
11535ffd940aSRaphael Isemann   StringRef FullMatch = MatchInfo[0];
11545ffd940aSRaphael Isemann 
11555ffd940aSRaphael Isemann   // If this defines any string variables, remember their values.
11565ffd940aSRaphael Isemann   for (const auto &VariableDef : VariableDefs) {
11575ffd940aSRaphael Isemann     assert(VariableDef.second < MatchInfo.size() && "Internal paren error");
11585ffd940aSRaphael Isemann     Context->GlobalVariableTable[VariableDef.first] =
11595ffd940aSRaphael Isemann         MatchInfo[VariableDef.second];
11605ffd940aSRaphael Isemann   }
11615ffd940aSRaphael Isemann 
1162dd59c132SJoel E. Denny   // Like CHECK-NEXT, CHECK-EMPTY's match range is considered to start after
1163dd59c132SJoel E. Denny   // the required preceding newline, which is consumed by the pattern in the
1164dd59c132SJoel E. Denny   // case of CHECK-EMPTY but not CHECK-NEXT.
1165dd59c132SJoel E. Denny   size_t MatchStartSkip = CheckTy == Check::CheckEmpty;
1166dd59c132SJoel E. Denny   Match TheMatch;
1167dd59c132SJoel E. Denny   TheMatch.Pos = FullMatch.data() - Buffer.data() + MatchStartSkip;
1168dd59c132SJoel E. Denny   TheMatch.Len = FullMatch.size() - MatchStartSkip;
1169dd59c132SJoel E. Denny 
11705ffd940aSRaphael Isemann   // If this defines any numeric variables, remember their values.
11715ffd940aSRaphael Isemann   for (const auto &NumericVariableDef : NumericVariableDefs) {
11725ffd940aSRaphael Isemann     const NumericVariableMatch &NumericVariableMatch =
11735ffd940aSRaphael Isemann         NumericVariableDef.getValue();
11745ffd940aSRaphael Isemann     unsigned CaptureParenGroup = NumericVariableMatch.CaptureParenGroup;
11755ffd940aSRaphael Isemann     assert(CaptureParenGroup < MatchInfo.size() && "Internal paren error");
11765ffd940aSRaphael Isemann     NumericVariable *DefinedNumericVariable =
11775ffd940aSRaphael Isemann         NumericVariableMatch.DefinedNumericVariable;
11785ffd940aSRaphael Isemann 
11795ffd940aSRaphael Isemann     StringRef MatchedValue = MatchInfo[CaptureParenGroup];
11805ffd940aSRaphael Isemann     ExpressionFormat Format = DefinedNumericVariable->getImplicitFormat();
1181b743c193SThomas Preud'homme     APInt Value = Format.valueFromStringRepr(MatchedValue, SM);
1182b743c193SThomas Preud'homme     DefinedNumericVariable->setValue(Value, MatchedValue);
11835ffd940aSRaphael Isemann   }
11845ffd940aSRaphael Isemann 
1185dd59c132SJoel E. Denny   return MatchResult(TheMatch, Error::success());
11865ffd940aSRaphael Isemann }
11875ffd940aSRaphael Isemann 
11885ffd940aSRaphael Isemann unsigned Pattern::computeMatchDistance(StringRef Buffer) const {
11895ffd940aSRaphael Isemann   // Just compute the number of matching characters. For regular expressions, we
11905ffd940aSRaphael Isemann   // just compare against the regex itself and hope for the best.
11915ffd940aSRaphael Isemann   //
11925ffd940aSRaphael Isemann   // FIXME: One easy improvement here is have the regex lib generate a single
11935ffd940aSRaphael Isemann   // example regular expression which matches, and use that as the example
11945ffd940aSRaphael Isemann   // string.
11955ffd940aSRaphael Isemann   StringRef ExampleString(FixedStr);
11965ffd940aSRaphael Isemann   if (ExampleString.empty())
11975ffd940aSRaphael Isemann     ExampleString = RegExStr;
11985ffd940aSRaphael Isemann 
11995ffd940aSRaphael Isemann   // Only compare up to the first line in the buffer, or the string size.
12005ffd940aSRaphael Isemann   StringRef BufferPrefix = Buffer.substr(0, ExampleString.size());
12015ffd940aSRaphael Isemann   BufferPrefix = BufferPrefix.split('\n').first;
12025ffd940aSRaphael Isemann   return BufferPrefix.edit_distance(ExampleString);
12035ffd940aSRaphael Isemann }
12045ffd940aSRaphael Isemann 
12055ffd940aSRaphael Isemann void Pattern::printSubstitutions(const SourceMgr &SM, StringRef Buffer,
12065ffd940aSRaphael Isemann                                  SMRange Range,
12075ffd940aSRaphael Isemann                                  FileCheckDiag::MatchType MatchTy,
12085ffd940aSRaphael Isemann                                  std::vector<FileCheckDiag> *Diags) const {
12095ffd940aSRaphael Isemann   // Print what we know about substitutions.
12105ffd940aSRaphael Isemann   if (!Substitutions.empty()) {
12115ffd940aSRaphael Isemann     for (const auto &Substitution : Substitutions) {
12125ffd940aSRaphael Isemann       SmallString<256> Msg;
12135ffd940aSRaphael Isemann       raw_svector_ostream OS(Msg);
12145ffd940aSRaphael Isemann 
1215fd941036SThomas Preud'homme       Expected<std::string> MatchedValue = Substitution->getResult();
1216fd941036SThomas Preud'homme       // Substitution failures are handled in printNoMatch().
12175ffd940aSRaphael Isemann       if (!MatchedValue) {
1218fd941036SThomas Preud'homme         consumeError(MatchedValue.takeError());
1219f87b4109SJoel E. Denny         continue;
1220fd941036SThomas Preud'homme       }
1221fd941036SThomas Preud'homme 
12225ffd940aSRaphael Isemann       OS << "with \"";
12235ffd940aSRaphael Isemann       OS.write_escaped(Substitution->getFromString()) << "\" equal to \"";
12245ffd940aSRaphael Isemann       OS.write_escaped(*MatchedValue) << "\"";
12255ffd940aSRaphael Isemann 
12265ffd940aSRaphael Isemann       // We report only the start of the match/search range to suggest we are
12275ffd940aSRaphael Isemann       // reporting the substitutions as set at the start of the match/search.
12285ffd940aSRaphael Isemann       // Indicating a non-zero-length range might instead seem to imply that the
12295ffd940aSRaphael Isemann       // substitution matches or was captured from exactly that range.
12305ffd940aSRaphael Isemann       if (Diags)
12315ffd940aSRaphael Isemann         Diags->emplace_back(SM, CheckTy, getLoc(), MatchTy,
12325ffd940aSRaphael Isemann                             SMRange(Range.Start, Range.Start), OS.str());
12335ffd940aSRaphael Isemann       else
12345ffd940aSRaphael Isemann         SM.PrintMessage(Range.Start, SourceMgr::DK_Note, OS.str());
12355ffd940aSRaphael Isemann     }
12365ffd940aSRaphael Isemann   }
12375ffd940aSRaphael Isemann }
12385ffd940aSRaphael Isemann 
12395ffd940aSRaphael Isemann void Pattern::printVariableDefs(const SourceMgr &SM,
12405ffd940aSRaphael Isemann                                 FileCheckDiag::MatchType MatchTy,
12415ffd940aSRaphael Isemann                                 std::vector<FileCheckDiag> *Diags) const {
12425ffd940aSRaphael Isemann   if (VariableDefs.empty() && NumericVariableDefs.empty())
12435ffd940aSRaphael Isemann     return;
12445ffd940aSRaphael Isemann   // Build list of variable captures.
12455ffd940aSRaphael Isemann   struct VarCapture {
12465ffd940aSRaphael Isemann     StringRef Name;
12475ffd940aSRaphael Isemann     SMRange Range;
12485ffd940aSRaphael Isemann   };
12495ffd940aSRaphael Isemann   SmallVector<VarCapture, 2> VarCaptures;
12505ffd940aSRaphael Isemann   for (const auto &VariableDef : VariableDefs) {
12515ffd940aSRaphael Isemann     VarCapture VC;
12525ffd940aSRaphael Isemann     VC.Name = VariableDef.first;
12535ffd940aSRaphael Isemann     StringRef Value = Context->GlobalVariableTable[VC.Name];
12545ffd940aSRaphael Isemann     SMLoc Start = SMLoc::getFromPointer(Value.data());
12555ffd940aSRaphael Isemann     SMLoc End = SMLoc::getFromPointer(Value.data() + Value.size());
12565ffd940aSRaphael Isemann     VC.Range = SMRange(Start, End);
12575ffd940aSRaphael Isemann     VarCaptures.push_back(VC);
12585ffd940aSRaphael Isemann   }
12595ffd940aSRaphael Isemann   for (const auto &VariableDef : NumericVariableDefs) {
12605ffd940aSRaphael Isemann     VarCapture VC;
12615ffd940aSRaphael Isemann     VC.Name = VariableDef.getKey();
126294081642SFangrui Song     std::optional<StringRef> StrValue =
1263dd59c132SJoel E. Denny         VariableDef.getValue().DefinedNumericVariable->getStringValue();
1264dd59c132SJoel E. Denny     if (!StrValue)
1265dd59c132SJoel E. Denny       continue;
1266dd59c132SJoel E. Denny     SMLoc Start = SMLoc::getFromPointer(StrValue->data());
1267dd59c132SJoel E. Denny     SMLoc End = SMLoc::getFromPointer(StrValue->data() + StrValue->size());
12685ffd940aSRaphael Isemann     VC.Range = SMRange(Start, End);
12695ffd940aSRaphael Isemann     VarCaptures.push_back(VC);
12705ffd940aSRaphael Isemann   }
12715ffd940aSRaphael Isemann   // Sort variable captures by the order in which they matched the input.
12725ffd940aSRaphael Isemann   // Ranges shouldn't be overlapping, so we can just compare the start.
1273352fcfc6SKazu Hirata   llvm::sort(VarCaptures, [](const VarCapture &A, const VarCapture &B) {
12743a35bcefSDavid Spickett     if (&A == &B)
12753a35bcefSDavid Spickett       return false;
12765ffd940aSRaphael Isemann     assert(A.Range.Start != B.Range.Start &&
12775ffd940aSRaphael Isemann            "unexpected overlapping variable captures");
12785ffd940aSRaphael Isemann     return A.Range.Start.getPointer() < B.Range.Start.getPointer();
12795ffd940aSRaphael Isemann   });
12805ffd940aSRaphael Isemann   // Create notes for the sorted captures.
12815ffd940aSRaphael Isemann   for (const VarCapture &VC : VarCaptures) {
12825ffd940aSRaphael Isemann     SmallString<256> Msg;
12835ffd940aSRaphael Isemann     raw_svector_ostream OS(Msg);
12845ffd940aSRaphael Isemann     OS << "captured var \"" << VC.Name << "\"";
12855ffd940aSRaphael Isemann     if (Diags)
12865ffd940aSRaphael Isemann       Diags->emplace_back(SM, CheckTy, getLoc(), MatchTy, VC.Range, OS.str());
12875ffd940aSRaphael Isemann     else
12885ffd940aSRaphael Isemann       SM.PrintMessage(VC.Range.Start, SourceMgr::DK_Note, OS.str(), VC.Range);
12895ffd940aSRaphael Isemann   }
12905ffd940aSRaphael Isemann }
12915ffd940aSRaphael Isemann 
12925ffd940aSRaphael Isemann static SMRange ProcessMatchResult(FileCheckDiag::MatchType MatchTy,
12935ffd940aSRaphael Isemann                                   const SourceMgr &SM, SMLoc Loc,
12945ffd940aSRaphael Isemann                                   Check::FileCheckType CheckTy,
12955ffd940aSRaphael Isemann                                   StringRef Buffer, size_t Pos, size_t Len,
12965ffd940aSRaphael Isemann                                   std::vector<FileCheckDiag> *Diags,
12975ffd940aSRaphael Isemann                                   bool AdjustPrevDiags = false) {
12985ffd940aSRaphael Isemann   SMLoc Start = SMLoc::getFromPointer(Buffer.data() + Pos);
12995ffd940aSRaphael Isemann   SMLoc End = SMLoc::getFromPointer(Buffer.data() + Pos + Len);
13005ffd940aSRaphael Isemann   SMRange Range(Start, End);
13015ffd940aSRaphael Isemann   if (Diags) {
13025ffd940aSRaphael Isemann     if (AdjustPrevDiags) {
13035ffd940aSRaphael Isemann       SMLoc CheckLoc = Diags->rbegin()->CheckLoc;
13045ffd940aSRaphael Isemann       for (auto I = Diags->rbegin(), E = Diags->rend();
13055ffd940aSRaphael Isemann            I != E && I->CheckLoc == CheckLoc; ++I)
13065ffd940aSRaphael Isemann         I->MatchTy = MatchTy;
13075ffd940aSRaphael Isemann     } else
13085ffd940aSRaphael Isemann       Diags->emplace_back(SM, CheckTy, Loc, MatchTy, Range);
13095ffd940aSRaphael Isemann   }
13105ffd940aSRaphael Isemann   return Range;
13115ffd940aSRaphael Isemann }
13125ffd940aSRaphael Isemann 
13135ffd940aSRaphael Isemann void Pattern::printFuzzyMatch(const SourceMgr &SM, StringRef Buffer,
13145ffd940aSRaphael Isemann                               std::vector<FileCheckDiag> *Diags) const {
13155ffd940aSRaphael Isemann   // Attempt to find the closest/best fuzzy match.  Usually an error happens
13165ffd940aSRaphael Isemann   // because some string in the output didn't exactly match. In these cases, we
13175ffd940aSRaphael Isemann   // would like to show the user a best guess at what "should have" matched, to
13185ffd940aSRaphael Isemann   // save them having to actually check the input manually.
13195ffd940aSRaphael Isemann   size_t NumLinesForward = 0;
13205ffd940aSRaphael Isemann   size_t Best = StringRef::npos;
13215ffd940aSRaphael Isemann   double BestQuality = 0;
13225ffd940aSRaphael Isemann 
13235ffd940aSRaphael Isemann   // Use an arbitrary 4k limit on how far we will search.
13245ffd940aSRaphael Isemann   for (size_t i = 0, e = std::min(size_t(4096), Buffer.size()); i != e; ++i) {
13255ffd940aSRaphael Isemann     if (Buffer[i] == '\n')
13265ffd940aSRaphael Isemann       ++NumLinesForward;
13275ffd940aSRaphael Isemann 
13285ffd940aSRaphael Isemann     // Patterns have leading whitespace stripped, so skip whitespace when
13295ffd940aSRaphael Isemann     // looking for something which looks like a pattern.
13305ffd940aSRaphael Isemann     if (Buffer[i] == ' ' || Buffer[i] == '\t')
13315ffd940aSRaphael Isemann       continue;
13325ffd940aSRaphael Isemann 
13335ffd940aSRaphael Isemann     // Compute the "quality" of this match as an arbitrary combination of the
13345ffd940aSRaphael Isemann     // match distance and the number of lines skipped to get to this match.
13355ffd940aSRaphael Isemann     unsigned Distance = computeMatchDistance(Buffer.substr(i));
13365ffd940aSRaphael Isemann     double Quality = Distance + (NumLinesForward / 100.);
13375ffd940aSRaphael Isemann 
13385ffd940aSRaphael Isemann     if (Quality < BestQuality || Best == StringRef::npos) {
13395ffd940aSRaphael Isemann       Best = i;
13405ffd940aSRaphael Isemann       BestQuality = Quality;
13415ffd940aSRaphael Isemann     }
13425ffd940aSRaphael Isemann   }
13435ffd940aSRaphael Isemann 
13445ffd940aSRaphael Isemann   // Print the "possible intended match here" line if we found something
13455ffd940aSRaphael Isemann   // reasonable and not equal to what we showed in the "scanning from here"
13465ffd940aSRaphael Isemann   // line.
13475ffd940aSRaphael Isemann   if (Best && Best != StringRef::npos && BestQuality < 50) {
13485ffd940aSRaphael Isemann     SMRange MatchRange =
13495ffd940aSRaphael Isemann         ProcessMatchResult(FileCheckDiag::MatchFuzzy, SM, getLoc(),
13505ffd940aSRaphael Isemann                            getCheckTy(), Buffer, Best, 0, Diags);
13515ffd940aSRaphael Isemann     SM.PrintMessage(MatchRange.Start, SourceMgr::DK_Note,
13525ffd940aSRaphael Isemann                     "possible intended match here");
13535ffd940aSRaphael Isemann 
13545ffd940aSRaphael Isemann     // FIXME: If we wanted to be really friendly we would show why the match
13555ffd940aSRaphael Isemann     // failed, as it can be hard to spot simple one character differences.
13565ffd940aSRaphael Isemann   }
13575ffd940aSRaphael Isemann }
13585ffd940aSRaphael Isemann 
13595ffd940aSRaphael Isemann Expected<StringRef>
13605ffd940aSRaphael Isemann FileCheckPatternContext::getPatternVarValue(StringRef VarName) {
13615ffd940aSRaphael Isemann   auto VarIter = GlobalVariableTable.find(VarName);
13625ffd940aSRaphael Isemann   if (VarIter == GlobalVariableTable.end())
13635ffd940aSRaphael Isemann     return make_error<UndefVarError>(VarName);
13645ffd940aSRaphael Isemann 
13655ffd940aSRaphael Isemann   return VarIter->second;
13665ffd940aSRaphael Isemann }
13675ffd940aSRaphael Isemann 
13685ffd940aSRaphael Isemann template <class... Types>
13695ffd940aSRaphael Isemann NumericVariable *FileCheckPatternContext::makeNumericVariable(Types... args) {
13705ffd940aSRaphael Isemann   NumericVariables.push_back(std::make_unique<NumericVariable>(args...));
13715ffd940aSRaphael Isemann   return NumericVariables.back().get();
13725ffd940aSRaphael Isemann }
13735ffd940aSRaphael Isemann 
13745ffd940aSRaphael Isemann Substitution *
13755ffd940aSRaphael Isemann FileCheckPatternContext::makeStringSubstitution(StringRef VarName,
13765ffd940aSRaphael Isemann                                                 size_t InsertIdx) {
13775ffd940aSRaphael Isemann   Substitutions.push_back(
13785ffd940aSRaphael Isemann       std::make_unique<StringSubstitution>(this, VarName, InsertIdx));
13795ffd940aSRaphael Isemann   return Substitutions.back().get();
13805ffd940aSRaphael Isemann }
13815ffd940aSRaphael Isemann 
13825ffd940aSRaphael Isemann Substitution *FileCheckPatternContext::makeNumericSubstitution(
13835ffd940aSRaphael Isemann     StringRef ExpressionStr, std::unique_ptr<Expression> Expression,
13845ffd940aSRaphael Isemann     size_t InsertIdx) {
13855ffd940aSRaphael Isemann   Substitutions.push_back(std::make_unique<NumericSubstitution>(
13865ffd940aSRaphael Isemann       this, ExpressionStr, std::move(Expression), InsertIdx));
13875ffd940aSRaphael Isemann   return Substitutions.back().get();
13885ffd940aSRaphael Isemann }
13895ffd940aSRaphael Isemann 
13905ffd940aSRaphael Isemann size_t Pattern::FindRegexVarEnd(StringRef Str, SourceMgr &SM) {
13915ffd940aSRaphael Isemann   // Offset keeps track of the current offset within the input Str
13925ffd940aSRaphael Isemann   size_t Offset = 0;
13935ffd940aSRaphael Isemann   // [...] Nesting depth
13945ffd940aSRaphael Isemann   size_t BracketDepth = 0;
13955ffd940aSRaphael Isemann 
13965ffd940aSRaphael Isemann   while (!Str.empty()) {
1397586ecdf2SKazu Hirata     if (Str.starts_with("]]") && BracketDepth == 0)
13985ffd940aSRaphael Isemann       return Offset;
13995ffd940aSRaphael Isemann     if (Str[0] == '\\') {
14005ffd940aSRaphael Isemann       // Backslash escapes the next char within regexes, so skip them both.
14015ffd940aSRaphael Isemann       Str = Str.substr(2);
14025ffd940aSRaphael Isemann       Offset += 2;
14035ffd940aSRaphael Isemann     } else {
14045ffd940aSRaphael Isemann       switch (Str[0]) {
14055ffd940aSRaphael Isemann       default:
14065ffd940aSRaphael Isemann         break;
14075ffd940aSRaphael Isemann       case '[':
14085ffd940aSRaphael Isemann         BracketDepth++;
14095ffd940aSRaphael Isemann         break;
14105ffd940aSRaphael Isemann       case ']':
14115ffd940aSRaphael Isemann         if (BracketDepth == 0) {
14125ffd940aSRaphael Isemann           SM.PrintMessage(SMLoc::getFromPointer(Str.data()),
14135ffd940aSRaphael Isemann                           SourceMgr::DK_Error,
14145ffd940aSRaphael Isemann                           "missing closing \"]\" for regex variable");
14155ffd940aSRaphael Isemann           exit(1);
14165ffd940aSRaphael Isemann         }
14175ffd940aSRaphael Isemann         BracketDepth--;
14185ffd940aSRaphael Isemann         break;
14195ffd940aSRaphael Isemann       }
14205ffd940aSRaphael Isemann       Str = Str.substr(1);
14215ffd940aSRaphael Isemann       Offset++;
14225ffd940aSRaphael Isemann     }
14235ffd940aSRaphael Isemann   }
14245ffd940aSRaphael Isemann 
14255ffd940aSRaphael Isemann   return StringRef::npos;
14265ffd940aSRaphael Isemann }
14275ffd940aSRaphael Isemann 
14285ffd940aSRaphael Isemann StringRef FileCheck::CanonicalizeFile(MemoryBuffer &MB,
14295ffd940aSRaphael Isemann                                       SmallVectorImpl<char> &OutputBuffer) {
14305ffd940aSRaphael Isemann   OutputBuffer.reserve(MB.getBufferSize());
14315ffd940aSRaphael Isemann 
14325ffd940aSRaphael Isemann   for (const char *Ptr = MB.getBufferStart(), *End = MB.getBufferEnd();
14335ffd940aSRaphael Isemann        Ptr != End; ++Ptr) {
14345ffd940aSRaphael Isemann     // Eliminate trailing dosish \r.
14355ffd940aSRaphael Isemann     if (Ptr <= End - 2 && Ptr[0] == '\r' && Ptr[1] == '\n') {
14365ffd940aSRaphael Isemann       continue;
14375ffd940aSRaphael Isemann     }
14385ffd940aSRaphael Isemann 
14395ffd940aSRaphael Isemann     // If current char is not a horizontal whitespace or if horizontal
14405ffd940aSRaphael Isemann     // whitespace canonicalization is disabled, dump it to output as is.
14415ffd940aSRaphael Isemann     if (Req.NoCanonicalizeWhiteSpace || (*Ptr != ' ' && *Ptr != '\t')) {
14425ffd940aSRaphael Isemann       OutputBuffer.push_back(*Ptr);
14435ffd940aSRaphael Isemann       continue;
14445ffd940aSRaphael Isemann     }
14455ffd940aSRaphael Isemann 
14465ffd940aSRaphael Isemann     // Otherwise, add one space and advance over neighboring space.
14475ffd940aSRaphael Isemann     OutputBuffer.push_back(' ');
14485ffd940aSRaphael Isemann     while (Ptr + 1 != End && (Ptr[1] == ' ' || Ptr[1] == '\t'))
14495ffd940aSRaphael Isemann       ++Ptr;
14505ffd940aSRaphael Isemann   }
14515ffd940aSRaphael Isemann 
14525ffd940aSRaphael Isemann   // Add a null byte and then return all but that byte.
14535ffd940aSRaphael Isemann   OutputBuffer.push_back('\0');
14545ffd940aSRaphael Isemann   return StringRef(OutputBuffer.data(), OutputBuffer.size() - 1);
14555ffd940aSRaphael Isemann }
14565ffd940aSRaphael Isemann 
14575ffd940aSRaphael Isemann FileCheckDiag::FileCheckDiag(const SourceMgr &SM,
14585ffd940aSRaphael Isemann                              const Check::FileCheckType &CheckTy,
14595ffd940aSRaphael Isemann                              SMLoc CheckLoc, MatchType MatchTy,
14605ffd940aSRaphael Isemann                              SMRange InputRange, StringRef Note)
14615ffd940aSRaphael Isemann     : CheckTy(CheckTy), CheckLoc(CheckLoc), MatchTy(MatchTy), Note(Note) {
14625ffd940aSRaphael Isemann   auto Start = SM.getLineAndColumn(InputRange.Start);
14635ffd940aSRaphael Isemann   auto End = SM.getLineAndColumn(InputRange.End);
14645ffd940aSRaphael Isemann   InputStartLine = Start.first;
14655ffd940aSRaphael Isemann   InputStartCol = Start.second;
14665ffd940aSRaphael Isemann   InputEndLine = End.first;
14675ffd940aSRaphael Isemann   InputEndCol = End.second;
14685ffd940aSRaphael Isemann }
14695ffd940aSRaphael Isemann 
14705ffd940aSRaphael Isemann static bool IsPartOfWord(char c) {
14715ffd940aSRaphael Isemann   return (isAlnum(c) || c == '-' || c == '_');
14725ffd940aSRaphael Isemann }
14735ffd940aSRaphael Isemann 
14745ffd940aSRaphael Isemann Check::FileCheckType &Check::FileCheckType::setCount(int C) {
14755ffd940aSRaphael Isemann   assert(Count > 0 && "zero and negative counts are not supported");
14765ffd940aSRaphael Isemann   assert((C == 1 || Kind == CheckPlain) &&
14775ffd940aSRaphael Isemann          "count supported only for plain CHECK directives");
14785ffd940aSRaphael Isemann   Count = C;
14795ffd940aSRaphael Isemann   return *this;
14805ffd940aSRaphael Isemann }
14815ffd940aSRaphael Isemann 
148244f399ccSJacques Pienaar std::string Check::FileCheckType::getModifiersDescription() const {
148344f399ccSJacques Pienaar   if (Modifiers.none())
148444f399ccSJacques Pienaar     return "";
148544f399ccSJacques Pienaar   std::string Ret;
148644f399ccSJacques Pienaar   raw_string_ostream OS(Ret);
148744f399ccSJacques Pienaar   OS << '{';
148844f399ccSJacques Pienaar   if (isLiteralMatch())
148944f399ccSJacques Pienaar     OS << "LITERAL";
149044f399ccSJacques Pienaar   OS << '}';
149134855405SYoungsuk Kim   return Ret;
149244f399ccSJacques Pienaar }
149344f399ccSJacques Pienaar 
14945ffd940aSRaphael Isemann std::string Check::FileCheckType::getDescription(StringRef Prefix) const {
149544f399ccSJacques Pienaar   // Append directive modifiers.
149644f399ccSJacques Pienaar   auto WithModifiers = [this, Prefix](StringRef Str) -> std::string {
149744f399ccSJacques Pienaar     return (Prefix + Str + getModifiersDescription()).str();
149844f399ccSJacques Pienaar   };
149944f399ccSJacques Pienaar 
15005ffd940aSRaphael Isemann   switch (Kind) {
15015ffd940aSRaphael Isemann   case Check::CheckNone:
15025ffd940aSRaphael Isemann     return "invalid";
1503ad1d60c3SIvan Kosarev   case Check::CheckMisspelled:
1504ad1d60c3SIvan Kosarev     return "misspelled";
15055ffd940aSRaphael Isemann   case Check::CheckPlain:
15065ffd940aSRaphael Isemann     if (Count > 1)
150744f399ccSJacques Pienaar       return WithModifiers("-COUNT");
150844f399ccSJacques Pienaar     return WithModifiers("");
15095ffd940aSRaphael Isemann   case Check::CheckNext:
151044f399ccSJacques Pienaar     return WithModifiers("-NEXT");
15115ffd940aSRaphael Isemann   case Check::CheckSame:
151244f399ccSJacques Pienaar     return WithModifiers("-SAME");
15135ffd940aSRaphael Isemann   case Check::CheckNot:
151444f399ccSJacques Pienaar     return WithModifiers("-NOT");
15155ffd940aSRaphael Isemann   case Check::CheckDAG:
151644f399ccSJacques Pienaar     return WithModifiers("-DAG");
15175ffd940aSRaphael Isemann   case Check::CheckLabel:
151844f399ccSJacques Pienaar     return WithModifiers("-LABEL");
15195ffd940aSRaphael Isemann   case Check::CheckEmpty:
152044f399ccSJacques Pienaar     return WithModifiers("-EMPTY");
15215ffd940aSRaphael Isemann   case Check::CheckComment:
15225ffd940aSRaphael Isemann     return std::string(Prefix);
15235ffd940aSRaphael Isemann   case Check::CheckEOF:
15245ffd940aSRaphael Isemann     return "implicit EOF";
15255ffd940aSRaphael Isemann   case Check::CheckBadNot:
15265ffd940aSRaphael Isemann     return "bad NOT";
15275ffd940aSRaphael Isemann   case Check::CheckBadCount:
15285ffd940aSRaphael Isemann     return "bad COUNT";
15295ffd940aSRaphael Isemann   }
15305ffd940aSRaphael Isemann   llvm_unreachable("unknown FileCheckType");
15315ffd940aSRaphael Isemann }
15325ffd940aSRaphael Isemann 
15335ffd940aSRaphael Isemann static std::pair<Check::FileCheckType, StringRef>
1534ad1d60c3SIvan Kosarev FindCheckType(const FileCheckRequest &Req, StringRef Buffer, StringRef Prefix,
1535ad1d60c3SIvan Kosarev               bool &Misspelled) {
15365ffd940aSRaphael Isemann   if (Buffer.size() <= Prefix.size())
15375ffd940aSRaphael Isemann     return {Check::CheckNone, StringRef()};
15385ffd940aSRaphael Isemann 
153944f399ccSJacques Pienaar   StringRef Rest = Buffer.drop_front(Prefix.size());
15405ffd940aSRaphael Isemann   // Check for comment.
15415ffd940aSRaphael Isemann   if (llvm::is_contained(Req.CommentPrefixes, Prefix)) {
154244f399ccSJacques Pienaar     if (Rest.consume_front(":"))
15435ffd940aSRaphael Isemann       return {Check::CheckComment, Rest};
15445ffd940aSRaphael Isemann     // Ignore a comment prefix if it has a suffix like "-NOT".
15455ffd940aSRaphael Isemann     return {Check::CheckNone, StringRef()};
15465ffd940aSRaphael Isemann   }
15475ffd940aSRaphael Isemann 
154844f399ccSJacques Pienaar   auto ConsumeModifiers = [&](Check::FileCheckType Ret)
154944f399ccSJacques Pienaar       -> std::pair<Check::FileCheckType, StringRef> {
155044f399ccSJacques Pienaar     if (Rest.consume_front(":"))
155144f399ccSJacques Pienaar       return {Ret, Rest};
155244f399ccSJacques Pienaar     if (!Rest.consume_front("{"))
155344f399ccSJacques Pienaar       return {Check::CheckNone, StringRef()};
15545ffd940aSRaphael Isemann 
155544f399ccSJacques Pienaar     // Parse the modifiers, speparated by commas.
155644f399ccSJacques Pienaar     do {
155744f399ccSJacques Pienaar       // Allow whitespace in modifiers list.
155844f399ccSJacques Pienaar       Rest = Rest.ltrim();
155944f399ccSJacques Pienaar       if (Rest.consume_front("LITERAL"))
156044f399ccSJacques Pienaar         Ret.setLiteralMatch();
156144f399ccSJacques Pienaar       else
156244f399ccSJacques Pienaar         return {Check::CheckNone, Rest};
156344f399ccSJacques Pienaar       // Allow whitespace in modifiers list.
156444f399ccSJacques Pienaar       Rest = Rest.ltrim();
156544f399ccSJacques Pienaar     } while (Rest.consume_front(","));
156644f399ccSJacques Pienaar     if (!Rest.consume_front("}:"))
156744f399ccSJacques Pienaar       return {Check::CheckNone, Rest};
156844f399ccSJacques Pienaar     return {Ret, Rest};
156944f399ccSJacques Pienaar   };
157044f399ccSJacques Pienaar 
157144f399ccSJacques Pienaar   // Verify that the prefix is followed by directive modifiers or a colon.
157244f399ccSJacques Pienaar   if (Rest.consume_front(":"))
157344f399ccSJacques Pienaar     return {Check::CheckPlain, Rest};
157444f399ccSJacques Pienaar   if (Rest.front() == '{')
157544f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckPlain);
157644f399ccSJacques Pienaar 
1577ad1d60c3SIvan Kosarev   if (Rest.consume_front("_"))
1578ad1d60c3SIvan Kosarev     Misspelled = true;
1579ad1d60c3SIvan Kosarev   else if (!Rest.consume_front("-"))
15805ffd940aSRaphael Isemann     return {Check::CheckNone, StringRef()};
15815ffd940aSRaphael Isemann 
15825ffd940aSRaphael Isemann   if (Rest.consume_front("COUNT-")) {
15835ffd940aSRaphael Isemann     int64_t Count;
15845ffd940aSRaphael Isemann     if (Rest.consumeInteger(10, Count))
15855ffd940aSRaphael Isemann       // Error happened in parsing integer.
15865ffd940aSRaphael Isemann       return {Check::CheckBadCount, Rest};
15875ffd940aSRaphael Isemann     if (Count <= 0 || Count > INT32_MAX)
15885ffd940aSRaphael Isemann       return {Check::CheckBadCount, Rest};
158944f399ccSJacques Pienaar     if (Rest.front() != ':' && Rest.front() != '{')
15905ffd940aSRaphael Isemann       return {Check::CheckBadCount, Rest};
159144f399ccSJacques Pienaar     return ConsumeModifiers(
159244f399ccSJacques Pienaar         Check::FileCheckType(Check::CheckPlain).setCount(Count));
15935ffd940aSRaphael Isemann   }
15945ffd940aSRaphael Isemann 
15955ffd940aSRaphael Isemann   // You can't combine -NOT with another suffix.
1596586ecdf2SKazu Hirata   if (Rest.starts_with("DAG-NOT:") || Rest.starts_with("NOT-DAG:") ||
1597586ecdf2SKazu Hirata       Rest.starts_with("NEXT-NOT:") || Rest.starts_with("NOT-NEXT:") ||
1598586ecdf2SKazu Hirata       Rest.starts_with("SAME-NOT:") || Rest.starts_with("NOT-SAME:") ||
1599586ecdf2SKazu Hirata       Rest.starts_with("EMPTY-NOT:") || Rest.starts_with("NOT-EMPTY:"))
16005ffd940aSRaphael Isemann     return {Check::CheckBadNot, Rest};
16015ffd940aSRaphael Isemann 
160244f399ccSJacques Pienaar   if (Rest.consume_front("NEXT"))
160344f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckNext);
160444f399ccSJacques Pienaar 
160544f399ccSJacques Pienaar   if (Rest.consume_front("SAME"))
160644f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckSame);
160744f399ccSJacques Pienaar 
160844f399ccSJacques Pienaar   if (Rest.consume_front("NOT"))
160944f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckNot);
161044f399ccSJacques Pienaar 
161144f399ccSJacques Pienaar   if (Rest.consume_front("DAG"))
161244f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckDAG);
161344f399ccSJacques Pienaar 
161444f399ccSJacques Pienaar   if (Rest.consume_front("LABEL"))
161544f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckLabel);
161644f399ccSJacques Pienaar 
161744f399ccSJacques Pienaar   if (Rest.consume_front("EMPTY"))
161844f399ccSJacques Pienaar     return ConsumeModifiers(Check::CheckEmpty);
161944f399ccSJacques Pienaar 
16205ffd940aSRaphael Isemann   return {Check::CheckNone, Rest};
16215ffd940aSRaphael Isemann }
16225ffd940aSRaphael Isemann 
1623ad1d60c3SIvan Kosarev static std::pair<Check::FileCheckType, StringRef>
1624ad1d60c3SIvan Kosarev FindCheckType(const FileCheckRequest &Req, StringRef Buffer, StringRef Prefix) {
1625ad1d60c3SIvan Kosarev   bool Misspelled = false;
1626ad1d60c3SIvan Kosarev   auto Res = FindCheckType(Req, Buffer, Prefix, Misspelled);
1627ad1d60c3SIvan Kosarev   if (Res.first != Check::CheckNone && Misspelled)
1628ad1d60c3SIvan Kosarev     return {Check::CheckMisspelled, Res.second};
1629ad1d60c3SIvan Kosarev   return Res;
1630ad1d60c3SIvan Kosarev }
1631ad1d60c3SIvan Kosarev 
16325ffd940aSRaphael Isemann // From the given position, find the next character after the word.
16335ffd940aSRaphael Isemann static size_t SkipWord(StringRef Str, size_t Loc) {
16345ffd940aSRaphael Isemann   while (Loc < Str.size() && IsPartOfWord(Str[Loc]))
16355ffd940aSRaphael Isemann     ++Loc;
16365ffd940aSRaphael Isemann   return Loc;
16375ffd940aSRaphael Isemann }
16385ffd940aSRaphael Isemann 
1639261b4710SNikita Popov static const char *DefaultCheckPrefixes[] = {"CHECK"};
1640261b4710SNikita Popov static const char *DefaultCommentPrefixes[] = {"COM", "RUN"};
1641261b4710SNikita Popov 
1642261b4710SNikita Popov static void addDefaultPrefixes(FileCheckRequest &Req) {
1643261b4710SNikita Popov   if (Req.CheckPrefixes.empty()) {
1644261b4710SNikita Popov     for (const char *Prefix : DefaultCheckPrefixes)
1645261b4710SNikita Popov       Req.CheckPrefixes.push_back(Prefix);
1646261b4710SNikita Popov     Req.IsDefaultCheckPrefix = true;
1647261b4710SNikita Popov   }
1648261b4710SNikita Popov   if (Req.CommentPrefixes.empty())
1649261b4710SNikita Popov     for (const char *Prefix : DefaultCommentPrefixes)
1650261b4710SNikita Popov       Req.CommentPrefixes.push_back(Prefix);
1651261b4710SNikita Popov }
1652261b4710SNikita Popov 
1653261b4710SNikita Popov struct PrefixMatcher {
1654261b4710SNikita Popov   /// Prefixes and their first occurrence past the current position.
1655261b4710SNikita Popov   SmallVector<std::pair<StringRef, size_t>> Prefixes;
1656261b4710SNikita Popov   StringRef Input;
1657261b4710SNikita Popov 
1658261b4710SNikita Popov   PrefixMatcher(ArrayRef<StringRef> CheckPrefixes,
1659261b4710SNikita Popov                 ArrayRef<StringRef> CommentPrefixes, StringRef Input)
1660261b4710SNikita Popov       : Input(Input) {
1661261b4710SNikita Popov     for (StringRef Prefix : CheckPrefixes)
1662261b4710SNikita Popov       Prefixes.push_back({Prefix, Input.find(Prefix)});
1663261b4710SNikita Popov     for (StringRef Prefix : CommentPrefixes)
1664261b4710SNikita Popov       Prefixes.push_back({Prefix, Input.find(Prefix)});
1665261b4710SNikita Popov 
1666261b4710SNikita Popov     // Sort by descending length.
1667261b4710SNikita Popov     llvm::sort(Prefixes,
1668261b4710SNikita Popov                [](auto A, auto B) { return A.first.size() > B.first.size(); });
1669261b4710SNikita Popov   }
1670261b4710SNikita Popov 
1671261b4710SNikita Popov   /// Find the next match of a prefix in Buffer.
1672261b4710SNikita Popov   /// Returns empty StringRef if not found.
1673261b4710SNikita Popov   StringRef match(StringRef Buffer) {
1674261b4710SNikita Popov     assert(Buffer.data() >= Input.data() &&
1675261b4710SNikita Popov            Buffer.data() + Buffer.size() == Input.data() + Input.size() &&
1676261b4710SNikita Popov            "Buffer must be suffix of Input");
1677261b4710SNikita Popov 
1678261b4710SNikita Popov     size_t From = Buffer.data() - Input.data();
1679261b4710SNikita Popov     StringRef Match;
1680261b4710SNikita Popov     for (auto &[Prefix, Pos] : Prefixes) {
1681261b4710SNikita Popov       // If the last occurrence was before From, find the next one after From.
1682261b4710SNikita Popov       if (Pos < From)
1683261b4710SNikita Popov         Pos = Input.find(Prefix, From);
1684261b4710SNikita Popov       // Find the first prefix with the lowest position.
1685261b4710SNikita Popov       if (Pos != StringRef::npos &&
1686261b4710SNikita Popov           (Match.empty() || size_t(Match.data() - Input.data()) > Pos))
1687261b4710SNikita Popov         Match = StringRef(Input.substr(Pos, Prefix.size()));
1688261b4710SNikita Popov     }
1689261b4710SNikita Popov     return Match;
1690261b4710SNikita Popov   }
1691261b4710SNikita Popov };
1692261b4710SNikita Popov 
16935ffd940aSRaphael Isemann /// Searches the buffer for the first prefix in the prefix regular expression.
16945ffd940aSRaphael Isemann ///
16955ffd940aSRaphael Isemann /// This searches the buffer using the provided regular expression, however it
16965ffd940aSRaphael Isemann /// enforces constraints beyond that:
16975ffd940aSRaphael Isemann /// 1) The found prefix must not be a suffix of something that looks like
16985ffd940aSRaphael Isemann ///    a valid prefix.
16995ffd940aSRaphael Isemann /// 2) The found prefix must be followed by a valid check type suffix using \c
17005ffd940aSRaphael Isemann ///    FindCheckType above.
17015ffd940aSRaphael Isemann ///
17025ffd940aSRaphael Isemann /// \returns a pair of StringRefs into the Buffer, which combines:
17035ffd940aSRaphael Isemann ///   - the first match of the regular expression to satisfy these two is
17045ffd940aSRaphael Isemann ///   returned,
17055ffd940aSRaphael Isemann ///     otherwise an empty StringRef is returned to indicate failure.
17065ffd940aSRaphael Isemann ///   - buffer rewound to the location right after parsed suffix, for parsing
17075ffd940aSRaphael Isemann ///     to continue from
17085ffd940aSRaphael Isemann ///
17095ffd940aSRaphael Isemann /// If this routine returns a valid prefix, it will also shrink \p Buffer to
17105ffd940aSRaphael Isemann /// start at the beginning of the returned prefix, increment \p LineNumber for
17115ffd940aSRaphael Isemann /// each new line consumed from \p Buffer, and set \p CheckTy to the type of
17125ffd940aSRaphael Isemann /// check found by examining the suffix.
17135ffd940aSRaphael Isemann ///
17145ffd940aSRaphael Isemann /// If no valid prefix is found, the state of Buffer, LineNumber, and CheckTy
17155ffd940aSRaphael Isemann /// is unspecified.
17165ffd940aSRaphael Isemann static std::pair<StringRef, StringRef>
1717261b4710SNikita Popov FindFirstMatchingPrefix(const FileCheckRequest &Req, PrefixMatcher &Matcher,
17185ffd940aSRaphael Isemann                         StringRef &Buffer, unsigned &LineNumber,
17195ffd940aSRaphael Isemann                         Check::FileCheckType &CheckTy) {
17205ffd940aSRaphael Isemann   while (!Buffer.empty()) {
1721261b4710SNikita Popov     // Find the first (longest) prefix match.
1722261b4710SNikita Popov     StringRef Prefix = Matcher.match(Buffer);
1723261b4710SNikita Popov     if (Prefix.empty())
17245ffd940aSRaphael Isemann       // No match at all, bail.
17255ffd940aSRaphael Isemann       return {StringRef(), StringRef()};
17265ffd940aSRaphael Isemann 
17275ffd940aSRaphael Isemann     assert(Prefix.data() >= Buffer.data() &&
17285ffd940aSRaphael Isemann            Prefix.data() < Buffer.data() + Buffer.size() &&
17295ffd940aSRaphael Isemann            "Prefix doesn't start inside of buffer!");
17305ffd940aSRaphael Isemann     size_t Loc = Prefix.data() - Buffer.data();
17315ffd940aSRaphael Isemann     StringRef Skipped = Buffer.substr(0, Loc);
17325ffd940aSRaphael Isemann     Buffer = Buffer.drop_front(Loc);
17335ffd940aSRaphael Isemann     LineNumber += Skipped.count('\n');
17345ffd940aSRaphael Isemann 
17355ffd940aSRaphael Isemann     // Check that the matched prefix isn't a suffix of some other check-like
17365ffd940aSRaphael Isemann     // word.
17375ffd940aSRaphael Isemann     // FIXME: This is a very ad-hoc check. it would be better handled in some
17385ffd940aSRaphael Isemann     // other way. Among other things it seems hard to distinguish between
17395ffd940aSRaphael Isemann     // intentional and unintentional uses of this feature.
17405ffd940aSRaphael Isemann     if (Skipped.empty() || !IsPartOfWord(Skipped.back())) {
17415ffd940aSRaphael Isemann       // Now extract the type.
17425ffd940aSRaphael Isemann       StringRef AfterSuffix;
17435ffd940aSRaphael Isemann       std::tie(CheckTy, AfterSuffix) = FindCheckType(Req, Buffer, Prefix);
17445ffd940aSRaphael Isemann 
17455ffd940aSRaphael Isemann       // If we've found a valid check type for this prefix, we're done.
17465ffd940aSRaphael Isemann       if (CheckTy != Check::CheckNone)
17475ffd940aSRaphael Isemann         return {Prefix, AfterSuffix};
17485ffd940aSRaphael Isemann     }
17495ffd940aSRaphael Isemann 
17505ffd940aSRaphael Isemann     // If we didn't successfully find a prefix, we need to skip this invalid
17515ffd940aSRaphael Isemann     // prefix and continue scanning. We directly skip the prefix that was
17525ffd940aSRaphael Isemann     // matched and any additional parts of that check-like word.
17535ffd940aSRaphael Isemann     Buffer = Buffer.drop_front(SkipWord(Buffer, Prefix.size()));
17545ffd940aSRaphael Isemann   }
17555ffd940aSRaphael Isemann 
17565ffd940aSRaphael Isemann   // We ran out of buffer while skipping partial matches so give up.
17575ffd940aSRaphael Isemann   return {StringRef(), StringRef()};
17585ffd940aSRaphael Isemann }
17595ffd940aSRaphael Isemann 
17605ffd940aSRaphael Isemann void FileCheckPatternContext::createLineVariable() {
17615ffd940aSRaphael Isemann   assert(!LineVariable && "@LINE pseudo numeric variable already created");
17625ffd940aSRaphael Isemann   StringRef LineName = "@LINE";
17635ffd940aSRaphael Isemann   LineVariable = makeNumericVariable(
17645ffd940aSRaphael Isemann       LineName, ExpressionFormat(ExpressionFormat::Kind::Unsigned));
17655ffd940aSRaphael Isemann   GlobalNumericVariableTable[LineName] = LineVariable;
17665ffd940aSRaphael Isemann }
17675ffd940aSRaphael Isemann 
17685ffd940aSRaphael Isemann FileCheck::FileCheck(FileCheckRequest Req)
1769c10e8261SJay Foad     : Req(Req), PatternContext(std::make_unique<FileCheckPatternContext>()) {}
17705ffd940aSRaphael Isemann 
17715ffd940aSRaphael Isemann FileCheck::~FileCheck() = default;
17725ffd940aSRaphael Isemann 
17735ffd940aSRaphael Isemann bool FileCheck::readCheckFile(
1774261b4710SNikita Popov     SourceMgr &SM, StringRef Buffer,
17755ffd940aSRaphael Isemann     std::pair<unsigned, unsigned> *ImpPatBufferIDRange) {
17765ffd940aSRaphael Isemann   if (ImpPatBufferIDRange)
17775ffd940aSRaphael Isemann     ImpPatBufferIDRange->first = ImpPatBufferIDRange->second = 0;
17785ffd940aSRaphael Isemann 
17795ffd940aSRaphael Isemann   Error DefineError =
17805ffd940aSRaphael Isemann       PatternContext->defineCmdlineVariables(Req.GlobalDefines, SM);
17815ffd940aSRaphael Isemann   if (DefineError) {
17825ffd940aSRaphael Isemann     logAllUnhandledErrors(std::move(DefineError), errs());
17835ffd940aSRaphael Isemann     return true;
17845ffd940aSRaphael Isemann   }
17855ffd940aSRaphael Isemann 
17865ffd940aSRaphael Isemann   PatternContext->createLineVariable();
17875ffd940aSRaphael Isemann 
1788497a8604SVinayak Dev   std::vector<FileCheckString::DagNotPrefixInfo> ImplicitNegativeChecks;
17895ffd940aSRaphael Isemann   for (StringRef PatternString : Req.ImplicitCheckNot) {
17905ffd940aSRaphael Isemann     // Create a buffer with fake command line content in order to display the
17915ffd940aSRaphael Isemann     // command line option responsible for the specific implicit CHECK-NOT.
17925ffd940aSRaphael Isemann     std::string Prefix = "-implicit-check-not='";
17935ffd940aSRaphael Isemann     std::string Suffix = "'";
17945ffd940aSRaphael Isemann     std::unique_ptr<MemoryBuffer> CmdLine = MemoryBuffer::getMemBufferCopy(
17955ffd940aSRaphael Isemann         (Prefix + PatternString + Suffix).str(), "command line");
17965ffd940aSRaphael Isemann 
17975ffd940aSRaphael Isemann     StringRef PatternInBuffer =
17985ffd940aSRaphael Isemann         CmdLine->getBuffer().substr(Prefix.size(), PatternString.size());
17995ffd940aSRaphael Isemann     unsigned BufferID = SM.AddNewSourceBuffer(std::move(CmdLine), SMLoc());
18005ffd940aSRaphael Isemann     if (ImpPatBufferIDRange) {
18015ffd940aSRaphael Isemann       if (ImpPatBufferIDRange->first == ImpPatBufferIDRange->second) {
18025ffd940aSRaphael Isemann         ImpPatBufferIDRange->first = BufferID;
18035ffd940aSRaphael Isemann         ImpPatBufferIDRange->second = BufferID + 1;
18045ffd940aSRaphael Isemann       } else {
18055ffd940aSRaphael Isemann         assert(BufferID == ImpPatBufferIDRange->second &&
18065ffd940aSRaphael Isemann                "expected consecutive source buffer IDs");
18075ffd940aSRaphael Isemann         ++ImpPatBufferIDRange->second;
18085ffd940aSRaphael Isemann       }
18095ffd940aSRaphael Isemann     }
18105ffd940aSRaphael Isemann 
1811497a8604SVinayak Dev     ImplicitNegativeChecks.emplace_back(
1812497a8604SVinayak Dev         Pattern(Check::CheckNot, PatternContext.get()),
1813497a8604SVinayak Dev         StringRef("IMPLICIT-CHECK"));
1814497a8604SVinayak Dev     ImplicitNegativeChecks.back().DagNotPat.parsePattern(
1815497a8604SVinayak Dev         PatternInBuffer, "IMPLICIT-CHECK", SM, Req);
18165ffd940aSRaphael Isemann   }
18175ffd940aSRaphael Isemann 
1818497a8604SVinayak Dev   std::vector<FileCheckString::DagNotPrefixInfo> DagNotMatches =
1819497a8604SVinayak Dev       ImplicitNegativeChecks;
18205ffd940aSRaphael Isemann   // LineNumber keeps track of the line on which CheckPrefix instances are
18215ffd940aSRaphael Isemann   // found.
18225ffd940aSRaphael Isemann   unsigned LineNumber = 1;
18235ffd940aSRaphael Isemann 
1824261b4710SNikita Popov   addDefaultPrefixes(Req);
1825261b4710SNikita Popov   PrefixMatcher Matcher(Req.CheckPrefixes, Req.CommentPrefixes, Buffer);
1826871d658cSMircea Trofin   std::set<StringRef> PrefixesNotFound(Req.CheckPrefixes.begin(),
1827871d658cSMircea Trofin                                        Req.CheckPrefixes.end());
1828871d658cSMircea Trofin   const size_t DistinctPrefixes = PrefixesNotFound.size();
1829871d658cSMircea Trofin   while (true) {
18305ffd940aSRaphael Isemann     Check::FileCheckType CheckTy;
18315ffd940aSRaphael Isemann 
18325ffd940aSRaphael Isemann     // See if a prefix occurs in the memory buffer.
18335ffd940aSRaphael Isemann     StringRef UsedPrefix;
18345ffd940aSRaphael Isemann     StringRef AfterSuffix;
18355ffd940aSRaphael Isemann     std::tie(UsedPrefix, AfterSuffix) =
1836261b4710SNikita Popov         FindFirstMatchingPrefix(Req, Matcher, Buffer, LineNumber, CheckTy);
18375ffd940aSRaphael Isemann     if (UsedPrefix.empty())
18385ffd940aSRaphael Isemann       break;
18395ffd940aSRaphael Isemann     if (CheckTy != Check::CheckComment)
1840871d658cSMircea Trofin       PrefixesNotFound.erase(UsedPrefix);
18415ffd940aSRaphael Isemann 
18425ffd940aSRaphael Isemann     assert(UsedPrefix.data() == Buffer.data() &&
18435ffd940aSRaphael Isemann            "Failed to move Buffer's start forward, or pointed prefix outside "
18445ffd940aSRaphael Isemann            "of the buffer!");
18455ffd940aSRaphael Isemann     assert(AfterSuffix.data() >= Buffer.data() &&
18465ffd940aSRaphael Isemann            AfterSuffix.data() < Buffer.data() + Buffer.size() &&
18475ffd940aSRaphael Isemann            "Parsing after suffix doesn't start inside of buffer!");
18485ffd940aSRaphael Isemann 
18495ffd940aSRaphael Isemann     // Location to use for error messages.
18505ffd940aSRaphael Isemann     const char *UsedPrefixStart = UsedPrefix.data();
18515ffd940aSRaphael Isemann 
18525ffd940aSRaphael Isemann     // Skip the buffer to the end of parsed suffix (or just prefix, if no good
18535ffd940aSRaphael Isemann     // suffix was processed).
18545ffd940aSRaphael Isemann     Buffer = AfterSuffix.empty() ? Buffer.drop_front(UsedPrefix.size())
18555ffd940aSRaphael Isemann                                  : AfterSuffix;
18565ffd940aSRaphael Isemann 
1857ad1d60c3SIvan Kosarev     // Complain about misspelled directives.
1858ad1d60c3SIvan Kosarev     if (CheckTy == Check::CheckMisspelled) {
1859ad1d60c3SIvan Kosarev       StringRef UsedDirective(UsedPrefix.data(),
1860ad1d60c3SIvan Kosarev                               AfterSuffix.data() - UsedPrefix.data());
1861ad1d60c3SIvan Kosarev       SM.PrintMessage(SMLoc::getFromPointer(UsedDirective.data()),
1862ad1d60c3SIvan Kosarev                       SourceMgr::DK_Error,
1863ad1d60c3SIvan Kosarev                       "misspelled directive '" + UsedDirective + "'");
1864ad1d60c3SIvan Kosarev       return true;
1865ad1d60c3SIvan Kosarev     }
1866ad1d60c3SIvan Kosarev 
18675ffd940aSRaphael Isemann     // Complain about useful-looking but unsupported suffixes.
18685ffd940aSRaphael Isemann     if (CheckTy == Check::CheckBadNot) {
18695ffd940aSRaphael Isemann       SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Error,
18705ffd940aSRaphael Isemann                       "unsupported -NOT combo on prefix '" + UsedPrefix + "'");
18715ffd940aSRaphael Isemann       return true;
18725ffd940aSRaphael Isemann     }
18735ffd940aSRaphael Isemann 
18745ffd940aSRaphael Isemann     // Complain about invalid count specification.
18755ffd940aSRaphael Isemann     if (CheckTy == Check::CheckBadCount) {
18765ffd940aSRaphael Isemann       SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Error,
18775ffd940aSRaphael Isemann                       "invalid count in -COUNT specification on prefix '" +
18785ffd940aSRaphael Isemann                           UsedPrefix + "'");
18795ffd940aSRaphael Isemann       return true;
18805ffd940aSRaphael Isemann     }
18815ffd940aSRaphael Isemann 
18825ffd940aSRaphael Isemann     // Okay, we found the prefix, yay. Remember the rest of the line, but ignore
18835ffd940aSRaphael Isemann     // leading whitespace.
18845ffd940aSRaphael Isemann     if (!(Req.NoCanonicalizeWhiteSpace && Req.MatchFullLines))
18855ffd940aSRaphael Isemann       Buffer = Buffer.substr(Buffer.find_first_not_of(" \t"));
18865ffd940aSRaphael Isemann 
18875ffd940aSRaphael Isemann     // Scan ahead to the end of line.
18885ffd940aSRaphael Isemann     size_t EOL = Buffer.find_first_of("\n\r");
18895ffd940aSRaphael Isemann 
18905ffd940aSRaphael Isemann     // Remember the location of the start of the pattern, for diagnostics.
18915ffd940aSRaphael Isemann     SMLoc PatternLoc = SMLoc::getFromPointer(Buffer.data());
18925ffd940aSRaphael Isemann 
18935ffd940aSRaphael Isemann     // Extract the pattern from the buffer.
18945ffd940aSRaphael Isemann     StringRef PatternBuffer = Buffer.substr(0, EOL);
18955ffd940aSRaphael Isemann     Buffer = Buffer.substr(EOL);
18965ffd940aSRaphael Isemann 
18975ffd940aSRaphael Isemann     // If this is a comment, we're done.
18985ffd940aSRaphael Isemann     if (CheckTy == Check::CheckComment)
18995ffd940aSRaphael Isemann       continue;
19005ffd940aSRaphael Isemann 
19015ffd940aSRaphael Isemann     // Parse the pattern.
19025ffd940aSRaphael Isemann     Pattern P(CheckTy, PatternContext.get(), LineNumber);
19035ffd940aSRaphael Isemann     if (P.parsePattern(PatternBuffer, UsedPrefix, SM, Req))
19045ffd940aSRaphael Isemann       return true;
19055ffd940aSRaphael Isemann 
19065ffd940aSRaphael Isemann     // Verify that CHECK-LABEL lines do not define or use variables
19075ffd940aSRaphael Isemann     if ((CheckTy == Check::CheckLabel) && P.hasVariable()) {
19085ffd940aSRaphael Isemann       SM.PrintMessage(
19095ffd940aSRaphael Isemann           SMLoc::getFromPointer(UsedPrefixStart), SourceMgr::DK_Error,
19105ffd940aSRaphael Isemann           "found '" + UsedPrefix + "-LABEL:'"
19115ffd940aSRaphael Isemann                                    " with variable definition or use");
19125ffd940aSRaphael Isemann       return true;
19135ffd940aSRaphael Isemann     }
19145ffd940aSRaphael Isemann 
19155ffd940aSRaphael Isemann     // Verify that CHECK-NEXT/SAME/EMPTY lines have at least one CHECK line before them.
19165ffd940aSRaphael Isemann     if ((CheckTy == Check::CheckNext || CheckTy == Check::CheckSame ||
19175ffd940aSRaphael Isemann          CheckTy == Check::CheckEmpty) &&
1918c10e8261SJay Foad         CheckStrings.empty()) {
19195ffd940aSRaphael Isemann       StringRef Type = CheckTy == Check::CheckNext
19205ffd940aSRaphael Isemann                            ? "NEXT"
19215ffd940aSRaphael Isemann                            : CheckTy == Check::CheckEmpty ? "EMPTY" : "SAME";
19225ffd940aSRaphael Isemann       SM.PrintMessage(SMLoc::getFromPointer(UsedPrefixStart),
19235ffd940aSRaphael Isemann                       SourceMgr::DK_Error,
19245ffd940aSRaphael Isemann                       "found '" + UsedPrefix + "-" + Type +
19255ffd940aSRaphael Isemann                           "' without previous '" + UsedPrefix + ": line");
19265ffd940aSRaphael Isemann       return true;
19275ffd940aSRaphael Isemann     }
19285ffd940aSRaphael Isemann 
19295ffd940aSRaphael Isemann     // Handle CHECK-DAG/-NOT.
19305ffd940aSRaphael Isemann     if (CheckTy == Check::CheckDAG || CheckTy == Check::CheckNot) {
1931497a8604SVinayak Dev       DagNotMatches.emplace_back(P, UsedPrefix);
19325ffd940aSRaphael Isemann       continue;
19335ffd940aSRaphael Isemann     }
19345ffd940aSRaphael Isemann 
19355ffd940aSRaphael Isemann     // Okay, add the string we captured to the output vector and move on.
1936*d3d605b7SJay Foad     CheckStrings.emplace_back(std::move(P), UsedPrefix, PatternLoc,
1937*d3d605b7SJay Foad                               std::move(DagNotMatches));
19385ffd940aSRaphael Isemann     DagNotMatches = ImplicitNegativeChecks;
19395ffd940aSRaphael Isemann   }
19405ffd940aSRaphael Isemann 
19415ffd940aSRaphael Isemann   // When there are no used prefixes we report an error except in the case that
19425ffd940aSRaphael Isemann   // no prefix is specified explicitly but -implicit-check-not is specified.
1943871d658cSMircea Trofin   const bool NoPrefixesFound = PrefixesNotFound.size() == DistinctPrefixes;
1944871d658cSMircea Trofin   const bool SomePrefixesUnexpectedlyNotUsed =
1945871d658cSMircea Trofin       !Req.AllowUnusedPrefixes && !PrefixesNotFound.empty();
1946871d658cSMircea Trofin   if ((NoPrefixesFound || SomePrefixesUnexpectedlyNotUsed) &&
19475ffd940aSRaphael Isemann       (ImplicitNegativeChecks.empty() || !Req.IsDefaultCheckPrefix)) {
19485ffd940aSRaphael Isemann     errs() << "error: no check strings found with prefix"
1949871d658cSMircea Trofin            << (PrefixesNotFound.size() > 1 ? "es " : " ");
1950871d658cSMircea Trofin     bool First = true;
1951871d658cSMircea Trofin     for (StringRef MissingPrefix : PrefixesNotFound) {
1952871d658cSMircea Trofin       if (!First)
19535ffd940aSRaphael Isemann         errs() << ", ";
1954871d658cSMircea Trofin       errs() << "\'" << MissingPrefix << ":'";
1955871d658cSMircea Trofin       First = false;
19565ffd940aSRaphael Isemann     }
19575ffd940aSRaphael Isemann     errs() << '\n';
19585ffd940aSRaphael Isemann     return true;
19595ffd940aSRaphael Isemann   }
19605ffd940aSRaphael Isemann 
19615ffd940aSRaphael Isemann   // Add an EOF pattern for any trailing --implicit-check-not/CHECK-DAG/-NOTs,
19625ffd940aSRaphael Isemann   // and use the first prefix as a filler for the error message.
19635ffd940aSRaphael Isemann   if (!DagNotMatches.empty()) {
1964c10e8261SJay Foad     CheckStrings.emplace_back(
19655ffd940aSRaphael Isemann         Pattern(Check::CheckEOF, PatternContext.get(), LineNumber + 1),
1966*d3d605b7SJay Foad         *Req.CheckPrefixes.begin(), SMLoc::getFromPointer(Buffer.data()),
1967*d3d605b7SJay Foad         std::move(DagNotMatches));
19685ffd940aSRaphael Isemann   }
19695ffd940aSRaphael Isemann 
19705ffd940aSRaphael Isemann   return false;
19715ffd940aSRaphael Isemann }
19725ffd940aSRaphael Isemann 
1973dd59c132SJoel E. Denny /// Returns either (1) \c ErrorSuccess if there was no error or (2)
1974dd59c132SJoel E. Denny /// \c ErrorReported if an error was reported, such as an unexpected match.
1975dd59c132SJoel E. Denny static Error printMatch(bool ExpectedMatch, const SourceMgr &SM,
19765ffd940aSRaphael Isemann                         StringRef Prefix, SMLoc Loc, const Pattern &Pat,
1977dd59c132SJoel E. Denny                         int MatchedCount, StringRef Buffer,
1978dd59c132SJoel E. Denny                         Pattern::MatchResult MatchResult,
1979dd59c132SJoel E. Denny                         const FileCheckRequest &Req,
19805ffd940aSRaphael Isemann                         std::vector<FileCheckDiag> *Diags) {
1981dd59c132SJoel E. Denny   // Suppress some verbosity if there's no error.
1982dd59c132SJoel E. Denny   bool HasError = !ExpectedMatch || MatchResult.TheError;
19835ffd940aSRaphael Isemann   bool PrintDiag = true;
1984dd59c132SJoel E. Denny   if (!HasError) {
19855ffd940aSRaphael Isemann     if (!Req.Verbose)
1986dd59c132SJoel E. Denny       return ErrorReported::reportedOrSuccess(HasError);
19875ffd940aSRaphael Isemann     if (!Req.VerboseVerbose && Pat.getCheckTy() == Check::CheckEOF)
1988dd59c132SJoel E. Denny       return ErrorReported::reportedOrSuccess(HasError);
19895ffd940aSRaphael Isemann     // Due to their verbosity, we don't print verbose diagnostics here if we're
1990dd59c132SJoel E. Denny     // gathering them for Diags to be rendered elsewhere, but we always print
1991dd59c132SJoel E. Denny     // other diagnostics.
19925ffd940aSRaphael Isemann     PrintDiag = !Diags;
19935ffd940aSRaphael Isemann   }
1994dd59c132SJoel E. Denny 
1995dd59c132SJoel E. Denny   // Add "found" diagnostic, substitutions, and variable definitions to Diags.
19965ffd940aSRaphael Isemann   FileCheckDiag::MatchType MatchTy = ExpectedMatch
19975ffd940aSRaphael Isemann                                          ? FileCheckDiag::MatchFoundAndExpected
19985ffd940aSRaphael Isemann                                          : FileCheckDiag::MatchFoundButExcluded;
19995ffd940aSRaphael Isemann   SMRange MatchRange = ProcessMatchResult(MatchTy, SM, Loc, Pat.getCheckTy(),
2000dd59c132SJoel E. Denny                                           Buffer, MatchResult.TheMatch->Pos,
2001dd59c132SJoel E. Denny                                           MatchResult.TheMatch->Len, Diags);
20025ffd940aSRaphael Isemann   if (Diags) {
20035ffd940aSRaphael Isemann     Pat.printSubstitutions(SM, Buffer, MatchRange, MatchTy, Diags);
20045ffd940aSRaphael Isemann     Pat.printVariableDefs(SM, MatchTy, Diags);
20055ffd940aSRaphael Isemann   }
2006dd59c132SJoel E. Denny   if (!PrintDiag) {
2007dd59c132SJoel E. Denny     assert(!HasError && "expected to report more diagnostics for error");
2008dd59c132SJoel E. Denny     return ErrorReported::reportedOrSuccess(HasError);
2009dd59c132SJoel E. Denny   }
20105ffd940aSRaphael Isemann 
2011dd59c132SJoel E. Denny   // Print the match.
20125ffd940aSRaphael Isemann   std::string Message = formatv("{0}: {1} string found in input",
20135ffd940aSRaphael Isemann                                 Pat.getCheckTy().getDescription(Prefix),
20145ffd940aSRaphael Isemann                                 (ExpectedMatch ? "expected" : "excluded"))
20155ffd940aSRaphael Isemann                             .str();
20165ffd940aSRaphael Isemann   if (Pat.getCount() > 1)
20175ffd940aSRaphael Isemann     Message += formatv(" ({0} out of {1})", MatchedCount, Pat.getCount()).str();
20185ffd940aSRaphael Isemann   SM.PrintMessage(
20195ffd940aSRaphael Isemann       Loc, ExpectedMatch ? SourceMgr::DK_Remark : SourceMgr::DK_Error, Message);
20205ffd940aSRaphael Isemann   SM.PrintMessage(MatchRange.Start, SourceMgr::DK_Note, "found here",
20215ffd940aSRaphael Isemann                   {MatchRange});
2022dd59c132SJoel E. Denny 
2023dd59c132SJoel E. Denny   // Print additional information, which can be useful even if there are errors.
20245ffd940aSRaphael Isemann   Pat.printSubstitutions(SM, Buffer, MatchRange, MatchTy, nullptr);
20255ffd940aSRaphael Isemann   Pat.printVariableDefs(SM, MatchTy, nullptr);
2026dd59c132SJoel E. Denny 
2027dd59c132SJoel E. Denny   // Print errors and add them to Diags.  We report these errors after the match
2028dd59c132SJoel E. Denny   // itself because we found them after the match.  If we had found them before
2029dd59c132SJoel E. Denny   // the match, we'd be in printNoMatch.
2030dd59c132SJoel E. Denny   handleAllErrors(std::move(MatchResult.TheError),
2031dd59c132SJoel E. Denny                   [&](const ErrorDiagnostic &E) {
2032dd59c132SJoel E. Denny                     E.log(errs());
2033dd59c132SJoel E. Denny                     if (Diags) {
2034dd59c132SJoel E. Denny                       Diags->emplace_back(SM, Pat.getCheckTy(), Loc,
2035dd59c132SJoel E. Denny                                           FileCheckDiag::MatchFoundErrorNote,
2036dd59c132SJoel E. Denny                                           E.getRange(), E.getMessage().str());
2037dd59c132SJoel E. Denny                     }
2038dd59c132SJoel E. Denny                   });
2039dd59c132SJoel E. Denny   return ErrorReported::reportedOrSuccess(HasError);
20405ffd940aSRaphael Isemann }
20415ffd940aSRaphael Isemann 
2042dd59c132SJoel E. Denny /// Returns either (1) \c ErrorSuccess if there was no error, or (2)
2043dd59c132SJoel E. Denny /// \c ErrorReported if an error was reported, such as an expected match not
2044dd59c132SJoel E. Denny /// found.
2045dd59c132SJoel E. Denny static Error printNoMatch(bool ExpectedMatch, const SourceMgr &SM,
20465ffd940aSRaphael Isemann                           StringRef Prefix, SMLoc Loc, const Pattern &Pat,
2047dd59c132SJoel E. Denny                           int MatchedCount, StringRef Buffer, Error MatchError,
2048dd59c132SJoel E. Denny                           bool VerboseVerbose,
2049dd59c132SJoel E. Denny                           std::vector<FileCheckDiag> *Diags) {
2050dd59c132SJoel E. Denny   // Print any pattern errors, and record them to be added to Diags later.
2051dd59c132SJoel E. Denny   bool HasError = ExpectedMatch;
2052dd59c132SJoel E. Denny   bool HasPatternError = false;
20535ffd940aSRaphael Isemann   FileCheckDiag::MatchType MatchTy = ExpectedMatch
20545ffd940aSRaphael Isemann                                          ? FileCheckDiag::MatchNoneButExpected
20555ffd940aSRaphael Isemann                                          : FileCheckDiag::MatchNoneAndExcluded;
2056dd59c132SJoel E. Denny   SmallVector<std::string, 4> ErrorMsgs;
2057dd59c132SJoel E. Denny   handleAllErrors(
2058dd59c132SJoel E. Denny       std::move(MatchError),
2059dd59c132SJoel E. Denny       [&](const ErrorDiagnostic &E) {
2060dd59c132SJoel E. Denny         HasError = HasPatternError = true;
2061dd59c132SJoel E. Denny         MatchTy = FileCheckDiag::MatchNoneForInvalidPattern;
2062dd59c132SJoel E. Denny         E.log(errs());
20635ffd940aSRaphael Isemann         if (Diags)
2064dd59c132SJoel E. Denny           ErrorMsgs.push_back(E.getMessage().str());
2065dd59c132SJoel E. Denny       },
2066dd59c132SJoel E. Denny       // NotFoundError is why printNoMatch was invoked.
2067dd59c132SJoel E. Denny       [](const NotFoundError &E) {});
2068dd59c132SJoel E. Denny 
2069dd59c132SJoel E. Denny   // Suppress some verbosity if there's no error.
2070dd59c132SJoel E. Denny   bool PrintDiag = true;
2071dd59c132SJoel E. Denny   if (!HasError) {
2072dd59c132SJoel E. Denny     if (!VerboseVerbose)
2073dd59c132SJoel E. Denny       return ErrorReported::reportedOrSuccess(HasError);
2074dd59c132SJoel E. Denny     // Due to their verbosity, we don't print verbose diagnostics here if we're
2075dd59c132SJoel E. Denny     // gathering them for Diags to be rendered elsewhere, but we always print
2076dd59c132SJoel E. Denny     // other diagnostics.
2077dd59c132SJoel E. Denny     PrintDiag = !Diags;
20785ffd940aSRaphael Isemann   }
20795ffd940aSRaphael Isemann 
2080dd59c132SJoel E. Denny   // Add "not found" diagnostic, substitutions, and pattern errors to Diags.
2081dd59c132SJoel E. Denny   //
2082dd59c132SJoel E. Denny   // We handle Diags a little differently than the errors we print directly:
2083dd59c132SJoel E. Denny   // we add the "not found" diagnostic to Diags even if there are pattern
2084dd59c132SJoel E. Denny   // errors.  The reason is that we need to attach pattern errors as notes
2085dd59c132SJoel E. Denny   // somewhere in the input, and the input search range from the "not found"
2086dd59c132SJoel E. Denny   // diagnostic is all we have to anchor them.
2087dd59c132SJoel E. Denny   SMRange SearchRange = ProcessMatchResult(MatchTy, SM, Loc, Pat.getCheckTy(),
2088dd59c132SJoel E. Denny                                            Buffer, 0, Buffer.size(), Diags);
2089dd59c132SJoel E. Denny   if (Diags) {
2090dd59c132SJoel E. Denny     SMRange NoteRange = SMRange(SearchRange.Start, SearchRange.Start);
2091dd59c132SJoel E. Denny     for (StringRef ErrorMsg : ErrorMsgs)
2092dd59c132SJoel E. Denny       Diags->emplace_back(SM, Pat.getCheckTy(), Loc, MatchTy, NoteRange,
2093dd59c132SJoel E. Denny                           ErrorMsg);
2094dd59c132SJoel E. Denny     Pat.printSubstitutions(SM, Buffer, SearchRange, MatchTy, Diags);
2095dd59c132SJoel E. Denny   }
2096dd59c132SJoel E. Denny   if (!PrintDiag) {
2097dd59c132SJoel E. Denny     assert(!HasError && "expected to report more diagnostics for error");
2098dd59c132SJoel E. Denny     return ErrorReported::reportedOrSuccess(HasError);
2099dd59c132SJoel E. Denny   }
21005ffd940aSRaphael Isemann 
2101dd59c132SJoel E. Denny   // Print "not found" diagnostic, except that's implied if we already printed a
2102dd59c132SJoel E. Denny   // pattern error.
2103dd59c132SJoel E. Denny   if (!HasPatternError) {
21045ffd940aSRaphael Isemann     std::string Message = formatv("{0}: {1} string not found in input",
21055ffd940aSRaphael Isemann                                   Pat.getCheckTy().getDescription(Prefix),
21065ffd940aSRaphael Isemann                                   (ExpectedMatch ? "expected" : "excluded"))
21075ffd940aSRaphael Isemann                               .str();
21085ffd940aSRaphael Isemann     if (Pat.getCount() > 1)
2109dd59c132SJoel E. Denny       Message +=
2110dd59c132SJoel E. Denny           formatv(" ({0} out of {1})", MatchedCount, Pat.getCount()).str();
2111dd59c132SJoel E. Denny     SM.PrintMessage(Loc,
2112dd59c132SJoel E. Denny                     ExpectedMatch ? SourceMgr::DK_Error : SourceMgr::DK_Remark,
2113dd59c132SJoel E. Denny                     Message);
2114dd59c132SJoel E. Denny     SM.PrintMessage(SearchRange.Start, SourceMgr::DK_Note,
2115dd59c132SJoel E. Denny                     "scanning from here");
21165ffd940aSRaphael Isemann   }
21175ffd940aSRaphael Isemann 
2118dd59c132SJoel E. Denny   // Print additional information, which can be useful even after a pattern
2119dd59c132SJoel E. Denny   // error.
2120dd59c132SJoel E. Denny   Pat.printSubstitutions(SM, Buffer, SearchRange, MatchTy, nullptr);
2121dd59c132SJoel E. Denny   if (ExpectedMatch)
2122dd59c132SJoel E. Denny     Pat.printFuzzyMatch(SM, Buffer, Diags);
2123dd59c132SJoel E. Denny   return ErrorReported::reportedOrSuccess(HasError);
2124dd59c132SJoel E. Denny }
2125dd59c132SJoel E. Denny 
2126dd59c132SJoel E. Denny /// Returns either (1) \c ErrorSuccess if there was no error, or (2)
2127dd59c132SJoel E. Denny /// \c ErrorReported if an error was reported.
2128dd59c132SJoel E. Denny static Error reportMatchResult(bool ExpectedMatch, const SourceMgr &SM,
2129dd59c132SJoel E. Denny                                StringRef Prefix, SMLoc Loc, const Pattern &Pat,
2130dd59c132SJoel E. Denny                                int MatchedCount, StringRef Buffer,
2131dd59c132SJoel E. Denny                                Pattern::MatchResult MatchResult,
2132dd59c132SJoel E. Denny                                const FileCheckRequest &Req,
2133dd59c132SJoel E. Denny                                std::vector<FileCheckDiag> *Diags) {
2134dd59c132SJoel E. Denny   if (MatchResult.TheMatch)
2135dd59c132SJoel E. Denny     return printMatch(ExpectedMatch, SM, Prefix, Loc, Pat, MatchedCount, Buffer,
2136dd59c132SJoel E. Denny                       std::move(MatchResult), Req, Diags);
2137dd59c132SJoel E. Denny   return printNoMatch(ExpectedMatch, SM, Prefix, Loc, Pat, MatchedCount, Buffer,
2138dd59c132SJoel E. Denny                       std::move(MatchResult.TheError), Req.VerboseVerbose,
2139dd59c132SJoel E. Denny                       Diags);
21405ffd940aSRaphael Isemann }
21415ffd940aSRaphael Isemann 
21425ffd940aSRaphael Isemann /// Counts the number of newlines in the specified range.
21435ffd940aSRaphael Isemann static unsigned CountNumNewlinesBetween(StringRef Range,
21445ffd940aSRaphael Isemann                                         const char *&FirstNewLine) {
21455ffd940aSRaphael Isemann   unsigned NumNewLines = 0;
21462aed0813SKazu Hirata   while (true) {
21475ffd940aSRaphael Isemann     // Scan for newline.
21485ffd940aSRaphael Isemann     Range = Range.substr(Range.find_first_of("\n\r"));
21495ffd940aSRaphael Isemann     if (Range.empty())
21505ffd940aSRaphael Isemann       return NumNewLines;
21515ffd940aSRaphael Isemann 
21525ffd940aSRaphael Isemann     ++NumNewLines;
21535ffd940aSRaphael Isemann 
21545ffd940aSRaphael Isemann     // Handle \n\r and \r\n as a single newline.
21555ffd940aSRaphael Isemann     if (Range.size() > 1 && (Range[1] == '\n' || Range[1] == '\r') &&
21565ffd940aSRaphael Isemann         (Range[0] != Range[1]))
21575ffd940aSRaphael Isemann       Range = Range.substr(1);
21585ffd940aSRaphael Isemann     Range = Range.substr(1);
21595ffd940aSRaphael Isemann 
21605ffd940aSRaphael Isemann     if (NumNewLines == 1)
21615ffd940aSRaphael Isemann       FirstNewLine = Range.begin();
21625ffd940aSRaphael Isemann   }
21635ffd940aSRaphael Isemann }
21645ffd940aSRaphael Isemann 
21655ffd940aSRaphael Isemann size_t FileCheckString::Check(const SourceMgr &SM, StringRef Buffer,
21665ffd940aSRaphael Isemann                               bool IsLabelScanMode, size_t &MatchLen,
21675ffd940aSRaphael Isemann                               FileCheckRequest &Req,
21685ffd940aSRaphael Isemann                               std::vector<FileCheckDiag> *Diags) const {
21695ffd940aSRaphael Isemann   size_t LastPos = 0;
2170497a8604SVinayak Dev   std::vector<const DagNotPrefixInfo *> NotStrings;
21715ffd940aSRaphael Isemann 
21725ffd940aSRaphael Isemann   // IsLabelScanMode is true when we are scanning forward to find CHECK-LABEL
21735ffd940aSRaphael Isemann   // bounds; we have not processed variable definitions within the bounded block
21745ffd940aSRaphael Isemann   // yet so cannot handle any final CHECK-DAG yet; this is handled when going
21755ffd940aSRaphael Isemann   // over the block again (including the last CHECK-LABEL) in normal mode.
21765ffd940aSRaphael Isemann   if (!IsLabelScanMode) {
21775ffd940aSRaphael Isemann     // Match "dag strings" (with mixed "not strings" if any).
21785ffd940aSRaphael Isemann     LastPos = CheckDag(SM, Buffer, NotStrings, Req, Diags);
21795ffd940aSRaphael Isemann     if (LastPos == StringRef::npos)
21805ffd940aSRaphael Isemann       return StringRef::npos;
21815ffd940aSRaphael Isemann   }
21825ffd940aSRaphael Isemann 
21835ffd940aSRaphael Isemann   // Match itself from the last position after matching CHECK-DAG.
21845ffd940aSRaphael Isemann   size_t LastMatchEnd = LastPos;
21855ffd940aSRaphael Isemann   size_t FirstMatchPos = 0;
21865ffd940aSRaphael Isemann   // Go match the pattern Count times. Majority of patterns only match with
21875ffd940aSRaphael Isemann   // count 1 though.
21885ffd940aSRaphael Isemann   assert(Pat.getCount() != 0 && "pattern count can not be zero");
21895ffd940aSRaphael Isemann   for (int i = 1; i <= Pat.getCount(); i++) {
21905ffd940aSRaphael Isemann     StringRef MatchBuffer = Buffer.substr(LastMatchEnd);
21915ffd940aSRaphael Isemann     // get a match at current start point
2192dd59c132SJoel E. Denny     Pattern::MatchResult MatchResult = Pat.match(MatchBuffer, SM);
21935ffd940aSRaphael Isemann 
21945ffd940aSRaphael Isemann     // report
2195dd59c132SJoel E. Denny     if (Error Err = reportMatchResult(/*ExpectedMatch=*/true, SM, Prefix, Loc,
2196dd59c132SJoel E. Denny                                       Pat, i, MatchBuffer,
2197dd59c132SJoel E. Denny                                       std::move(MatchResult), Req, Diags)) {
2198dd59c132SJoel E. Denny       cantFail(handleErrors(std::move(Err), [&](const ErrorReported &E) {}));
21995ffd940aSRaphael Isemann       return StringRef::npos;
22005ffd940aSRaphael Isemann     }
2201dd59c132SJoel E. Denny 
2202dd59c132SJoel E. Denny     size_t MatchPos = MatchResult.TheMatch->Pos;
22035ffd940aSRaphael Isemann     if (i == 1)
22045ffd940aSRaphael Isemann       FirstMatchPos = LastPos + MatchPos;
22055ffd940aSRaphael Isemann 
22065ffd940aSRaphael Isemann     // move start point after the match
2207dd59c132SJoel E. Denny     LastMatchEnd += MatchPos + MatchResult.TheMatch->Len;
22085ffd940aSRaphael Isemann   }
22095ffd940aSRaphael Isemann   // Full match len counts from first match pos.
22105ffd940aSRaphael Isemann   MatchLen = LastMatchEnd - FirstMatchPos;
22115ffd940aSRaphael Isemann 
22125ffd940aSRaphael Isemann   // Similar to the above, in "label-scan mode" we can't yet handle CHECK-NEXT
22135ffd940aSRaphael Isemann   // or CHECK-NOT
22145ffd940aSRaphael Isemann   if (!IsLabelScanMode) {
22155ffd940aSRaphael Isemann     size_t MatchPos = FirstMatchPos - LastPos;
22165ffd940aSRaphael Isemann     StringRef MatchBuffer = Buffer.substr(LastPos);
22175ffd940aSRaphael Isemann     StringRef SkippedRegion = Buffer.substr(LastPos, MatchPos);
22185ffd940aSRaphael Isemann 
22195ffd940aSRaphael Isemann     // If this check is a "CHECK-NEXT", verify that the previous match was on
22205ffd940aSRaphael Isemann     // the previous line (i.e. that there is one newline between them).
22215ffd940aSRaphael Isemann     if (CheckNext(SM, SkippedRegion)) {
22225ffd940aSRaphael Isemann       ProcessMatchResult(FileCheckDiag::MatchFoundButWrongLine, SM, Loc,
22235ffd940aSRaphael Isemann                          Pat.getCheckTy(), MatchBuffer, MatchPos, MatchLen,
22245ffd940aSRaphael Isemann                          Diags, Req.Verbose);
22255ffd940aSRaphael Isemann       return StringRef::npos;
22265ffd940aSRaphael Isemann     }
22275ffd940aSRaphael Isemann 
22285ffd940aSRaphael Isemann     // If this check is a "CHECK-SAME", verify that the previous match was on
22295ffd940aSRaphael Isemann     // the same line (i.e. that there is no newline between them).
22305ffd940aSRaphael Isemann     if (CheckSame(SM, SkippedRegion)) {
22315ffd940aSRaphael Isemann       ProcessMatchResult(FileCheckDiag::MatchFoundButWrongLine, SM, Loc,
22325ffd940aSRaphael Isemann                          Pat.getCheckTy(), MatchBuffer, MatchPos, MatchLen,
22335ffd940aSRaphael Isemann                          Diags, Req.Verbose);
22345ffd940aSRaphael Isemann       return StringRef::npos;
22355ffd940aSRaphael Isemann     }
22365ffd940aSRaphael Isemann 
22375ffd940aSRaphael Isemann     // If this match had "not strings", verify that they don't exist in the
22385ffd940aSRaphael Isemann     // skipped region.
22395ffd940aSRaphael Isemann     if (CheckNot(SM, SkippedRegion, NotStrings, Req, Diags))
22405ffd940aSRaphael Isemann       return StringRef::npos;
22415ffd940aSRaphael Isemann   }
22425ffd940aSRaphael Isemann 
22435ffd940aSRaphael Isemann   return FirstMatchPos;
22445ffd940aSRaphael Isemann }
22455ffd940aSRaphael Isemann 
22465ffd940aSRaphael Isemann bool FileCheckString::CheckNext(const SourceMgr &SM, StringRef Buffer) const {
22475ffd940aSRaphael Isemann   if (Pat.getCheckTy() != Check::CheckNext &&
22485ffd940aSRaphael Isemann       Pat.getCheckTy() != Check::CheckEmpty)
22495ffd940aSRaphael Isemann     return false;
22505ffd940aSRaphael Isemann 
22515ffd940aSRaphael Isemann   Twine CheckName =
22525ffd940aSRaphael Isemann       Prefix +
22535ffd940aSRaphael Isemann       Twine(Pat.getCheckTy() == Check::CheckEmpty ? "-EMPTY" : "-NEXT");
22545ffd940aSRaphael Isemann 
22555ffd940aSRaphael Isemann   // Count the number of newlines between the previous match and this one.
22565ffd940aSRaphael Isemann   const char *FirstNewLine = nullptr;
22575ffd940aSRaphael Isemann   unsigned NumNewLines = CountNumNewlinesBetween(Buffer, FirstNewLine);
22585ffd940aSRaphael Isemann 
22595ffd940aSRaphael Isemann   if (NumNewLines == 0) {
22605ffd940aSRaphael Isemann     SM.PrintMessage(Loc, SourceMgr::DK_Error,
22615ffd940aSRaphael Isemann                     CheckName + ": is on the same line as previous match");
22625ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note,
22635ffd940aSRaphael Isemann                     "'next' match was here");
22645ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note,
22655ffd940aSRaphael Isemann                     "previous match ended here");
22665ffd940aSRaphael Isemann     return true;
22675ffd940aSRaphael Isemann   }
22685ffd940aSRaphael Isemann 
22695ffd940aSRaphael Isemann   if (NumNewLines != 1) {
22705ffd940aSRaphael Isemann     SM.PrintMessage(Loc, SourceMgr::DK_Error,
22715ffd940aSRaphael Isemann                     CheckName +
22725ffd940aSRaphael Isemann                         ": is not on the line after the previous match");
22735ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note,
22745ffd940aSRaphael Isemann                     "'next' match was here");
22755ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note,
22765ffd940aSRaphael Isemann                     "previous match ended here");
22775ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(FirstNewLine), SourceMgr::DK_Note,
22785ffd940aSRaphael Isemann                     "non-matching line after previous match is here");
22795ffd940aSRaphael Isemann     return true;
22805ffd940aSRaphael Isemann   }
22815ffd940aSRaphael Isemann 
22825ffd940aSRaphael Isemann   return false;
22835ffd940aSRaphael Isemann }
22845ffd940aSRaphael Isemann 
22855ffd940aSRaphael Isemann bool FileCheckString::CheckSame(const SourceMgr &SM, StringRef Buffer) const {
22865ffd940aSRaphael Isemann   if (Pat.getCheckTy() != Check::CheckSame)
22875ffd940aSRaphael Isemann     return false;
22885ffd940aSRaphael Isemann 
22895ffd940aSRaphael Isemann   // Count the number of newlines between the previous match and this one.
22905ffd940aSRaphael Isemann   const char *FirstNewLine = nullptr;
22915ffd940aSRaphael Isemann   unsigned NumNewLines = CountNumNewlinesBetween(Buffer, FirstNewLine);
22925ffd940aSRaphael Isemann 
22935ffd940aSRaphael Isemann   if (NumNewLines != 0) {
22945ffd940aSRaphael Isemann     SM.PrintMessage(Loc, SourceMgr::DK_Error,
22955ffd940aSRaphael Isemann                     Prefix +
22965ffd940aSRaphael Isemann                         "-SAME: is not on the same line as the previous match");
22975ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.end()), SourceMgr::DK_Note,
22985ffd940aSRaphael Isemann                     "'next' match was here");
22995ffd940aSRaphael Isemann     SM.PrintMessage(SMLoc::getFromPointer(Buffer.data()), SourceMgr::DK_Note,
23005ffd940aSRaphael Isemann                     "previous match ended here");
23015ffd940aSRaphael Isemann     return true;
23025ffd940aSRaphael Isemann   }
23035ffd940aSRaphael Isemann 
23045ffd940aSRaphael Isemann   return false;
23055ffd940aSRaphael Isemann }
23065ffd940aSRaphael Isemann 
2307497a8604SVinayak Dev bool FileCheckString::CheckNot(
2308497a8604SVinayak Dev     const SourceMgr &SM, StringRef Buffer,
2309497a8604SVinayak Dev     const std::vector<const DagNotPrefixInfo *> &NotStrings,
2310497a8604SVinayak Dev     const FileCheckRequest &Req, std::vector<FileCheckDiag> *Diags) const {
23115ffd940aSRaphael Isemann   bool DirectiveFail = false;
2312497a8604SVinayak Dev   for (auto NotInfo : NotStrings) {
2313497a8604SVinayak Dev     assert((NotInfo->DagNotPat.getCheckTy() == Check::CheckNot) &&
2314497a8604SVinayak Dev            "Expect CHECK-NOT!");
2315497a8604SVinayak Dev     Pattern::MatchResult MatchResult = NotInfo->DagNotPat.match(Buffer, SM);
2316497a8604SVinayak Dev     if (Error Err = reportMatchResult(
2317497a8604SVinayak Dev             /*ExpectedMatch=*/false, SM, NotInfo->DagNotPrefix,
2318497a8604SVinayak Dev             NotInfo->DagNotPat.getLoc(), NotInfo->DagNotPat, 1, Buffer,
2319dd59c132SJoel E. Denny             std::move(MatchResult), Req, Diags)) {
2320dd59c132SJoel E. Denny       cantFail(handleErrors(std::move(Err), [&](const ErrorReported &E) {}));
2321dd59c132SJoel E. Denny       DirectiveFail = true;
23225ffd940aSRaphael Isemann       continue;
23235ffd940aSRaphael Isemann     }
23245ffd940aSRaphael Isemann   }
23255ffd940aSRaphael Isemann   return DirectiveFail;
23265ffd940aSRaphael Isemann }
23275ffd940aSRaphael Isemann 
2328497a8604SVinayak Dev size_t
2329497a8604SVinayak Dev FileCheckString::CheckDag(const SourceMgr &SM, StringRef Buffer,
2330497a8604SVinayak Dev                           std::vector<const DagNotPrefixInfo *> &NotStrings,
23315ffd940aSRaphael Isemann                           const FileCheckRequest &Req,
23325ffd940aSRaphael Isemann                           std::vector<FileCheckDiag> *Diags) const {
23335ffd940aSRaphael Isemann   if (DagNotStrings.empty())
23345ffd940aSRaphael Isemann     return 0;
23355ffd940aSRaphael Isemann 
23365ffd940aSRaphael Isemann   // The start of the search range.
23375ffd940aSRaphael Isemann   size_t StartPos = 0;
23385ffd940aSRaphael Isemann 
23395ffd940aSRaphael Isemann   struct MatchRange {
23405ffd940aSRaphael Isemann     size_t Pos;
23415ffd940aSRaphael Isemann     size_t End;
23425ffd940aSRaphael Isemann   };
23435ffd940aSRaphael Isemann   // A sorted list of ranges for non-overlapping CHECK-DAG matches.  Match
23445ffd940aSRaphael Isemann   // ranges are erased from this list once they are no longer in the search
23455ffd940aSRaphael Isemann   // range.
23465ffd940aSRaphael Isemann   std::list<MatchRange> MatchRanges;
23475ffd940aSRaphael Isemann 
23485ffd940aSRaphael Isemann   // We need PatItr and PatEnd later for detecting the end of a CHECK-DAG
23495ffd940aSRaphael Isemann   // group, so we don't use a range-based for loop here.
23505ffd940aSRaphael Isemann   for (auto PatItr = DagNotStrings.begin(), PatEnd = DagNotStrings.end();
23515ffd940aSRaphael Isemann        PatItr != PatEnd; ++PatItr) {
2352497a8604SVinayak Dev     const Pattern &Pat = PatItr->DagNotPat;
2353497a8604SVinayak Dev     const StringRef DNPrefix = PatItr->DagNotPrefix;
23545ffd940aSRaphael Isemann     assert((Pat.getCheckTy() == Check::CheckDAG ||
23555ffd940aSRaphael Isemann             Pat.getCheckTy() == Check::CheckNot) &&
23565ffd940aSRaphael Isemann            "Invalid CHECK-DAG or CHECK-NOT!");
23575ffd940aSRaphael Isemann 
23585ffd940aSRaphael Isemann     if (Pat.getCheckTy() == Check::CheckNot) {
2359497a8604SVinayak Dev       NotStrings.push_back(&*PatItr);
23605ffd940aSRaphael Isemann       continue;
23615ffd940aSRaphael Isemann     }
23625ffd940aSRaphael Isemann 
23635ffd940aSRaphael Isemann     assert((Pat.getCheckTy() == Check::CheckDAG) && "Expect CHECK-DAG!");
23645ffd940aSRaphael Isemann 
23655ffd940aSRaphael Isemann     // CHECK-DAG always matches from the start.
23665ffd940aSRaphael Isemann     size_t MatchLen = 0, MatchPos = StartPos;
23675ffd940aSRaphael Isemann 
23685ffd940aSRaphael Isemann     // Search for a match that doesn't overlap a previous match in this
23695ffd940aSRaphael Isemann     // CHECK-DAG group.
23705ffd940aSRaphael Isemann     for (auto MI = MatchRanges.begin(), ME = MatchRanges.end(); true; ++MI) {
23715ffd940aSRaphael Isemann       StringRef MatchBuffer = Buffer.substr(MatchPos);
2372dd59c132SJoel E. Denny       Pattern::MatchResult MatchResult = Pat.match(MatchBuffer, SM);
23735ffd940aSRaphael Isemann       // With a group of CHECK-DAGs, a single mismatching means the match on
23745ffd940aSRaphael Isemann       // that group of CHECK-DAGs fails immediately.
2375dd59c132SJoel E. Denny       if (MatchResult.TheError || Req.VerboseVerbose) {
2376497a8604SVinayak Dev         if (Error Err = reportMatchResult(/*ExpectedMatch=*/true, SM, DNPrefix,
2377dd59c132SJoel E. Denny                                           Pat.getLoc(), Pat, 1, MatchBuffer,
2378dd59c132SJoel E. Denny                                           std::move(MatchResult), Req, Diags)) {
2379dd59c132SJoel E. Denny           cantFail(
2380dd59c132SJoel E. Denny               handleErrors(std::move(Err), [&](const ErrorReported &E) {}));
23815ffd940aSRaphael Isemann           return StringRef::npos;
23825ffd940aSRaphael Isemann         }
2383dd59c132SJoel E. Denny       }
2384dd59c132SJoel E. Denny       MatchLen = MatchResult.TheMatch->Len;
2385dd59c132SJoel E. Denny       // Re-calc it as the offset relative to the start of the original
2386dd59c132SJoel E. Denny       // string.
2387dd59c132SJoel E. Denny       MatchPos += MatchResult.TheMatch->Pos;
23885ffd940aSRaphael Isemann       MatchRange M{MatchPos, MatchPos + MatchLen};
23895ffd940aSRaphael Isemann       if (Req.AllowDeprecatedDagOverlap) {
23905ffd940aSRaphael Isemann         // We don't need to track all matches in this mode, so we just maintain
23915ffd940aSRaphael Isemann         // one match range that encompasses the current CHECK-DAG group's
23925ffd940aSRaphael Isemann         // matches.
23935ffd940aSRaphael Isemann         if (MatchRanges.empty())
23945ffd940aSRaphael Isemann           MatchRanges.insert(MatchRanges.end(), M);
23955ffd940aSRaphael Isemann         else {
23965ffd940aSRaphael Isemann           auto Block = MatchRanges.begin();
23975ffd940aSRaphael Isemann           Block->Pos = std::min(Block->Pos, M.Pos);
23985ffd940aSRaphael Isemann           Block->End = std::max(Block->End, M.End);
23995ffd940aSRaphael Isemann         }
24005ffd940aSRaphael Isemann         break;
24015ffd940aSRaphael Isemann       }
24025ffd940aSRaphael Isemann       // Iterate previous matches until overlapping match or insertion point.
24035ffd940aSRaphael Isemann       bool Overlap = false;
24045ffd940aSRaphael Isemann       for (; MI != ME; ++MI) {
24055ffd940aSRaphael Isemann         if (M.Pos < MI->End) {
24065ffd940aSRaphael Isemann           // !Overlap => New match has no overlap and is before this old match.
24075ffd940aSRaphael Isemann           // Overlap => New match overlaps this old match.
24085ffd940aSRaphael Isemann           Overlap = MI->Pos < M.End;
24095ffd940aSRaphael Isemann           break;
24105ffd940aSRaphael Isemann         }
24115ffd940aSRaphael Isemann       }
24125ffd940aSRaphael Isemann       if (!Overlap) {
24135ffd940aSRaphael Isemann         // Insert non-overlapping match into list.
24145ffd940aSRaphael Isemann         MatchRanges.insert(MI, M);
24155ffd940aSRaphael Isemann         break;
24165ffd940aSRaphael Isemann       }
24175ffd940aSRaphael Isemann       if (Req.VerboseVerbose) {
24185ffd940aSRaphael Isemann         // Due to their verbosity, we don't print verbose diagnostics here if
24195ffd940aSRaphael Isemann         // we're gathering them for a different rendering, but we always print
24205ffd940aSRaphael Isemann         // other diagnostics.
24215ffd940aSRaphael Isemann         if (!Diags) {
24225ffd940aSRaphael Isemann           SMLoc OldStart = SMLoc::getFromPointer(Buffer.data() + MI->Pos);
24235ffd940aSRaphael Isemann           SMLoc OldEnd = SMLoc::getFromPointer(Buffer.data() + MI->End);
24245ffd940aSRaphael Isemann           SMRange OldRange(OldStart, OldEnd);
24255ffd940aSRaphael Isemann           SM.PrintMessage(OldStart, SourceMgr::DK_Note,
24265ffd940aSRaphael Isemann                           "match discarded, overlaps earlier DAG match here",
24275ffd940aSRaphael Isemann                           {OldRange});
24285ffd940aSRaphael Isemann         } else {
24295ffd940aSRaphael Isemann           SMLoc CheckLoc = Diags->rbegin()->CheckLoc;
24305ffd940aSRaphael Isemann           for (auto I = Diags->rbegin(), E = Diags->rend();
24315ffd940aSRaphael Isemann                I != E && I->CheckLoc == CheckLoc; ++I)
24325ffd940aSRaphael Isemann             I->MatchTy = FileCheckDiag::MatchFoundButDiscarded;
24335ffd940aSRaphael Isemann         }
24345ffd940aSRaphael Isemann       }
24355ffd940aSRaphael Isemann       MatchPos = MI->End;
24365ffd940aSRaphael Isemann     }
24375ffd940aSRaphael Isemann     if (!Req.VerboseVerbose)
2438dd59c132SJoel E. Denny       cantFail(printMatch(
2439497a8604SVinayak Dev           /*ExpectedMatch=*/true, SM, DNPrefix, Pat.getLoc(), Pat, 1, Buffer,
2440dd59c132SJoel E. Denny           Pattern::MatchResult(MatchPos, MatchLen, Error::success()), Req,
2441dd59c132SJoel E. Denny           Diags));
24425ffd940aSRaphael Isemann 
24435ffd940aSRaphael Isemann     // Handle the end of a CHECK-DAG group.
24445ffd940aSRaphael Isemann     if (std::next(PatItr) == PatEnd ||
2445497a8604SVinayak Dev         std::next(PatItr)->DagNotPat.getCheckTy() == Check::CheckNot) {
24465ffd940aSRaphael Isemann       if (!NotStrings.empty()) {
24475ffd940aSRaphael Isemann         // If there are CHECK-NOTs between two CHECK-DAGs or from CHECK to
24485ffd940aSRaphael Isemann         // CHECK-DAG, verify that there are no 'not' strings occurred in that
24495ffd940aSRaphael Isemann         // region.
24505ffd940aSRaphael Isemann         StringRef SkippedRegion =
24515ffd940aSRaphael Isemann             Buffer.slice(StartPos, MatchRanges.begin()->Pos);
24525ffd940aSRaphael Isemann         if (CheckNot(SM, SkippedRegion, NotStrings, Req, Diags))
24535ffd940aSRaphael Isemann           return StringRef::npos;
24545ffd940aSRaphael Isemann         // Clear "not strings".
24555ffd940aSRaphael Isemann         NotStrings.clear();
24565ffd940aSRaphael Isemann       }
24575ffd940aSRaphael Isemann       // All subsequent CHECK-DAGs and CHECK-NOTs should be matched from the
24585ffd940aSRaphael Isemann       // end of this CHECK-DAG group's match range.
24595ffd940aSRaphael Isemann       StartPos = MatchRanges.rbegin()->End;
24605ffd940aSRaphael Isemann       // Don't waste time checking for (impossible) overlaps before that.
24615ffd940aSRaphael Isemann       MatchRanges.clear();
24625ffd940aSRaphael Isemann     }
24635ffd940aSRaphael Isemann   }
24645ffd940aSRaphael Isemann 
24655ffd940aSRaphael Isemann   return StartPos;
24665ffd940aSRaphael Isemann }
24675ffd940aSRaphael Isemann 
24685ffd940aSRaphael Isemann static bool ValidatePrefixes(StringRef Kind, StringSet<> &UniquePrefixes,
24695ffd940aSRaphael Isemann                              ArrayRef<StringRef> SuppliedPrefixes) {
24705ffd940aSRaphael Isemann   for (StringRef Prefix : SuppliedPrefixes) {
24715ffd940aSRaphael Isemann     if (Prefix.empty()) {
24725ffd940aSRaphael Isemann       errs() << "error: supplied " << Kind << " prefix must not be the empty "
24735ffd940aSRaphael Isemann              << "string\n";
24745ffd940aSRaphael Isemann       return false;
24755ffd940aSRaphael Isemann     }
24765ffd940aSRaphael Isemann     static const Regex Validator("^[a-zA-Z0-9_-]*$");
24775ffd940aSRaphael Isemann     if (!Validator.match(Prefix)) {
24785ffd940aSRaphael Isemann       errs() << "error: supplied " << Kind << " prefix must start with a "
24795ffd940aSRaphael Isemann              << "letter and contain only alphanumeric characters, hyphens, and "
24805ffd940aSRaphael Isemann              << "underscores: '" << Prefix << "'\n";
24815ffd940aSRaphael Isemann       return false;
24825ffd940aSRaphael Isemann     }
24835ffd940aSRaphael Isemann     if (!UniquePrefixes.insert(Prefix).second) {
24845ffd940aSRaphael Isemann       errs() << "error: supplied " << Kind << " prefix must be unique among "
24855ffd940aSRaphael Isemann              << "check and comment prefixes: '" << Prefix << "'\n";
24865ffd940aSRaphael Isemann       return false;
24875ffd940aSRaphael Isemann     }
24885ffd940aSRaphael Isemann   }
24895ffd940aSRaphael Isemann   return true;
24905ffd940aSRaphael Isemann }
24915ffd940aSRaphael Isemann 
24925ffd940aSRaphael Isemann bool FileCheck::ValidateCheckPrefixes() {
24935ffd940aSRaphael Isemann   StringSet<> UniquePrefixes;
24945ffd940aSRaphael Isemann   // Add default prefixes to catch user-supplied duplicates of them below.
24955ffd940aSRaphael Isemann   if (Req.CheckPrefixes.empty()) {
24965ffd940aSRaphael Isemann     for (const char *Prefix : DefaultCheckPrefixes)
24975ffd940aSRaphael Isemann       UniquePrefixes.insert(Prefix);
24985ffd940aSRaphael Isemann   }
24995ffd940aSRaphael Isemann   if (Req.CommentPrefixes.empty()) {
25005ffd940aSRaphael Isemann     for (const char *Prefix : DefaultCommentPrefixes)
25015ffd940aSRaphael Isemann       UniquePrefixes.insert(Prefix);
25025ffd940aSRaphael Isemann   }
25035ffd940aSRaphael Isemann   // Do not validate the default prefixes, or diagnostics about duplicates might
25045ffd940aSRaphael Isemann   // incorrectly indicate that they were supplied by the user.
25055ffd940aSRaphael Isemann   if (!ValidatePrefixes("check", UniquePrefixes, Req.CheckPrefixes))
25065ffd940aSRaphael Isemann     return false;
25075ffd940aSRaphael Isemann   if (!ValidatePrefixes("comment", UniquePrefixes, Req.CommentPrefixes))
25085ffd940aSRaphael Isemann     return false;
25095ffd940aSRaphael Isemann   return true;
25105ffd940aSRaphael Isemann }
25115ffd940aSRaphael Isemann 
25125ffd940aSRaphael Isemann Error FileCheckPatternContext::defineCmdlineVariables(
25135ffd940aSRaphael Isemann     ArrayRef<StringRef> CmdlineDefines, SourceMgr &SM) {
25145ffd940aSRaphael Isemann   assert(GlobalVariableTable.empty() && GlobalNumericVariableTable.empty() &&
25155ffd940aSRaphael Isemann          "Overriding defined variable with command-line variable definitions");
25165ffd940aSRaphael Isemann 
25175ffd940aSRaphael Isemann   if (CmdlineDefines.empty())
25185ffd940aSRaphael Isemann     return Error::success();
25195ffd940aSRaphael Isemann 
25205ffd940aSRaphael Isemann   // Create a string representing the vector of command-line definitions. Each
25215ffd940aSRaphael Isemann   // definition is on its own line and prefixed with a definition number to
25225ffd940aSRaphael Isemann   // clarify which definition a given diagnostic corresponds to.
25235ffd940aSRaphael Isemann   unsigned I = 0;
25245ffd940aSRaphael Isemann   Error Errs = Error::success();
25255ffd940aSRaphael Isemann   std::string CmdlineDefsDiag;
25265ffd940aSRaphael Isemann   SmallVector<std::pair<size_t, size_t>, 4> CmdlineDefsIndices;
25275ffd940aSRaphael Isemann   for (StringRef CmdlineDef : CmdlineDefines) {
25285ffd940aSRaphael Isemann     std::string DefPrefix = ("Global define #" + Twine(++I) + ": ").str();
25295ffd940aSRaphael Isemann     size_t EqIdx = CmdlineDef.find('=');
25305ffd940aSRaphael Isemann     if (EqIdx == StringRef::npos) {
25315ffd940aSRaphael Isemann       CmdlineDefsIndices.push_back(std::make_pair(CmdlineDefsDiag.size(), 0));
25325ffd940aSRaphael Isemann       continue;
25335ffd940aSRaphael Isemann     }
25345ffd940aSRaphael Isemann     // Numeric variable definition.
25355ffd940aSRaphael Isemann     if (CmdlineDef[0] == '#') {
25365ffd940aSRaphael Isemann       // Append a copy of the command-line definition adapted to use the same
25375ffd940aSRaphael Isemann       // format as in the input file to be able to reuse
25385ffd940aSRaphael Isemann       // parseNumericSubstitutionBlock.
25395ffd940aSRaphael Isemann       CmdlineDefsDiag += (DefPrefix + CmdlineDef + " (parsed as: [[").str();
25405ffd940aSRaphael Isemann       std::string SubstitutionStr = std::string(CmdlineDef);
25415ffd940aSRaphael Isemann       SubstitutionStr[EqIdx] = ':';
25425ffd940aSRaphael Isemann       CmdlineDefsIndices.push_back(
25435ffd940aSRaphael Isemann           std::make_pair(CmdlineDefsDiag.size(), SubstitutionStr.size()));
25445ffd940aSRaphael Isemann       CmdlineDefsDiag += (SubstitutionStr + Twine("]])\n")).str();
25455ffd940aSRaphael Isemann     } else {
25465ffd940aSRaphael Isemann       CmdlineDefsDiag += DefPrefix;
25475ffd940aSRaphael Isemann       CmdlineDefsIndices.push_back(
25485ffd940aSRaphael Isemann           std::make_pair(CmdlineDefsDiag.size(), CmdlineDef.size()));
25495ffd940aSRaphael Isemann       CmdlineDefsDiag += (CmdlineDef + "\n").str();
25505ffd940aSRaphael Isemann     }
25515ffd940aSRaphael Isemann   }
25525ffd940aSRaphael Isemann 
25535ffd940aSRaphael Isemann   // Create a buffer with fake command line content in order to display
25545ffd940aSRaphael Isemann   // parsing diagnostic with location information and point to the
25555ffd940aSRaphael Isemann   // global definition with invalid syntax.
25565ffd940aSRaphael Isemann   std::unique_ptr<MemoryBuffer> CmdLineDefsDiagBuffer =
25575ffd940aSRaphael Isemann       MemoryBuffer::getMemBufferCopy(CmdlineDefsDiag, "Global defines");
25585ffd940aSRaphael Isemann   StringRef CmdlineDefsDiagRef = CmdLineDefsDiagBuffer->getBuffer();
25595ffd940aSRaphael Isemann   SM.AddNewSourceBuffer(std::move(CmdLineDefsDiagBuffer), SMLoc());
25605ffd940aSRaphael Isemann 
25615ffd940aSRaphael Isemann   for (std::pair<size_t, size_t> CmdlineDefIndices : CmdlineDefsIndices) {
25625ffd940aSRaphael Isemann     StringRef CmdlineDef = CmdlineDefsDiagRef.substr(CmdlineDefIndices.first,
25635ffd940aSRaphael Isemann                                                      CmdlineDefIndices.second);
25645ffd940aSRaphael Isemann     if (CmdlineDef.empty()) {
25655ffd940aSRaphael Isemann       Errs = joinErrors(
25665ffd940aSRaphael Isemann           std::move(Errs),
25675ffd940aSRaphael Isemann           ErrorDiagnostic::get(SM, CmdlineDef,
25685ffd940aSRaphael Isemann                                "missing equal sign in global definition"));
25695ffd940aSRaphael Isemann       continue;
25705ffd940aSRaphael Isemann     }
25715ffd940aSRaphael Isemann 
25725ffd940aSRaphael Isemann     // Numeric variable definition.
25735ffd940aSRaphael Isemann     if (CmdlineDef[0] == '#') {
25745ffd940aSRaphael Isemann       // Now parse the definition both to check that the syntax is correct and
25755ffd940aSRaphael Isemann       // to create the necessary class instance.
25765ffd940aSRaphael Isemann       StringRef CmdlineDefExpr = CmdlineDef.substr(1);
257794081642SFangrui Song       std::optional<NumericVariable *> DefinedNumericVariable;
25785ffd940aSRaphael Isemann       Expected<std::unique_ptr<Expression>> ExpressionResult =
2579aadaafacSKazu Hirata           Pattern::parseNumericSubstitutionBlock(CmdlineDefExpr,
2580aadaafacSKazu Hirata                                                  DefinedNumericVariable, false,
2581aadaafacSKazu Hirata                                                  std::nullopt, this, SM);
25825ffd940aSRaphael Isemann       if (!ExpressionResult) {
25835ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs), ExpressionResult.takeError());
25845ffd940aSRaphael Isemann         continue;
25855ffd940aSRaphael Isemann       }
25865ffd940aSRaphael Isemann       std::unique_ptr<Expression> Expression = std::move(*ExpressionResult);
25875ffd940aSRaphael Isemann       // Now evaluate the expression whose value this variable should be set
25885ffd940aSRaphael Isemann       // to, since the expression of a command-line variable definition should
25895ffd940aSRaphael Isemann       // only use variables defined earlier on the command-line. If not, this
25905ffd940aSRaphael Isemann       // is an error and we report it.
2591e15e969aSThomas Preud'homme       Expected<APInt> Value = Expression->getAST()->eval();
25925ffd940aSRaphael Isemann       if (!Value) {
25935ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs), Value.takeError());
25945ffd940aSRaphael Isemann         continue;
25955ffd940aSRaphael Isemann       }
25965ffd940aSRaphael Isemann 
25975ffd940aSRaphael Isemann       assert(DefinedNumericVariable && "No variable defined");
25985ffd940aSRaphael Isemann       (*DefinedNumericVariable)->setValue(*Value);
25995ffd940aSRaphael Isemann 
26005ffd940aSRaphael Isemann       // Record this variable definition.
26015ffd940aSRaphael Isemann       GlobalNumericVariableTable[(*DefinedNumericVariable)->getName()] =
26025ffd940aSRaphael Isemann           *DefinedNumericVariable;
26035ffd940aSRaphael Isemann     } else {
26045ffd940aSRaphael Isemann       // String variable definition.
26055ffd940aSRaphael Isemann       std::pair<StringRef, StringRef> CmdlineNameVal = CmdlineDef.split('=');
26065ffd940aSRaphael Isemann       StringRef CmdlineName = CmdlineNameVal.first;
26075ffd940aSRaphael Isemann       StringRef OrigCmdlineName = CmdlineName;
26085ffd940aSRaphael Isemann       Expected<Pattern::VariableProperties> ParseVarResult =
26095ffd940aSRaphael Isemann           Pattern::parseVariable(CmdlineName, SM);
26105ffd940aSRaphael Isemann       if (!ParseVarResult) {
26115ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs), ParseVarResult.takeError());
26125ffd940aSRaphael Isemann         continue;
26135ffd940aSRaphael Isemann       }
26145ffd940aSRaphael Isemann       // Check that CmdlineName does not denote a pseudo variable is only
26155ffd940aSRaphael Isemann       // composed of the parsed numeric variable. This catches cases like
26165ffd940aSRaphael Isemann       // "FOO+2" in a "FOO+2=10" definition.
26175ffd940aSRaphael Isemann       if (ParseVarResult->IsPseudo || !CmdlineName.empty()) {
26185ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs),
26195ffd940aSRaphael Isemann                           ErrorDiagnostic::get(
26205ffd940aSRaphael Isemann                               SM, OrigCmdlineName,
26215ffd940aSRaphael Isemann                               "invalid name in string variable definition '" +
26225ffd940aSRaphael Isemann                                   OrigCmdlineName + "'"));
26235ffd940aSRaphael Isemann         continue;
26245ffd940aSRaphael Isemann       }
26255ffd940aSRaphael Isemann       StringRef Name = ParseVarResult->Name;
26265ffd940aSRaphael Isemann 
26275ffd940aSRaphael Isemann       // Detect collisions between string and numeric variables when the former
26285ffd940aSRaphael Isemann       // is created later than the latter.
2629b595eb83SKazu Hirata       if (GlobalNumericVariableTable.contains(Name)) {
26305ffd940aSRaphael Isemann         Errs = joinErrors(std::move(Errs),
26315ffd940aSRaphael Isemann                           ErrorDiagnostic::get(SM, Name,
26325ffd940aSRaphael Isemann                                                "numeric variable with name '" +
26335ffd940aSRaphael Isemann                                                    Name + "' already exists"));
26345ffd940aSRaphael Isemann         continue;
26355ffd940aSRaphael Isemann       }
26365ffd940aSRaphael Isemann       GlobalVariableTable.insert(CmdlineNameVal);
26375ffd940aSRaphael Isemann       // Mark the string variable as defined to detect collisions between
26385ffd940aSRaphael Isemann       // string and numeric variables in defineCmdlineVariables when the latter
26395ffd940aSRaphael Isemann       // is created later than the former. We cannot reuse GlobalVariableTable
26405ffd940aSRaphael Isemann       // for this by populating it with an empty string since we would then
26415ffd940aSRaphael Isemann       // lose the ability to detect the use of an undefined variable in
26425ffd940aSRaphael Isemann       // match().
26435ffd940aSRaphael Isemann       DefinedVariableTable[Name] = true;
26445ffd940aSRaphael Isemann     }
26455ffd940aSRaphael Isemann   }
26465ffd940aSRaphael Isemann 
26475ffd940aSRaphael Isemann   return Errs;
26485ffd940aSRaphael Isemann }
26495ffd940aSRaphael Isemann 
26505ffd940aSRaphael Isemann void FileCheckPatternContext::clearLocalVars() {
26515ffd940aSRaphael Isemann   SmallVector<StringRef, 16> LocalPatternVars, LocalNumericVars;
26525ffd940aSRaphael Isemann   for (const StringMapEntry<StringRef> &Var : GlobalVariableTable)
26535ffd940aSRaphael Isemann     if (Var.first()[0] != '$')
26545ffd940aSRaphael Isemann       LocalPatternVars.push_back(Var.first());
26555ffd940aSRaphael Isemann 
26565ffd940aSRaphael Isemann   // Numeric substitution reads the value of a variable directly, not via
26575ffd940aSRaphael Isemann   // GlobalNumericVariableTable. Therefore, we clear local variables by
26585ffd940aSRaphael Isemann   // clearing their value which will lead to a numeric substitution failure. We
26595ffd940aSRaphael Isemann   // also mark the variable for removal from GlobalNumericVariableTable since
26605ffd940aSRaphael Isemann   // this is what defineCmdlineVariables checks to decide that no global
26615ffd940aSRaphael Isemann   // variable has been defined.
26625ffd940aSRaphael Isemann   for (const auto &Var : GlobalNumericVariableTable)
26635ffd940aSRaphael Isemann     if (Var.first()[0] != '$') {
26645ffd940aSRaphael Isemann       Var.getValue()->clearValue();
26655ffd940aSRaphael Isemann       LocalNumericVars.push_back(Var.first());
26665ffd940aSRaphael Isemann     }
26675ffd940aSRaphael Isemann 
26685ffd940aSRaphael Isemann   for (const auto &Var : LocalPatternVars)
26695ffd940aSRaphael Isemann     GlobalVariableTable.erase(Var);
26705ffd940aSRaphael Isemann   for (const auto &Var : LocalNumericVars)
26715ffd940aSRaphael Isemann     GlobalNumericVariableTable.erase(Var);
26725ffd940aSRaphael Isemann }
26735ffd940aSRaphael Isemann 
26745ffd940aSRaphael Isemann bool FileCheck::checkInput(SourceMgr &SM, StringRef Buffer,
26755ffd940aSRaphael Isemann                            std::vector<FileCheckDiag> *Diags) {
26765ffd940aSRaphael Isemann   bool ChecksFailed = false;
26775ffd940aSRaphael Isemann 
2678c10e8261SJay Foad   unsigned i = 0, j = 0, e = CheckStrings.size();
26795ffd940aSRaphael Isemann   while (true) {
26805ffd940aSRaphael Isemann     StringRef CheckRegion;
26815ffd940aSRaphael Isemann     if (j == e) {
26825ffd940aSRaphael Isemann       CheckRegion = Buffer;
26835ffd940aSRaphael Isemann     } else {
2684c10e8261SJay Foad       const FileCheckString &CheckLabelStr = CheckStrings[j];
26855ffd940aSRaphael Isemann       if (CheckLabelStr.Pat.getCheckTy() != Check::CheckLabel) {
26865ffd940aSRaphael Isemann         ++j;
26875ffd940aSRaphael Isemann         continue;
26885ffd940aSRaphael Isemann       }
26895ffd940aSRaphael Isemann 
26905ffd940aSRaphael Isemann       // Scan to next CHECK-LABEL match, ignoring CHECK-NOT and CHECK-DAG
26915ffd940aSRaphael Isemann       size_t MatchLabelLen = 0;
26925ffd940aSRaphael Isemann       size_t MatchLabelPos =
26935ffd940aSRaphael Isemann           CheckLabelStr.Check(SM, Buffer, true, MatchLabelLen, Req, Diags);
26945ffd940aSRaphael Isemann       if (MatchLabelPos == StringRef::npos)
26955ffd940aSRaphael Isemann         // Immediately bail if CHECK-LABEL fails, nothing else we can do.
26965ffd940aSRaphael Isemann         return false;
26975ffd940aSRaphael Isemann 
26985ffd940aSRaphael Isemann       CheckRegion = Buffer.substr(0, MatchLabelPos + MatchLabelLen);
26995ffd940aSRaphael Isemann       Buffer = Buffer.substr(MatchLabelPos + MatchLabelLen);
27005ffd940aSRaphael Isemann       ++j;
27015ffd940aSRaphael Isemann     }
27025ffd940aSRaphael Isemann 
27035ffd940aSRaphael Isemann     // Do not clear the first region as it's the one before the first
27045ffd940aSRaphael Isemann     // CHECK-LABEL and it would clear variables defined on the command-line
27055ffd940aSRaphael Isemann     // before they get used.
27065ffd940aSRaphael Isemann     if (i != 0 && Req.EnableVarScope)
27075ffd940aSRaphael Isemann       PatternContext->clearLocalVars();
27085ffd940aSRaphael Isemann 
27095ffd940aSRaphael Isemann     for (; i != j; ++i) {
2710c10e8261SJay Foad       const FileCheckString &CheckStr = CheckStrings[i];
27115ffd940aSRaphael Isemann 
27125ffd940aSRaphael Isemann       // Check each string within the scanned region, including a second check
27135ffd940aSRaphael Isemann       // of any final CHECK-LABEL (to verify CHECK-NOT and CHECK-DAG)
27145ffd940aSRaphael Isemann       size_t MatchLen = 0;
27155ffd940aSRaphael Isemann       size_t MatchPos =
27165ffd940aSRaphael Isemann           CheckStr.Check(SM, CheckRegion, false, MatchLen, Req, Diags);
27175ffd940aSRaphael Isemann 
27185ffd940aSRaphael Isemann       if (MatchPos == StringRef::npos) {
27195ffd940aSRaphael Isemann         ChecksFailed = true;
27205ffd940aSRaphael Isemann         i = j;
27215ffd940aSRaphael Isemann         break;
27225ffd940aSRaphael Isemann       }
27235ffd940aSRaphael Isemann 
27245ffd940aSRaphael Isemann       CheckRegion = CheckRegion.substr(MatchPos + MatchLen);
27255ffd940aSRaphael Isemann     }
27265ffd940aSRaphael Isemann 
27275ffd940aSRaphael Isemann     if (j == e)
27285ffd940aSRaphael Isemann       break;
27295ffd940aSRaphael Isemann   }
27305ffd940aSRaphael Isemann 
27315ffd940aSRaphael Isemann   // Success if no checks failed.
27325ffd940aSRaphael Isemann   return !ChecksFailed;
27335ffd940aSRaphael Isemann }
2734