1//===-- FileCheckImpl.h - Private FileCheck Interface ------------*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the private interfaces of FileCheck. Its purpose is to
10// allow unit testing of FileCheck and to separate the interface from the
11// implementation. It is only meant to be used by FileCheck.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef LLVM_LIB_FILECHECK_FILECHECKIMPL_H
16#define LLVM_LIB_FILECHECK_FILECHECKIMPL_H
17
18#include "llvm/ADT/APInt.h"
19#include "llvm/ADT/StringMap.h"
20#include "llvm/ADT/StringRef.h"
21#include "llvm/FileCheck/FileCheck.h"
22#include "llvm/Support/Error.h"
23#include "llvm/Support/SourceMgr.h"
24#include <map>
25#include <optional>
26#include <string>
27#include <vector>
28
29namespace llvm {
30
31//===----------------------------------------------------------------------===//
32// Numeric substitution handling code.
33//===----------------------------------------------------------------------===//
34
35/// Type representing the format an expression value should be textualized into
36/// for matching. Used to represent both explicit format specifiers as well as
37/// implicit format from using numeric variables.
38struct ExpressionFormat {
39  enum class Kind {
40    /// Denote absence of format. Used for implicit format of literals and
41    /// empty expressions.
42    NoFormat,
43    /// Value is an unsigned integer and should be printed as a decimal number.
44    Unsigned,
45    /// Value is a signed integer and should be printed as a decimal number.
46    Signed,
47    /// Value should be printed as an uppercase hex number.
48    HexUpper,
49    /// Value should be printed as a lowercase hex number.
50    HexLower
51  };
52
53private:
54  Kind Value;
55  unsigned Precision = 0;
56  /// printf-like "alternate form" selected.
57  bool AlternateForm = false;
58
59public:
60  /// Evaluates a format to true if it can be used in a match.
61  explicit operator bool() const { return Value != Kind::NoFormat; }
62
63  /// Define format equality: formats are equal if neither is NoFormat and
64  /// their kinds and precision are the same.
65  bool operator==(const ExpressionFormat &Other) const {
66    return Value != Kind::NoFormat && Value == Other.Value &&
67           Precision == Other.Precision && AlternateForm == Other.AlternateForm;
68  }
69
70  bool operator!=(const ExpressionFormat &Other) const {
71    return !(*this == Other);
72  }
73
74  bool operator==(Kind OtherValue) const { return Value == OtherValue; }
75
76  bool operator!=(Kind OtherValue) const { return !(*this == OtherValue); }
77
78  /// \returns the format specifier corresponding to this format as a string.
79  StringRef toString() const;
80
81  ExpressionFormat() : Value(Kind::NoFormat){};
82  explicit ExpressionFormat(Kind Value) : Value(Value), Precision(0){};
83  explicit ExpressionFormat(Kind Value, unsigned Precision)
84      : Value(Value), Precision(Precision){};
85  explicit ExpressionFormat(Kind Value, unsigned Precision, bool AlternateForm)
86      : Value(Value), Precision(Precision), AlternateForm(AlternateForm){};
87
88  /// \returns a wildcard regular expression string that matches any value in
89  /// the format represented by this instance and no other value, or an error
90  /// if the format is NoFormat.
91  Expected<std::string> getWildcardRegex() const;
92
93  /// \returns the string representation of \p Value in the format represented
94  /// by this instance, or an error if conversion to this format failed or the
95  /// format is NoFormat.
96  Expected<std::string> getMatchingString(APInt Value) const;
97
98  /// \returns the value corresponding to string representation \p StrVal
99  /// according to the matching format represented by this instance.
100  APInt valueFromStringRepr(StringRef StrVal, const SourceMgr &SM) const;
101};
102
103/// Class to represent an overflow error that might result when manipulating a
104/// value.
105class OverflowError : public ErrorInfo<OverflowError> {
106public:
107  static char ID;
108
109  std::error_code convertToErrorCode() const override {
110    return std::make_error_code(std::errc::value_too_large);
111  }
112
113  void log(raw_ostream &OS) const override { OS << "overflow error"; }
114};
115
116/// Performs operation and \returns its result or an error in case of failure,
117/// such as if an overflow occurs.
118Expected<APInt> exprAdd(const APInt &Lhs, const APInt &Rhs, bool &Overflow);
119Expected<APInt> exprSub(const APInt &Lhs, const APInt &Rhs, bool &Overflow);
120Expected<APInt> exprMul(const APInt &Lhs, const APInt &Rhs, bool &Overflow);
121Expected<APInt> exprDiv(const APInt &Lhs, const APInt &Rhs, bool &Overflow);
122Expected<APInt> exprMax(const APInt &Lhs, const APInt &Rhs, bool &Overflow);
123Expected<APInt> exprMin(const APInt &Lhs, const APInt &Rhs, bool &Overflow);
124
125/// Base class representing the AST of a given expression.
126class ExpressionAST {
127private:
128  StringRef ExpressionStr;
129
130public:
131  ExpressionAST(StringRef ExpressionStr) : ExpressionStr(ExpressionStr) {}
132
133  virtual ~ExpressionAST() = default;
134
135  StringRef getExpressionStr() const { return ExpressionStr; }
136
137  /// Evaluates and \returns the value of the expression represented by this
138  /// AST or an error if evaluation fails.
139  virtual Expected<APInt> eval() const = 0;
140
141  /// \returns either the implicit format of this AST, a diagnostic against
142  /// \p SM if implicit formats of the AST's components conflict, or NoFormat
143  /// if the AST has no implicit format (e.g. AST is made up of a single
144  /// literal).
145  virtual Expected<ExpressionFormat>
146  getImplicitFormat(const SourceMgr &SM) const {
147    return ExpressionFormat();
148  }
149};
150
151/// Class representing an unsigned literal in the AST of an expression.
152class ExpressionLiteral : public ExpressionAST {
153private:
154  /// Actual value of the literal.
155  APInt Value;
156
157public:
158  explicit ExpressionLiteral(StringRef ExpressionStr, APInt Val)
159      : ExpressionAST(ExpressionStr), Value(Val) {}
160
161  /// \returns the literal's value.
162  Expected<APInt> eval() const override { return Value; }
163};
164
165/// Class to represent an undefined variable error, which quotes that
166/// variable's name when printed.
167class UndefVarError : public ErrorInfo<UndefVarError> {
168private:
169  StringRef VarName;
170
171public:
172  static char ID;
173
174  UndefVarError(StringRef VarName) : VarName(VarName) {}
175
176  StringRef getVarName() const { return VarName; }
177
178  std::error_code convertToErrorCode() const override {
179    return inconvertibleErrorCode();
180  }
181
182  /// Print name of variable associated with this error.
183  void log(raw_ostream &OS) const override {
184    OS << "undefined variable: " << VarName;
185  }
186};
187
188/// Class representing an expression and its matching format.
189class Expression {
190private:
191  /// Pointer to AST of the expression.
192  std::unique_ptr<ExpressionAST> AST;
193
194  /// Format to use (e.g. hex upper case letters) when matching the value.
195  ExpressionFormat Format;
196
197public:
198  /// Generic constructor for an expression represented by the given \p AST and
199  /// whose matching format is \p Format.
200  Expression(std::unique_ptr<ExpressionAST> AST, ExpressionFormat Format)
201      : AST(std::move(AST)), Format(Format) {}
202
203  /// \returns pointer to AST of the expression. Pointer is guaranteed to be
204  /// valid as long as this object is.
205  ExpressionAST *getAST() const { return AST.get(); }
206
207  ExpressionFormat getFormat() const { return Format; }
208};
209
210/// Class representing a numeric variable and its associated current value.
211class NumericVariable {
212private:
213  /// Name of the numeric variable.
214  StringRef Name;
215
216  /// Format to use for expressions using this variable without an explicit
217  /// format.
218  ExpressionFormat ImplicitFormat;
219
220  /// Value of numeric variable, if defined, or std::nullopt otherwise.
221  std::optional<APInt> Value;
222
223  /// The input buffer's string from which Value was parsed, or std::nullopt.
224  /// See comments on getStringValue for a discussion of the std::nullopt case.
225  std::optional<StringRef> StrValue;
226
227  /// Line number where this variable is defined, or std::nullopt if defined
228  /// before input is parsed. Used to determine whether a variable is defined on
229  /// the same line as a given use.
230  std::optional<size_t> DefLineNumber;
231
232public:
233  /// Constructor for a variable \p Name with implicit format \p ImplicitFormat
234  /// defined at line \p DefLineNumber or defined before input is parsed if
235  /// \p DefLineNumber is std::nullopt.
236  explicit NumericVariable(StringRef Name, ExpressionFormat ImplicitFormat,
237                           std::optional<size_t> DefLineNumber = std::nullopt)
238      : Name(Name), ImplicitFormat(ImplicitFormat),
239        DefLineNumber(DefLineNumber) {}
240
241  /// \returns name of this numeric variable.
242  StringRef getName() const { return Name; }
243
244  /// \returns implicit format of this numeric variable.
245  ExpressionFormat getImplicitFormat() const { return ImplicitFormat; }
246
247  /// \returns this variable's value.
248  std::optional<APInt> getValue() const { return Value; }
249
250  /// \returns the input buffer's string from which this variable's value was
251  /// parsed, or std::nullopt if the value is not yet defined or was not parsed
252  /// from the input buffer.  For example, the value of @LINE is not parsed from
253  /// the input buffer, and some numeric variables are parsed from the command
254  /// line instead.
255  std::optional<StringRef> getStringValue() const { return StrValue; }
256
257  /// Sets value of this numeric variable to \p NewValue, and sets the input
258  /// buffer string from which it was parsed to \p NewStrValue.  See comments on
259  /// getStringValue for a discussion of when the latter can be std::nullopt.
260  void setValue(APInt NewValue,
261                std::optional<StringRef> NewStrValue = std::nullopt) {
262    Value = NewValue;
263    StrValue = NewStrValue;
264  }
265
266  /// Clears value of this numeric variable, regardless of whether it is
267  /// currently defined or not.
268  void clearValue() {
269    Value = std::nullopt;
270    StrValue = std::nullopt;
271  }
272
273  /// \returns the line number where this variable is defined, if any, or
274  /// std::nullopt if defined before input is parsed.
275  std::optional<size_t> getDefLineNumber() const { return DefLineNumber; }
276};
277
278/// Class representing the use of a numeric variable in the AST of an
279/// expression.
280class NumericVariableUse : public ExpressionAST {
281private:
282  /// Pointer to the class instance for the variable this use is about.
283  NumericVariable *Variable;
284
285public:
286  NumericVariableUse(StringRef Name, NumericVariable *Variable)
287      : ExpressionAST(Name), Variable(Variable) {}
288  /// \returns the value of the variable referenced by this instance.
289  Expected<APInt> eval() const override;
290
291  /// \returns implicit format of this numeric variable.
292  Expected<ExpressionFormat>
293  getImplicitFormat(const SourceMgr &SM) const override {
294    return Variable->getImplicitFormat();
295  }
296};
297
298/// Type of functions evaluating a given binary operation.
299using binop_eval_t = Expected<APInt> (*)(const APInt &, const APInt &, bool &);
300
301/// Class representing a single binary operation in the AST of an expression.
302class BinaryOperation : public ExpressionAST {
303private:
304  /// Left operand.
305  std::unique_ptr<ExpressionAST> LeftOperand;
306
307  /// Right operand.
308  std::unique_ptr<ExpressionAST> RightOperand;
309
310  /// Pointer to function that can evaluate this binary operation.
311  binop_eval_t EvalBinop;
312
313public:
314  BinaryOperation(StringRef ExpressionStr, binop_eval_t EvalBinop,
315                  std::unique_ptr<ExpressionAST> LeftOp,
316                  std::unique_ptr<ExpressionAST> RightOp)
317      : ExpressionAST(ExpressionStr), EvalBinop(EvalBinop) {
318    LeftOperand = std::move(LeftOp);
319    RightOperand = std::move(RightOp);
320  }
321
322  /// Evaluates the value of the binary operation represented by this AST,
323  /// using EvalBinop on the result of recursively evaluating the operands.
324  /// \returns the expression value or an error if an undefined numeric
325  /// variable is used in one of the operands.
326  Expected<APInt> eval() const override;
327
328  /// \returns the implicit format of this AST, if any, a diagnostic against
329  /// \p SM if the implicit formats of the AST's components conflict, or no
330  /// format if the AST has no implicit format (e.g. AST is made of a single
331  /// literal).
332  Expected<ExpressionFormat>
333  getImplicitFormat(const SourceMgr &SM) const override;
334};
335
336class FileCheckPatternContext;
337
338/// Class representing a substitution to perform in the RegExStr string.
339class Substitution {
340protected:
341  /// Pointer to a class instance holding, among other things, the table with
342  /// the values of live string variables at the start of any given CHECK line.
343  /// Used for substituting string variables with the text they were defined
344  /// as. Expressions are linked to the numeric variables they use at
345  /// parse time and directly access the value of the numeric variable to
346  /// evaluate their value.
347  FileCheckPatternContext *Context;
348
349  /// The string that needs to be substituted for something else. For a
350  /// string variable this is its name, otherwise this is the whole expression.
351  StringRef FromStr;
352
353  // Index in RegExStr of where to do the substitution.
354  size_t InsertIdx;
355
356public:
357  Substitution(FileCheckPatternContext *Context, StringRef VarName,
358               size_t InsertIdx)
359      : Context(Context), FromStr(VarName), InsertIdx(InsertIdx) {}
360
361  virtual ~Substitution() = default;
362
363  /// \returns the string to be substituted for something else.
364  StringRef getFromString() const { return FromStr; }
365
366  /// \returns the index where the substitution is to be performed in RegExStr.
367  size_t getIndex() const { return InsertIdx; }
368
369  /// \returns a string containing the result of the substitution represented
370  /// by this class instance or an error if substitution failed.
371  virtual Expected<std::string> getResult() const = 0;
372};
373
374class StringSubstitution : public Substitution {
375public:
376  StringSubstitution(FileCheckPatternContext *Context, StringRef VarName,
377                     size_t InsertIdx)
378      : Substitution(Context, VarName, InsertIdx) {}
379
380  /// \returns the text that the string variable in this substitution matched
381  /// when defined, or an error if the variable is undefined.
382  Expected<std::string> getResult() const override;
383};
384
385class NumericSubstitution : public Substitution {
386private:
387  /// Pointer to the class representing the expression whose value is to be
388  /// substituted.
389  std::unique_ptr<Expression> ExpressionPointer;
390
391public:
392  NumericSubstitution(FileCheckPatternContext *Context, StringRef ExpressionStr,
393                      std::unique_ptr<Expression> ExpressionPointer,
394                      size_t InsertIdx)
395      : Substitution(Context, ExpressionStr, InsertIdx),
396        ExpressionPointer(std::move(ExpressionPointer)) {}
397
398  /// \returns a string containing the result of evaluating the expression in
399  /// this substitution, or an error if evaluation failed.
400  Expected<std::string> getResult() const override;
401};
402
403//===----------------------------------------------------------------------===//
404// Pattern handling code.
405//===----------------------------------------------------------------------===//
406
407/// Class holding the Pattern global state, shared by all patterns: tables
408/// holding values of variables and whether they are defined or not at any
409/// given time in the matching process.
410class FileCheckPatternContext {
411  friend class Pattern;
412
413private:
414  /// When matching a given pattern, this holds the value of all the string
415  /// variables defined in previous patterns. In a pattern, only the last
416  /// definition for a given variable is recorded in this table.
417  /// Back-references are used for uses after any the other definition.
418  StringMap<StringRef> GlobalVariableTable;
419
420  /// Map of all string variables defined so far. Used at parse time to detect
421  /// a name conflict between a numeric variable and a string variable when
422  /// the former is defined on a later line than the latter.
423  StringMap<bool> DefinedVariableTable;
424
425  /// When matching a given pattern, this holds the pointers to the classes
426  /// representing the numeric variables defined in previous patterns. When
427  /// matching a pattern all definitions for that pattern are recorded in the
428  /// NumericVariableDefs table in the Pattern instance of that pattern.
429  StringMap<NumericVariable *> GlobalNumericVariableTable;
430
431  /// Pointer to the class instance representing the @LINE pseudo variable for
432  /// easily updating its value.
433  NumericVariable *LineVariable = nullptr;
434
435  /// Vector holding pointers to all parsed numeric variables. Used to
436  /// automatically free them once they are guaranteed to no longer be used.
437  std::vector<std::unique_ptr<NumericVariable>> NumericVariables;
438
439  /// Vector holding pointers to all parsed expressions. Used to automatically
440  /// free the expressions once they are guaranteed to no longer be used.
441  std::vector<std::unique_ptr<Expression>> Expressions;
442
443  /// Vector holding pointers to all substitutions. Used to automatically free
444  /// them once they are guaranteed to no longer be used.
445  std::vector<std::unique_ptr<Substitution>> Substitutions;
446
447public:
448  /// \returns the value of string variable \p VarName or an error if no such
449  /// variable has been defined.
450  Expected<StringRef> getPatternVarValue(StringRef VarName);
451
452  /// Defines string and numeric variables from definitions given on the
453  /// command line, passed as a vector of [#]VAR=VAL strings in
454  /// \p CmdlineDefines. \returns an error list containing diagnostics against
455  /// \p SM for all definition parsing failures, if any, or Success otherwise.
456  Error defineCmdlineVariables(ArrayRef<StringRef> CmdlineDefines,
457                               SourceMgr &SM);
458
459  /// Create @LINE pseudo variable. Value is set when pattern are being
460  /// matched.
461  void createLineVariable();
462
463  /// Undefines local variables (variables whose name does not start with a '$'
464  /// sign), i.e. removes them from GlobalVariableTable and from
465  /// GlobalNumericVariableTable and also clears the value of numeric
466  /// variables.
467  void clearLocalVars();
468
469private:
470  /// Makes a new numeric variable and registers it for destruction when the
471  /// context is destroyed.
472  template <class... Types> NumericVariable *makeNumericVariable(Types... args);
473
474  /// Makes a new string substitution and registers it for destruction when the
475  /// context is destroyed.
476  Substitution *makeStringSubstitution(StringRef VarName, size_t InsertIdx);
477
478  /// Makes a new numeric substitution and registers it for destruction when
479  /// the context is destroyed.
480  Substitution *makeNumericSubstitution(StringRef ExpressionStr,
481                                        std::unique_ptr<Expression> Expression,
482                                        size_t InsertIdx);
483};
484
485/// Class to represent an error holding a diagnostic with location information
486/// used when printing it.
487class ErrorDiagnostic : public ErrorInfo<ErrorDiagnostic> {
488private:
489  SMDiagnostic Diagnostic;
490  SMRange Range;
491
492public:
493  static char ID;
494
495  ErrorDiagnostic(SMDiagnostic &&Diag, SMRange Range)
496      : Diagnostic(Diag), Range(Range) {}
497
498  std::error_code convertToErrorCode() const override {
499    return inconvertibleErrorCode();
500  }
501
502  /// Print diagnostic associated with this error when printing the error.
503  void log(raw_ostream &OS) const override { Diagnostic.print(nullptr, OS); }
504
505  StringRef getMessage() const { return Diagnostic.getMessage(); }
506  SMRange getRange() const { return Range; }
507
508  static Error get(const SourceMgr &SM, SMLoc Loc, const Twine &ErrMsg,
509                   SMRange Range = std::nullopt) {
510    return make_error<ErrorDiagnostic>(
511        SM.GetMessage(Loc, SourceMgr::DK_Error, ErrMsg), Range);
512  }
513
514  static Error get(const SourceMgr &SM, StringRef Buffer, const Twine &ErrMsg) {
515    SMLoc Start = SMLoc::getFromPointer(Buffer.data());
516    SMLoc End = SMLoc::getFromPointer(Buffer.data() + Buffer.size());
517    return get(SM, Start, ErrMsg, SMRange(Start, End));
518  }
519};
520
521class NotFoundError : public ErrorInfo<NotFoundError> {
522public:
523  static char ID;
524
525  std::error_code convertToErrorCode() const override {
526    return inconvertibleErrorCode();
527  }
528
529  /// Print diagnostic associated with this error when printing the error.
530  void log(raw_ostream &OS) const override {
531    OS << "String not found in input";
532  }
533};
534
535/// An error that has already been reported.
536///
537/// This class is designed to support a function whose callers may need to know
538/// whether the function encountered and reported an error but never need to
539/// know the nature of that error.  For example, the function has a return type
540/// of \c Error and always returns either \c ErrorReported or \c ErrorSuccess.
541/// That interface is similar to that of a function returning bool to indicate
542/// an error except, in the former case, (1) there is no confusion over polarity
543/// and (2) the caller must either check the result or explicitly ignore it with
544/// a call like \c consumeError.
545class ErrorReported final : public ErrorInfo<ErrorReported> {
546public:
547  static char ID;
548
549  std::error_code convertToErrorCode() const override {
550    return inconvertibleErrorCode();
551  }
552
553  /// Print diagnostic associated with this error when printing the error.
554  void log(raw_ostream &OS) const override {
555    OS << "error previously reported";
556  }
557
558  static inline Error reportedOrSuccess(bool HasErrorReported) {
559    if (HasErrorReported)
560      return make_error<ErrorReported>();
561    return Error::success();
562  }
563};
564
565class Pattern {
566  SMLoc PatternLoc;
567
568  /// A fixed string to match as the pattern or empty if this pattern requires
569  /// a regex match.
570  StringRef FixedStr;
571
572  /// A regex string to match as the pattern or empty if this pattern requires
573  /// a fixed string to match.
574  std::string RegExStr;
575
576  /// Entries in this vector represent a substitution of a string variable or
577  /// an expression in the RegExStr regex at match time. For example, in the
578  /// case of a CHECK directive with the pattern "foo[[bar]]baz[[#N+1]]",
579  /// RegExStr will contain "foobaz" and we'll get two entries in this vector
580  /// that tells us to insert the value of string variable "bar" at offset 3
581  /// and the value of expression "N+1" at offset 6.
582  std::vector<Substitution *> Substitutions;
583
584  /// Maps names of string variables defined in a pattern to the number of
585  /// their parenthesis group in RegExStr capturing their last definition.
586  ///
587  /// E.g. for the pattern "foo[[bar:.*]]baz([[bar]][[QUUX]][[bar:.*]])",
588  /// RegExStr will be "foo(.*)baz(\1<quux value>(.*))" where <quux value> is
589  /// the value captured for QUUX on the earlier line where it was defined, and
590  /// VariableDefs will map "bar" to the third parenthesis group which captures
591  /// the second definition of "bar".
592  ///
593  /// Note: uses std::map rather than StringMap to be able to get the key when
594  /// iterating over values.
595  std::map<StringRef, unsigned> VariableDefs;
596
597  /// Structure representing the definition of a numeric variable in a pattern.
598  /// It holds the pointer to the class instance holding the value and matching
599  /// format of the numeric variable whose value is being defined and the
600  /// number of the parenthesis group in RegExStr to capture that value.
601  struct NumericVariableMatch {
602    /// Pointer to class instance holding the value and matching format of the
603    /// numeric variable being defined.
604    NumericVariable *DefinedNumericVariable;
605
606    /// Number of the parenthesis group in RegExStr that captures the value of
607    /// this numeric variable definition.
608    unsigned CaptureParenGroup;
609  };
610
611  /// Holds the number of the parenthesis group in RegExStr and pointer to the
612  /// corresponding NumericVariable class instance of all numeric variable
613  /// definitions. Used to set the matched value of all those variables.
614  StringMap<NumericVariableMatch> NumericVariableDefs;
615
616  /// Pointer to a class instance holding the global state shared by all
617  /// patterns:
618  /// - separate tables with the values of live string and numeric variables
619  ///   respectively at the start of any given CHECK line;
620  /// - table holding whether a string variable has been defined at any given
621  ///   point during the parsing phase.
622  FileCheckPatternContext *Context;
623
624  Check::FileCheckType CheckTy;
625
626  /// Line number for this CHECK pattern or std::nullopt if it is an implicit
627  /// pattern. Used to determine whether a variable definition is made on an
628  /// earlier line to the one with this CHECK.
629  std::optional<size_t> LineNumber;
630
631  /// Ignore case while matching if set to true.
632  bool IgnoreCase = false;
633
634public:
635  Pattern(Check::FileCheckType Ty, FileCheckPatternContext *Context,
636          std::optional<size_t> Line = std::nullopt)
637      : Context(Context), CheckTy(Ty), LineNumber(Line) {}
638
639  /// \returns the location in source code.
640  SMLoc getLoc() const { return PatternLoc; }
641
642  /// \returns the pointer to the global state for all patterns in this
643  /// FileCheck instance.
644  FileCheckPatternContext *getContext() const { return Context; }
645
646  /// \returns whether \p C is a valid first character for a variable name.
647  static bool isValidVarNameStart(char C);
648
649  /// Parsing information about a variable.
650  struct VariableProperties {
651    StringRef Name;
652    bool IsPseudo;
653  };
654
655  /// Parses the string at the start of \p Str for a variable name. \returns
656  /// a VariableProperties structure holding the variable name and whether it
657  /// is the name of a pseudo variable, or an error holding a diagnostic
658  /// against \p SM if parsing fail. If parsing was successful, also strips
659  /// \p Str from the variable name.
660  static Expected<VariableProperties> parseVariable(StringRef &Str,
661                                                    const SourceMgr &SM);
662  /// Parses \p Expr for a numeric substitution block at line \p LineNumber,
663  /// or before input is parsed if \p LineNumber is None. Parameter
664  /// \p IsLegacyLineExpr indicates whether \p Expr should be a legacy @LINE
665  /// expression and \p Context points to the class instance holding the live
666  /// string and numeric variables. \returns a pointer to the class instance
667  /// representing the expression whose value must be substitued, or an error
668  /// holding a diagnostic against \p SM if parsing fails. If substitution was
669  /// successful, sets \p DefinedNumericVariable to point to the class
670  /// representing the numeric variable defined in this numeric substitution
671  /// block, or std::nullopt if this block does not define any variable.
672  static Expected<std::unique_ptr<Expression>> parseNumericSubstitutionBlock(
673      StringRef Expr, std::optional<NumericVariable *> &DefinedNumericVariable,
674      bool IsLegacyLineExpr, std::optional<size_t> LineNumber,
675      FileCheckPatternContext *Context, const SourceMgr &SM);
676  /// Parses the pattern in \p PatternStr and initializes this Pattern instance
677  /// accordingly.
678  ///
679  /// \p Prefix provides which prefix is being matched, \p Req describes the
680  /// global options that influence the parsing such as whitespace
681  /// canonicalization, \p SM provides the SourceMgr used for error reports.
682  /// \returns true in case of an error, false otherwise.
683  bool parsePattern(StringRef PatternStr, StringRef Prefix, SourceMgr &SM,
684                    const FileCheckRequest &Req);
685  struct Match {
686    size_t Pos;
687    size_t Len;
688  };
689  struct MatchResult {
690    std::optional<Match> TheMatch;
691    Error TheError;
692    MatchResult(size_t MatchPos, size_t MatchLen, Error E)
693        : TheMatch(Match{MatchPos, MatchLen}), TheError(std::move(E)) {}
694    MatchResult(Match M, Error E) : TheMatch(M), TheError(std::move(E)) {}
695    MatchResult(Error E) : TheError(std::move(E)) {}
696  };
697  /// Matches the pattern string against the input buffer \p Buffer.
698  ///
699  /// \returns either (1) an error resulting in no match or (2) a match possibly
700  /// with an error encountered while processing the match.
701  ///
702  /// The GlobalVariableTable StringMap in the FileCheckPatternContext class
703  /// instance provides the current values of FileCheck string variables and is
704  /// updated if this match defines new values. Likewise, the
705  /// GlobalNumericVariableTable StringMap in the same class provides the
706  /// current values of FileCheck numeric variables and is updated if this
707  /// match defines new numeric values.
708  MatchResult match(StringRef Buffer, const SourceMgr &SM) const;
709  /// Prints the value of successful substitutions.
710  void printSubstitutions(const SourceMgr &SM, StringRef Buffer,
711                          SMRange MatchRange, FileCheckDiag::MatchType MatchTy,
712                          std::vector<FileCheckDiag> *Diags) const;
713  void printFuzzyMatch(const SourceMgr &SM, StringRef Buffer,
714                       std::vector<FileCheckDiag> *Diags) const;
715
716  bool hasVariable() const {
717    return !(Substitutions.empty() && VariableDefs.empty());
718  }
719  void printVariableDefs(const SourceMgr &SM, FileCheckDiag::MatchType MatchTy,
720                         std::vector<FileCheckDiag> *Diags) const;
721
722  Check::FileCheckType getCheckTy() const { return CheckTy; }
723
724  int getCount() const { return CheckTy.getCount(); }
725
726private:
727  bool AddRegExToRegEx(StringRef RS, unsigned &CurParen, SourceMgr &SM);
728  void AddBackrefToRegEx(unsigned BackrefNum);
729  /// Computes an arbitrary estimate for the quality of matching this pattern
730  /// at the start of \p Buffer; a distance of zero should correspond to a
731  /// perfect match.
732  unsigned computeMatchDistance(StringRef Buffer) const;
733  /// Finds the closing sequence of a regex variable usage or definition.
734  ///
735  /// \p Str has to point in the beginning of the definition (right after the
736  /// opening sequence). \p SM holds the SourceMgr used for error reporting.
737  ///  \returns the offset of the closing sequence within Str, or npos if it
738  /// was not found.
739  static size_t FindRegexVarEnd(StringRef Str, SourceMgr &SM);
740
741  /// Parses \p Expr for the name of a numeric variable to be defined at line
742  /// \p LineNumber, or before input is parsed if \p LineNumber is None.
743  /// \returns a pointer to the class instance representing that variable,
744  /// creating it if needed, or an error holding a diagnostic against \p SM
745  /// should defining such a variable be invalid.
746  static Expected<NumericVariable *> parseNumericVariableDefinition(
747      StringRef &Expr, FileCheckPatternContext *Context,
748      std::optional<size_t> LineNumber, ExpressionFormat ImplicitFormat,
749      const SourceMgr &SM);
750  /// Parses \p Name as a (pseudo if \p IsPseudo is true) numeric variable use
751  /// at line \p LineNumber, or before input is parsed if \p LineNumber is
752  /// None. Parameter \p Context points to the class instance holding the live
753  /// string and numeric variables. \returns the pointer to the class instance
754  /// representing that variable if successful, or an error holding a
755  /// diagnostic against \p SM otherwise.
756  static Expected<std::unique_ptr<NumericVariableUse>> parseNumericVariableUse(
757      StringRef Name, bool IsPseudo, std::optional<size_t> LineNumber,
758      FileCheckPatternContext *Context, const SourceMgr &SM);
759  enum class AllowedOperand { LineVar, LegacyLiteral, Any };
760  /// Parses \p Expr for use of a numeric operand at line \p LineNumber, or
761  /// before input is parsed if \p LineNumber is None. Accepts literal values,
762  /// numeric variables and function calls, depending on the value of \p AO.
763  /// \p MaybeInvalidConstraint indicates whether the text being parsed could
764  /// be an invalid constraint. \p Context points to the class instance holding
765  /// the live string and numeric variables. \returns the class representing
766  /// that operand in the AST of the expression or an error holding a
767  /// diagnostic against \p SM otherwise. If \p Expr starts with a "(" this
768  /// function will attempt to parse a parenthesized expression.
769  static Expected<std::unique_ptr<ExpressionAST>>
770  parseNumericOperand(StringRef &Expr, AllowedOperand AO, bool ConstraintParsed,
771                      std::optional<size_t> LineNumber,
772                      FileCheckPatternContext *Context, const SourceMgr &SM);
773  /// Parses and updates \p RemainingExpr for a binary operation at line
774  /// \p LineNumber, or before input is parsed if \p LineNumber is None. The
775  /// left operand of this binary operation is given in \p LeftOp and \p Expr
776  /// holds the string for the full expression, including the left operand.
777  /// Parameter \p IsLegacyLineExpr indicates whether we are parsing a legacy
778  /// @LINE expression. Parameter \p Context points to the class instance
779  /// holding the live string and numeric variables. \returns the class
780  /// representing the binary operation in the AST of the expression, or an
781  /// error holding a diagnostic against \p SM otherwise.
782  static Expected<std::unique_ptr<ExpressionAST>>
783  parseBinop(StringRef Expr, StringRef &RemainingExpr,
784             std::unique_ptr<ExpressionAST> LeftOp, bool IsLegacyLineExpr,
785             std::optional<size_t> LineNumber, FileCheckPatternContext *Context,
786             const SourceMgr &SM);
787
788  /// Parses a parenthesized expression inside \p Expr at line \p LineNumber, or
789  /// before input is parsed if \p LineNumber is None. \p Expr must start with
790  /// a '('. Accepts both literal values and numeric variables. Parameter \p
791  /// Context points to the class instance holding the live string and numeric
792  /// variables. \returns the class representing that operand in the AST of the
793  /// expression or an error holding a diagnostic against \p SM otherwise.
794  static Expected<std::unique_ptr<ExpressionAST>>
795  parseParenExpr(StringRef &Expr, std::optional<size_t> LineNumber,
796                 FileCheckPatternContext *Context, const SourceMgr &SM);
797
798  /// Parses \p Expr for an argument list belonging to a call to function \p
799  /// FuncName at line \p LineNumber, or before input is parsed if \p LineNumber
800  /// is None. Parameter \p FuncLoc is the source location used for diagnostics.
801  /// Parameter \p Context points to the class instance holding the live string
802  /// and numeric variables. \returns the class representing that call in the
803  /// AST of the expression or an error holding a diagnostic against \p SM
804  /// otherwise.
805  static Expected<std::unique_ptr<ExpressionAST>>
806  parseCallExpr(StringRef &Expr, StringRef FuncName,
807                std::optional<size_t> LineNumber,
808                FileCheckPatternContext *Context, const SourceMgr &SM);
809};
810
811//===----------------------------------------------------------------------===//
812// Check Strings.
813//===----------------------------------------------------------------------===//
814
815/// A check that we found in the input file.
816struct FileCheckString {
817  /// The pattern to match.
818  Pattern Pat;
819
820  /// Which prefix name this check matched.
821  StringRef Prefix;
822
823  /// The location in the match file that the check string was specified.
824  SMLoc Loc;
825
826  /// Hold the information about the DAG/NOT strings in the program, which are
827  /// not explicitly stored otherwise. This allows for better and more accurate
828  /// diagnostic messages.
829  struct DagNotPrefixInfo {
830    Pattern DagNotPat;
831    StringRef DagNotPrefix;
832
833    DagNotPrefixInfo(const Pattern &P, StringRef S)
834        : DagNotPat(P), DagNotPrefix(S) {}
835  };
836
837  /// Hold the DAG/NOT strings occurring in the input file.
838  std::vector<DagNotPrefixInfo> DagNotStrings;
839
840  FileCheckString(const Pattern &P, StringRef S, SMLoc L)
841      : Pat(P), Prefix(S), Loc(L) {}
842
843  /// Matches check string and its "not strings" and/or "dag strings".
844  size_t Check(const SourceMgr &SM, StringRef Buffer, bool IsLabelScanMode,
845               size_t &MatchLen, FileCheckRequest &Req,
846               std::vector<FileCheckDiag> *Diags) const;
847
848  /// Verifies that there is a single line in the given \p Buffer. Errors are
849  /// reported against \p SM.
850  bool CheckNext(const SourceMgr &SM, StringRef Buffer) const;
851  /// Verifies that there is no newline in the given \p Buffer. Errors are
852  /// reported against \p SM.
853  bool CheckSame(const SourceMgr &SM, StringRef Buffer) const;
854  /// Verifies that none of the strings in \p NotStrings are found in the given
855  /// \p Buffer. Errors are reported against \p SM and diagnostics recorded in
856  /// \p Diags according to the verbosity level set in \p Req.
857  bool CheckNot(const SourceMgr &SM, StringRef Buffer,
858                const std::vector<const DagNotPrefixInfo *> &NotStrings,
859                const FileCheckRequest &Req,
860                std::vector<FileCheckDiag> *Diags) const;
861  /// Matches "dag strings" and their mixed "not strings".
862  size_t CheckDag(const SourceMgr &SM, StringRef Buffer,
863                  std::vector<const DagNotPrefixInfo *> &NotStrings,
864                  const FileCheckRequest &Req,
865                  std::vector<FileCheckDiag> *Diags) const;
866};
867
868} // namespace llvm
869
870#endif
871