| 1 | //===-- FileCheckImpl.h - Private FileCheck Interface ------------*- C++ -*-==// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This file defines the private interfaces of FileCheck. Its purpose is to |
| 10 | // allow unit testing of FileCheck and to separate the interface from the |
| 11 | // implementation. It is only meant to be used by FileCheck. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #ifndef LLVM_LIB_FILECHECK_FILECHECKIMPL_H |
| 16 | #define LLVM_LIB_FILECHECK_FILECHECKIMPL_H |
| 17 | |
| 18 | #include "llvm/ADT/APInt.h" |
| 19 | #include "llvm/ADT/StringMap.h" |
| 20 | #include "llvm/ADT/StringRef.h" |
| 21 | #include "llvm/FileCheck/FileCheck.h" |
| 22 | #include "llvm/Support/Compiler.h" |
| 23 | #include "llvm/Support/Error.h" |
| 24 | #include "llvm/Support/SourceMgr.h" |
| 25 | #include <map> |
| 26 | #include <optional> |
| 27 | #include <string> |
| 28 | #include <vector> |
| 29 | |
| 30 | namespace llvm { |
| 31 | |
| 32 | //===----------------------------------------------------------------------===// |
| 33 | // Numeric substitution handling code. |
| 34 | //===----------------------------------------------------------------------===// |
| 35 | |
| 36 | /// Type representing the format an expression value should be textualized into |
| 37 | /// for matching. Used to represent both explicit format specifiers as well as |
| 38 | /// implicit format from using numeric variables. |
| 39 | struct ExpressionFormat { |
| 40 | enum class Kind { |
| 41 | /// Denote absence of format. Used for implicit format of literals and |
| 42 | /// empty expressions. |
| 43 | NoFormat, |
| 44 | /// Value is an unsigned integer and should be printed as a decimal number. |
| 45 | Unsigned, |
| 46 | /// Value is a signed integer and should be printed as a decimal number. |
| 47 | Signed, |
| 48 | /// Value should be printed as an uppercase hex number. |
| 49 | HexUpper, |
| 50 | /// Value should be printed as a lowercase hex number. |
| 51 | HexLower |
| 52 | }; |
| 53 | |
| 54 | private: |
| 55 | Kind Value = Kind::NoFormat; |
| 56 | unsigned Precision = 0; |
| 57 | /// printf-like "alternate form" selected. |
| 58 | bool AlternateForm = false; |
| 59 | |
| 60 | public: |
| 61 | /// Evaluates a format to true if it can be used in a match. |
| 62 | explicit operator bool() const { return Value != Kind::NoFormat; } |
| 63 | |
| 64 | /// Define format equality: formats are equal if neither is NoFormat and |
| 65 | /// their kinds and precision are the same. |
| 66 | bool operator==(const ExpressionFormat &Other) const { |
| 67 | return Value != Kind::NoFormat && Value == Other.Value && |
| 68 | Precision == Other.Precision && AlternateForm == Other.AlternateForm; |
| 69 | } |
| 70 | |
| 71 | bool operator!=(const ExpressionFormat &Other) const { |
| 72 | return !(*this == Other); |
| 73 | } |
| 74 | |
| 75 | bool operator==(Kind OtherValue) const { return Value == OtherValue; } |
| 76 | |
| 77 | bool operator!=(Kind OtherValue) const { return !(*this == OtherValue); } |
| 78 | |
| 79 | /// \returns the format specifier corresponding to this format as a string. |
| 80 | StringRef toString() const; |
| 81 | |
| 82 | ExpressionFormat() = default; |
| 83 | explicit ExpressionFormat(Kind Value) : Value(Value), Precision(0){}; |
| 84 | explicit ExpressionFormat(Kind Value, unsigned Precision) |
| 85 | : Value(Value), Precision(Precision){}; |
| 86 | explicit ExpressionFormat(Kind Value, unsigned Precision, bool AlternateForm) |
| 87 | : Value(Value), Precision(Precision), AlternateForm(AlternateForm){}; |
| 88 | |
| 89 | /// \returns a wildcard regular expression string that matches any value in |
| 90 | /// the format represented by this instance and no other value, or an error |
| 91 | /// if the format is NoFormat. |
| 92 | LLVM_ABI_FOR_TEST Expected<std::string> getWildcardRegex() const; |
| 93 | |
| 94 | /// \returns the string representation of \p Value in the format represented |
| 95 | /// by this instance, or an error if conversion to this format failed or the |
| 96 | /// format is NoFormat. |
| 97 | LLVM_ABI_FOR_TEST Expected<std::string> getMatchingString(APInt Value) const; |
| 98 | |
| 99 | /// \returns the value corresponding to string representation \p StrVal |
| 100 | /// according to the matching format represented by this instance. |
| 101 | LLVM_ABI_FOR_TEST APInt valueFromStringRepr(StringRef StrVal, |
| 102 | const SourceMgr &SM) const; |
| 103 | }; |
| 104 | |
| 105 | /// Class to represent an overflow error that might result when manipulating a |
| 106 | /// value. |
| 107 | class OverflowError : public ErrorInfo<OverflowError> { |
| 108 | public: |
| 109 | LLVM_ABI_FOR_TEST static char ID; |
| 110 | |
| 111 | std::error_code convertToErrorCode() const override { |
| 112 | return std::make_error_code(e: std::errc::value_too_large); |
| 113 | } |
| 114 | |
| 115 | void log(raw_ostream &OS) const override { OS << "overflow error" ; } |
| 116 | }; |
| 117 | |
| 118 | /// Performs operation and \returns its result or an error in case of failure, |
| 119 | /// such as if an overflow occurs. |
| 120 | LLVM_ABI_FOR_TEST Expected<APInt> exprAdd(const APInt &Lhs, const APInt &Rhs, |
| 121 | bool &Overflow); |
| 122 | LLVM_ABI_FOR_TEST Expected<APInt> exprSub(const APInt &Lhs, const APInt &Rhs, |
| 123 | bool &Overflow); |
| 124 | LLVM_ABI_FOR_TEST Expected<APInt> exprMul(const APInt &Lhs, const APInt &Rhs, |
| 125 | bool &Overflow); |
| 126 | LLVM_ABI_FOR_TEST Expected<APInt> exprDiv(const APInt &Lhs, const APInt &Rhs, |
| 127 | bool &Overflow); |
| 128 | Expected<APInt> exprMax(const APInt &Lhs, const APInt &Rhs, bool &Overflow); |
| 129 | Expected<APInt> exprMin(const APInt &Lhs, const APInt &Rhs, bool &Overflow); |
| 130 | |
| 131 | /// Base class representing the AST of a given expression. |
| 132 | class ExpressionAST { |
| 133 | private: |
| 134 | StringRef ExpressionStr; |
| 135 | |
| 136 | public: |
| 137 | ExpressionAST(StringRef ExpressionStr) : ExpressionStr(ExpressionStr) {} |
| 138 | |
| 139 | virtual ~ExpressionAST() = default; |
| 140 | |
| 141 | StringRef getExpressionStr() const { return ExpressionStr; } |
| 142 | |
| 143 | /// Evaluates and \returns the value of the expression represented by this |
| 144 | /// AST or an error if evaluation fails. |
| 145 | virtual Expected<APInt> eval() const = 0; |
| 146 | |
| 147 | /// \returns either the implicit format of this AST, a diagnostic against |
| 148 | /// \p SM if implicit formats of the AST's components conflict, or NoFormat |
| 149 | /// if the AST has no implicit format (e.g. AST is made up of a single |
| 150 | /// literal). |
| 151 | virtual Expected<ExpressionFormat> |
| 152 | getImplicitFormat(const SourceMgr &SM) const { |
| 153 | return ExpressionFormat(); |
| 154 | } |
| 155 | }; |
| 156 | |
| 157 | /// Class representing an unsigned literal in the AST of an expression. |
| 158 | class ExpressionLiteral : public ExpressionAST { |
| 159 | private: |
| 160 | /// Actual value of the literal. |
| 161 | APInt Value; |
| 162 | |
| 163 | public: |
| 164 | explicit ExpressionLiteral(StringRef ExpressionStr, APInt Val) |
| 165 | : ExpressionAST(ExpressionStr), Value(Val) {} |
| 166 | |
| 167 | /// \returns the literal's value. |
| 168 | Expected<APInt> eval() const override { return Value; } |
| 169 | }; |
| 170 | |
| 171 | /// Class to represent an undefined variable error, which quotes that |
| 172 | /// variable's name when printed. |
| 173 | class UndefVarError : public ErrorInfo<UndefVarError> { |
| 174 | private: |
| 175 | StringRef VarName; |
| 176 | |
| 177 | public: |
| 178 | LLVM_ABI_FOR_TEST static char ID; |
| 179 | |
| 180 | UndefVarError(StringRef VarName) : VarName(VarName) {} |
| 181 | |
| 182 | StringRef getVarName() const { return VarName; } |
| 183 | |
| 184 | std::error_code convertToErrorCode() const override { |
| 185 | return inconvertibleErrorCode(); |
| 186 | } |
| 187 | |
| 188 | /// Print name of variable associated with this error. |
| 189 | void log(raw_ostream &OS) const override { |
| 190 | OS << "undefined variable: " << VarName; |
| 191 | } |
| 192 | }; |
| 193 | |
| 194 | /// Class representing an expression and its matching format. |
| 195 | class Expression { |
| 196 | private: |
| 197 | /// Pointer to AST of the expression. |
| 198 | std::unique_ptr<ExpressionAST> AST; |
| 199 | |
| 200 | /// Format to use (e.g. hex upper case letters) when matching the value. |
| 201 | ExpressionFormat Format; |
| 202 | |
| 203 | public: |
| 204 | /// Generic constructor for an expression represented by the given \p AST and |
| 205 | /// whose matching format is \p Format. |
| 206 | Expression(std::unique_ptr<ExpressionAST> AST, ExpressionFormat Format) |
| 207 | : AST(std::move(AST)), Format(Format) {} |
| 208 | |
| 209 | /// \returns pointer to AST of the expression. Pointer is guaranteed to be |
| 210 | /// valid as long as this object is. |
| 211 | ExpressionAST *getAST() const { return AST.get(); } |
| 212 | |
| 213 | ExpressionFormat getFormat() const { return Format; } |
| 214 | }; |
| 215 | |
| 216 | /// Class representing a numeric variable and its associated current value. |
| 217 | class NumericVariable { |
| 218 | private: |
| 219 | /// Name of the numeric variable. |
| 220 | StringRef Name; |
| 221 | |
| 222 | /// Format to use for expressions using this variable without an explicit |
| 223 | /// format. |
| 224 | ExpressionFormat ImplicitFormat; |
| 225 | |
| 226 | /// Value of numeric variable, if defined, or std::nullopt otherwise. |
| 227 | std::optional<APInt> Value; |
| 228 | |
| 229 | /// The input buffer's string from which Value was parsed, or std::nullopt. |
| 230 | /// See comments on getStringValue for a discussion of the std::nullopt case. |
| 231 | std::optional<StringRef> StrValue; |
| 232 | |
| 233 | /// Line number where this variable is defined, or std::nullopt if defined |
| 234 | /// before input is parsed. Used to determine whether a variable is defined on |
| 235 | /// the same line as a given use. |
| 236 | std::optional<size_t> DefLineNumber; |
| 237 | |
| 238 | public: |
| 239 | /// Constructor for a variable \p Name with implicit format \p ImplicitFormat |
| 240 | /// defined at line \p DefLineNumber or defined before input is parsed if |
| 241 | /// \p DefLineNumber is std::nullopt. |
| 242 | explicit NumericVariable(StringRef Name, ExpressionFormat ImplicitFormat, |
| 243 | std::optional<size_t> DefLineNumber = std::nullopt) |
| 244 | : Name(Name), ImplicitFormat(ImplicitFormat), |
| 245 | DefLineNumber(DefLineNumber) {} |
| 246 | |
| 247 | /// \returns name of this numeric variable. |
| 248 | StringRef getName() const { return Name; } |
| 249 | |
| 250 | /// \returns implicit format of this numeric variable. |
| 251 | ExpressionFormat getImplicitFormat() const { return ImplicitFormat; } |
| 252 | |
| 253 | /// \returns this variable's value. |
| 254 | std::optional<APInt> getValue() const { return Value; } |
| 255 | |
| 256 | /// \returns the input buffer's string from which this variable's value was |
| 257 | /// parsed, or std::nullopt if the value is not yet defined or was not parsed |
| 258 | /// from the input buffer. For example, the value of @LINE is not parsed from |
| 259 | /// the input buffer, and some numeric variables are parsed from the command |
| 260 | /// line instead. |
| 261 | std::optional<StringRef> getStringValue() const { return StrValue; } |
| 262 | |
| 263 | /// Sets value of this numeric variable to \p NewValue, and sets the input |
| 264 | /// buffer string from which it was parsed to \p NewStrValue. See comments on |
| 265 | /// getStringValue for a discussion of when the latter can be std::nullopt. |
| 266 | void setValue(APInt NewValue, |
| 267 | std::optional<StringRef> NewStrValue = std::nullopt) { |
| 268 | Value = NewValue; |
| 269 | StrValue = NewStrValue; |
| 270 | } |
| 271 | |
| 272 | /// Clears value of this numeric variable, regardless of whether it is |
| 273 | /// currently defined or not. |
| 274 | void clearValue() { |
| 275 | Value = std::nullopt; |
| 276 | StrValue = std::nullopt; |
| 277 | } |
| 278 | |
| 279 | /// \returns the line number where this variable is defined, if any, or |
| 280 | /// std::nullopt if defined before input is parsed. |
| 281 | std::optional<size_t> getDefLineNumber() const { return DefLineNumber; } |
| 282 | }; |
| 283 | |
| 284 | /// Class representing the use of a numeric variable in the AST of an |
| 285 | /// expression. |
| 286 | class LLVM_ABI_FOR_TEST NumericVariableUse : public ExpressionAST { |
| 287 | private: |
| 288 | /// Pointer to the class instance for the variable this use is about. |
| 289 | NumericVariable *Variable; |
| 290 | |
| 291 | public: |
| 292 | NumericVariableUse(StringRef Name, NumericVariable *Variable) |
| 293 | : ExpressionAST(Name), Variable(Variable) {} |
| 294 | /// \returns the value of the variable referenced by this instance. |
| 295 | Expected<APInt> eval() const override; |
| 296 | |
| 297 | /// \returns implicit format of this numeric variable. |
| 298 | Expected<ExpressionFormat> |
| 299 | getImplicitFormat(const SourceMgr &SM) const override { |
| 300 | return Variable->getImplicitFormat(); |
| 301 | } |
| 302 | }; |
| 303 | |
| 304 | /// Type of functions evaluating a given binary operation. |
| 305 | using binop_eval_t = Expected<APInt> (*)(const APInt &, const APInt &, bool &); |
| 306 | |
| 307 | /// Class representing a single binary operation in the AST of an expression. |
| 308 | class LLVM_ABI_FOR_TEST BinaryOperation : public ExpressionAST { |
| 309 | private: |
| 310 | /// Left operand. |
| 311 | std::unique_ptr<ExpressionAST> LeftOperand; |
| 312 | |
| 313 | /// Right operand. |
| 314 | std::unique_ptr<ExpressionAST> RightOperand; |
| 315 | |
| 316 | /// Pointer to function that can evaluate this binary operation. |
| 317 | binop_eval_t EvalBinop; |
| 318 | |
| 319 | public: |
| 320 | BinaryOperation(StringRef ExpressionStr, binop_eval_t EvalBinop, |
| 321 | std::unique_ptr<ExpressionAST> LeftOp, |
| 322 | std::unique_ptr<ExpressionAST> RightOp) |
| 323 | : ExpressionAST(ExpressionStr), EvalBinop(EvalBinop) { |
| 324 | LeftOperand = std::move(LeftOp); |
| 325 | RightOperand = std::move(RightOp); |
| 326 | } |
| 327 | |
| 328 | /// Evaluates the value of the binary operation represented by this AST, |
| 329 | /// using EvalBinop on the result of recursively evaluating the operands. |
| 330 | /// \returns the expression value or an error if an undefined numeric |
| 331 | /// variable is used in one of the operands. |
| 332 | Expected<APInt> eval() const override; |
| 333 | |
| 334 | /// \returns the implicit format of this AST, if any, a diagnostic against |
| 335 | /// \p SM if the implicit formats of the AST's components conflict, or no |
| 336 | /// format if the AST has no implicit format (e.g. AST is made of a single |
| 337 | /// literal). |
| 338 | Expected<ExpressionFormat> |
| 339 | getImplicitFormat(const SourceMgr &SM) const override; |
| 340 | }; |
| 341 | |
| 342 | class FileCheckPatternContext; |
| 343 | |
| 344 | /// Class representing a substitution to perform in the RegExStr string. |
| 345 | class Substitution { |
| 346 | protected: |
| 347 | /// Pointer to a class instance holding, among other things, the table with |
| 348 | /// the values of live string variables at the start of any given CHECK line. |
| 349 | /// Used for substituting string variables with the text they were defined |
| 350 | /// as. Expressions are linked to the numeric variables they use at |
| 351 | /// parse time and directly access the value of the numeric variable to |
| 352 | /// evaluate their value. |
| 353 | FileCheckPatternContext *Context; |
| 354 | |
| 355 | /// The string that needs to be substituted for something else. For a |
| 356 | /// string variable this is its name, otherwise this is the whole expression. |
| 357 | StringRef FromStr; |
| 358 | |
| 359 | // Index in RegExStr of where to do the substitution. |
| 360 | size_t InsertIdx; |
| 361 | |
| 362 | public: |
| 363 | Substitution(FileCheckPatternContext *Context, StringRef VarName, |
| 364 | size_t InsertIdx) |
| 365 | : Context(Context), FromStr(VarName), InsertIdx(InsertIdx) {} |
| 366 | |
| 367 | virtual ~Substitution() = default; |
| 368 | |
| 369 | /// \returns the string to be substituted for something else. |
| 370 | StringRef getFromString() const { return FromStr; } |
| 371 | |
| 372 | /// \returns the index where the substitution is to be performed in RegExStr. |
| 373 | size_t getIndex() const { return InsertIdx; } |
| 374 | |
| 375 | /// \returns a regular expression string that matches the result of the |
| 376 | /// substitution represented by this class instance or an error if |
| 377 | /// substitution failed. |
| 378 | virtual Expected<std::string> getResultRegex() const = 0; |
| 379 | |
| 380 | /// \returns a string containing the result of the substitution represented |
| 381 | /// by this class instance in a form suitable for diagnostics, or an error if |
| 382 | /// substitution failed. |
| 383 | virtual Expected<std::string> getResultForDiagnostics() const = 0; |
| 384 | }; |
| 385 | |
| 386 | class LLVM_ABI_FOR_TEST StringSubstitution : public Substitution { |
| 387 | public: |
| 388 | StringSubstitution(FileCheckPatternContext *Context, StringRef VarName, |
| 389 | size_t InsertIdx) |
| 390 | : Substitution(Context, VarName, InsertIdx) {} |
| 391 | |
| 392 | /// \returns the text that the string variable in this substitution matched |
| 393 | /// when defined, or an error if the variable is undefined. |
| 394 | Expected<std::string> getResultRegex() const override; |
| 395 | |
| 396 | /// \returns the text that the string variable in this substitution matched |
| 397 | /// when defined, in a form suitable for diagnostics, or an error if the |
| 398 | /// variable is undefined. |
| 399 | Expected<std::string> getResultForDiagnostics() const override; |
| 400 | }; |
| 401 | |
| 402 | class LLVM_ABI_FOR_TEST NumericSubstitution : public Substitution { |
| 403 | private: |
| 404 | /// Pointer to the class representing the expression whose value is to be |
| 405 | /// substituted. |
| 406 | std::unique_ptr<Expression> ExpressionPointer; |
| 407 | |
| 408 | public: |
| 409 | NumericSubstitution(FileCheckPatternContext *Context, StringRef ExpressionStr, |
| 410 | std::unique_ptr<Expression> ExpressionPointer, |
| 411 | size_t InsertIdx) |
| 412 | : Substitution(Context, ExpressionStr, InsertIdx), |
| 413 | ExpressionPointer(std::move(ExpressionPointer)) {} |
| 414 | |
| 415 | /// \returns a string containing the result of evaluating the expression in |
| 416 | /// this substitution, or an error if evaluation failed. |
| 417 | Expected<std::string> getResultRegex() const override; |
| 418 | |
| 419 | /// \returns a string containing the result of evaluating the expression in |
| 420 | /// this substitution, in a form suitable for diagnostics, or an error if |
| 421 | /// evaluation failed. |
| 422 | Expected<std::string> getResultForDiagnostics() const override; |
| 423 | }; |
| 424 | |
| 425 | //===----------------------------------------------------------------------===// |
| 426 | // Pattern handling code. |
| 427 | //===----------------------------------------------------------------------===// |
| 428 | |
| 429 | /// Class holding the Pattern global state, shared by all patterns: tables |
| 430 | /// holding values of variables and whether they are defined or not at any |
| 431 | /// given time in the matching process. |
| 432 | class FileCheckPatternContext { |
| 433 | friend class Pattern; |
| 434 | |
| 435 | private: |
| 436 | /// When matching a given pattern, this holds the value of all the string |
| 437 | /// variables defined in previous patterns. In a pattern, only the last |
| 438 | /// definition for a given variable is recorded in this table. |
| 439 | /// Back-references are used for uses after any the other definition. |
| 440 | StringMap<StringRef> GlobalVariableTable; |
| 441 | |
| 442 | /// Map of all string variables defined so far. Used at parse time to detect |
| 443 | /// a name conflict between a numeric variable and a string variable when |
| 444 | /// the former is defined on a later line than the latter. |
| 445 | StringMap<bool> DefinedVariableTable; |
| 446 | |
| 447 | /// When matching a given pattern, this holds the pointers to the classes |
| 448 | /// representing the numeric variables defined in previous patterns. When |
| 449 | /// matching a pattern all definitions for that pattern are recorded in the |
| 450 | /// NumericVariableDefs table in the Pattern instance of that pattern. |
| 451 | StringMap<NumericVariable *> GlobalNumericVariableTable; |
| 452 | |
| 453 | /// Pointer to the class instance representing the @LINE pseudo variable for |
| 454 | /// easily updating its value. |
| 455 | NumericVariable *LineVariable = nullptr; |
| 456 | |
| 457 | /// Vector holding pointers to all parsed numeric variables. Used to |
| 458 | /// automatically free them once they are guaranteed to no longer be used. |
| 459 | std::vector<std::unique_ptr<NumericVariable>> NumericVariables; |
| 460 | |
| 461 | /// Vector holding pointers to all parsed expressions. Used to automatically |
| 462 | /// free the expressions once they are guaranteed to no longer be used. |
| 463 | std::vector<std::unique_ptr<Expression>> Expressions; |
| 464 | |
| 465 | /// Vector holding pointers to all substitutions. Used to automatically free |
| 466 | /// them once they are guaranteed to no longer be used. |
| 467 | std::vector<std::unique_ptr<Substitution>> Substitutions; |
| 468 | |
| 469 | public: |
| 470 | /// \returns the value of string variable \p VarName or an error if no such |
| 471 | /// variable has been defined. |
| 472 | LLVM_ABI_FOR_TEST Expected<StringRef> getPatternVarValue(StringRef VarName); |
| 473 | |
| 474 | /// Defines string and numeric variables from definitions given on the |
| 475 | /// command line, passed as a vector of [#]VAR=VAL strings in |
| 476 | /// \p CmdlineDefines. \returns an error list containing diagnostics against |
| 477 | /// \p SM for all definition parsing failures, if any, or Success otherwise. |
| 478 | LLVM_ABI_FOR_TEST Error |
| 479 | defineCmdlineVariables(ArrayRef<StringRef> CmdlineDefines, SourceMgr &SM); |
| 480 | |
| 481 | /// Create @LINE pseudo variable. Value is set when pattern are being |
| 482 | /// matched. |
| 483 | LLVM_ABI_FOR_TEST void createLineVariable(); |
| 484 | |
| 485 | /// Undefines local variables (variables whose name does not start with a '$' |
| 486 | /// sign), i.e. removes them from GlobalVariableTable and from |
| 487 | /// GlobalNumericVariableTable and also clears the value of numeric |
| 488 | /// variables. |
| 489 | LLVM_ABI_FOR_TEST void clearLocalVars(); |
| 490 | |
| 491 | private: |
| 492 | /// Makes a new numeric variable and registers it for destruction when the |
| 493 | /// context is destroyed. |
| 494 | template <class... Types> NumericVariable *makeNumericVariable(Types... args); |
| 495 | |
| 496 | /// Makes a new string substitution and registers it for destruction when the |
| 497 | /// context is destroyed. |
| 498 | Substitution *makeStringSubstitution(StringRef VarName, size_t InsertIdx); |
| 499 | |
| 500 | /// Makes a new numeric substitution and registers it for destruction when |
| 501 | /// the context is destroyed. |
| 502 | Substitution *makeNumericSubstitution(StringRef ExpressionStr, |
| 503 | std::unique_ptr<Expression> Expression, |
| 504 | size_t InsertIdx); |
| 505 | }; |
| 506 | |
| 507 | /// Class to represent an error holding a diagnostic with location information |
| 508 | /// used when printing it. |
| 509 | class ErrorDiagnostic : public ErrorInfo<ErrorDiagnostic> { |
| 510 | private: |
| 511 | SMDiagnostic Diagnostic; |
| 512 | SMRange Range; |
| 513 | |
| 514 | public: |
| 515 | LLVM_ABI_FOR_TEST static char ID; |
| 516 | |
| 517 | ErrorDiagnostic(SMDiagnostic &&Diag, SMRange Range) |
| 518 | : Diagnostic(Diag), Range(Range) {} |
| 519 | |
| 520 | std::error_code convertToErrorCode() const override { |
| 521 | return inconvertibleErrorCode(); |
| 522 | } |
| 523 | |
| 524 | /// Print diagnostic associated with this error when printing the error. |
| 525 | void log(raw_ostream &OS) const override { Diagnostic.print(ProgName: nullptr, S&: OS); } |
| 526 | |
| 527 | StringRef getMessage() const { return Diagnostic.getMessage(); } |
| 528 | SMRange getRange() const { return Range; } |
| 529 | |
| 530 | static Error get(const SourceMgr &SM, SMLoc Loc, const Twine &ErrMsg, |
| 531 | SMRange Range = {}) { |
| 532 | return make_error<ErrorDiagnostic>( |
| 533 | Args: SM.GetMessage(Loc, Kind: SourceMgr::DK_Error, Msg: ErrMsg), Args&: Range); |
| 534 | } |
| 535 | |
| 536 | static Error get(const SourceMgr &SM, StringRef Buffer, const Twine &ErrMsg) { |
| 537 | SMLoc Start = SMLoc::getFromPointer(Ptr: Buffer.data()); |
| 538 | SMLoc End = SMLoc::getFromPointer(Ptr: Buffer.data() + Buffer.size()); |
| 539 | return get(SM, Loc: Start, ErrMsg, Range: SMRange(Start, End)); |
| 540 | } |
| 541 | }; |
| 542 | |
| 543 | class NotFoundError : public ErrorInfo<NotFoundError> { |
| 544 | public: |
| 545 | LLVM_ABI_FOR_TEST static char ID; |
| 546 | |
| 547 | std::error_code convertToErrorCode() const override { |
| 548 | return inconvertibleErrorCode(); |
| 549 | } |
| 550 | |
| 551 | /// Print diagnostic associated with this error when printing the error. |
| 552 | void log(raw_ostream &OS) const override { |
| 553 | OS << "String not found in input" ; |
| 554 | } |
| 555 | }; |
| 556 | |
| 557 | /// An error that has already been reported. |
| 558 | /// |
| 559 | /// This class is designed to support a function whose callers may need to know |
| 560 | /// whether the function encountered and reported an error but never need to |
| 561 | /// know the nature of that error. For example, the function has a return type |
| 562 | /// of \c Error and always returns either \c ErrorReported or \c ErrorSuccess. |
| 563 | /// That interface is similar to that of a function returning bool to indicate |
| 564 | /// an error except, in the former case, (1) there is no confusion over polarity |
| 565 | /// and (2) the caller must either check the result or explicitly ignore it with |
| 566 | /// a call like \c consumeError. |
| 567 | class ErrorReported final : public ErrorInfo<ErrorReported> { |
| 568 | public: |
| 569 | static char ID; |
| 570 | |
| 571 | std::error_code convertToErrorCode() const override { |
| 572 | return inconvertibleErrorCode(); |
| 573 | } |
| 574 | |
| 575 | /// Print diagnostic associated with this error when printing the error. |
| 576 | void log(raw_ostream &OS) const override { |
| 577 | OS << "error previously reported" ; |
| 578 | } |
| 579 | |
| 580 | static inline Error reportedOrSuccess(bool HasErrorReported) { |
| 581 | if (HasErrorReported) |
| 582 | return make_error<ErrorReported>(); |
| 583 | return Error::success(); |
| 584 | } |
| 585 | }; |
| 586 | |
| 587 | class Pattern { |
| 588 | SMLoc PatternLoc; |
| 589 | |
| 590 | /// A fixed string to match as the pattern or empty if this pattern requires |
| 591 | /// a regex match. |
| 592 | StringRef FixedStr; |
| 593 | |
| 594 | /// A regex string to match as the pattern or empty if this pattern requires |
| 595 | /// a fixed string to match. |
| 596 | std::string RegExStr; |
| 597 | |
| 598 | /// Entries in this vector represent a substitution of a string variable or |
| 599 | /// an expression in the RegExStr regex at match time. For example, in the |
| 600 | /// case of a CHECK directive with the pattern "foo[[bar]]baz[[#N+1]]", |
| 601 | /// RegExStr will contain "foobaz" and we'll get two entries in this vector |
| 602 | /// that tells us to insert the value of string variable "bar" at offset 3 |
| 603 | /// and the value of expression "N+1" at offset 6. |
| 604 | std::vector<Substitution *> Substitutions; |
| 605 | |
| 606 | /// Maps names of string variables defined in a pattern to the number of |
| 607 | /// their parenthesis group in RegExStr capturing their last definition. |
| 608 | /// |
| 609 | /// E.g. for the pattern "foo[[bar:.*]]baz([[bar]][[QUUX]][[bar:.*]])", |
| 610 | /// RegExStr will be "foo(.*)baz(\1<quux value>(.*))" where <quux value> is |
| 611 | /// the value captured for QUUX on the earlier line where it was defined, and |
| 612 | /// VariableDefs will map "bar" to the third parenthesis group which captures |
| 613 | /// the second definition of "bar". |
| 614 | /// |
| 615 | /// Note: uses std::map rather than StringMap to be able to get the key when |
| 616 | /// iterating over values. |
| 617 | std::map<StringRef, unsigned> VariableDefs; |
| 618 | |
| 619 | /// Structure representing the definition of a numeric variable in a pattern. |
| 620 | /// It holds the pointer to the class instance holding the value and matching |
| 621 | /// format of the numeric variable whose value is being defined and the |
| 622 | /// number of the parenthesis group in RegExStr to capture that value. |
| 623 | struct NumericVariableMatch { |
| 624 | /// Pointer to class instance holding the value and matching format of the |
| 625 | /// numeric variable being defined. |
| 626 | NumericVariable *DefinedNumericVariable; |
| 627 | |
| 628 | /// Number of the parenthesis group in RegExStr that captures the value of |
| 629 | /// this numeric variable definition. |
| 630 | unsigned CaptureParenGroup; |
| 631 | }; |
| 632 | |
| 633 | /// Holds the number of the parenthesis group in RegExStr and pointer to the |
| 634 | /// corresponding NumericVariable class instance of all numeric variable |
| 635 | /// definitions. Used to set the matched value of all those variables. |
| 636 | StringMap<NumericVariableMatch> NumericVariableDefs; |
| 637 | |
| 638 | /// Pointer to a class instance holding the global state shared by all |
| 639 | /// patterns: |
| 640 | /// - separate tables with the values of live string and numeric variables |
| 641 | /// respectively at the start of any given CHECK line; |
| 642 | /// - table holding whether a string variable has been defined at any given |
| 643 | /// point during the parsing phase. |
| 644 | FileCheckPatternContext *Context; |
| 645 | |
| 646 | Check::FileCheckType CheckTy; |
| 647 | |
| 648 | /// Line number for this CHECK pattern or std::nullopt if it is an implicit |
| 649 | /// pattern. Used to determine whether a variable definition is made on an |
| 650 | /// earlier line to the one with this CHECK. |
| 651 | std::optional<size_t> LineNumber; |
| 652 | |
| 653 | /// Ignore case while matching if set to true. |
| 654 | bool IgnoreCase = false; |
| 655 | |
| 656 | public: |
| 657 | Pattern(Check::FileCheckType Ty, FileCheckPatternContext *Context, |
| 658 | std::optional<size_t> Line = std::nullopt) |
| 659 | : Context(Context), CheckTy(Ty), LineNumber(Line) {} |
| 660 | |
| 661 | /// \returns the location in source code. |
| 662 | SMLoc getLoc() const { return PatternLoc; } |
| 663 | |
| 664 | /// \returns the pointer to the global state for all patterns in this |
| 665 | /// FileCheck instance. |
| 666 | FileCheckPatternContext *getContext() const { return Context; } |
| 667 | |
| 668 | /// \returns whether \p C is a valid first character for a variable name. |
| 669 | LLVM_ABI_FOR_TEST static bool isValidVarNameStart(char C); |
| 670 | |
| 671 | /// Parsing information about a variable. |
| 672 | struct VariableProperties { |
| 673 | StringRef Name; |
| 674 | bool IsPseudo; |
| 675 | }; |
| 676 | |
| 677 | /// Parses the string at the start of \p Str for a variable name. \returns |
| 678 | /// a VariableProperties structure holding the variable name and whether it |
| 679 | /// is the name of a pseudo variable, or an error holding a diagnostic |
| 680 | /// against \p SM if parsing fail. If parsing was successful, also strips |
| 681 | /// \p Str from the variable name. |
| 682 | LLVM_ABI_FOR_TEST static Expected<VariableProperties> |
| 683 | parseVariable(StringRef &Str, const SourceMgr &SM); |
| 684 | /// Parses \p Expr for a numeric substitution block at line \p LineNumber, |
| 685 | /// or before input is parsed if \p LineNumber is None. Parameter |
| 686 | /// \p IsLegacyLineExpr indicates whether \p Expr should be a legacy @LINE |
| 687 | /// expression and \p Context points to the class instance holding the live |
| 688 | /// string and numeric variables. \returns a pointer to the class instance |
| 689 | /// representing the expression whose value must be substitued, or an error |
| 690 | /// holding a diagnostic against \p SM if parsing fails. If substitution was |
| 691 | /// successful, sets \p DefinedNumericVariable to point to the class |
| 692 | /// representing the numeric variable defined in this numeric substitution |
| 693 | /// block, or std::nullopt if this block does not define any variable. |
| 694 | LLVM_ABI_FOR_TEST static Expected<std::unique_ptr<Expression>> |
| 695 | parseNumericSubstitutionBlock( |
| 696 | StringRef Expr, std::optional<NumericVariable *> &DefinedNumericVariable, |
| 697 | bool IsLegacyLineExpr, std::optional<size_t> LineNumber, |
| 698 | FileCheckPatternContext *Context, const SourceMgr &SM); |
| 699 | /// Parses the pattern in \p PatternStr and initializes this Pattern instance |
| 700 | /// accordingly. |
| 701 | /// |
| 702 | /// \p Prefix provides which prefix is being matched, \p Req describes the |
| 703 | /// global options that influence the parsing such as whitespace |
| 704 | /// canonicalization, \p SM provides the SourceMgr used for error reports. |
| 705 | /// \returns true in case of an error, false otherwise. |
| 706 | LLVM_ABI_FOR_TEST bool parsePattern(StringRef PatternStr, StringRef Prefix, |
| 707 | SourceMgr &SM, |
| 708 | const FileCheckRequest &Req); |
| 709 | struct Match { |
| 710 | size_t Pos; |
| 711 | size_t Len; |
| 712 | }; |
| 713 | struct MatchResult { |
| 714 | std::optional<Match> TheMatch; |
| 715 | Error TheError; |
| 716 | MatchResult(size_t MatchPos, size_t MatchLen, Error E) |
| 717 | : TheMatch(Match{.Pos: MatchPos, .Len: MatchLen}), TheError(std::move(E)) {} |
| 718 | MatchResult(Match M, Error E) : TheMatch(M), TheError(std::move(E)) {} |
| 719 | MatchResult(Error E) : TheError(std::move(E)) {} |
| 720 | }; |
| 721 | /// Matches the pattern string against the input buffer \p Buffer. |
| 722 | /// |
| 723 | /// \returns either (1) an error resulting in no match or (2) a match possibly |
| 724 | /// with an error encountered while processing the match. |
| 725 | /// |
| 726 | /// The GlobalVariableTable StringMap in the FileCheckPatternContext class |
| 727 | /// instance provides the current values of FileCheck string variables and is |
| 728 | /// updated if this match defines new values. Likewise, the |
| 729 | /// GlobalNumericVariableTable StringMap in the same class provides the |
| 730 | /// current values of FileCheck numeric variables and is updated if this |
| 731 | /// match defines new numeric values. |
| 732 | LLVM_ABI_FOR_TEST MatchResult match(StringRef Buffer, |
| 733 | const SourceMgr &SM) const; |
| 734 | /// Prints the value of successful substitutions. |
| 735 | void printSubstitutions(const SourceMgr &SM, StringRef Buffer, |
| 736 | SMRange MatchRange, FileCheckDiag::MatchType MatchTy, |
| 737 | std::vector<FileCheckDiag> *Diags) const; |
| 738 | void printFuzzyMatch(const SourceMgr &SM, StringRef Buffer, |
| 739 | std::vector<FileCheckDiag> *Diags) const; |
| 740 | |
| 741 | bool hasVariable() const { |
| 742 | return !(Substitutions.empty() && VariableDefs.empty()); |
| 743 | } |
| 744 | LLVM_ABI_FOR_TEST void |
| 745 | printVariableDefs(const SourceMgr &SM, FileCheckDiag::MatchType MatchTy, |
| 746 | std::vector<FileCheckDiag> *Diags) const; |
| 747 | |
| 748 | Check::FileCheckType getCheckTy() const { return CheckTy; } |
| 749 | |
| 750 | int getCount() const { return CheckTy.getCount(); } |
| 751 | |
| 752 | private: |
| 753 | bool AddRegExToRegEx(StringRef RS, unsigned &CurParen, SourceMgr &SM); |
| 754 | void AddBackrefToRegEx(unsigned BackrefNum); |
| 755 | /// Computes an arbitrary estimate for the quality of matching this pattern |
| 756 | /// at the start of \p Buffer; a distance of zero should correspond to a |
| 757 | /// perfect match. |
| 758 | unsigned computeMatchDistance(StringRef Buffer) const; |
| 759 | /// Finds the closing sequence of a regex variable usage or definition. |
| 760 | /// |
| 761 | /// \p Str has to point in the beginning of the definition (right after the |
| 762 | /// opening sequence). \p SM holds the SourceMgr used for error reporting. |
| 763 | /// \returns the offset of the closing sequence within Str, or npos if it |
| 764 | /// was not found. |
| 765 | static size_t FindRegexVarEnd(StringRef Str, SourceMgr &SM); |
| 766 | |
| 767 | /// Parses \p Expr for the name of a numeric variable to be defined at line |
| 768 | /// \p LineNumber, or before input is parsed if \p LineNumber is None. |
| 769 | /// \returns a pointer to the class instance representing that variable, |
| 770 | /// creating it if needed, or an error holding a diagnostic against \p SM |
| 771 | /// should defining such a variable be invalid. |
| 772 | static Expected<NumericVariable *> parseNumericVariableDefinition( |
| 773 | StringRef &Expr, FileCheckPatternContext *Context, |
| 774 | std::optional<size_t> LineNumber, ExpressionFormat ImplicitFormat, |
| 775 | const SourceMgr &SM); |
| 776 | /// Parses \p Name as a (pseudo if \p IsPseudo is true) numeric variable use |
| 777 | /// at line \p LineNumber, or before input is parsed if \p LineNumber is |
| 778 | /// None. Parameter \p Context points to the class instance holding the live |
| 779 | /// string and numeric variables. \returns the pointer to the class instance |
| 780 | /// representing that variable if successful, or an error holding a |
| 781 | /// diagnostic against \p SM otherwise. |
| 782 | static Expected<std::unique_ptr<NumericVariableUse>> parseNumericVariableUse( |
| 783 | StringRef Name, bool IsPseudo, std::optional<size_t> LineNumber, |
| 784 | FileCheckPatternContext *Context, const SourceMgr &SM); |
| 785 | enum class AllowedOperand { LineVar, LegacyLiteral, Any }; |
| 786 | /// Parses \p Expr for use of a numeric operand at line \p LineNumber, or |
| 787 | /// before input is parsed if \p LineNumber is None. Accepts literal values, |
| 788 | /// numeric variables and function calls, depending on the value of \p AO. |
| 789 | /// \p MaybeInvalidConstraint indicates whether the text being parsed could |
| 790 | /// be an invalid constraint. \p Context points to the class instance holding |
| 791 | /// the live string and numeric variables. \returns the class representing |
| 792 | /// that operand in the AST of the expression or an error holding a |
| 793 | /// diagnostic against \p SM otherwise. If \p Expr starts with a "(" this |
| 794 | /// function will attempt to parse a parenthesized expression. |
| 795 | static Expected<std::unique_ptr<ExpressionAST>> |
| 796 | parseNumericOperand(StringRef &Expr, AllowedOperand AO, bool ConstraintParsed, |
| 797 | std::optional<size_t> LineNumber, |
| 798 | FileCheckPatternContext *Context, const SourceMgr &SM); |
| 799 | /// Parses and updates \p RemainingExpr for a binary operation at line |
| 800 | /// \p LineNumber, or before input is parsed if \p LineNumber is None. The |
| 801 | /// left operand of this binary operation is given in \p LeftOp and \p Expr |
| 802 | /// holds the string for the full expression, including the left operand. |
| 803 | /// Parameter \p IsLegacyLineExpr indicates whether we are parsing a legacy |
| 804 | /// @LINE expression. Parameter \p Context points to the class instance |
| 805 | /// holding the live string and numeric variables. \returns the class |
| 806 | /// representing the binary operation in the AST of the expression, or an |
| 807 | /// error holding a diagnostic against \p SM otherwise. |
| 808 | static Expected<std::unique_ptr<ExpressionAST>> |
| 809 | parseBinop(StringRef Expr, StringRef &RemainingExpr, |
| 810 | std::unique_ptr<ExpressionAST> LeftOp, bool IsLegacyLineExpr, |
| 811 | std::optional<size_t> LineNumber, FileCheckPatternContext *Context, |
| 812 | const SourceMgr &SM); |
| 813 | |
| 814 | /// Parses a parenthesized expression inside \p Expr at line \p LineNumber, or |
| 815 | /// before input is parsed if \p LineNumber is None. \p Expr must start with |
| 816 | /// a '('. Accepts both literal values and numeric variables. Parameter \p |
| 817 | /// Context points to the class instance holding the live string and numeric |
| 818 | /// variables. \returns the class representing that operand in the AST of the |
| 819 | /// expression or an error holding a diagnostic against \p SM otherwise. |
| 820 | static Expected<std::unique_ptr<ExpressionAST>> |
| 821 | parseParenExpr(StringRef &Expr, std::optional<size_t> LineNumber, |
| 822 | FileCheckPatternContext *Context, const SourceMgr &SM); |
| 823 | |
| 824 | /// Parses \p Expr for an argument list belonging to a call to function \p |
| 825 | /// FuncName at line \p LineNumber, or before input is parsed if \p LineNumber |
| 826 | /// is None. Parameter \p FuncLoc is the source location used for diagnostics. |
| 827 | /// Parameter \p Context points to the class instance holding the live string |
| 828 | /// and numeric variables. \returns the class representing that call in the |
| 829 | /// AST of the expression or an error holding a diagnostic against \p SM |
| 830 | /// otherwise. |
| 831 | static Expected<std::unique_ptr<ExpressionAST>> |
| 832 | parseCallExpr(StringRef &Expr, StringRef FuncName, |
| 833 | std::optional<size_t> LineNumber, |
| 834 | FileCheckPatternContext *Context, const SourceMgr &SM); |
| 835 | }; |
| 836 | |
| 837 | //===----------------------------------------------------------------------===// |
| 838 | // Check Strings. |
| 839 | //===----------------------------------------------------------------------===// |
| 840 | |
| 841 | /// A check that we found in the input file. |
| 842 | struct FileCheckString { |
| 843 | /// The pattern to match. |
| 844 | Pattern Pat; |
| 845 | |
| 846 | /// Which prefix name this check matched. |
| 847 | StringRef Prefix; |
| 848 | |
| 849 | /// The location in the match file that the check string was specified. |
| 850 | SMLoc Loc; |
| 851 | |
| 852 | /// Hold the information about the DAG/NOT strings in the program, which are |
| 853 | /// not explicitly stored otherwise. This allows for better and more accurate |
| 854 | /// diagnostic messages. |
| 855 | struct DagNotPrefixInfo { |
| 856 | Pattern DagNotPat; |
| 857 | StringRef DagNotPrefix; |
| 858 | |
| 859 | DagNotPrefixInfo(const Pattern &P, StringRef S) |
| 860 | : DagNotPat(P), DagNotPrefix(S) {} |
| 861 | }; |
| 862 | |
| 863 | /// Hold the DAG/NOT strings occurring in the input file. |
| 864 | std::vector<DagNotPrefixInfo> DagNotStrings; |
| 865 | |
| 866 | FileCheckString(Pattern &&P, StringRef S, SMLoc L, |
| 867 | std::vector<DagNotPrefixInfo> &&D) |
| 868 | : Pat(std::move(P)), Prefix(S), Loc(L), DagNotStrings(std::move(D)) {} |
| 869 | |
| 870 | /// Matches check string and its "not strings" and/or "dag strings". |
| 871 | size_t Check(const SourceMgr &SM, StringRef Buffer, bool IsLabelScanMode, |
| 872 | size_t &MatchLen, FileCheckRequest &Req, |
| 873 | std::vector<FileCheckDiag> *Diags) const; |
| 874 | |
| 875 | /// Verifies that there is a single line in the given \p Buffer. Errors are |
| 876 | /// reported against \p SM. |
| 877 | bool CheckNext(const SourceMgr &SM, StringRef Buffer) const; |
| 878 | /// Verifies that there is no newline in the given \p Buffer. Errors are |
| 879 | /// reported against \p SM. |
| 880 | bool CheckSame(const SourceMgr &SM, StringRef Buffer) const; |
| 881 | /// Verifies that none of the strings in \p NotStrings are found in the given |
| 882 | /// \p Buffer. Errors are reported against \p SM and diagnostics recorded in |
| 883 | /// \p Diags according to the verbosity level set in \p Req. |
| 884 | bool CheckNot(const SourceMgr &SM, StringRef Buffer, |
| 885 | const std::vector<const DagNotPrefixInfo *> &NotStrings, |
| 886 | const FileCheckRequest &Req, |
| 887 | std::vector<FileCheckDiag> *Diags) const; |
| 888 | /// Matches "dag strings" and their mixed "not strings". |
| 889 | size_t CheckDag(const SourceMgr &SM, StringRef Buffer, |
| 890 | std::vector<const DagNotPrefixInfo *> &NotStrings, |
| 891 | const FileCheckRequest &Req, |
| 892 | std::vector<FileCheckDiag> *Diags) const; |
| 893 | }; |
| 894 | |
| 895 | } // namespace llvm |
| 896 | |
| 897 | #endif |
| 898 | |