860 lines
35 KiB
C++
860 lines
35 KiB
C++
//===-- FileCheckImpl.h - Private FileCheck Interface ------------*- C++ -*-==//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file defines the private interfaces of FileCheck. Its purpose is to
|
|
// allow unit testing of FileCheck and to separate the interface from the
|
|
// implementation. It is only meant to be used by FileCheck.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_LIB_FILECHECK_FILECHECKIMPL_H
|
|
#define LLVM_LIB_FILECHECK_FILECHECKIMPL_H
|
|
|
|
#include "llvm/ADT/Optional.h"
|
|
#include "llvm/ADT/StringMap.h"
|
|
#include "llvm/ADT/StringRef.h"
|
|
#include "llvm/FileCheck/FileCheck.h"
|
|
#include "llvm/Support/Error.h"
|
|
#include "llvm/Support/SourceMgr.h"
|
|
#include <map>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
namespace llvm {
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Numeric substitution handling code.
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
class ExpressionValue;
|
|
|
|
/// Type representing the format an expression value should be textualized into
|
|
/// for matching. Used to represent both explicit format specifiers as well as
|
|
/// implicit format from using numeric variables.
|
|
struct ExpressionFormat {
|
|
enum class Kind {
|
|
/// Denote absence of format. Used for implicit format of literals and
|
|
/// empty expressions.
|
|
NoFormat,
|
|
/// Value is an unsigned integer and should be printed as a decimal number.
|
|
Unsigned,
|
|
/// Value is a signed integer and should be printed as a decimal number.
|
|
Signed,
|
|
/// Value should be printed as an uppercase hex number.
|
|
HexUpper,
|
|
/// Value should be printed as a lowercase hex number.
|
|
HexLower
|
|
};
|
|
|
|
private:
|
|
Kind Value;
|
|
unsigned Precision = 0;
|
|
|
|
public:
|
|
/// Evaluates a format to true if it can be used in a match.
|
|
explicit operator bool() const { return Value != Kind::NoFormat; }
|
|
|
|
/// Define format equality: formats are equal if neither is NoFormat and
|
|
/// their kinds and precision are the same.
|
|
bool operator==(const ExpressionFormat &Other) const {
|
|
return Value != Kind::NoFormat && Value == Other.Value &&
|
|
Precision == Other.Precision;
|
|
}
|
|
|
|
bool operator!=(const ExpressionFormat &Other) const {
|
|
return !(*this == Other);
|
|
}
|
|
|
|
bool operator==(Kind OtherValue) const { return Value == OtherValue; }
|
|
|
|
bool operator!=(Kind OtherValue) const { return !(*this == OtherValue); }
|
|
|
|
/// \returns the format specifier corresponding to this format as a string.
|
|
StringRef toString() const;
|
|
|
|
ExpressionFormat() : Value(Kind::NoFormat){};
|
|
explicit ExpressionFormat(Kind Value) : Value(Value), Precision(0){};
|
|
explicit ExpressionFormat(Kind Value, unsigned Precision)
|
|
: Value(Value), Precision(Precision){};
|
|
|
|
/// \returns a wildcard regular expression string that matches any value in
|
|
/// the format represented by this instance and no other value, or an error
|
|
/// if the format is NoFormat.
|
|
Expected<std::string> getWildcardRegex() const;
|
|
|
|
/// \returns the string representation of \p Value in the format represented
|
|
/// by this instance, or an error if conversion to this format failed or the
|
|
/// format is NoFormat.
|
|
Expected<std::string> getMatchingString(ExpressionValue Value) const;
|
|
|
|
/// \returns the value corresponding to string representation \p StrVal
|
|
/// according to the matching format represented by this instance or an error
|
|
/// with diagnostic against \p SM if \p StrVal does not correspond to a valid
|
|
/// and representable value.
|
|
Expected<ExpressionValue> valueFromStringRepr(StringRef StrVal,
|
|
const SourceMgr &SM) const;
|
|
};
|
|
|
|
/// Class to represent an overflow error that might result when manipulating a
|
|
/// value.
|
|
class OverflowError : public ErrorInfo<OverflowError> {
|
|
public:
|
|
static char ID;
|
|
|
|
std::error_code convertToErrorCode() const override {
|
|
return std::make_error_code(std::errc::value_too_large);
|
|
}
|
|
|
|
void log(raw_ostream &OS) const override { OS << "overflow error"; }
|
|
};
|
|
|
|
/// Class representing a numeric value.
|
|
class ExpressionValue {
|
|
private:
|
|
uint64_t Value;
|
|
bool Negative;
|
|
|
|
public:
|
|
template <class T>
|
|
explicit ExpressionValue(T Val) : Value(Val), Negative(Val < 0) {}
|
|
|
|
bool operator==(const ExpressionValue &Other) const {
|
|
return Value == Other.Value && isNegative() == Other.isNegative();
|
|
}
|
|
|
|
bool operator!=(const ExpressionValue &Other) const {
|
|
return !(*this == Other);
|
|
}
|
|
|
|
/// Returns true if value is signed and negative, false otherwise.
|
|
bool isNegative() const {
|
|
assert((Value != 0 || !Negative) && "Unexpected negative zero!");
|
|
return Negative;
|
|
}
|
|
|
|
/// \returns the value as a signed integer or an error if the value is out of
|
|
/// range.
|
|
Expected<int64_t> getSignedValue() const;
|
|
|
|
/// \returns the value as an unsigned integer or an error if the value is out
|
|
/// of range.
|
|
Expected<uint64_t> getUnsignedValue() const;
|
|
|
|
/// \returns an unsigned ExpressionValue instance whose value is the absolute
|
|
/// value to this object's value.
|
|
ExpressionValue getAbsolute() const;
|
|
};
|
|
|
|
/// Performs operation and \returns its result or an error in case of failure,
|
|
/// such as if an overflow occurs.
|
|
Expected<ExpressionValue> operator+(const ExpressionValue &Lhs,
|
|
const ExpressionValue &Rhs);
|
|
Expected<ExpressionValue> operator-(const ExpressionValue &Lhs,
|
|
const ExpressionValue &Rhs);
|
|
Expected<ExpressionValue> operator*(const ExpressionValue &Lhs,
|
|
const ExpressionValue &Rhs);
|
|
Expected<ExpressionValue> operator/(const ExpressionValue &Lhs,
|
|
const ExpressionValue &Rhs);
|
|
Expected<ExpressionValue> max(const ExpressionValue &Lhs,
|
|
const ExpressionValue &Rhs);
|
|
Expected<ExpressionValue> min(const ExpressionValue &Lhs,
|
|
const ExpressionValue &Rhs);
|
|
|
|
/// Base class representing the AST of a given expression.
|
|
class ExpressionAST {
|
|
private:
|
|
StringRef ExpressionStr;
|
|
|
|
public:
|
|
ExpressionAST(StringRef ExpressionStr) : ExpressionStr(ExpressionStr) {}
|
|
|
|
virtual ~ExpressionAST() = default;
|
|
|
|
StringRef getExpressionStr() const { return ExpressionStr; }
|
|
|
|
/// Evaluates and \returns the value of the expression represented by this
|
|
/// AST or an error if evaluation fails.
|
|
virtual Expected<ExpressionValue> eval() const = 0;
|
|
|
|
/// \returns either the implicit format of this AST, a diagnostic against
|
|
/// \p SM if implicit formats of the AST's components conflict, or NoFormat
|
|
/// if the AST has no implicit format (e.g. AST is made up of a single
|
|
/// literal).
|
|
virtual Expected<ExpressionFormat>
|
|
getImplicitFormat(const SourceMgr &SM) const {
|
|
return ExpressionFormat();
|
|
}
|
|
};
|
|
|
|
/// Class representing an unsigned literal in the AST of an expression.
|
|
class ExpressionLiteral : public ExpressionAST {
|
|
private:
|
|
/// Actual value of the literal.
|
|
ExpressionValue Value;
|
|
|
|
public:
|
|
template <class T>
|
|
explicit ExpressionLiteral(StringRef ExpressionStr, T Val)
|
|
: ExpressionAST(ExpressionStr), Value(Val) {}
|
|
|
|
/// \returns the literal's value.
|
|
Expected<ExpressionValue> eval() const override { return Value; }
|
|
};
|
|
|
|
/// Class to represent an undefined variable error, which quotes that
|
|
/// variable's name when printed.
|
|
class UndefVarError : public ErrorInfo<UndefVarError> {
|
|
private:
|
|
StringRef VarName;
|
|
|
|
public:
|
|
static char ID;
|
|
|
|
UndefVarError(StringRef VarName) : VarName(VarName) {}
|
|
|
|
StringRef getVarName() const { return VarName; }
|
|
|
|
std::error_code convertToErrorCode() const override {
|
|
return inconvertibleErrorCode();
|
|
}
|
|
|
|
/// Print name of variable associated with this error.
|
|
void log(raw_ostream &OS) const override {
|
|
OS << "\"";
|
|
OS.write_escaped(VarName) << "\"";
|
|
}
|
|
};
|
|
|
|
/// Class representing an expression and its matching format.
|
|
class Expression {
|
|
private:
|
|
/// Pointer to AST of the expression.
|
|
std::unique_ptr<ExpressionAST> AST;
|
|
|
|
/// Format to use (e.g. hex upper case letters) when matching the value.
|
|
ExpressionFormat Format;
|
|
|
|
public:
|
|
/// Generic constructor for an expression represented by the given \p AST and
|
|
/// whose matching format is \p Format.
|
|
Expression(std::unique_ptr<ExpressionAST> AST, ExpressionFormat Format)
|
|
: AST(std::move(AST)), Format(Format) {}
|
|
|
|
/// \returns pointer to AST of the expression. Pointer is guaranteed to be
|
|
/// valid as long as this object is.
|
|
ExpressionAST *getAST() const { return AST.get(); }
|
|
|
|
ExpressionFormat getFormat() const { return Format; }
|
|
};
|
|
|
|
/// Class representing a numeric variable and its associated current value.
|
|
class NumericVariable {
|
|
private:
|
|
/// Name of the numeric variable.
|
|
StringRef Name;
|
|
|
|
/// Format to use for expressions using this variable without an explicit
|
|
/// format.
|
|
ExpressionFormat ImplicitFormat;
|
|
|
|
/// Value of numeric variable, if defined, or None otherwise.
|
|
Optional<ExpressionValue> Value;
|
|
|
|
/// The input buffer's string from which Value was parsed, or None. See
|
|
/// comments on getStringValue for a discussion of the None case.
|
|
Optional<StringRef> StrValue;
|
|
|
|
/// Line number where this variable is defined, or None if defined before
|
|
/// input is parsed. Used to determine whether a variable is defined on the
|
|
/// same line as a given use.
|
|
Optional<size_t> DefLineNumber;
|
|
|
|
public:
|
|
/// Constructor for a variable \p Name with implicit format \p ImplicitFormat
|
|
/// defined at line \p DefLineNumber or defined before input is parsed if
|
|
/// \p DefLineNumber is None.
|
|
explicit NumericVariable(StringRef Name, ExpressionFormat ImplicitFormat,
|
|
Optional<size_t> DefLineNumber = None)
|
|
: Name(Name), ImplicitFormat(ImplicitFormat),
|
|
DefLineNumber(DefLineNumber) {}
|
|
|
|
/// \returns name of this numeric variable.
|
|
StringRef getName() const { return Name; }
|
|
|
|
/// \returns implicit format of this numeric variable.
|
|
ExpressionFormat getImplicitFormat() const { return ImplicitFormat; }
|
|
|
|
/// \returns this variable's value.
|
|
Optional<ExpressionValue> getValue() const { return Value; }
|
|
|
|
/// \returns the input buffer's string from which this variable's value was
|
|
/// parsed, or None if the value is not yet defined or was not parsed from the
|
|
/// input buffer. For example, the value of @LINE is not parsed from the
|
|
/// input buffer, and some numeric variables are parsed from the command
|
|
/// line instead.
|
|
Optional<StringRef> getStringValue() const { return StrValue; }
|
|
|
|
/// Sets value of this numeric variable to \p NewValue, and sets the input
|
|
/// buffer string from which it was parsed to \p NewStrValue. See comments on
|
|
/// getStringValue for a discussion of when the latter can be None.
|
|
void setValue(ExpressionValue NewValue,
|
|
Optional<StringRef> NewStrValue = None) {
|
|
Value = NewValue;
|
|
StrValue = NewStrValue;
|
|
}
|
|
|
|
/// Clears value of this numeric variable, regardless of whether it is
|
|
/// currently defined or not.
|
|
void clearValue() {
|
|
Value = None;
|
|
StrValue = None;
|
|
}
|
|
|
|
/// \returns the line number where this variable is defined, if any, or None
|
|
/// if defined before input is parsed.
|
|
Optional<size_t> getDefLineNumber() const { return DefLineNumber; }
|
|
};
|
|
|
|
/// Class representing the use of a numeric variable in the AST of an
|
|
/// expression.
|
|
class NumericVariableUse : public ExpressionAST {
|
|
private:
|
|
/// Pointer to the class instance for the variable this use is about.
|
|
NumericVariable *Variable;
|
|
|
|
public:
|
|
NumericVariableUse(StringRef Name, NumericVariable *Variable)
|
|
: ExpressionAST(Name), Variable(Variable) {}
|
|
/// \returns the value of the variable referenced by this instance.
|
|
Expected<ExpressionValue> eval() const override;
|
|
|
|
/// \returns implicit format of this numeric variable.
|
|
Expected<ExpressionFormat>
|
|
getImplicitFormat(const SourceMgr &SM) const override {
|
|
return Variable->getImplicitFormat();
|
|
}
|
|
};
|
|
|
|
/// Type of functions evaluating a given binary operation.
|
|
using binop_eval_t = Expected<ExpressionValue> (*)(const ExpressionValue &,
|
|
const ExpressionValue &);
|
|
|
|
/// Class representing a single binary operation in the AST of an expression.
|
|
class BinaryOperation : public ExpressionAST {
|
|
private:
|
|
/// Left operand.
|
|
std::unique_ptr<ExpressionAST> LeftOperand;
|
|
|
|
/// Right operand.
|
|
std::unique_ptr<ExpressionAST> RightOperand;
|
|
|
|
/// Pointer to function that can evaluate this binary operation.
|
|
binop_eval_t EvalBinop;
|
|
|
|
public:
|
|
BinaryOperation(StringRef ExpressionStr, binop_eval_t EvalBinop,
|
|
std::unique_ptr<ExpressionAST> LeftOp,
|
|
std::unique_ptr<ExpressionAST> RightOp)
|
|
: ExpressionAST(ExpressionStr), EvalBinop(EvalBinop) {
|
|
LeftOperand = std::move(LeftOp);
|
|
RightOperand = std::move(RightOp);
|
|
}
|
|
|
|
/// Evaluates the value of the binary operation represented by this AST,
|
|
/// using EvalBinop on the result of recursively evaluating the operands.
|
|
/// \returns the expression value or an error if an undefined numeric
|
|
/// variable is used in one of the operands.
|
|
Expected<ExpressionValue> eval() const override;
|
|
|
|
/// \returns the implicit format of this AST, if any, a diagnostic against
|
|
/// \p SM if the implicit formats of the AST's components conflict, or no
|
|
/// format if the AST has no implicit format (e.g. AST is made of a single
|
|
/// literal).
|
|
Expected<ExpressionFormat>
|
|
getImplicitFormat(const SourceMgr &SM) const override;
|
|
};
|
|
|
|
class FileCheckPatternContext;
|
|
|
|
/// Class representing a substitution to perform in the RegExStr string.
|
|
class Substitution {
|
|
protected:
|
|
/// Pointer to a class instance holding, among other things, the table with
|
|
/// the values of live string variables at the start of any given CHECK line.
|
|
/// Used for substituting string variables with the text they were defined
|
|
/// as. Expressions are linked to the numeric variables they use at
|
|
/// parse time and directly access the value of the numeric variable to
|
|
/// evaluate their value.
|
|
FileCheckPatternContext *Context;
|
|
|
|
/// The string that needs to be substituted for something else. For a
|
|
/// string variable this is its name, otherwise this is the whole expression.
|
|
StringRef FromStr;
|
|
|
|
// Index in RegExStr of where to do the substitution.
|
|
size_t InsertIdx;
|
|
|
|
public:
|
|
Substitution(FileCheckPatternContext *Context, StringRef VarName,
|
|
size_t InsertIdx)
|
|
: Context(Context), FromStr(VarName), InsertIdx(InsertIdx) {}
|
|
|
|
virtual ~Substitution() = default;
|
|
|
|
/// \returns the string to be substituted for something else.
|
|
StringRef getFromString() const { return FromStr; }
|
|
|
|
/// \returns the index where the substitution is to be performed in RegExStr.
|
|
size_t getIndex() const { return InsertIdx; }
|
|
|
|
/// \returns a string containing the result of the substitution represented
|
|
/// by this class instance or an error if substitution failed.
|
|
virtual Expected<std::string> getResult() const = 0;
|
|
};
|
|
|
|
class StringSubstitution : public Substitution {
|
|
public:
|
|
StringSubstitution(FileCheckPatternContext *Context, StringRef VarName,
|
|
size_t InsertIdx)
|
|
: Substitution(Context, VarName, InsertIdx) {}
|
|
|
|
/// \returns the text that the string variable in this substitution matched
|
|
/// when defined, or an error if the variable is undefined.
|
|
Expected<std::string> getResult() const override;
|
|
};
|
|
|
|
class NumericSubstitution : public Substitution {
|
|
private:
|
|
/// Pointer to the class representing the expression whose value is to be
|
|
/// substituted.
|
|
std::unique_ptr<Expression> ExpressionPointer;
|
|
|
|
public:
|
|
NumericSubstitution(FileCheckPatternContext *Context, StringRef ExpressionStr,
|
|
std::unique_ptr<Expression> ExpressionPointer,
|
|
size_t InsertIdx)
|
|
: Substitution(Context, ExpressionStr, InsertIdx),
|
|
ExpressionPointer(std::move(ExpressionPointer)) {}
|
|
|
|
/// \returns a string containing the result of evaluating the expression in
|
|
/// this substitution, or an error if evaluation failed.
|
|
Expected<std::string> getResult() const override;
|
|
};
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Pattern handling code.
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
/// Class holding the Pattern global state, shared by all patterns: tables
|
|
/// holding values of variables and whether they are defined or not at any
|
|
/// given time in the matching process.
|
|
class FileCheckPatternContext {
|
|
friend class Pattern;
|
|
|
|
private:
|
|
/// When matching a given pattern, this holds the value of all the string
|
|
/// variables defined in previous patterns. In a pattern, only the last
|
|
/// definition for a given variable is recorded in this table.
|
|
/// Back-references are used for uses after any the other definition.
|
|
StringMap<StringRef> GlobalVariableTable;
|
|
|
|
/// Map of all string variables defined so far. Used at parse time to detect
|
|
/// a name conflict between a numeric variable and a string variable when
|
|
/// the former is defined on a later line than the latter.
|
|
StringMap<bool> DefinedVariableTable;
|
|
|
|
/// When matching a given pattern, this holds the pointers to the classes
|
|
/// representing the numeric variables defined in previous patterns. When
|
|
/// matching a pattern all definitions for that pattern are recorded in the
|
|
/// NumericVariableDefs table in the Pattern instance of that pattern.
|
|
StringMap<NumericVariable *> GlobalNumericVariableTable;
|
|
|
|
/// Pointer to the class instance representing the @LINE pseudo variable for
|
|
/// easily updating its value.
|
|
NumericVariable *LineVariable = nullptr;
|
|
|
|
/// Vector holding pointers to all parsed numeric variables. Used to
|
|
/// automatically free them once they are guaranteed to no longer be used.
|
|
std::vector<std::unique_ptr<NumericVariable>> NumericVariables;
|
|
|
|
/// Vector holding pointers to all parsed expressions. Used to automatically
|
|
/// free the expressions once they are guaranteed to no longer be used.
|
|
std::vector<std::unique_ptr<Expression>> Expressions;
|
|
|
|
/// Vector holding pointers to all substitutions. Used to automatically free
|
|
/// them once they are guaranteed to no longer be used.
|
|
std::vector<std::unique_ptr<Substitution>> Substitutions;
|
|
|
|
public:
|
|
/// \returns the value of string variable \p VarName or an error if no such
|
|
/// variable has been defined.
|
|
Expected<StringRef> getPatternVarValue(StringRef VarName);
|
|
|
|
/// Defines string and numeric variables from definitions given on the
|
|
/// command line, passed as a vector of [#]VAR=VAL strings in
|
|
/// \p CmdlineDefines. \returns an error list containing diagnostics against
|
|
/// \p SM for all definition parsing failures, if any, or Success otherwise.
|
|
Error defineCmdlineVariables(ArrayRef<StringRef> CmdlineDefines,
|
|
SourceMgr &SM);
|
|
|
|
/// Create @LINE pseudo variable. Value is set when pattern are being
|
|
/// matched.
|
|
void createLineVariable();
|
|
|
|
/// Undefines local variables (variables whose name does not start with a '$'
|
|
/// sign), i.e. removes them from GlobalVariableTable and from
|
|
/// GlobalNumericVariableTable and also clears the value of numeric
|
|
/// variables.
|
|
void clearLocalVars();
|
|
|
|
private:
|
|
/// Makes a new numeric variable and registers it for destruction when the
|
|
/// context is destroyed.
|
|
template <class... Types> NumericVariable *makeNumericVariable(Types... args);
|
|
|
|
/// Makes a new string substitution and registers it for destruction when the
|
|
/// context is destroyed.
|
|
Substitution *makeStringSubstitution(StringRef VarName, size_t InsertIdx);
|
|
|
|
/// Makes a new numeric substitution and registers it for destruction when
|
|
/// the context is destroyed.
|
|
Substitution *makeNumericSubstitution(StringRef ExpressionStr,
|
|
std::unique_ptr<Expression> Expression,
|
|
size_t InsertIdx);
|
|
};
|
|
|
|
/// Class to represent an error holding a diagnostic with location information
|
|
/// used when printing it.
|
|
class ErrorDiagnostic : public ErrorInfo<ErrorDiagnostic> {
|
|
private:
|
|
SMDiagnostic Diagnostic;
|
|
|
|
public:
|
|
static char ID;
|
|
|
|
ErrorDiagnostic(SMDiagnostic &&Diag) : Diagnostic(Diag) {}
|
|
|
|
std::error_code convertToErrorCode() const override {
|
|
return inconvertibleErrorCode();
|
|
}
|
|
|
|
/// Print diagnostic associated with this error when printing the error.
|
|
void log(raw_ostream &OS) const override { Diagnostic.print(nullptr, OS); }
|
|
|
|
static Error get(const SourceMgr &SM, SMLoc Loc, const Twine &ErrMsg) {
|
|
return make_error<ErrorDiagnostic>(
|
|
SM.GetMessage(Loc, SourceMgr::DK_Error, ErrMsg));
|
|
}
|
|
|
|
static Error get(const SourceMgr &SM, StringRef Buffer, const Twine &ErrMsg) {
|
|
return get(SM, SMLoc::getFromPointer(Buffer.data()), ErrMsg);
|
|
}
|
|
};
|
|
|
|
class NotFoundError : public ErrorInfo<NotFoundError> {
|
|
public:
|
|
static char ID;
|
|
|
|
std::error_code convertToErrorCode() const override {
|
|
return inconvertibleErrorCode();
|
|
}
|
|
|
|
/// Print diagnostic associated with this error when printing the error.
|
|
void log(raw_ostream &OS) const override {
|
|
OS << "String not found in input";
|
|
}
|
|
};
|
|
|
|
class Pattern {
|
|
SMLoc PatternLoc;
|
|
|
|
/// A fixed string to match as the pattern or empty if this pattern requires
|
|
/// a regex match.
|
|
StringRef FixedStr;
|
|
|
|
/// A regex string to match as the pattern or empty if this pattern requires
|
|
/// a fixed string to match.
|
|
std::string RegExStr;
|
|
|
|
/// Entries in this vector represent a substitution of a string variable or
|
|
/// an expression in the RegExStr regex at match time. For example, in the
|
|
/// case of a CHECK directive with the pattern "foo[[bar]]baz[[#N+1]]",
|
|
/// RegExStr will contain "foobaz" and we'll get two entries in this vector
|
|
/// that tells us to insert the value of string variable "bar" at offset 3
|
|
/// and the value of expression "N+1" at offset 6.
|
|
std::vector<Substitution *> Substitutions;
|
|
|
|
/// Maps names of string variables defined in a pattern to the number of
|
|
/// their parenthesis group in RegExStr capturing their last definition.
|
|
///
|
|
/// E.g. for the pattern "foo[[bar:.*]]baz([[bar]][[QUUX]][[bar:.*]])",
|
|
/// RegExStr will be "foo(.*)baz(\1<quux value>(.*))" where <quux value> is
|
|
/// the value captured for QUUX on the earlier line where it was defined, and
|
|
/// VariableDefs will map "bar" to the third parenthesis group which captures
|
|
/// the second definition of "bar".
|
|
///
|
|
/// Note: uses std::map rather than StringMap to be able to get the key when
|
|
/// iterating over values.
|
|
std::map<StringRef, unsigned> VariableDefs;
|
|
|
|
/// Structure representing the definition of a numeric variable in a pattern.
|
|
/// It holds the pointer to the class instance holding the value and matching
|
|
/// format of the numeric variable whose value is being defined and the
|
|
/// number of the parenthesis group in RegExStr to capture that value.
|
|
struct NumericVariableMatch {
|
|
/// Pointer to class instance holding the value and matching format of the
|
|
/// numeric variable being defined.
|
|
NumericVariable *DefinedNumericVariable;
|
|
|
|
/// Number of the parenthesis group in RegExStr that captures the value of
|
|
/// this numeric variable definition.
|
|
unsigned CaptureParenGroup;
|
|
};
|
|
|
|
/// Holds the number of the parenthesis group in RegExStr and pointer to the
|
|
/// corresponding NumericVariable class instance of all numeric variable
|
|
/// definitions. Used to set the matched value of all those variables.
|
|
StringMap<NumericVariableMatch> NumericVariableDefs;
|
|
|
|
/// Pointer to a class instance holding the global state shared by all
|
|
/// patterns:
|
|
/// - separate tables with the values of live string and numeric variables
|
|
/// respectively at the start of any given CHECK line;
|
|
/// - table holding whether a string variable has been defined at any given
|
|
/// point during the parsing phase.
|
|
FileCheckPatternContext *Context;
|
|
|
|
Check::FileCheckType CheckTy;
|
|
|
|
/// Line number for this CHECK pattern or None if it is an implicit pattern.
|
|
/// Used to determine whether a variable definition is made on an earlier
|
|
/// line to the one with this CHECK.
|
|
Optional<size_t> LineNumber;
|
|
|
|
/// Ignore case while matching if set to true.
|
|
bool IgnoreCase = false;
|
|
|
|
public:
|
|
Pattern(Check::FileCheckType Ty, FileCheckPatternContext *Context,
|
|
Optional<size_t> Line = None)
|
|
: Context(Context), CheckTy(Ty), LineNumber(Line) {}
|
|
|
|
/// \returns the location in source code.
|
|
SMLoc getLoc() const { return PatternLoc; }
|
|
|
|
/// \returns the pointer to the global state for all patterns in this
|
|
/// FileCheck instance.
|
|
FileCheckPatternContext *getContext() const { return Context; }
|
|
|
|
/// \returns whether \p C is a valid first character for a variable name.
|
|
static bool isValidVarNameStart(char C);
|
|
|
|
/// Parsing information about a variable.
|
|
struct VariableProperties {
|
|
StringRef Name;
|
|
bool IsPseudo;
|
|
};
|
|
|
|
/// Parses the string at the start of \p Str for a variable name. \returns
|
|
/// a VariableProperties structure holding the variable name and whether it
|
|
/// is the name of a pseudo variable, or an error holding a diagnostic
|
|
/// against \p SM if parsing fail. If parsing was successful, also strips
|
|
/// \p Str from the variable name.
|
|
static Expected<VariableProperties> parseVariable(StringRef &Str,
|
|
const SourceMgr &SM);
|
|
/// Parses \p Expr for a numeric substitution block at line \p LineNumber,
|
|
/// or before input is parsed if \p LineNumber is None. Parameter
|
|
/// \p IsLegacyLineExpr indicates whether \p Expr should be a legacy @LINE
|
|
/// expression and \p Context points to the class instance holding the live
|
|
/// string and numeric variables. \returns a pointer to the class instance
|
|
/// representing the expression whose value must be substitued, or an error
|
|
/// holding a diagnostic against \p SM if parsing fails. If substitution was
|
|
/// successful, sets \p DefinedNumericVariable to point to the class
|
|
/// representing the numeric variable defined in this numeric substitution
|
|
/// block, or None if this block does not define any variable.
|
|
static Expected<std::unique_ptr<Expression>> parseNumericSubstitutionBlock(
|
|
StringRef Expr, Optional<NumericVariable *> &DefinedNumericVariable,
|
|
bool IsLegacyLineExpr, Optional<size_t> LineNumber,
|
|
FileCheckPatternContext *Context, const SourceMgr &SM);
|
|
/// Parses the pattern in \p PatternStr and initializes this Pattern instance
|
|
/// accordingly.
|
|
///
|
|
/// \p Prefix provides which prefix is being matched, \p Req describes the
|
|
/// global options that influence the parsing such as whitespace
|
|
/// canonicalization, \p SM provides the SourceMgr used for error reports.
|
|
/// \returns true in case of an error, false otherwise.
|
|
bool parsePattern(StringRef PatternStr, StringRef Prefix, SourceMgr &SM,
|
|
const FileCheckRequest &Req);
|
|
/// Matches the pattern string against the input buffer \p Buffer
|
|
///
|
|
/// \returns the position that is matched or an error indicating why matching
|
|
/// failed. If there is a match, updates \p MatchLen with the size of the
|
|
/// matched string.
|
|
///
|
|
/// The GlobalVariableTable StringMap in the FileCheckPatternContext class
|
|
/// instance provides the current values of FileCheck string variables and is
|
|
/// updated if this match defines new values. Likewise, the
|
|
/// GlobalNumericVariableTable StringMap in the same class provides the
|
|
/// current values of FileCheck numeric variables and is updated if this
|
|
/// match defines new numeric values.
|
|
Expected<size_t> match(StringRef Buffer, size_t &MatchLen,
|
|
const SourceMgr &SM) const;
|
|
/// Prints the value of successful substitutions or the name of the undefined
|
|
/// string or numeric variables preventing a successful substitution.
|
|
void printSubstitutions(const SourceMgr &SM, StringRef Buffer,
|
|
SMRange MatchRange, FileCheckDiag::MatchType MatchTy,
|
|
std::vector<FileCheckDiag> *Diags) const;
|
|
void printFuzzyMatch(const SourceMgr &SM, StringRef Buffer,
|
|
std::vector<FileCheckDiag> *Diags) const;
|
|
|
|
bool hasVariable() const {
|
|
return !(Substitutions.empty() && VariableDefs.empty());
|
|
}
|
|
void printVariableDefs(const SourceMgr &SM, FileCheckDiag::MatchType MatchTy,
|
|
std::vector<FileCheckDiag> *Diags) const;
|
|
|
|
Check::FileCheckType getCheckTy() const { return CheckTy; }
|
|
|
|
int getCount() const { return CheckTy.getCount(); }
|
|
|
|
private:
|
|
bool AddRegExToRegEx(StringRef RS, unsigned &CurParen, SourceMgr &SM);
|
|
void AddBackrefToRegEx(unsigned BackrefNum);
|
|
/// Computes an arbitrary estimate for the quality of matching this pattern
|
|
/// at the start of \p Buffer; a distance of zero should correspond to a
|
|
/// perfect match.
|
|
unsigned computeMatchDistance(StringRef Buffer) const;
|
|
/// Finds the closing sequence of a regex variable usage or definition.
|
|
///
|
|
/// \p Str has to point in the beginning of the definition (right after the
|
|
/// opening sequence). \p SM holds the SourceMgr used for error reporting.
|
|
/// \returns the offset of the closing sequence within Str, or npos if it
|
|
/// was not found.
|
|
static size_t FindRegexVarEnd(StringRef Str, SourceMgr &SM);
|
|
|
|
/// Parses \p Expr for the name of a numeric variable to be defined at line
|
|
/// \p LineNumber, or before input is parsed if \p LineNumber is None.
|
|
/// \returns a pointer to the class instance representing that variable,
|
|
/// creating it if needed, or an error holding a diagnostic against \p SM
|
|
/// should defining such a variable be invalid.
|
|
static Expected<NumericVariable *> parseNumericVariableDefinition(
|
|
StringRef &Expr, FileCheckPatternContext *Context,
|
|
Optional<size_t> LineNumber, ExpressionFormat ImplicitFormat,
|
|
const SourceMgr &SM);
|
|
/// Parses \p Name as a (pseudo if \p IsPseudo is true) numeric variable use
|
|
/// at line \p LineNumber, or before input is parsed if \p LineNumber is
|
|
/// None. Parameter \p Context points to the class instance holding the live
|
|
/// string and numeric variables. \returns the pointer to the class instance
|
|
/// representing that variable if successful, or an error holding a
|
|
/// diagnostic against \p SM otherwise.
|
|
static Expected<std::unique_ptr<NumericVariableUse>> parseNumericVariableUse(
|
|
StringRef Name, bool IsPseudo, Optional<size_t> LineNumber,
|
|
FileCheckPatternContext *Context, const SourceMgr &SM);
|
|
enum class AllowedOperand { LineVar, LegacyLiteral, Any };
|
|
/// Parses \p Expr for use of a numeric operand at line \p LineNumber, or
|
|
/// before input is parsed if \p LineNumber is None. Accepts literal values,
|
|
/// numeric variables and function calls, depending on the value of \p AO.
|
|
/// \p MaybeInvalidConstraint indicates whether the text being parsed could
|
|
/// be an invalid constraint. \p Context points to the class instance holding
|
|
/// the live string and numeric variables. \returns the class representing
|
|
/// that operand in the AST of the expression or an error holding a
|
|
/// diagnostic against \p SM otherwise. If \p Expr starts with a "(" this
|
|
/// function will attempt to parse a parenthesized expression.
|
|
static Expected<std::unique_ptr<ExpressionAST>>
|
|
parseNumericOperand(StringRef &Expr, AllowedOperand AO, bool ConstraintParsed,
|
|
Optional<size_t> LineNumber,
|
|
FileCheckPatternContext *Context, const SourceMgr &SM);
|
|
/// Parses and updates \p RemainingExpr for a binary operation at line
|
|
/// \p LineNumber, or before input is parsed if \p LineNumber is None. The
|
|
/// left operand of this binary operation is given in \p LeftOp and \p Expr
|
|
/// holds the string for the full expression, including the left operand.
|
|
/// Parameter \p IsLegacyLineExpr indicates whether we are parsing a legacy
|
|
/// @LINE expression. Parameter \p Context points to the class instance
|
|
/// holding the live string and numeric variables. \returns the class
|
|
/// representing the binary operation in the AST of the expression, or an
|
|
/// error holding a diagnostic against \p SM otherwise.
|
|
static Expected<std::unique_ptr<ExpressionAST>>
|
|
parseBinop(StringRef Expr, StringRef &RemainingExpr,
|
|
std::unique_ptr<ExpressionAST> LeftOp, bool IsLegacyLineExpr,
|
|
Optional<size_t> LineNumber, FileCheckPatternContext *Context,
|
|
const SourceMgr &SM);
|
|
|
|
/// Parses a parenthesized expression inside \p Expr at line \p LineNumber, or
|
|
/// before input is parsed if \p LineNumber is None. \p Expr must start with
|
|
/// a '('. Accepts both literal values and numeric variables. Parameter \p
|
|
/// Context points to the class instance holding the live string and numeric
|
|
/// variables. \returns the class representing that operand in the AST of the
|
|
/// expression or an error holding a diagnostic against \p SM otherwise.
|
|
static Expected<std::unique_ptr<ExpressionAST>>
|
|
parseParenExpr(StringRef &Expr, Optional<size_t> LineNumber,
|
|
FileCheckPatternContext *Context, const SourceMgr &SM);
|
|
|
|
/// Parses \p Expr for an argument list belonging to a call to function \p
|
|
/// FuncName at line \p LineNumber, or before input is parsed if \p LineNumber
|
|
/// is None. Parameter \p FuncLoc is the source location used for diagnostics.
|
|
/// Parameter \p Context points to the class instance holding the live string
|
|
/// and numeric variables. \returns the class representing that call in the
|
|
/// AST of the expression or an error holding a diagnostic against \p SM
|
|
/// otherwise.
|
|
static Expected<std::unique_ptr<ExpressionAST>>
|
|
parseCallExpr(StringRef &Expr, StringRef FuncName,
|
|
Optional<size_t> LineNumber, FileCheckPatternContext *Context,
|
|
const SourceMgr &SM);
|
|
};
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Check Strings.
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
/// A check that we found in the input file.
|
|
struct FileCheckString {
|
|
/// The pattern to match.
|
|
Pattern Pat;
|
|
|
|
/// Which prefix name this check matched.
|
|
StringRef Prefix;
|
|
|
|
/// The location in the match file that the check string was specified.
|
|
SMLoc Loc;
|
|
|
|
/// All of the strings that are disallowed from occurring between this match
|
|
/// string and the previous one (or start of file).
|
|
std::vector<Pattern> DagNotStrings;
|
|
|
|
FileCheckString(const Pattern &P, StringRef S, SMLoc L)
|
|
: Pat(P), Prefix(S), Loc(L) {}
|
|
|
|
/// Matches check string and its "not strings" and/or "dag strings".
|
|
size_t Check(const SourceMgr &SM, StringRef Buffer, bool IsLabelScanMode,
|
|
size_t &MatchLen, FileCheckRequest &Req,
|
|
std::vector<FileCheckDiag> *Diags) const;
|
|
|
|
/// Verifies that there is a single line in the given \p Buffer. Errors are
|
|
/// reported against \p SM.
|
|
bool CheckNext(const SourceMgr &SM, StringRef Buffer) const;
|
|
/// Verifies that there is no newline in the given \p Buffer. Errors are
|
|
/// reported against \p SM.
|
|
bool CheckSame(const SourceMgr &SM, StringRef Buffer) const;
|
|
/// Verifies that none of the strings in \p NotStrings are found in the given
|
|
/// \p Buffer. Errors are reported against \p SM and diagnostics recorded in
|
|
/// \p Diags according to the verbosity level set in \p Req.
|
|
bool CheckNot(const SourceMgr &SM, StringRef Buffer,
|
|
const std::vector<const Pattern *> &NotStrings,
|
|
const FileCheckRequest &Req,
|
|
std::vector<FileCheckDiag> *Diags) const;
|
|
/// Matches "dag strings" and their mixed "not strings".
|
|
size_t CheckDag(const SourceMgr &SM, StringRef Buffer,
|
|
std::vector<const Pattern *> &NotStrings,
|
|
const FileCheckRequest &Req,
|
|
std::vector<FileCheckDiag> *Diags) const;
|
|
};
|
|
|
|
} // namespace llvm
|
|
|
|
#endif
|