159 lines
6.0 KiB
C++
159 lines
6.0 KiB
C++
//===-- SpecialCaseList.h - special case list for sanitizers ----*- C++ -*-===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This is a utility class used to parse user-provided text files with
|
|
// "special case lists" for code sanitizers. Such files are used to
|
|
// define an "ABI list" for DataFlowSanitizer and allow/exclusion lists for
|
|
// sanitizers like AddressSanitizer or UndefinedBehaviorSanitizer.
|
|
//
|
|
// Empty lines and lines starting with "#" are ignored. Sections are defined
|
|
// using a '[section_name]' header and can be used to specify sanitizers the
|
|
// entries below it apply to. Section names are regular expressions, and
|
|
// entries without a section header match all sections (e.g. an '[*]' header
|
|
// is assumed.)
|
|
// The remaining lines should have the form:
|
|
// prefix:wildcard_expression[=category]
|
|
// If category is not specified, it is assumed to be empty string.
|
|
// Definitions of "prefix" and "category" are sanitizer-specific. For example,
|
|
// sanitizer exclusion support prefixes "src", "fun" and "global".
|
|
// Wildcard expressions define, respectively, source files, functions or
|
|
// globals which shouldn't be instrumented.
|
|
// Examples of categories:
|
|
// "functional": used in DFSan to list functions with pure functional
|
|
// semantics.
|
|
// "init": used in ASan exclusion list to disable initialization-order bugs
|
|
// detection for certain globals or source files.
|
|
// Full special case list file example:
|
|
// ---
|
|
// [address]
|
|
// # Excluded items:
|
|
// fun:*_ZN4base6subtle*
|
|
// global:*global_with_bad_access_or_initialization*
|
|
// global:*global_with_initialization_issues*=init
|
|
// type:*Namespace::ClassName*=init
|
|
// src:file_with_tricky_code.cc
|
|
// src:ignore-global-initializers-issues.cc=init
|
|
//
|
|
// [dataflow]
|
|
// # Functions with pure functional semantics:
|
|
// fun:cos=functional
|
|
// fun:sin=functional
|
|
// ---
|
|
// Note that the wild card is in fact an llvm::Regex, but * is automatically
|
|
// replaced with .*
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_SUPPORT_SPECIALCASELIST_H
|
|
#define LLVM_SUPPORT_SPECIALCASELIST_H
|
|
|
|
#include "llvm/ADT/StringMap.h"
|
|
#include "llvm/Support/Regex.h"
|
|
#include "llvm/Support/TrigramIndex.h"
|
|
#include <memory>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
namespace llvm {
|
|
class MemoryBuffer;
|
|
class StringRef;
|
|
|
|
namespace vfs {
|
|
class FileSystem;
|
|
}
|
|
|
|
class SpecialCaseList {
|
|
public:
|
|
/// Parses the special case list entries from files. On failure, returns
|
|
/// 0 and writes an error message to string.
|
|
static std::unique_ptr<SpecialCaseList>
|
|
create(const std::vector<std::string> &Paths, llvm::vfs::FileSystem &FS,
|
|
std::string &Error);
|
|
/// Parses the special case list from a memory buffer. On failure, returns
|
|
/// 0 and writes an error message to string.
|
|
static std::unique_ptr<SpecialCaseList> create(const MemoryBuffer *MB,
|
|
std::string &Error);
|
|
/// Parses the special case list entries from files. On failure, reports a
|
|
/// fatal error.
|
|
static std::unique_ptr<SpecialCaseList>
|
|
createOrDie(const std::vector<std::string> &Paths, llvm::vfs::FileSystem &FS);
|
|
|
|
~SpecialCaseList();
|
|
|
|
/// Returns true, if special case list contains a line
|
|
/// \code
|
|
/// @Prefix:<E>=@Category
|
|
/// \endcode
|
|
/// where @Query satisfies wildcard expression <E> in a given @Section.
|
|
bool inSection(StringRef Section, StringRef Prefix, StringRef Query,
|
|
StringRef Category = StringRef()) const;
|
|
|
|
/// Returns the line number corresponding to the special case list entry if
|
|
/// the special case list contains a line
|
|
/// \code
|
|
/// @Prefix:<E>=@Category
|
|
/// \endcode
|
|
/// where @Query satisfies wildcard expression <E> in a given @Section.
|
|
/// Returns zero if there is no exclusion entry corresponding to this
|
|
/// expression.
|
|
unsigned inSectionBlame(StringRef Section, StringRef Prefix, StringRef Query,
|
|
StringRef Category = StringRef()) const;
|
|
|
|
protected:
|
|
// Implementations of the create*() functions that can also be used by derived
|
|
// classes.
|
|
bool createInternal(const std::vector<std::string> &Paths,
|
|
vfs::FileSystem &VFS, std::string &Error);
|
|
bool createInternal(const MemoryBuffer *MB, std::string &Error);
|
|
|
|
SpecialCaseList() = default;
|
|
SpecialCaseList(SpecialCaseList const &) = delete;
|
|
SpecialCaseList &operator=(SpecialCaseList const &) = delete;
|
|
|
|
/// Represents a set of regular expressions. Regular expressions which are
|
|
/// "literal" (i.e. no regex metacharacters) are stored in Strings. The
|
|
/// reason for doing so is efficiency; StringMap is much faster at matching
|
|
/// literal strings than Regex.
|
|
class Matcher {
|
|
public:
|
|
bool insert(std::string Regexp, unsigned LineNumber, std::string &REError);
|
|
// Returns the line number in the source file that this query matches to.
|
|
// Returns zero if no match is found.
|
|
unsigned match(StringRef Query) const;
|
|
|
|
private:
|
|
StringMap<unsigned> Strings;
|
|
TrigramIndex Trigrams;
|
|
std::vector<std::pair<std::unique_ptr<Regex>, unsigned>> RegExes;
|
|
};
|
|
|
|
using SectionEntries = StringMap<StringMap<Matcher>>;
|
|
|
|
struct Section {
|
|
Section(std::unique_ptr<Matcher> M) : SectionMatcher(std::move(M)){};
|
|
|
|
std::unique_ptr<Matcher> SectionMatcher;
|
|
SectionEntries Entries;
|
|
};
|
|
|
|
std::vector<Section> Sections;
|
|
|
|
/// Parses just-constructed SpecialCaseList entries from a memory buffer.
|
|
bool parse(const MemoryBuffer *MB, StringMap<size_t> &SectionsMap,
|
|
std::string &Error);
|
|
|
|
// Helper method for derived classes to search by Prefix, Query, and Category
|
|
// once they have already resolved a section entry.
|
|
unsigned inSectionBlame(const SectionEntries &Entries, StringRef Prefix,
|
|
StringRef Query, StringRef Category) const;
|
|
};
|
|
|
|
} // namespace llvm
|
|
|
|
#endif // LLVM_SUPPORT_SPECIALCASELIST_H
|
|
|