LLVM 17.0.0git
SpecialCaseList.h
Go to the documentation of this file.
1//===-- SpecialCaseList.h - special case list for sanitizers ----*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//===----------------------------------------------------------------------===//
7//
8// This is a utility class used to parse user-provided text files with
9// "special case lists" for code sanitizers. Such files are used to
10// define an "ABI list" for DataFlowSanitizer and allow/exclusion lists for
11// sanitizers like AddressSanitizer or UndefinedBehaviorSanitizer.
12//
13// Empty lines and lines starting with "#" are ignored. Sections are defined
14// using a '[section_name]' header and can be used to specify sanitizers the
15// entries below it apply to. Section names are regular expressions, and
16// entries without a section header match all sections (e.g. an '[*]' header
17// is assumed.)
18// The remaining lines should have the form:
19// prefix:wildcard_expression[=category]
20// If category is not specified, it is assumed to be empty string.
21// Definitions of "prefix" and "category" are sanitizer-specific. For example,
22// sanitizer exclusion support prefixes "src", "mainfile", "fun" and "global".
23// Wildcard expressions define, respectively, source files, main files,
24// functions or globals which shouldn't be instrumented.
25// Examples of categories:
26// "functional": used in DFSan to list functions with pure functional
27// semantics.
28// "init": used in ASan exclusion list to disable initialization-order bugs
29// detection for certain globals or source files.
30// Full special case list file example:
31// ---
32// [address]
33// # Excluded items:
34// fun:*_ZN4base6subtle*
35// global:*global_with_bad_access_or_initialization*
36// global:*global_with_initialization_issues*=init
37// type:*Namespace::ClassName*=init
38// src:file_with_tricky_code.cc
39// src:ignore-global-initializers-issues.cc=init
40// mainfile:main_file.cc
41//
42// [dataflow]
43// # Functions with pure functional semantics:
44// fun:cos=functional
45// fun:sin=functional
46// ---
47// Note that the wild card is in fact an llvm::Regex, but * is automatically
48// replaced with .*
49//
50//===----------------------------------------------------------------------===//
51
52#ifndef LLVM_SUPPORT_SPECIALCASELIST_H
53#define LLVM_SUPPORT_SPECIALCASELIST_H
54
55#include "llvm/ADT/StringMap.h"
56#include "llvm/Support/Regex.h"
58#include <memory>
59#include <string>
60#include <vector>
61
62namespace llvm {
63class MemoryBuffer;
64class StringRef;
65
66namespace vfs {
67class FileSystem;
68}
69
71public:
72 /// Parses the special case list entries from files. On failure, returns
73 /// 0 and writes an error message to string.
74 static std::unique_ptr<SpecialCaseList>
75 create(const std::vector<std::string> &Paths, llvm::vfs::FileSystem &FS,
76 std::string &Error);
77 /// Parses the special case list from a memory buffer. On failure, returns
78 /// 0 and writes an error message to string.
79 static std::unique_ptr<SpecialCaseList> create(const MemoryBuffer *MB,
80 std::string &Error);
81 /// Parses the special case list entries from files. On failure, reports a
82 /// fatal error.
83 static std::unique_ptr<SpecialCaseList>
84 createOrDie(const std::vector<std::string> &Paths, llvm::vfs::FileSystem &FS);
85
87
88 /// Returns true, if special case list contains a line
89 /// \code
90 /// @Prefix:<E>=@Category
91 /// \endcode
92 /// where @Query satisfies wildcard expression <E> in a given @Section.
93 bool inSection(StringRef Section, StringRef Prefix, StringRef Query,
94 StringRef Category = StringRef()) const;
95
96 /// Returns the line number corresponding to the special case list entry if
97 /// the special case list contains a line
98 /// \code
99 /// @Prefix:<E>=@Category
100 /// \endcode
101 /// where @Query satisfies wildcard expression <E> in a given @Section.
102 /// Returns zero if there is no exclusion entry corresponding to this
103 /// expression.
104 unsigned inSectionBlame(StringRef Section, StringRef Prefix, StringRef Query,
105 StringRef Category = StringRef()) const;
106
107protected:
108 // Implementations of the create*() functions that can also be used by derived
109 // classes.
110 bool createInternal(const std::vector<std::string> &Paths,
111 vfs::FileSystem &VFS, std::string &Error);
112 bool createInternal(const MemoryBuffer *MB, std::string &Error);
113
114 SpecialCaseList() = default;
117
118 /// Represents a set of regular expressions. Regular expressions which are
119 /// "literal" (i.e. no regex metacharacters) are stored in Strings. The
120 /// reason for doing so is efficiency; StringMap is much faster at matching
121 /// literal strings than Regex.
122 class Matcher {
123 public:
124 bool insert(std::string Regexp, unsigned LineNumber, std::string &REError);
125 // Returns the line number in the source file that this query matches to.
126 // Returns zero if no match is found.
127 unsigned match(StringRef Query) const;
128
129 private:
130 StringMap<unsigned> Strings;
131 TrigramIndex Trigrams;
132 std::vector<std::pair<std::unique_ptr<Regex>, unsigned>> RegExes;
133 };
134
136
137 struct Section {
138 Section(std::unique_ptr<Matcher> M) : SectionMatcher(std::move(M)){};
139
140 std::unique_ptr<Matcher> SectionMatcher;
142 };
143
144 std::vector<Section> Sections;
145
146 /// Parses just-constructed SpecialCaseList entries from a memory buffer.
147 bool parse(const MemoryBuffer *MB, StringMap<size_t> &SectionsMap,
148 std::string &Error);
149
150 // Helper method for derived classes to search by Prefix, Query, and Category
151 // once they have already resolved a section entry.
152 unsigned inSectionBlame(const SectionEntries &Entries, StringRef Prefix,
153 StringRef Query, StringRef Category) const;
154};
155
156} // namespace llvm
157
158#endif // LLVM_SUPPORT_SPECIALCASELIST_H
159
This file defines the StringMap class.
@ Paths
Definition: TextStubV5.cpp:120
Lightweight error class with error context and mandatory checking.
Definition: Error.h:156
This interface provides simple read-only access to a block of memory, and provides simple methods for...
Definition: MemoryBuffer.h:51
Represents a set of regular expressions.
bool insert(std::string Regexp, unsigned LineNumber, std::string &REError)
unsigned match(StringRef Query) const
SpecialCaseList & operator=(SpecialCaseList const &)=delete
SpecialCaseList(SpecialCaseList const &)=delete
std::vector< Section > Sections
bool createInternal(const std::vector< std::string > &Paths, vfs::FileSystem &VFS, std::string &Error)
static std::unique_ptr< SpecialCaseList > createOrDie(const std::vector< std::string > &Paths, llvm::vfs::FileSystem &FS)
Parses the special case list entries from files.
static std::unique_ptr< SpecialCaseList > create(const std::vector< std::string > &Paths, llvm::vfs::FileSystem &FS, std::string &Error)
Parses the special case list entries from files.
unsigned inSectionBlame(StringRef Section, StringRef Prefix, StringRef Query, StringRef Category=StringRef()) const
Returns the line number corresponding to the special case list entry if the special case list contain...
bool inSection(StringRef Section, StringRef Prefix, StringRef Query, StringRef Category=StringRef()) const
Returns true, if special case list contains a line.
StringMap - This is an unconventional map that is specialized for handling keys that are "strings",...
Definition: StringMap.h:111
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50
The virtual file system interface.
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1946
Definition: BitVector.h:858
Section(std::unique_ptr< Matcher > M)
std::unique_ptr< Matcher > SectionMatcher
Definition: regcomp.c:192