Details | Last modification | View Log | RSS feed
Rev | Author | Line No. | Line |
---|---|---|---|
14 | pmbaty | 1 | //===-- SpecialCaseList.h - special case list for sanitizers ----*- C++ -*-===// |
2 | // |
||
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
||
4 | // See https://llvm.org/LICENSE.txt for license information. |
||
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
||
6 | //===----------------------------------------------------------------------===// |
||
7 | // |
||
8 | // This is a utility class used to parse user-provided text files with |
||
9 | // "special case lists" for code sanitizers. Such files are used to |
||
10 | // define an "ABI list" for DataFlowSanitizer and allow/exclusion lists for |
||
11 | // sanitizers like AddressSanitizer or UndefinedBehaviorSanitizer. |
||
12 | // |
||
13 | // Empty lines and lines starting with "#" are ignored. Sections are defined |
||
14 | // using a '[section_name]' header and can be used to specify sanitizers the |
||
15 | // entries below it apply to. Section names are regular expressions, and |
||
16 | // entries without a section header match all sections (e.g. an '[*]' header |
||
17 | // is assumed.) |
||
18 | // The remaining lines should have the form: |
||
19 | // prefix:wildcard_expression[=category] |
||
20 | // If category is not specified, it is assumed to be empty string. |
||
21 | // Definitions of "prefix" and "category" are sanitizer-specific. For example, |
||
22 | // sanitizer exclusion support prefixes "src", "mainfile", "fun" and "global". |
||
23 | // Wildcard expressions define, respectively, source files, main files, |
||
24 | // functions or globals which shouldn't be instrumented. |
||
25 | // Examples of categories: |
||
26 | // "functional": used in DFSan to list functions with pure functional |
||
27 | // semantics. |
||
28 | // "init": used in ASan exclusion list to disable initialization-order bugs |
||
29 | // detection for certain globals or source files. |
||
30 | // Full special case list file example: |
||
31 | // --- |
||
32 | // [address] |
||
33 | // # Excluded items: |
||
34 | // fun:*_ZN4base6subtle* |
||
35 | // global:*global_with_bad_access_or_initialization* |
||
36 | // global:*global_with_initialization_issues*=init |
||
37 | // type:*Namespace::ClassName*=init |
||
38 | // src:file_with_tricky_code.cc |
||
39 | // src:ignore-global-initializers-issues.cc=init |
||
40 | // mainfile:main_file.cc |
||
41 | // |
||
42 | // [dataflow] |
||
43 | // # Functions with pure functional semantics: |
||
44 | // fun:cos=functional |
||
45 | // fun:sin=functional |
||
46 | // --- |
||
47 | // Note that the wild card is in fact an llvm::Regex, but * is automatically |
||
48 | // replaced with .* |
||
49 | // |
||
50 | //===----------------------------------------------------------------------===// |
||
51 | |||
52 | #ifndef LLVM_SUPPORT_SPECIALCASELIST_H |
||
53 | #define LLVM_SUPPORT_SPECIALCASELIST_H |
||
54 | |||
55 | #include "llvm/ADT/StringMap.h" |
||
56 | #include "llvm/Support/Regex.h" |
||
57 | #include "llvm/Support/TrigramIndex.h" |
||
58 | #include <memory> |
||
59 | #include <string> |
||
60 | #include <vector> |
||
61 | |||
62 | namespace llvm { |
||
63 | class MemoryBuffer; |
||
64 | class StringRef; |
||
65 | |||
66 | namespace vfs { |
||
67 | class FileSystem; |
||
68 | } |
||
69 | |||
70 | class SpecialCaseList { |
||
71 | public: |
||
72 | /// Parses the special case list entries from files. On failure, returns |
||
73 | /// 0 and writes an error message to string. |
||
74 | static std::unique_ptr<SpecialCaseList> |
||
75 | create(const std::vector<std::string> &Paths, llvm::vfs::FileSystem &FS, |
||
76 | std::string &Error); |
||
77 | /// Parses the special case list from a memory buffer. On failure, returns |
||
78 | /// 0 and writes an error message to string. |
||
79 | static std::unique_ptr<SpecialCaseList> create(const MemoryBuffer *MB, |
||
80 | std::string &Error); |
||
81 | /// Parses the special case list entries from files. On failure, reports a |
||
82 | /// fatal error. |
||
83 | static std::unique_ptr<SpecialCaseList> |
||
84 | createOrDie(const std::vector<std::string> &Paths, llvm::vfs::FileSystem &FS); |
||
85 | |||
86 | ~SpecialCaseList(); |
||
87 | |||
88 | /// Returns true, if special case list contains a line |
||
89 | /// \code |
||
90 | /// @Prefix:<E>=@Category |
||
91 | /// \endcode |
||
92 | /// where @Query satisfies wildcard expression <E> in a given @Section. |
||
93 | bool inSection(StringRef Section, StringRef Prefix, StringRef Query, |
||
94 | StringRef Category = StringRef()) const; |
||
95 | |||
96 | /// Returns the line number corresponding to the special case list entry if |
||
97 | /// the special case list contains a line |
||
98 | /// \code |
||
99 | /// @Prefix:<E>=@Category |
||
100 | /// \endcode |
||
101 | /// where @Query satisfies wildcard expression <E> in a given @Section. |
||
102 | /// Returns zero if there is no exclusion entry corresponding to this |
||
103 | /// expression. |
||
104 | unsigned inSectionBlame(StringRef Section, StringRef Prefix, StringRef Query, |
||
105 | StringRef Category = StringRef()) const; |
||
106 | |||
107 | protected: |
||
108 | // Implementations of the create*() functions that can also be used by derived |
||
109 | // classes. |
||
110 | bool createInternal(const std::vector<std::string> &Paths, |
||
111 | vfs::FileSystem &VFS, std::string &Error); |
||
112 | bool createInternal(const MemoryBuffer *MB, std::string &Error); |
||
113 | |||
114 | SpecialCaseList() = default; |
||
115 | SpecialCaseList(SpecialCaseList const &) = delete; |
||
116 | SpecialCaseList &operator=(SpecialCaseList const &) = delete; |
||
117 | |||
118 | /// Represents a set of regular expressions. Regular expressions which are |
||
119 | /// "literal" (i.e. no regex metacharacters) are stored in Strings. The |
||
120 | /// reason for doing so is efficiency; StringMap is much faster at matching |
||
121 | /// literal strings than Regex. |
||
122 | class Matcher { |
||
123 | public: |
||
124 | bool insert(std::string Regexp, unsigned LineNumber, std::string &REError); |
||
125 | // Returns the line number in the source file that this query matches to. |
||
126 | // Returns zero if no match is found. |
||
127 | unsigned match(StringRef Query) const; |
||
128 | |||
129 | private: |
||
130 | StringMap<unsigned> Strings; |
||
131 | TrigramIndex Trigrams; |
||
132 | std::vector<std::pair<std::unique_ptr<Regex>, unsigned>> RegExes; |
||
133 | }; |
||
134 | |||
135 | using SectionEntries = StringMap<StringMap<Matcher>>; |
||
136 | |||
137 | struct Section { |
||
138 | Section(std::unique_ptr<Matcher> M) : SectionMatcher(std::move(M)){}; |
||
139 | |||
140 | std::unique_ptr<Matcher> SectionMatcher; |
||
141 | SectionEntries Entries; |
||
142 | }; |
||
143 | |||
144 | std::vector<Section> Sections; |
||
145 | |||
146 | /// Parses just-constructed SpecialCaseList entries from a memory buffer. |
||
147 | bool parse(const MemoryBuffer *MB, StringMap<size_t> &SectionsMap, |
||
148 | std::string &Error); |
||
149 | |||
150 | // Helper method for derived classes to search by Prefix, Query, and Category |
||
151 | // once they have already resolved a section entry. |
||
152 | unsigned inSectionBlame(const SectionEntries &Entries, StringRef Prefix, |
||
153 | StringRef Query, StringRef Category) const; |
||
154 | }; |
||
155 | |||
156 | } // namespace llvm |
||
157 | |||
158 | #endif // LLVM_SUPPORT_SPECIALCASELIST_H |
||
159 |