1 | //===- Bitcode/Writer/ValueEnumerator.h - Number values ---------*- C++ -*-===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // This class gives values and types Unique ID's. |
10 | // |
11 | //===----------------------------------------------------------------------===// |
12 | |
13 | #ifndef LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H |
14 | #define LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H |
15 | |
16 | #include "llvm/ADT/ArrayRef.h" |
17 | #include "llvm/ADT/DenseMap.h" |
18 | #include "llvm/ADT/UniqueVector.h" |
19 | #include "llvm/IR/Attributes.h" |
20 | #include "llvm/IR/UseListOrder.h" |
21 | #include <cassert> |
22 | #include <cstdint> |
23 | #include <utility> |
24 | #include <vector> |
25 | |
26 | namespace llvm { |
27 | |
28 | class BasicBlock; |
29 | class Comdat; |
30 | class DIArgList; |
31 | class Function; |
32 | class Instruction; |
33 | class LocalAsMetadata; |
34 | class MDNode; |
35 | class Metadata; |
36 | class Module; |
37 | class NamedMDNode; |
38 | class raw_ostream; |
39 | class Type; |
40 | class Value; |
41 | class ValueSymbolTable; |
42 | |
43 | class ValueEnumerator { |
44 | public: |
45 | using TypeList = std::vector<Type *>; |
46 | |
47 | // For each value, we remember its Value* and occurrence frequency. |
48 | using ValueList = std::vector<std::pair<const Value *, unsigned>>; |
49 | |
50 | /// Attribute groups as encoded in bitcode are almost AttributeSets, but they |
51 | /// include the AttributeList index, so we have to track that in our map. |
52 | using IndexAndAttrSet = std::pair<unsigned, AttributeSet>; |
53 | |
54 | UseListOrderStack UseListOrders; |
55 | |
56 | private: |
57 | using TypeMapType = DenseMap<Type *, unsigned>; |
58 | TypeMapType TypeMap; |
59 | TypeList Types; |
60 | |
61 | using ValueMapType = DenseMap<const Value *, unsigned>; |
62 | ValueMapType ValueMap; |
63 | ValueList Values; |
64 | |
65 | using ComdatSetType = UniqueVector<const Comdat *>; |
66 | ComdatSetType Comdats; |
67 | |
68 | std::vector<const Metadata *> MDs; |
69 | std::vector<const Metadata *> FunctionMDs; |
70 | |
71 | /// Index of information about a piece of metadata. |
72 | struct MDIndex { |
73 | unsigned F = 0; ///< The ID of the function for this metadata, if any. |
74 | unsigned ID = 0; ///< The implicit ID of this metadata in bitcode. |
75 | |
76 | MDIndex() = default; |
77 | explicit MDIndex(unsigned F) : F(F) {} |
78 | |
79 | /// Check if this has a function tag, and it's different from NewF. |
80 | bool hasDifferentFunction(unsigned NewF) const { return F && F != NewF; } |
81 | |
82 | /// Fetch the MD this references out of the given metadata array. |
83 | const Metadata *get(ArrayRef<const Metadata *> MDs) const { |
84 | assert(ID && "Expected non-zero ID" ); |
85 | assert(ID <= MDs.size() && "Expected valid ID" ); |
86 | return MDs[ID - 1]; |
87 | } |
88 | }; |
89 | |
90 | using MetadataMapType = DenseMap<const Metadata *, MDIndex>; |
91 | MetadataMapType MetadataMap; |
92 | |
93 | /// Range of metadata IDs, as a half-open range. |
94 | struct MDRange { |
95 | unsigned First = 0; |
96 | unsigned Last = 0; |
97 | |
98 | /// Number of strings in the prefix of the metadata range. |
99 | unsigned NumStrings = 0; |
100 | |
101 | MDRange() = default; |
102 | explicit MDRange(unsigned First) : First(First) {} |
103 | }; |
104 | SmallDenseMap<unsigned, MDRange, 1> FunctionMDInfo; |
105 | |
106 | bool ShouldPreserveUseListOrder; |
107 | |
108 | using AttributeGroupMapType = DenseMap<IndexAndAttrSet, unsigned>; |
109 | AttributeGroupMapType AttributeGroupMap; |
110 | std::vector<IndexAndAttrSet> AttributeGroups; |
111 | |
112 | using AttributeListMapType = DenseMap<AttributeList, unsigned>; |
113 | AttributeListMapType AttributeListMap; |
114 | std::vector<AttributeList> AttributeLists; |
115 | |
116 | /// GlobalBasicBlockIDs - This map memoizes the basic block ID's referenced by |
117 | /// the "getGlobalBasicBlockID" method. |
118 | mutable DenseMap<const BasicBlock*, unsigned> GlobalBasicBlockIDs; |
119 | |
120 | using InstructionMapType = DenseMap<const Instruction *, unsigned>; |
121 | InstructionMapType InstructionMap; |
122 | unsigned InstructionCount; |
123 | |
124 | /// BasicBlocks - This contains all the basic blocks for the currently |
125 | /// incorporated function. Their reverse mapping is stored in ValueMap. |
126 | std::vector<const BasicBlock*> BasicBlocks; |
127 | |
128 | /// When a function is incorporated, this is the size of the Values list |
129 | /// before incorporation. |
130 | unsigned NumModuleValues; |
131 | |
132 | /// When a function is incorporated, this is the size of the Metadatas list |
133 | /// before incorporation. |
134 | unsigned NumModuleMDs = 0; |
135 | unsigned NumMDStrings = 0; |
136 | |
137 | unsigned FirstFuncConstantID; |
138 | unsigned FirstInstID; |
139 | |
140 | public: |
141 | ValueEnumerator(const Module &M, bool ShouldPreserveUseListOrder); |
142 | ValueEnumerator(const ValueEnumerator &) = delete; |
143 | ValueEnumerator &operator=(const ValueEnumerator &) = delete; |
144 | |
145 | void dump() const; |
146 | void print(raw_ostream &OS, const ValueMapType &Map, const char *Name) const; |
147 | void print(raw_ostream &OS, const MetadataMapType &Map, |
148 | const char *Name) const; |
149 | |
150 | unsigned getValueID(const Value *V) const; |
151 | |
152 | unsigned getMetadataID(const Metadata *MD) const { |
153 | auto ID = getMetadataOrNullID(MD); |
154 | assert(ID != 0 && "Metadata not in slotcalculator!" ); |
155 | return ID - 1; |
156 | } |
157 | |
158 | unsigned getMetadataOrNullID(const Metadata *MD) const { |
159 | return MetadataMap.lookup(Val: MD).ID; |
160 | } |
161 | |
162 | unsigned numMDs() const { return MDs.size(); } |
163 | |
164 | bool shouldPreserveUseListOrder() const { return ShouldPreserveUseListOrder; } |
165 | |
166 | unsigned getTypeID(Type *T) const { |
167 | TypeMapType::const_iterator I = TypeMap.find(Val: T); |
168 | assert(I != TypeMap.end() && "Type not in ValueEnumerator!" ); |
169 | return I->second-1; |
170 | } |
171 | |
172 | unsigned getInstructionID(const Instruction *I) const; |
173 | void setInstructionID(const Instruction *I); |
174 | |
175 | unsigned getAttributeListID(AttributeList PAL) const { |
176 | if (PAL.isEmpty()) return 0; // Null maps to zero. |
177 | AttributeListMapType::const_iterator I = AttributeListMap.find(Val: PAL); |
178 | assert(I != AttributeListMap.end() && "Attribute not in ValueEnumerator!" ); |
179 | return I->second; |
180 | } |
181 | |
182 | unsigned getAttributeGroupID(IndexAndAttrSet Group) const { |
183 | if (!Group.second.hasAttributes()) |
184 | return 0; // Null maps to zero. |
185 | AttributeGroupMapType::const_iterator I = AttributeGroupMap.find(Val: Group); |
186 | assert(I != AttributeGroupMap.end() && "Attribute not in ValueEnumerator!" ); |
187 | return I->second; |
188 | } |
189 | |
190 | /// getFunctionConstantRange - Return the range of values that corresponds to |
191 | /// function-local constants. |
192 | void getFunctionConstantRange(unsigned &Start, unsigned &End) const { |
193 | Start = FirstFuncConstantID; |
194 | End = FirstInstID; |
195 | } |
196 | |
197 | const ValueList &getValues() const { return Values; } |
198 | |
199 | /// Check whether the current block has any metadata to emit. |
200 | bool hasMDs() const { return NumModuleMDs < MDs.size(); } |
201 | |
202 | /// Get the MDString metadata for this block. |
203 | ArrayRef<const Metadata *> getMDStrings() const { |
204 | return ArrayRef(MDs).slice(N: NumModuleMDs, M: NumMDStrings); |
205 | } |
206 | |
207 | /// Get the non-MDString metadata for this block. |
208 | ArrayRef<const Metadata *> getNonMDStrings() const { |
209 | return ArrayRef(MDs).slice(N: NumModuleMDs).slice(N: NumMDStrings); |
210 | } |
211 | |
212 | const TypeList &getTypes() const { return Types; } |
213 | |
214 | const std::vector<const BasicBlock*> &getBasicBlocks() const { |
215 | return BasicBlocks; |
216 | } |
217 | |
218 | const std::vector<AttributeList> &getAttributeLists() const { return AttributeLists; } |
219 | |
220 | const std::vector<IndexAndAttrSet> &getAttributeGroups() const { |
221 | return AttributeGroups; |
222 | } |
223 | |
224 | const ComdatSetType &getComdats() const { return Comdats; } |
225 | unsigned getComdatID(const Comdat *C) const; |
226 | |
227 | /// getGlobalBasicBlockID - This returns the function-specific ID for the |
228 | /// specified basic block. This is relatively expensive information, so it |
229 | /// should only be used by rare constructs such as address-of-label. |
230 | unsigned getGlobalBasicBlockID(const BasicBlock *BB) const; |
231 | |
232 | /// incorporateFunction/purgeFunction - If you'd like to deal with a function, |
233 | /// use these two methods to get its data into the ValueEnumerator! |
234 | void incorporateFunction(const Function &F); |
235 | |
236 | void purgeFunction(); |
237 | uint64_t computeBitsRequiredForTypeIndices() const; |
238 | |
239 | private: |
240 | void OptimizeConstants(unsigned CstStart, unsigned CstEnd); |
241 | |
242 | /// Reorder the reachable metadata. |
243 | /// |
244 | /// This is not just an optimization, but is mandatory for emitting MDString |
245 | /// correctly. |
246 | void organizeMetadata(); |
247 | |
248 | /// Drop the function tag from the transitive operands of the given node. |
249 | void dropFunctionFromMetadata(MetadataMapType::value_type &FirstMD); |
250 | |
251 | /// Incorporate the function metadata. |
252 | /// |
253 | /// This should be called before enumerating LocalAsMetadata for the |
254 | /// function. |
255 | void incorporateFunctionMetadata(const Function &F); |
256 | |
257 | /// Enumerate a single instance of metadata with the given function tag. |
258 | /// |
259 | /// If \c MD has already been enumerated, check that \c F matches its |
260 | /// function tag. If not, call \a dropFunctionFromMetadata(). |
261 | /// |
262 | /// Otherwise, mark \c MD as visited. Assign it an ID, or just return it if |
263 | /// it's an \a MDNode. |
264 | const MDNode *enumerateMetadataImpl(unsigned F, const Metadata *MD); |
265 | |
266 | unsigned getMetadataFunctionID(const Function *F) const; |
267 | |
268 | /// Enumerate reachable metadata in (almost) post-order. |
269 | /// |
270 | /// Enumerate all the metadata reachable from MD. We want to minimize the |
271 | /// cost of reading bitcode records, and so the primary consideration is that |
272 | /// operands of uniqued nodes are resolved before the nodes are read. This |
273 | /// avoids re-uniquing them on the context and factors away RAUW support. |
274 | /// |
275 | /// This algorithm guarantees that subgraphs of uniqued nodes are in |
276 | /// post-order. Distinct subgraphs reachable only from a single uniqued node |
277 | /// will be in post-order. |
278 | /// |
279 | /// \note The relative order of a distinct and uniqued node is irrelevant. |
280 | /// \a organizeMetadata() will later partition distinct nodes ahead of |
281 | /// uniqued ones. |
282 | ///{ |
283 | void EnumerateMetadata(const Function *F, const Metadata *MD); |
284 | void EnumerateMetadata(unsigned F, const Metadata *MD); |
285 | ///} |
286 | |
287 | void EnumerateFunctionLocalMetadata(const Function &F, |
288 | const LocalAsMetadata *Local); |
289 | void EnumerateFunctionLocalMetadata(unsigned F, const LocalAsMetadata *Local); |
290 | void EnumerateFunctionLocalListMetadata(const Function &F, |
291 | const DIArgList *ArgList); |
292 | void EnumerateFunctionLocalListMetadata(unsigned F, const DIArgList *Arglist); |
293 | void EnumerateNamedMDNode(const NamedMDNode *NMD); |
294 | void EnumerateValue(const Value *V); |
295 | void EnumerateType(Type *T); |
296 | void EnumerateOperandType(const Value *V); |
297 | void EnumerateAttributes(AttributeList PAL); |
298 | |
299 | void EnumerateValueSymbolTable(const ValueSymbolTable &ST); |
300 | void EnumerateNamedMetadata(const Module &M); |
301 | }; |
302 | |
303 | } // end namespace llvm |
304 | |
305 | #endif // LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H |
306 | |