1 //===- Bitcode/Writer/ValueEnumerator.h - Number values ---------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This class gives values and types Unique ID's.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #ifndef LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H
15 #define LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H
16 
17 #include "llvm/ADT/ArrayRef.h"
18 #include "llvm/ADT/DenseMap.h"
19 #include "llvm/ADT/UniqueVector.h"
20 #include "llvm/IR/Attributes.h"
21 #include "llvm/IR/Metadata.h"
22 #include "llvm/IR/Type.h"
23 #include "llvm/IR/UseListOrder.h"
24 #include <cassert>
25 #include <cstdint>
26 #include <utility>
27 #include <vector>
28 
29 namespace llvm {
30 
31 class BasicBlock;
32 class Comdat;
33 class Function;
34 class Instruction;
35 class LocalAsMetadata;
36 class MDNode;
37 class Metadata;
38 class Module;
39 class NamedMDNode;
40 class raw_ostream;
41 class Type;
42 class Value;
43 class ValueSymbolTable;
44 
45 class ValueEnumerator {
46 public:
47   using TypeList = std::vector<Type *>;
48 
49   // For each value, we remember its Value* and occurrence frequency.
50   using ValueList = std::vector<std::pair<const Value *, unsigned>>;
51 
52   /// Attribute groups as encoded in bitcode are almost AttributeSets, but they
53   /// include the AttributeList index, so we have to track that in our map.
54   using IndexAndAttrSet = std::pair<unsigned, AttributeSet>;
55 
56   UseListOrderStack UseListOrders;
57 
58 private:
59   using TypeMapType = DenseMap<Type *, unsigned>;
60   TypeMapType TypeMap;
61   TypeList Types;
62 
63   using ValueMapType = DenseMap<const Value *, unsigned>;
64   ValueMapType ValueMap;
65   ValueList Values;
66 
67   using ComdatSetType = UniqueVector<const Comdat *>;
68   ComdatSetType Comdats;
69 
70   std::vector<const Metadata *> MDs;
71   std::vector<const Metadata *> FunctionMDs;
72 
73   /// Index of information about a piece of metadata.
74   struct MDIndex {
75     unsigned F = 0;  ///< The ID of the function for this metadata, if any.
76     unsigned ID = 0; ///< The implicit ID of this metadata in bitcode.
77 
78     MDIndex() = default;
MDIndexMDIndex79     explicit MDIndex(unsigned F) : F(F) {}
80 
81     /// Check if this has a function tag, and it's different from NewF.
hasDifferentFunctionMDIndex82     bool hasDifferentFunction(unsigned NewF) const { return F && F != NewF; }
83 
84     /// Fetch the MD this references out of the given metadata array.
getMDIndex85     const Metadata *get(ArrayRef<const Metadata *> MDs) const {
86       assert(ID && "Expected non-zero ID");
87       assert(ID <= MDs.size() && "Expected valid ID");
88       return MDs[ID - 1];
89     }
90   };
91 
92   using MetadataMapType = DenseMap<const Metadata *, MDIndex>;
93   MetadataMapType MetadataMap;
94 
95   /// Range of metadata IDs, as a half-open range.
96   struct MDRange {
97     unsigned First = 0;
98     unsigned Last = 0;
99 
100     /// Number of strings in the prefix of the metadata range.
101     unsigned NumStrings = 0;
102 
103     MDRange() = default;
MDRangeMDRange104     explicit MDRange(unsigned First) : First(First) {}
105   };
106   SmallDenseMap<unsigned, MDRange, 1> FunctionMDInfo;
107 
108   bool ShouldPreserveUseListOrder;
109 
110   using AttributeGroupMapType = DenseMap<IndexAndAttrSet, unsigned>;
111   AttributeGroupMapType AttributeGroupMap;
112   std::vector<IndexAndAttrSet> AttributeGroups;
113 
114   using AttributeListMapType = DenseMap<AttributeList, unsigned>;
115   AttributeListMapType AttributeListMap;
116   std::vector<AttributeList> AttributeLists;
117 
118   /// GlobalBasicBlockIDs - This map memoizes the basic block ID's referenced by
119   /// the "getGlobalBasicBlockID" method.
120   mutable DenseMap<const BasicBlock*, unsigned> GlobalBasicBlockIDs;
121 
122   using InstructionMapType = DenseMap<const Instruction *, unsigned>;
123   InstructionMapType InstructionMap;
124   unsigned InstructionCount;
125 
126   /// BasicBlocks - This contains all the basic blocks for the currently
127   /// incorporated function.  Their reverse mapping is stored in ValueMap.
128   std::vector<const BasicBlock*> BasicBlocks;
129 
130   /// When a function is incorporated, this is the size of the Values list
131   /// before incorporation.
132   unsigned NumModuleValues;
133 
134   /// When a function is incorporated, this is the size of the Metadatas list
135   /// before incorporation.
136   unsigned NumModuleMDs = 0;
137   unsigned NumMDStrings = 0;
138 
139   unsigned FirstFuncConstantID;
140   unsigned FirstInstID;
141 
142 public:
143   ValueEnumerator(const Module &M, bool ShouldPreserveUseListOrder);
144   ValueEnumerator(const ValueEnumerator &) = delete;
145   ValueEnumerator &operator=(const ValueEnumerator &) = delete;
146 
147   void dump() const;
148   void print(raw_ostream &OS, const ValueMapType &Map, const char *Name) const;
149   void print(raw_ostream &OS, const MetadataMapType &Map,
150              const char *Name) const;
151 
152   unsigned getValueID(const Value *V) const;
153 
getMetadataID(const Metadata * MD)154   unsigned getMetadataID(const Metadata *MD) const {
155     auto ID = getMetadataOrNullID(MD);
156     assert(ID != 0 && "Metadata not in slotcalculator!");
157     return ID - 1;
158   }
159 
getMetadataOrNullID(const Metadata * MD)160   unsigned getMetadataOrNullID(const Metadata *MD) const {
161     return MetadataMap.lookup(MD).ID;
162   }
163 
numMDs()164   unsigned numMDs() const { return MDs.size(); }
165 
shouldPreserveUseListOrder()166   bool shouldPreserveUseListOrder() const { return ShouldPreserveUseListOrder; }
167 
getTypeID(Type * T)168   unsigned getTypeID(Type *T) const {
169     TypeMapType::const_iterator I = TypeMap.find(T);
170     assert(I != TypeMap.end() && "Type not in ValueEnumerator!");
171     return I->second-1;
172   }
173 
174   unsigned getInstructionID(const Instruction *I) const;
175   void setInstructionID(const Instruction *I);
176 
getAttributeListID(AttributeList PAL)177   unsigned getAttributeListID(AttributeList PAL) const {
178     if (PAL.isEmpty()) return 0;  // Null maps to zero.
179     AttributeListMapType::const_iterator I = AttributeListMap.find(PAL);
180     assert(I != AttributeListMap.end() && "Attribute not in ValueEnumerator!");
181     return I->second;
182   }
183 
getAttributeGroupID(IndexAndAttrSet Group)184   unsigned getAttributeGroupID(IndexAndAttrSet Group) const {
185     if (!Group.second.hasAttributes())
186       return 0; // Null maps to zero.
187     AttributeGroupMapType::const_iterator I = AttributeGroupMap.find(Group);
188     assert(I != AttributeGroupMap.end() && "Attribute not in ValueEnumerator!");
189     return I->second;
190   }
191 
192   /// getFunctionConstantRange - Return the range of values that corresponds to
193   /// function-local constants.
getFunctionConstantRange(unsigned & Start,unsigned & End)194   void getFunctionConstantRange(unsigned &Start, unsigned &End) const {
195     Start = FirstFuncConstantID;
196     End = FirstInstID;
197   }
198 
getValues()199   const ValueList &getValues() const { return Values; }
200 
201   /// Check whether the current block has any metadata to emit.
hasMDs()202   bool hasMDs() const { return NumModuleMDs < MDs.size(); }
203 
204   /// Get the MDString metadata for this block.
getMDStrings()205   ArrayRef<const Metadata *> getMDStrings() const {
206     return makeArrayRef(MDs).slice(NumModuleMDs, NumMDStrings);
207   }
208 
209   /// Get the non-MDString metadata for this block.
getNonMDStrings()210   ArrayRef<const Metadata *> getNonMDStrings() const {
211     return makeArrayRef(MDs).slice(NumModuleMDs).slice(NumMDStrings);
212   }
213 
getTypes()214   const TypeList &getTypes() const { return Types; }
215 
getBasicBlocks()216   const std::vector<const BasicBlock*> &getBasicBlocks() const {
217     return BasicBlocks;
218   }
219 
getAttributeLists()220   const std::vector<AttributeList> &getAttributeLists() const { return AttributeLists; }
221 
getAttributeGroups()222   const std::vector<IndexAndAttrSet> &getAttributeGroups() const {
223     return AttributeGroups;
224   }
225 
getComdats()226   const ComdatSetType &getComdats() const { return Comdats; }
227   unsigned getComdatID(const Comdat *C) const;
228 
229   /// getGlobalBasicBlockID - This returns the function-specific ID for the
230   /// specified basic block.  This is relatively expensive information, so it
231   /// should only be used by rare constructs such as address-of-label.
232   unsigned getGlobalBasicBlockID(const BasicBlock *BB) const;
233 
234   /// incorporateFunction/purgeFunction - If you'd like to deal with a function,
235   /// use these two methods to get its data into the ValueEnumerator!
236   void incorporateFunction(const Function &F);
237 
238   void purgeFunction();
239   uint64_t computeBitsRequiredForTypeIndicies() const;
240 
241 private:
242   void OptimizeConstants(unsigned CstStart, unsigned CstEnd);
243 
244   /// Reorder the reachable metadata.
245   ///
246   /// This is not just an optimization, but is mandatory for emitting MDString
247   /// correctly.
248   void organizeMetadata();
249 
250   /// Drop the function tag from the transitive operands of the given node.
251   void dropFunctionFromMetadata(MetadataMapType::value_type &FirstMD);
252 
253   /// Incorporate the function metadata.
254   ///
255   /// This should be called before enumerating LocalAsMetadata for the
256   /// function.
257   void incorporateFunctionMetadata(const Function &F);
258 
259   /// Enumerate a single instance of metadata with the given function tag.
260   ///
261   /// If \c MD has already been enumerated, check that \c F matches its
262   /// function tag.  If not, call \a dropFunctionFromMetadata().
263   ///
264   /// Otherwise, mark \c MD as visited.  Assign it an ID, or just return it if
265   /// it's an \a MDNode.
266   const MDNode *enumerateMetadataImpl(unsigned F, const Metadata *MD);
267 
268   unsigned getMetadataFunctionID(const Function *F) const;
269 
270   /// Enumerate reachable metadata in (almost) post-order.
271   ///
272   /// Enumerate all the metadata reachable from MD.  We want to minimize the
273   /// cost of reading bitcode records, and so the primary consideration is that
274   /// operands of uniqued nodes are resolved before the nodes are read.  This
275   /// avoids re-uniquing them on the context and factors away RAUW support.
276   ///
277   /// This algorithm guarantees that subgraphs of uniqued nodes are in
278   /// post-order.  Distinct subgraphs reachable only from a single uniqued node
279   /// will be in post-order.
280   ///
281   /// \note The relative order of a distinct and uniqued node is irrelevant.
282   /// \a organizeMetadata() will later partition distinct nodes ahead of
283   /// uniqued ones.
284   ///{
285   void EnumerateMetadata(const Function *F, const Metadata *MD);
286   void EnumerateMetadata(unsigned F, const Metadata *MD);
287   ///}
288 
289   void EnumerateFunctionLocalMetadata(const Function &F,
290                                       const LocalAsMetadata *Local);
291   void EnumerateFunctionLocalMetadata(unsigned F, const LocalAsMetadata *Local);
292   void EnumerateNamedMDNode(const NamedMDNode *NMD);
293   void EnumerateValue(const Value *V);
294   void EnumerateType(Type *T);
295   void EnumerateOperandType(const Value *V);
296   void EnumerateAttributes(AttributeList PAL);
297 
298   void EnumerateValueSymbolTable(const ValueSymbolTable &ST);
299   void EnumerateNamedMetadata(const Module &M);
300 };
301 
302 } // end namespace llvm
303 
304 #endif // LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H
305