xref: /openbsd-src/gnu/llvm/llvm/lib/Bitcode/Writer/ValueEnumerator.h (revision d415bd752c734aee168c4ee86ff32e8cc249eb16)
109467b48Spatrick //===- Bitcode/Writer/ValueEnumerator.h - Number values ---------*- C++ -*-===//
209467b48Spatrick //
309467b48Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
409467b48Spatrick // See https://llvm.org/LICENSE.txt for license information.
509467b48Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
609467b48Spatrick //
709467b48Spatrick //===----------------------------------------------------------------------===//
809467b48Spatrick //
909467b48Spatrick // This class gives values and types Unique ID's.
1009467b48Spatrick //
1109467b48Spatrick //===----------------------------------------------------------------------===//
1209467b48Spatrick 
1309467b48Spatrick #ifndef LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H
1409467b48Spatrick #define LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H
1509467b48Spatrick 
1609467b48Spatrick #include "llvm/ADT/ArrayRef.h"
1709467b48Spatrick #include "llvm/ADT/DenseMap.h"
1809467b48Spatrick #include "llvm/ADT/UniqueVector.h"
1909467b48Spatrick #include "llvm/IR/Attributes.h"
2009467b48Spatrick #include "llvm/IR/UseListOrder.h"
2109467b48Spatrick #include <cassert>
2209467b48Spatrick #include <cstdint>
2309467b48Spatrick #include <utility>
2409467b48Spatrick #include <vector>
2509467b48Spatrick 
2609467b48Spatrick namespace llvm {
2709467b48Spatrick 
2809467b48Spatrick class BasicBlock;
2909467b48Spatrick class Comdat;
3073471bf0Spatrick class DIArgList;
3109467b48Spatrick class Function;
3209467b48Spatrick class Instruction;
3309467b48Spatrick class LocalAsMetadata;
3409467b48Spatrick class MDNode;
3509467b48Spatrick class Metadata;
3609467b48Spatrick class Module;
3709467b48Spatrick class NamedMDNode;
3809467b48Spatrick class raw_ostream;
3909467b48Spatrick class Type;
4009467b48Spatrick class Value;
4109467b48Spatrick class ValueSymbolTable;
4209467b48Spatrick 
4309467b48Spatrick class ValueEnumerator {
4409467b48Spatrick public:
4509467b48Spatrick   using TypeList = std::vector<Type *>;
4609467b48Spatrick 
4709467b48Spatrick   // For each value, we remember its Value* and occurrence frequency.
4809467b48Spatrick   using ValueList = std::vector<std::pair<const Value *, unsigned>>;
4909467b48Spatrick 
5009467b48Spatrick   /// Attribute groups as encoded in bitcode are almost AttributeSets, but they
5109467b48Spatrick   /// include the AttributeList index, so we have to track that in our map.
5209467b48Spatrick   using IndexAndAttrSet = std::pair<unsigned, AttributeSet>;
5309467b48Spatrick 
5409467b48Spatrick   UseListOrderStack UseListOrders;
5509467b48Spatrick 
5609467b48Spatrick private:
5709467b48Spatrick   using TypeMapType = DenseMap<Type *, unsigned>;
5809467b48Spatrick   TypeMapType TypeMap;
5909467b48Spatrick   TypeList Types;
6009467b48Spatrick 
6109467b48Spatrick   using ValueMapType = DenseMap<const Value *, unsigned>;
6209467b48Spatrick   ValueMapType ValueMap;
6309467b48Spatrick   ValueList Values;
6409467b48Spatrick 
6509467b48Spatrick   using ComdatSetType = UniqueVector<const Comdat *>;
6609467b48Spatrick   ComdatSetType Comdats;
6709467b48Spatrick 
6809467b48Spatrick   std::vector<const Metadata *> MDs;
6909467b48Spatrick   std::vector<const Metadata *> FunctionMDs;
7009467b48Spatrick 
7109467b48Spatrick   /// Index of information about a piece of metadata.
7209467b48Spatrick   struct MDIndex {
7309467b48Spatrick     unsigned F = 0;  ///< The ID of the function for this metadata, if any.
7409467b48Spatrick     unsigned ID = 0; ///< The implicit ID of this metadata in bitcode.
7509467b48Spatrick 
7609467b48Spatrick     MDIndex() = default;
MDIndexMDIndex7709467b48Spatrick     explicit MDIndex(unsigned F) : F(F) {}
7809467b48Spatrick 
7909467b48Spatrick     /// Check if this has a function tag, and it's different from NewF.
hasDifferentFunctionMDIndex8009467b48Spatrick     bool hasDifferentFunction(unsigned NewF) const { return F && F != NewF; }
8109467b48Spatrick 
8209467b48Spatrick     /// Fetch the MD this references out of the given metadata array.
getMDIndex8309467b48Spatrick     const Metadata *get(ArrayRef<const Metadata *> MDs) const {
8409467b48Spatrick       assert(ID && "Expected non-zero ID");
8509467b48Spatrick       assert(ID <= MDs.size() && "Expected valid ID");
8609467b48Spatrick       return MDs[ID - 1];
8709467b48Spatrick     }
8809467b48Spatrick   };
8909467b48Spatrick 
9009467b48Spatrick   using MetadataMapType = DenseMap<const Metadata *, MDIndex>;
9109467b48Spatrick   MetadataMapType MetadataMap;
9209467b48Spatrick 
9309467b48Spatrick   /// Range of metadata IDs, as a half-open range.
9409467b48Spatrick   struct MDRange {
9509467b48Spatrick     unsigned First = 0;
9609467b48Spatrick     unsigned Last = 0;
9709467b48Spatrick 
9809467b48Spatrick     /// Number of strings in the prefix of the metadata range.
9909467b48Spatrick     unsigned NumStrings = 0;
10009467b48Spatrick 
10109467b48Spatrick     MDRange() = default;
MDRangeMDRange10209467b48Spatrick     explicit MDRange(unsigned First) : First(First) {}
10309467b48Spatrick   };
10409467b48Spatrick   SmallDenseMap<unsigned, MDRange, 1> FunctionMDInfo;
10509467b48Spatrick 
10609467b48Spatrick   bool ShouldPreserveUseListOrder;
10709467b48Spatrick 
10809467b48Spatrick   using AttributeGroupMapType = DenseMap<IndexAndAttrSet, unsigned>;
10909467b48Spatrick   AttributeGroupMapType AttributeGroupMap;
11009467b48Spatrick   std::vector<IndexAndAttrSet> AttributeGroups;
11109467b48Spatrick 
11209467b48Spatrick   using AttributeListMapType = DenseMap<AttributeList, unsigned>;
11309467b48Spatrick   AttributeListMapType AttributeListMap;
11409467b48Spatrick   std::vector<AttributeList> AttributeLists;
11509467b48Spatrick 
11609467b48Spatrick   /// GlobalBasicBlockIDs - This map memoizes the basic block ID's referenced by
11709467b48Spatrick   /// the "getGlobalBasicBlockID" method.
11809467b48Spatrick   mutable DenseMap<const BasicBlock*, unsigned> GlobalBasicBlockIDs;
11909467b48Spatrick 
12009467b48Spatrick   using InstructionMapType = DenseMap<const Instruction *, unsigned>;
12109467b48Spatrick   InstructionMapType InstructionMap;
12209467b48Spatrick   unsigned InstructionCount;
12309467b48Spatrick 
12409467b48Spatrick   /// BasicBlocks - This contains all the basic blocks for the currently
12509467b48Spatrick   /// incorporated function.  Their reverse mapping is stored in ValueMap.
12609467b48Spatrick   std::vector<const BasicBlock*> BasicBlocks;
12709467b48Spatrick 
12809467b48Spatrick   /// When a function is incorporated, this is the size of the Values list
12909467b48Spatrick   /// before incorporation.
13009467b48Spatrick   unsigned NumModuleValues;
13109467b48Spatrick 
13209467b48Spatrick   /// When a function is incorporated, this is the size of the Metadatas list
13309467b48Spatrick   /// before incorporation.
13409467b48Spatrick   unsigned NumModuleMDs = 0;
13509467b48Spatrick   unsigned NumMDStrings = 0;
13609467b48Spatrick 
13709467b48Spatrick   unsigned FirstFuncConstantID;
13809467b48Spatrick   unsigned FirstInstID;
13909467b48Spatrick 
14009467b48Spatrick public:
14109467b48Spatrick   ValueEnumerator(const Module &M, bool ShouldPreserveUseListOrder);
14209467b48Spatrick   ValueEnumerator(const ValueEnumerator &) = delete;
14309467b48Spatrick   ValueEnumerator &operator=(const ValueEnumerator &) = delete;
14409467b48Spatrick 
14509467b48Spatrick   void dump() const;
14609467b48Spatrick   void print(raw_ostream &OS, const ValueMapType &Map, const char *Name) const;
14709467b48Spatrick   void print(raw_ostream &OS, const MetadataMapType &Map,
14809467b48Spatrick              const char *Name) const;
14909467b48Spatrick 
15009467b48Spatrick   unsigned getValueID(const Value *V) const;
15109467b48Spatrick 
getMetadataID(const Metadata * MD)15209467b48Spatrick   unsigned getMetadataID(const Metadata *MD) const {
15309467b48Spatrick     auto ID = getMetadataOrNullID(MD);
15409467b48Spatrick     assert(ID != 0 && "Metadata not in slotcalculator!");
15509467b48Spatrick     return ID - 1;
15609467b48Spatrick   }
15709467b48Spatrick 
getMetadataOrNullID(const Metadata * MD)15809467b48Spatrick   unsigned getMetadataOrNullID(const Metadata *MD) const {
15909467b48Spatrick     return MetadataMap.lookup(MD).ID;
16009467b48Spatrick   }
16109467b48Spatrick 
numMDs()16209467b48Spatrick   unsigned numMDs() const { return MDs.size(); }
16309467b48Spatrick 
shouldPreserveUseListOrder()16409467b48Spatrick   bool shouldPreserveUseListOrder() const { return ShouldPreserveUseListOrder; }
16509467b48Spatrick 
getTypeID(Type * T)16609467b48Spatrick   unsigned getTypeID(Type *T) const {
16709467b48Spatrick     TypeMapType::const_iterator I = TypeMap.find(T);
16809467b48Spatrick     assert(I != TypeMap.end() && "Type not in ValueEnumerator!");
16909467b48Spatrick     return I->second-1;
17009467b48Spatrick   }
17109467b48Spatrick 
17209467b48Spatrick   unsigned getInstructionID(const Instruction *I) const;
17309467b48Spatrick   void setInstructionID(const Instruction *I);
17409467b48Spatrick 
getAttributeListID(AttributeList PAL)17509467b48Spatrick   unsigned getAttributeListID(AttributeList PAL) const {
17609467b48Spatrick     if (PAL.isEmpty()) return 0;  // Null maps to zero.
17709467b48Spatrick     AttributeListMapType::const_iterator I = AttributeListMap.find(PAL);
17809467b48Spatrick     assert(I != AttributeListMap.end() && "Attribute not in ValueEnumerator!");
17909467b48Spatrick     return I->second;
18009467b48Spatrick   }
18109467b48Spatrick 
getAttributeGroupID(IndexAndAttrSet Group)18209467b48Spatrick   unsigned getAttributeGroupID(IndexAndAttrSet Group) const {
18309467b48Spatrick     if (!Group.second.hasAttributes())
18409467b48Spatrick       return 0; // Null maps to zero.
18509467b48Spatrick     AttributeGroupMapType::const_iterator I = AttributeGroupMap.find(Group);
18609467b48Spatrick     assert(I != AttributeGroupMap.end() && "Attribute not in ValueEnumerator!");
18709467b48Spatrick     return I->second;
18809467b48Spatrick   }
18909467b48Spatrick 
19009467b48Spatrick   /// getFunctionConstantRange - Return the range of values that corresponds to
19109467b48Spatrick   /// function-local constants.
getFunctionConstantRange(unsigned & Start,unsigned & End)19209467b48Spatrick   void getFunctionConstantRange(unsigned &Start, unsigned &End) const {
19309467b48Spatrick     Start = FirstFuncConstantID;
19409467b48Spatrick     End = FirstInstID;
19509467b48Spatrick   }
19609467b48Spatrick 
getValues()19709467b48Spatrick   const ValueList &getValues() const { return Values; }
19809467b48Spatrick 
19909467b48Spatrick   /// Check whether the current block has any metadata to emit.
hasMDs()20009467b48Spatrick   bool hasMDs() const { return NumModuleMDs < MDs.size(); }
20109467b48Spatrick 
20209467b48Spatrick   /// Get the MDString metadata for this block.
getMDStrings()20309467b48Spatrick   ArrayRef<const Metadata *> getMDStrings() const {
204*d415bd75Srobert     return ArrayRef(MDs).slice(NumModuleMDs, NumMDStrings);
20509467b48Spatrick   }
20609467b48Spatrick 
20709467b48Spatrick   /// Get the non-MDString metadata for this block.
getNonMDStrings()20809467b48Spatrick   ArrayRef<const Metadata *> getNonMDStrings() const {
209*d415bd75Srobert     return ArrayRef(MDs).slice(NumModuleMDs).slice(NumMDStrings);
21009467b48Spatrick   }
21109467b48Spatrick 
getTypes()21209467b48Spatrick   const TypeList &getTypes() const { return Types; }
21309467b48Spatrick 
getBasicBlocks()21409467b48Spatrick   const std::vector<const BasicBlock*> &getBasicBlocks() const {
21509467b48Spatrick     return BasicBlocks;
21609467b48Spatrick   }
21709467b48Spatrick 
getAttributeLists()21809467b48Spatrick   const std::vector<AttributeList> &getAttributeLists() const { return AttributeLists; }
21909467b48Spatrick 
getAttributeGroups()22009467b48Spatrick   const std::vector<IndexAndAttrSet> &getAttributeGroups() const {
22109467b48Spatrick     return AttributeGroups;
22209467b48Spatrick   }
22309467b48Spatrick 
getComdats()22409467b48Spatrick   const ComdatSetType &getComdats() const { return Comdats; }
22509467b48Spatrick   unsigned getComdatID(const Comdat *C) const;
22609467b48Spatrick 
22709467b48Spatrick   /// getGlobalBasicBlockID - This returns the function-specific ID for the
22809467b48Spatrick   /// specified basic block.  This is relatively expensive information, so it
22909467b48Spatrick   /// should only be used by rare constructs such as address-of-label.
23009467b48Spatrick   unsigned getGlobalBasicBlockID(const BasicBlock *BB) const;
23109467b48Spatrick 
23209467b48Spatrick   /// incorporateFunction/purgeFunction - If you'd like to deal with a function,
23309467b48Spatrick   /// use these two methods to get its data into the ValueEnumerator!
23409467b48Spatrick   void incorporateFunction(const Function &F);
23509467b48Spatrick 
23609467b48Spatrick   void purgeFunction();
23709467b48Spatrick   uint64_t computeBitsRequiredForTypeIndicies() const;
23809467b48Spatrick 
23909467b48Spatrick private:
24009467b48Spatrick   void OptimizeConstants(unsigned CstStart, unsigned CstEnd);
24109467b48Spatrick 
24209467b48Spatrick   /// Reorder the reachable metadata.
24309467b48Spatrick   ///
24409467b48Spatrick   /// This is not just an optimization, but is mandatory for emitting MDString
24509467b48Spatrick   /// correctly.
24609467b48Spatrick   void organizeMetadata();
24709467b48Spatrick 
24809467b48Spatrick   /// Drop the function tag from the transitive operands of the given node.
24909467b48Spatrick   void dropFunctionFromMetadata(MetadataMapType::value_type &FirstMD);
25009467b48Spatrick 
25109467b48Spatrick   /// Incorporate the function metadata.
25209467b48Spatrick   ///
25309467b48Spatrick   /// This should be called before enumerating LocalAsMetadata for the
25409467b48Spatrick   /// function.
25509467b48Spatrick   void incorporateFunctionMetadata(const Function &F);
25609467b48Spatrick 
25709467b48Spatrick   /// Enumerate a single instance of metadata with the given function tag.
25809467b48Spatrick   ///
25909467b48Spatrick   /// If \c MD has already been enumerated, check that \c F matches its
26009467b48Spatrick   /// function tag.  If not, call \a dropFunctionFromMetadata().
26109467b48Spatrick   ///
26209467b48Spatrick   /// Otherwise, mark \c MD as visited.  Assign it an ID, or just return it if
26309467b48Spatrick   /// it's an \a MDNode.
26409467b48Spatrick   const MDNode *enumerateMetadataImpl(unsigned F, const Metadata *MD);
26509467b48Spatrick 
26609467b48Spatrick   unsigned getMetadataFunctionID(const Function *F) const;
26709467b48Spatrick 
26809467b48Spatrick   /// Enumerate reachable metadata in (almost) post-order.
26909467b48Spatrick   ///
27009467b48Spatrick   /// Enumerate all the metadata reachable from MD.  We want to minimize the
27109467b48Spatrick   /// cost of reading bitcode records, and so the primary consideration is that
27209467b48Spatrick   /// operands of uniqued nodes are resolved before the nodes are read.  This
27309467b48Spatrick   /// avoids re-uniquing them on the context and factors away RAUW support.
27409467b48Spatrick   ///
27509467b48Spatrick   /// This algorithm guarantees that subgraphs of uniqued nodes are in
27609467b48Spatrick   /// post-order.  Distinct subgraphs reachable only from a single uniqued node
27709467b48Spatrick   /// will be in post-order.
27809467b48Spatrick   ///
27909467b48Spatrick   /// \note The relative order of a distinct and uniqued node is irrelevant.
28009467b48Spatrick   /// \a organizeMetadata() will later partition distinct nodes ahead of
28109467b48Spatrick   /// uniqued ones.
28209467b48Spatrick   ///{
28309467b48Spatrick   void EnumerateMetadata(const Function *F, const Metadata *MD);
28409467b48Spatrick   void EnumerateMetadata(unsigned F, const Metadata *MD);
28509467b48Spatrick   ///}
28609467b48Spatrick 
28709467b48Spatrick   void EnumerateFunctionLocalMetadata(const Function &F,
28809467b48Spatrick                                       const LocalAsMetadata *Local);
28909467b48Spatrick   void EnumerateFunctionLocalMetadata(unsigned F, const LocalAsMetadata *Local);
29073471bf0Spatrick   void EnumerateFunctionLocalListMetadata(const Function &F,
29173471bf0Spatrick                                           const DIArgList *ArgList);
29273471bf0Spatrick   void EnumerateFunctionLocalListMetadata(unsigned F, const DIArgList *Arglist);
29309467b48Spatrick   void EnumerateNamedMDNode(const NamedMDNode *NMD);
29409467b48Spatrick   void EnumerateValue(const Value *V);
29509467b48Spatrick   void EnumerateType(Type *T);
29609467b48Spatrick   void EnumerateOperandType(const Value *V);
29709467b48Spatrick   void EnumerateAttributes(AttributeList PAL);
29809467b48Spatrick 
29909467b48Spatrick   void EnumerateValueSymbolTable(const ValueSymbolTable &ST);
30009467b48Spatrick   void EnumerateNamedMetadata(const Module &M);
30109467b48Spatrick };
30209467b48Spatrick 
30309467b48Spatrick } // end namespace llvm
30409467b48Spatrick 
30509467b48Spatrick #endif // LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H
306