109467b48Spatrick //===- Bitcode/Writer/ValueEnumerator.h - Number values ---------*- C++ -*-===// 209467b48Spatrick // 309467b48Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 409467b48Spatrick // See https://llvm.org/LICENSE.txt for license information. 509467b48Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 609467b48Spatrick // 709467b48Spatrick //===----------------------------------------------------------------------===// 809467b48Spatrick // 909467b48Spatrick // This class gives values and types Unique ID's. 1009467b48Spatrick // 1109467b48Spatrick //===----------------------------------------------------------------------===// 1209467b48Spatrick 1309467b48Spatrick #ifndef LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H 1409467b48Spatrick #define LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H 1509467b48Spatrick 1609467b48Spatrick #include "llvm/ADT/ArrayRef.h" 1709467b48Spatrick #include "llvm/ADT/DenseMap.h" 1809467b48Spatrick #include "llvm/ADT/UniqueVector.h" 1909467b48Spatrick #include "llvm/IR/Attributes.h" 2009467b48Spatrick #include "llvm/IR/UseListOrder.h" 2109467b48Spatrick #include <cassert> 2209467b48Spatrick #include <cstdint> 2309467b48Spatrick #include <utility> 2409467b48Spatrick #include <vector> 2509467b48Spatrick 2609467b48Spatrick namespace llvm { 2709467b48Spatrick 2809467b48Spatrick class BasicBlock; 2909467b48Spatrick class Comdat; 3073471bf0Spatrick class DIArgList; 3109467b48Spatrick class Function; 3209467b48Spatrick class Instruction; 3309467b48Spatrick class LocalAsMetadata; 3409467b48Spatrick class MDNode; 3509467b48Spatrick class Metadata; 3609467b48Spatrick class Module; 3709467b48Spatrick class NamedMDNode; 3809467b48Spatrick class raw_ostream; 3909467b48Spatrick class Type; 4009467b48Spatrick class Value; 4109467b48Spatrick class ValueSymbolTable; 4209467b48Spatrick 4309467b48Spatrick class ValueEnumerator { 4409467b48Spatrick public: 4509467b48Spatrick using TypeList = std::vector<Type *>; 4609467b48Spatrick 4709467b48Spatrick // For each value, we remember its Value* and occurrence frequency. 4809467b48Spatrick using ValueList = std::vector<std::pair<const Value *, unsigned>>; 4909467b48Spatrick 5009467b48Spatrick /// Attribute groups as encoded in bitcode are almost AttributeSets, but they 5109467b48Spatrick /// include the AttributeList index, so we have to track that in our map. 5209467b48Spatrick using IndexAndAttrSet = std::pair<unsigned, AttributeSet>; 5309467b48Spatrick 5409467b48Spatrick UseListOrderStack UseListOrders; 5509467b48Spatrick 5609467b48Spatrick private: 5709467b48Spatrick using TypeMapType = DenseMap<Type *, unsigned>; 5809467b48Spatrick TypeMapType TypeMap; 5909467b48Spatrick TypeList Types; 6009467b48Spatrick 6109467b48Spatrick using ValueMapType = DenseMap<const Value *, unsigned>; 6209467b48Spatrick ValueMapType ValueMap; 6309467b48Spatrick ValueList Values; 6409467b48Spatrick 6509467b48Spatrick using ComdatSetType = UniqueVector<const Comdat *>; 6609467b48Spatrick ComdatSetType Comdats; 6709467b48Spatrick 6809467b48Spatrick std::vector<const Metadata *> MDs; 6909467b48Spatrick std::vector<const Metadata *> FunctionMDs; 7009467b48Spatrick 7109467b48Spatrick /// Index of information about a piece of metadata. 7209467b48Spatrick struct MDIndex { 7309467b48Spatrick unsigned F = 0; ///< The ID of the function for this metadata, if any. 7409467b48Spatrick unsigned ID = 0; ///< The implicit ID of this metadata in bitcode. 7509467b48Spatrick 7609467b48Spatrick MDIndex() = default; MDIndexMDIndex7709467b48Spatrick explicit MDIndex(unsigned F) : F(F) {} 7809467b48Spatrick 7909467b48Spatrick /// Check if this has a function tag, and it's different from NewF. hasDifferentFunctionMDIndex8009467b48Spatrick bool hasDifferentFunction(unsigned NewF) const { return F && F != NewF; } 8109467b48Spatrick 8209467b48Spatrick /// Fetch the MD this references out of the given metadata array. getMDIndex8309467b48Spatrick const Metadata *get(ArrayRef<const Metadata *> MDs) const { 8409467b48Spatrick assert(ID && "Expected non-zero ID"); 8509467b48Spatrick assert(ID <= MDs.size() && "Expected valid ID"); 8609467b48Spatrick return MDs[ID - 1]; 8709467b48Spatrick } 8809467b48Spatrick }; 8909467b48Spatrick 9009467b48Spatrick using MetadataMapType = DenseMap<const Metadata *, MDIndex>; 9109467b48Spatrick MetadataMapType MetadataMap; 9209467b48Spatrick 9309467b48Spatrick /// Range of metadata IDs, as a half-open range. 9409467b48Spatrick struct MDRange { 9509467b48Spatrick unsigned First = 0; 9609467b48Spatrick unsigned Last = 0; 9709467b48Spatrick 9809467b48Spatrick /// Number of strings in the prefix of the metadata range. 9909467b48Spatrick unsigned NumStrings = 0; 10009467b48Spatrick 10109467b48Spatrick MDRange() = default; MDRangeMDRange10209467b48Spatrick explicit MDRange(unsigned First) : First(First) {} 10309467b48Spatrick }; 10409467b48Spatrick SmallDenseMap<unsigned, MDRange, 1> FunctionMDInfo; 10509467b48Spatrick 10609467b48Spatrick bool ShouldPreserveUseListOrder; 10709467b48Spatrick 10809467b48Spatrick using AttributeGroupMapType = DenseMap<IndexAndAttrSet, unsigned>; 10909467b48Spatrick AttributeGroupMapType AttributeGroupMap; 11009467b48Spatrick std::vector<IndexAndAttrSet> AttributeGroups; 11109467b48Spatrick 11209467b48Spatrick using AttributeListMapType = DenseMap<AttributeList, unsigned>; 11309467b48Spatrick AttributeListMapType AttributeListMap; 11409467b48Spatrick std::vector<AttributeList> AttributeLists; 11509467b48Spatrick 11609467b48Spatrick /// GlobalBasicBlockIDs - This map memoizes the basic block ID's referenced by 11709467b48Spatrick /// the "getGlobalBasicBlockID" method. 11809467b48Spatrick mutable DenseMap<const BasicBlock*, unsigned> GlobalBasicBlockIDs; 11909467b48Spatrick 12009467b48Spatrick using InstructionMapType = DenseMap<const Instruction *, unsigned>; 12109467b48Spatrick InstructionMapType InstructionMap; 12209467b48Spatrick unsigned InstructionCount; 12309467b48Spatrick 12409467b48Spatrick /// BasicBlocks - This contains all the basic blocks for the currently 12509467b48Spatrick /// incorporated function. Their reverse mapping is stored in ValueMap. 12609467b48Spatrick std::vector<const BasicBlock*> BasicBlocks; 12709467b48Spatrick 12809467b48Spatrick /// When a function is incorporated, this is the size of the Values list 12909467b48Spatrick /// before incorporation. 13009467b48Spatrick unsigned NumModuleValues; 13109467b48Spatrick 13209467b48Spatrick /// When a function is incorporated, this is the size of the Metadatas list 13309467b48Spatrick /// before incorporation. 13409467b48Spatrick unsigned NumModuleMDs = 0; 13509467b48Spatrick unsigned NumMDStrings = 0; 13609467b48Spatrick 13709467b48Spatrick unsigned FirstFuncConstantID; 13809467b48Spatrick unsigned FirstInstID; 13909467b48Spatrick 14009467b48Spatrick public: 14109467b48Spatrick ValueEnumerator(const Module &M, bool ShouldPreserveUseListOrder); 14209467b48Spatrick ValueEnumerator(const ValueEnumerator &) = delete; 14309467b48Spatrick ValueEnumerator &operator=(const ValueEnumerator &) = delete; 14409467b48Spatrick 14509467b48Spatrick void dump() const; 14609467b48Spatrick void print(raw_ostream &OS, const ValueMapType &Map, const char *Name) const; 14709467b48Spatrick void print(raw_ostream &OS, const MetadataMapType &Map, 14809467b48Spatrick const char *Name) const; 14909467b48Spatrick 15009467b48Spatrick unsigned getValueID(const Value *V) const; 15109467b48Spatrick getMetadataID(const Metadata * MD)15209467b48Spatrick unsigned getMetadataID(const Metadata *MD) const { 15309467b48Spatrick auto ID = getMetadataOrNullID(MD); 15409467b48Spatrick assert(ID != 0 && "Metadata not in slotcalculator!"); 15509467b48Spatrick return ID - 1; 15609467b48Spatrick } 15709467b48Spatrick getMetadataOrNullID(const Metadata * MD)15809467b48Spatrick unsigned getMetadataOrNullID(const Metadata *MD) const { 15909467b48Spatrick return MetadataMap.lookup(MD).ID; 16009467b48Spatrick } 16109467b48Spatrick numMDs()16209467b48Spatrick unsigned numMDs() const { return MDs.size(); } 16309467b48Spatrick shouldPreserveUseListOrder()16409467b48Spatrick bool shouldPreserveUseListOrder() const { return ShouldPreserveUseListOrder; } 16509467b48Spatrick getTypeID(Type * T)16609467b48Spatrick unsigned getTypeID(Type *T) const { 16709467b48Spatrick TypeMapType::const_iterator I = TypeMap.find(T); 16809467b48Spatrick assert(I != TypeMap.end() && "Type not in ValueEnumerator!"); 16909467b48Spatrick return I->second-1; 17009467b48Spatrick } 17109467b48Spatrick 17209467b48Spatrick unsigned getInstructionID(const Instruction *I) const; 17309467b48Spatrick void setInstructionID(const Instruction *I); 17409467b48Spatrick getAttributeListID(AttributeList PAL)17509467b48Spatrick unsigned getAttributeListID(AttributeList PAL) const { 17609467b48Spatrick if (PAL.isEmpty()) return 0; // Null maps to zero. 17709467b48Spatrick AttributeListMapType::const_iterator I = AttributeListMap.find(PAL); 17809467b48Spatrick assert(I != AttributeListMap.end() && "Attribute not in ValueEnumerator!"); 17909467b48Spatrick return I->second; 18009467b48Spatrick } 18109467b48Spatrick getAttributeGroupID(IndexAndAttrSet Group)18209467b48Spatrick unsigned getAttributeGroupID(IndexAndAttrSet Group) const { 18309467b48Spatrick if (!Group.second.hasAttributes()) 18409467b48Spatrick return 0; // Null maps to zero. 18509467b48Spatrick AttributeGroupMapType::const_iterator I = AttributeGroupMap.find(Group); 18609467b48Spatrick assert(I != AttributeGroupMap.end() && "Attribute not in ValueEnumerator!"); 18709467b48Spatrick return I->second; 18809467b48Spatrick } 18909467b48Spatrick 19009467b48Spatrick /// getFunctionConstantRange - Return the range of values that corresponds to 19109467b48Spatrick /// function-local constants. getFunctionConstantRange(unsigned & Start,unsigned & End)19209467b48Spatrick void getFunctionConstantRange(unsigned &Start, unsigned &End) const { 19309467b48Spatrick Start = FirstFuncConstantID; 19409467b48Spatrick End = FirstInstID; 19509467b48Spatrick } 19609467b48Spatrick getValues()19709467b48Spatrick const ValueList &getValues() const { return Values; } 19809467b48Spatrick 19909467b48Spatrick /// Check whether the current block has any metadata to emit. hasMDs()20009467b48Spatrick bool hasMDs() const { return NumModuleMDs < MDs.size(); } 20109467b48Spatrick 20209467b48Spatrick /// Get the MDString metadata for this block. getMDStrings()20309467b48Spatrick ArrayRef<const Metadata *> getMDStrings() const { 204*d415bd75Srobert return ArrayRef(MDs).slice(NumModuleMDs, NumMDStrings); 20509467b48Spatrick } 20609467b48Spatrick 20709467b48Spatrick /// Get the non-MDString metadata for this block. getNonMDStrings()20809467b48Spatrick ArrayRef<const Metadata *> getNonMDStrings() const { 209*d415bd75Srobert return ArrayRef(MDs).slice(NumModuleMDs).slice(NumMDStrings); 21009467b48Spatrick } 21109467b48Spatrick getTypes()21209467b48Spatrick const TypeList &getTypes() const { return Types; } 21309467b48Spatrick getBasicBlocks()21409467b48Spatrick const std::vector<const BasicBlock*> &getBasicBlocks() const { 21509467b48Spatrick return BasicBlocks; 21609467b48Spatrick } 21709467b48Spatrick getAttributeLists()21809467b48Spatrick const std::vector<AttributeList> &getAttributeLists() const { return AttributeLists; } 21909467b48Spatrick getAttributeGroups()22009467b48Spatrick const std::vector<IndexAndAttrSet> &getAttributeGroups() const { 22109467b48Spatrick return AttributeGroups; 22209467b48Spatrick } 22309467b48Spatrick getComdats()22409467b48Spatrick const ComdatSetType &getComdats() const { return Comdats; } 22509467b48Spatrick unsigned getComdatID(const Comdat *C) const; 22609467b48Spatrick 22709467b48Spatrick /// getGlobalBasicBlockID - This returns the function-specific ID for the 22809467b48Spatrick /// specified basic block. This is relatively expensive information, so it 22909467b48Spatrick /// should only be used by rare constructs such as address-of-label. 23009467b48Spatrick unsigned getGlobalBasicBlockID(const BasicBlock *BB) const; 23109467b48Spatrick 23209467b48Spatrick /// incorporateFunction/purgeFunction - If you'd like to deal with a function, 23309467b48Spatrick /// use these two methods to get its data into the ValueEnumerator! 23409467b48Spatrick void incorporateFunction(const Function &F); 23509467b48Spatrick 23609467b48Spatrick void purgeFunction(); 23709467b48Spatrick uint64_t computeBitsRequiredForTypeIndicies() const; 23809467b48Spatrick 23909467b48Spatrick private: 24009467b48Spatrick void OptimizeConstants(unsigned CstStart, unsigned CstEnd); 24109467b48Spatrick 24209467b48Spatrick /// Reorder the reachable metadata. 24309467b48Spatrick /// 24409467b48Spatrick /// This is not just an optimization, but is mandatory for emitting MDString 24509467b48Spatrick /// correctly. 24609467b48Spatrick void organizeMetadata(); 24709467b48Spatrick 24809467b48Spatrick /// Drop the function tag from the transitive operands of the given node. 24909467b48Spatrick void dropFunctionFromMetadata(MetadataMapType::value_type &FirstMD); 25009467b48Spatrick 25109467b48Spatrick /// Incorporate the function metadata. 25209467b48Spatrick /// 25309467b48Spatrick /// This should be called before enumerating LocalAsMetadata for the 25409467b48Spatrick /// function. 25509467b48Spatrick void incorporateFunctionMetadata(const Function &F); 25609467b48Spatrick 25709467b48Spatrick /// Enumerate a single instance of metadata with the given function tag. 25809467b48Spatrick /// 25909467b48Spatrick /// If \c MD has already been enumerated, check that \c F matches its 26009467b48Spatrick /// function tag. If not, call \a dropFunctionFromMetadata(). 26109467b48Spatrick /// 26209467b48Spatrick /// Otherwise, mark \c MD as visited. Assign it an ID, or just return it if 26309467b48Spatrick /// it's an \a MDNode. 26409467b48Spatrick const MDNode *enumerateMetadataImpl(unsigned F, const Metadata *MD); 26509467b48Spatrick 26609467b48Spatrick unsigned getMetadataFunctionID(const Function *F) const; 26709467b48Spatrick 26809467b48Spatrick /// Enumerate reachable metadata in (almost) post-order. 26909467b48Spatrick /// 27009467b48Spatrick /// Enumerate all the metadata reachable from MD. We want to minimize the 27109467b48Spatrick /// cost of reading bitcode records, and so the primary consideration is that 27209467b48Spatrick /// operands of uniqued nodes are resolved before the nodes are read. This 27309467b48Spatrick /// avoids re-uniquing them on the context and factors away RAUW support. 27409467b48Spatrick /// 27509467b48Spatrick /// This algorithm guarantees that subgraphs of uniqued nodes are in 27609467b48Spatrick /// post-order. Distinct subgraphs reachable only from a single uniqued node 27709467b48Spatrick /// will be in post-order. 27809467b48Spatrick /// 27909467b48Spatrick /// \note The relative order of a distinct and uniqued node is irrelevant. 28009467b48Spatrick /// \a organizeMetadata() will later partition distinct nodes ahead of 28109467b48Spatrick /// uniqued ones. 28209467b48Spatrick ///{ 28309467b48Spatrick void EnumerateMetadata(const Function *F, const Metadata *MD); 28409467b48Spatrick void EnumerateMetadata(unsigned F, const Metadata *MD); 28509467b48Spatrick ///} 28609467b48Spatrick 28709467b48Spatrick void EnumerateFunctionLocalMetadata(const Function &F, 28809467b48Spatrick const LocalAsMetadata *Local); 28909467b48Spatrick void EnumerateFunctionLocalMetadata(unsigned F, const LocalAsMetadata *Local); 29073471bf0Spatrick void EnumerateFunctionLocalListMetadata(const Function &F, 29173471bf0Spatrick const DIArgList *ArgList); 29273471bf0Spatrick void EnumerateFunctionLocalListMetadata(unsigned F, const DIArgList *Arglist); 29309467b48Spatrick void EnumerateNamedMDNode(const NamedMDNode *NMD); 29409467b48Spatrick void EnumerateValue(const Value *V); 29509467b48Spatrick void EnumerateType(Type *T); 29609467b48Spatrick void EnumerateOperandType(const Value *V); 29709467b48Spatrick void EnumerateAttributes(AttributeList PAL); 29809467b48Spatrick 29909467b48Spatrick void EnumerateValueSymbolTable(const ValueSymbolTable &ST); 30009467b48Spatrick void EnumerateNamedMetadata(const Module &M); 30109467b48Spatrick }; 30209467b48Spatrick 30309467b48Spatrick } // end namespace llvm 30409467b48Spatrick 30509467b48Spatrick #endif // LLVM_LIB_BITCODE_WRITER_VALUEENUMERATOR_H 306