xref: /llvm-project/llvm/lib/Object/IRObjectFile.cpp (revision ec7e29e9419b083b5e3f9d0873ce8b35849a8cf8)
1 //===- IRObjectFile.cpp - IR object file implementation ---------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // Part of the IRObjectFile class implementation.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "llvm/Object/IRObjectFile.h"
15 #include "RecordStreamer.h"
16 #include "llvm/ADT/STLExtras.h"
17 #include "llvm/Bitcode/ReaderWriter.h"
18 #include "llvm/IR/GVMaterializer.h"
19 #include "llvm/IR/LLVMContext.h"
20 #include "llvm/IR/Mangler.h"
21 #include "llvm/IR/Module.h"
22 #include "llvm/MC/MCAsmInfo.h"
23 #include "llvm/MC/MCContext.h"
24 #include "llvm/MC/MCInstrInfo.h"
25 #include "llvm/MC/MCObjectFileInfo.h"
26 #include "llvm/MC/MCParser/MCAsmParser.h"
27 #include "llvm/MC/MCParser/MCTargetAsmParser.h"
28 #include "llvm/MC/MCRegisterInfo.h"
29 #include "llvm/MC/MCSubtargetInfo.h"
30 #include "llvm/Object/ObjectFile.h"
31 #include "llvm/Support/MemoryBuffer.h"
32 #include "llvm/Support/SourceMgr.h"
33 #include "llvm/Support/TargetRegistry.h"
34 #include "llvm/Support/raw_ostream.h"
35 using namespace llvm;
36 using namespace object;
37 
38 IRObjectFile::IRObjectFile(MemoryBufferRef Object, std::unique_ptr<Module> Mod)
39     : SymbolicFile(Binary::ID_IR, Object), M(std::move(Mod)) {
40   Mang.reset(new Mangler());
41   CollectAsmUndefinedRefs(
42       Triple(M->getTargetTriple()), M->getModuleInlineAsm(),
43       [this](StringRef Name, BasicSymbolRef::Flags Flags) {
44         AsmSymbols.push_back(
45             std::make_pair<std::string, uint32_t>(Name, std::move(Flags)));
46       });
47 }
48 
49 // Parse inline ASM and collect the list of symbols that are not defined in
50 // the current module. This is inspired from IRObjectFile.
51 void IRObjectFile::CollectAsmUndefinedRefs(
52     const Triple &TT, StringRef InlineAsm,
53     const std::function<void(StringRef, BasicSymbolRef::Flags)> &
54         AsmUndefinedRefs) {
55   if (InlineAsm.empty())
56     return;
57 
58   std::string Err;
59   const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
60   if (!T)
61     return;
62 
63   std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
64   if (!MRI)
65     return;
66 
67   std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str()));
68   if (!MAI)
69     return;
70 
71   std::unique_ptr<MCSubtargetInfo> STI(
72       T->createMCSubtargetInfo(TT.str(), "", ""));
73   if (!STI)
74     return;
75 
76   std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
77   if (!MCII)
78     return;
79 
80   MCObjectFileInfo MOFI;
81   MCContext MCCtx(MAI.get(), MRI.get(), &MOFI);
82   MOFI.InitMCObjectFileInfo(TT, /*PIC*/ false, CodeModel::Default, MCCtx);
83   std::unique_ptr<RecordStreamer> Streamer(new RecordStreamer(MCCtx));
84   T->createNullTargetStreamer(*Streamer);
85 
86   std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
87   SourceMgr SrcMgr;
88   SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
89   std::unique_ptr<MCAsmParser> Parser(
90       createMCAsmParser(SrcMgr, MCCtx, *Streamer, *MAI));
91 
92   MCTargetOptions MCOptions;
93   std::unique_ptr<MCTargetAsmParser> TAP(
94       T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
95   if (!TAP)
96     return;
97 
98   Parser->setTargetParser(*TAP);
99   if (Parser->Run(false))
100     return;
101 
102   for (auto &KV : *Streamer) {
103     StringRef Key = KV.first();
104     RecordStreamer::State Value = KV.second;
105     uint32_t Res = BasicSymbolRef::SF_None;
106     switch (Value) {
107     case RecordStreamer::NeverSeen:
108       llvm_unreachable("foo");
109     case RecordStreamer::DefinedGlobal:
110       Res |= BasicSymbolRef::SF_Global;
111       break;
112     case RecordStreamer::Defined:
113       break;
114     case RecordStreamer::Global:
115     case RecordStreamer::Used:
116       Res |= BasicSymbolRef::SF_Undefined;
117       Res |= BasicSymbolRef::SF_Global;
118       break;
119     case RecordStreamer::GlobalWeak:
120       Res |= BasicSymbolRef::SF_Weak;
121       Res |= BasicSymbolRef::SF_Global;
122     }
123     AsmUndefinedRefs(Key, BasicSymbolRef::Flags(Res));
124   }
125 }
126 
127 IRObjectFile::~IRObjectFile() {
128  }
129 
130 static GlobalValue *getGV(DataRefImpl &Symb) {
131   if ((Symb.p & 3) == 3)
132     return nullptr;
133 
134   return reinterpret_cast<GlobalValue*>(Symb.p & ~uintptr_t(3));
135 }
136 
137 static uintptr_t skipEmpty(Module::const_alias_iterator I, const Module &M) {
138   if (I == M.alias_end())
139     return 3;
140   const GlobalValue *GV = &*I;
141   return reinterpret_cast<uintptr_t>(GV) | 2;
142 }
143 
144 static uintptr_t skipEmpty(Module::const_global_iterator I, const Module &M) {
145   if (I == M.global_end())
146     return skipEmpty(M.alias_begin(), M);
147   const GlobalValue *GV = &*I;
148   return reinterpret_cast<uintptr_t>(GV) | 1;
149 }
150 
151 static uintptr_t skipEmpty(Module::const_iterator I, const Module &M) {
152   if (I == M.end())
153     return skipEmpty(M.global_begin(), M);
154   const GlobalValue *GV = &*I;
155   return reinterpret_cast<uintptr_t>(GV) | 0;
156 }
157 
158 static unsigned getAsmSymIndex(DataRefImpl Symb) {
159   assert((Symb.p & uintptr_t(3)) == 3);
160   uintptr_t Index = Symb.p & ~uintptr_t(3);
161   Index >>= 2;
162   return Index;
163 }
164 
165 void IRObjectFile::moveSymbolNext(DataRefImpl &Symb) const {
166   const GlobalValue *GV = getGV(Symb);
167   uintptr_t Res;
168 
169   switch (Symb.p & 3) {
170   case 0: {
171     Module::const_iterator Iter(static_cast<const Function*>(GV));
172     ++Iter;
173     Res = skipEmpty(Iter, *M);
174     break;
175   }
176   case 1: {
177     Module::const_global_iterator Iter(static_cast<const GlobalVariable*>(GV));
178     ++Iter;
179     Res = skipEmpty(Iter, *M);
180     break;
181   }
182   case 2: {
183     Module::const_alias_iterator Iter(static_cast<const GlobalAlias*>(GV));
184     ++Iter;
185     Res = skipEmpty(Iter, *M);
186     break;
187   }
188   case 3: {
189     unsigned Index = getAsmSymIndex(Symb);
190     assert(Index < AsmSymbols.size());
191     ++Index;
192     Res = (Index << 2) | 3;
193     break;
194   }
195   default:
196     llvm_unreachable("unreachable case");
197   }
198 
199   Symb.p = Res;
200 }
201 
202 std::error_code IRObjectFile::printSymbolName(raw_ostream &OS,
203                                               DataRefImpl Symb) const {
204   const GlobalValue *GV = getGV(Symb);
205   if (!GV) {
206     unsigned Index = getAsmSymIndex(Symb);
207     assert(Index <= AsmSymbols.size());
208     OS << AsmSymbols[Index].first;
209     return std::error_code();
210   }
211 
212   if (GV->hasDLLImportStorageClass())
213     OS << "__imp_";
214 
215   if (Mang)
216     Mang->getNameWithPrefix(OS, GV, false);
217   else
218     OS << GV->getName();
219 
220   return std::error_code();
221 }
222 
223 uint32_t IRObjectFile::getSymbolFlags(DataRefImpl Symb) const {
224   const GlobalValue *GV = getGV(Symb);
225 
226   if (!GV) {
227     unsigned Index = getAsmSymIndex(Symb);
228     assert(Index <= AsmSymbols.size());
229     return AsmSymbols[Index].second;
230   }
231 
232   uint32_t Res = BasicSymbolRef::SF_None;
233   if (GV->isDeclarationForLinker())
234     Res |= BasicSymbolRef::SF_Undefined;
235   else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
236     Res |= BasicSymbolRef::SF_Hidden;
237   if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
238     if (GVar->isConstant())
239       Res |= BasicSymbolRef::SF_Const;
240   }
241   if (GV->hasPrivateLinkage())
242     Res |= BasicSymbolRef::SF_FormatSpecific;
243   if (!GV->hasLocalLinkage())
244     Res |= BasicSymbolRef::SF_Global;
245   if (GV->hasCommonLinkage())
246     Res |= BasicSymbolRef::SF_Common;
247   if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
248       GV->hasExternalWeakLinkage())
249     Res |= BasicSymbolRef::SF_Weak;
250 
251   if (GV->getName().startswith("llvm."))
252     Res |= BasicSymbolRef::SF_FormatSpecific;
253   else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
254     if (Var->getSection() == "llvm.metadata")
255       Res |= BasicSymbolRef::SF_FormatSpecific;
256   }
257 
258   return Res;
259 }
260 
261 GlobalValue *IRObjectFile::getSymbolGV(DataRefImpl Symb) { return getGV(Symb); }
262 
263 std::unique_ptr<Module> IRObjectFile::takeModule() { return std::move(M); }
264 
265 basic_symbol_iterator IRObjectFile::symbol_begin_impl() const {
266   Module::const_iterator I = M->begin();
267   DataRefImpl Ret;
268   Ret.p = skipEmpty(I, *M);
269   return basic_symbol_iterator(BasicSymbolRef(Ret, this));
270 }
271 
272 basic_symbol_iterator IRObjectFile::symbol_end_impl() const {
273   DataRefImpl Ret;
274   uint64_t NumAsm = AsmSymbols.size();
275   NumAsm <<= 2;
276   Ret.p = 3 | NumAsm;
277   return basic_symbol_iterator(BasicSymbolRef(Ret, this));
278 }
279 
280 ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInObject(const ObjectFile &Obj) {
281   for (const SectionRef &Sec : Obj.sections()) {
282     if (Sec.isBitcode()) {
283       StringRef SecContents;
284       if (std::error_code EC = Sec.getContents(SecContents))
285         return EC;
286       return MemoryBufferRef(SecContents, Obj.getFileName());
287     }
288   }
289 
290   return object_error::bitcode_section_not_found;
291 }
292 
293 ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInMemBuffer(MemoryBufferRef Object) {
294   sys::fs::file_magic Type = sys::fs::identify_magic(Object.getBuffer());
295   switch (Type) {
296   case sys::fs::file_magic::bitcode:
297     return Object;
298   case sys::fs::file_magic::elf_relocatable:
299   case sys::fs::file_magic::macho_object:
300   case sys::fs::file_magic::coff_object: {
301     Expected<std::unique_ptr<ObjectFile>> ObjFile =
302         ObjectFile::createObjectFile(Object, Type);
303     if (!ObjFile)
304       return errorToErrorCode(ObjFile.takeError());
305     return findBitcodeInObject(*ObjFile->get());
306   }
307   default:
308     return object_error::invalid_file_type;
309   }
310 }
311 
312 ErrorOr<std::unique_ptr<IRObjectFile>>
313 llvm::object::IRObjectFile::create(MemoryBufferRef Object,
314                                    LLVMContext &Context) {
315   ErrorOr<MemoryBufferRef> BCOrErr = findBitcodeInMemBuffer(Object);
316   if (!BCOrErr)
317     return BCOrErr.getError();
318 
319   std::unique_ptr<MemoryBuffer> Buff =
320       MemoryBuffer::getMemBuffer(BCOrErr.get(), false);
321 
322   ErrorOr<std::unique_ptr<Module>> MOrErr =
323       getLazyBitcodeModule(std::move(Buff), Context,
324                            /*ShouldLazyLoadMetadata*/ true);
325   if (std::error_code EC = MOrErr.getError())
326     return EC;
327 
328   std::unique_ptr<Module> &M = MOrErr.get();
329   return llvm::make_unique<IRObjectFile>(Object, std::move(M));
330 }
331