1*f6aab3d8Srobert //===-- ObjectContainerMachOFileset.cpp -----------------------------------===//
2*f6aab3d8Srobert //
3*f6aab3d8Srobert // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*f6aab3d8Srobert // See https://llvm.org/LICENSE.txt for license information.
5*f6aab3d8Srobert // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*f6aab3d8Srobert //
7*f6aab3d8Srobert //===----------------------------------------------------------------------===//
8*f6aab3d8Srobert 
9*f6aab3d8Srobert #include "ObjectContainerMachOFileset.h"
10*f6aab3d8Srobert #include "lldb/Core/Module.h"
11*f6aab3d8Srobert #include "lldb/Core/ModuleSpec.h"
12*f6aab3d8Srobert #include "lldb/Core/PluginManager.h"
13*f6aab3d8Srobert #include "lldb/Symbol/ObjectFile.h"
14*f6aab3d8Srobert #include "lldb/Target/Target.h"
15*f6aab3d8Srobert #include "lldb/Utility/ArchSpec.h"
16*f6aab3d8Srobert #include "lldb/Utility/DataBuffer.h"
17*f6aab3d8Srobert #include "lldb/Utility/Stream.h"
18*f6aab3d8Srobert #include <optional>
19*f6aab3d8Srobert 
20*f6aab3d8Srobert using namespace lldb;
21*f6aab3d8Srobert using namespace lldb_private;
22*f6aab3d8Srobert using namespace llvm::MachO;
23*f6aab3d8Srobert 
LLDB_PLUGIN_DEFINE(ObjectContainerMachOFileset)24*f6aab3d8Srobert LLDB_PLUGIN_DEFINE(ObjectContainerMachOFileset)
25*f6aab3d8Srobert 
26*f6aab3d8Srobert void ObjectContainerMachOFileset::Initialize() {
27*f6aab3d8Srobert   PluginManager::RegisterPlugin(GetPluginNameStatic(),
28*f6aab3d8Srobert                                 GetPluginDescriptionStatic(), CreateInstance,
29*f6aab3d8Srobert                                 GetModuleSpecifications, CreateMemoryInstance);
30*f6aab3d8Srobert }
31*f6aab3d8Srobert 
Terminate()32*f6aab3d8Srobert void ObjectContainerMachOFileset::Terminate() {
33*f6aab3d8Srobert   PluginManager::UnregisterPlugin(CreateInstance);
34*f6aab3d8Srobert }
35*f6aab3d8Srobert 
ObjectContainerMachOFileset(const lldb::ModuleSP & module_sp,lldb::DataBufferSP & data_sp,lldb::offset_t data_offset,const lldb_private::FileSpec * file,lldb::offset_t offset,lldb::offset_t length)36*f6aab3d8Srobert ObjectContainerMachOFileset::ObjectContainerMachOFileset(
37*f6aab3d8Srobert     const lldb::ModuleSP &module_sp, lldb::DataBufferSP &data_sp,
38*f6aab3d8Srobert     lldb::offset_t data_offset, const lldb_private::FileSpec *file,
39*f6aab3d8Srobert     lldb::offset_t offset, lldb::offset_t length)
40*f6aab3d8Srobert     : ObjectContainer(module_sp, file, offset, length, data_sp, data_offset),
41*f6aab3d8Srobert       m_memory_addr(LLDB_INVALID_ADDRESS) {}
42*f6aab3d8Srobert 
ObjectContainerMachOFileset(const lldb::ModuleSP & module_sp,lldb::WritableDataBufferSP data_sp,const lldb::ProcessSP & process_sp,lldb::addr_t header_addr)43*f6aab3d8Srobert ObjectContainerMachOFileset::ObjectContainerMachOFileset(
44*f6aab3d8Srobert     const lldb::ModuleSP &module_sp, lldb::WritableDataBufferSP data_sp,
45*f6aab3d8Srobert     const lldb::ProcessSP &process_sp, lldb::addr_t header_addr)
46*f6aab3d8Srobert     : ObjectContainer(module_sp, nullptr, 0, data_sp->GetByteSize(), data_sp,
47*f6aab3d8Srobert                       0),
48*f6aab3d8Srobert       m_process_wp(process_sp), m_memory_addr(header_addr) {}
49*f6aab3d8Srobert 
CreateInstance(const lldb::ModuleSP & module_sp,DataBufferSP & data_sp,lldb::offset_t data_offset,const FileSpec * file,lldb::offset_t file_offset,lldb::offset_t length)50*f6aab3d8Srobert ObjectContainer *ObjectContainerMachOFileset::CreateInstance(
51*f6aab3d8Srobert     const lldb::ModuleSP &module_sp, DataBufferSP &data_sp,
52*f6aab3d8Srobert     lldb::offset_t data_offset, const FileSpec *file,
53*f6aab3d8Srobert     lldb::offset_t file_offset, lldb::offset_t length) {
54*f6aab3d8Srobert   if (!data_sp)
55*f6aab3d8Srobert     return {};
56*f6aab3d8Srobert 
57*f6aab3d8Srobert   DataExtractor data;
58*f6aab3d8Srobert   data.SetData(data_sp, data_offset, length);
59*f6aab3d8Srobert   if (!MagicBytesMatch(data))
60*f6aab3d8Srobert     return {};
61*f6aab3d8Srobert 
62*f6aab3d8Srobert   auto container_up = std::make_unique<ObjectContainerMachOFileset>(
63*f6aab3d8Srobert       module_sp, data_sp, data_offset, file, file_offset, length);
64*f6aab3d8Srobert   if (!container_up->ParseHeader())
65*f6aab3d8Srobert     return {};
66*f6aab3d8Srobert 
67*f6aab3d8Srobert   return container_up.release();
68*f6aab3d8Srobert }
69*f6aab3d8Srobert 
CreateMemoryInstance(const lldb::ModuleSP & module_sp,lldb::WritableDataBufferSP data_sp,const lldb::ProcessSP & process_sp,lldb::addr_t header_addr)70*f6aab3d8Srobert ObjectContainer *ObjectContainerMachOFileset::CreateMemoryInstance(
71*f6aab3d8Srobert     const lldb::ModuleSP &module_sp, lldb::WritableDataBufferSP data_sp,
72*f6aab3d8Srobert     const lldb::ProcessSP &process_sp, lldb::addr_t header_addr) {
73*f6aab3d8Srobert   if (!MagicBytesMatch(data_sp, 0, data_sp->GetByteSize()))
74*f6aab3d8Srobert     return {};
75*f6aab3d8Srobert 
76*f6aab3d8Srobert   auto container_up = std::make_unique<ObjectContainerMachOFileset>(
77*f6aab3d8Srobert       module_sp, data_sp, process_sp, header_addr);
78*f6aab3d8Srobert   if (!container_up->ParseHeader())
79*f6aab3d8Srobert     return {};
80*f6aab3d8Srobert 
81*f6aab3d8Srobert   return container_up.release();
82*f6aab3d8Srobert }
83*f6aab3d8Srobert 
84*f6aab3d8Srobert ObjectContainerMachOFileset::~ObjectContainerMachOFileset() = default;
85*f6aab3d8Srobert 
MachHeaderSizeFromMagic(uint32_t magic)86*f6aab3d8Srobert static uint32_t MachHeaderSizeFromMagic(uint32_t magic) {
87*f6aab3d8Srobert   switch (magic) {
88*f6aab3d8Srobert   case MH_MAGIC:
89*f6aab3d8Srobert   case MH_CIGAM:
90*f6aab3d8Srobert     return sizeof(struct mach_header);
91*f6aab3d8Srobert   case MH_MAGIC_64:
92*f6aab3d8Srobert   case MH_CIGAM_64:
93*f6aab3d8Srobert     return sizeof(struct mach_header_64);
94*f6aab3d8Srobert   default:
95*f6aab3d8Srobert     return 0;
96*f6aab3d8Srobert   }
97*f6aab3d8Srobert }
98*f6aab3d8Srobert 
ParseMachOHeader(DataExtractor & data)99*f6aab3d8Srobert static std::optional<mach_header> ParseMachOHeader(DataExtractor &data) {
100*f6aab3d8Srobert   lldb::offset_t offset = 0;
101*f6aab3d8Srobert   mach_header header;
102*f6aab3d8Srobert   header.magic = data.GetU32(&offset);
103*f6aab3d8Srobert   switch (header.magic) {
104*f6aab3d8Srobert   case MH_MAGIC:
105*f6aab3d8Srobert     data.SetByteOrder(endian::InlHostByteOrder());
106*f6aab3d8Srobert     data.SetAddressByteSize(4);
107*f6aab3d8Srobert     break;
108*f6aab3d8Srobert   case MH_MAGIC_64:
109*f6aab3d8Srobert     data.SetByteOrder(endian::InlHostByteOrder());
110*f6aab3d8Srobert     data.SetAddressByteSize(8);
111*f6aab3d8Srobert     break;
112*f6aab3d8Srobert   case MH_CIGAM:
113*f6aab3d8Srobert     data.SetByteOrder(endian::InlHostByteOrder() == eByteOrderBig
114*f6aab3d8Srobert                           ? eByteOrderLittle
115*f6aab3d8Srobert                           : eByteOrderBig);
116*f6aab3d8Srobert     data.SetAddressByteSize(4);
117*f6aab3d8Srobert     break;
118*f6aab3d8Srobert   case MH_CIGAM_64:
119*f6aab3d8Srobert     data.SetByteOrder(endian::InlHostByteOrder() == eByteOrderBig
120*f6aab3d8Srobert                           ? eByteOrderLittle
121*f6aab3d8Srobert                           : eByteOrderBig);
122*f6aab3d8Srobert     data.SetAddressByteSize(8);
123*f6aab3d8Srobert     break;
124*f6aab3d8Srobert   default:
125*f6aab3d8Srobert     return {};
126*f6aab3d8Srobert   }
127*f6aab3d8Srobert 
128*f6aab3d8Srobert   header.cputype = data.GetU32(&offset);
129*f6aab3d8Srobert   header.cpusubtype = data.GetU32(&offset);
130*f6aab3d8Srobert   header.filetype = data.GetU32(&offset);
131*f6aab3d8Srobert   header.ncmds = data.GetU32(&offset);
132*f6aab3d8Srobert   header.sizeofcmds = data.GetU32(&offset);
133*f6aab3d8Srobert   return header;
134*f6aab3d8Srobert }
135*f6aab3d8Srobert 
136*f6aab3d8Srobert static bool
ParseFileset(DataExtractor & data,mach_header header,std::vector<ObjectContainerMachOFileset::Entry> & entries,std::optional<lldb::addr_t> load_addr=std::nullopt)137*f6aab3d8Srobert ParseFileset(DataExtractor &data, mach_header header,
138*f6aab3d8Srobert              std::vector<ObjectContainerMachOFileset::Entry> &entries,
139*f6aab3d8Srobert              std::optional<lldb::addr_t> load_addr = std::nullopt) {
140*f6aab3d8Srobert   lldb::offset_t offset = MachHeaderSizeFromMagic(header.magic);
141*f6aab3d8Srobert   lldb::offset_t slide = 0;
142*f6aab3d8Srobert   for (uint32_t i = 0; i < header.ncmds; ++i) {
143*f6aab3d8Srobert     const lldb::offset_t load_cmd_offset = offset;
144*f6aab3d8Srobert     load_command lc = {};
145*f6aab3d8Srobert     if (data.GetU32(&offset, &lc.cmd, 2) == nullptr)
146*f6aab3d8Srobert       break;
147*f6aab3d8Srobert 
148*f6aab3d8Srobert     // If we know the load address we can compute the slide.
149*f6aab3d8Srobert     if (load_addr) {
150*f6aab3d8Srobert       if (lc.cmd == llvm::MachO::LC_SEGMENT_64) {
151*f6aab3d8Srobert         segment_command_64 segment;
152*f6aab3d8Srobert         data.CopyData(load_cmd_offset, sizeof(segment_command_64), &segment);
153*f6aab3d8Srobert         if (llvm::StringRef(segment.segname) == "__TEXT")
154*f6aab3d8Srobert           slide = *load_addr - segment.vmaddr;
155*f6aab3d8Srobert       }
156*f6aab3d8Srobert     }
157*f6aab3d8Srobert 
158*f6aab3d8Srobert     if (lc.cmd == LC_FILESET_ENTRY) {
159*f6aab3d8Srobert       fileset_entry_command entry;
160*f6aab3d8Srobert       data.CopyData(load_cmd_offset, sizeof(fileset_entry_command), &entry);
161*f6aab3d8Srobert       lldb::offset_t entry_id_offset = load_cmd_offset + entry.entry_id;
162*f6aab3d8Srobert       const char *id = data.GetCStr(&entry_id_offset);
163*f6aab3d8Srobert       entries.emplace_back(entry.vmaddr + slide, entry.fileoff,
164*f6aab3d8Srobert                            std::string(id));
165*f6aab3d8Srobert     }
166*f6aab3d8Srobert 
167*f6aab3d8Srobert     offset = load_cmd_offset + lc.cmdsize;
168*f6aab3d8Srobert   }
169*f6aab3d8Srobert 
170*f6aab3d8Srobert   return true;
171*f6aab3d8Srobert }
172*f6aab3d8Srobert 
ParseHeader(DataExtractor & data,const lldb_private::FileSpec & file,lldb::offset_t file_offset,std::vector<Entry> & entries)173*f6aab3d8Srobert bool ObjectContainerMachOFileset::ParseHeader(
174*f6aab3d8Srobert     DataExtractor &data, const lldb_private::FileSpec &file,
175*f6aab3d8Srobert     lldb::offset_t file_offset, std::vector<Entry> &entries) {
176*f6aab3d8Srobert   std::optional<mach_header> header = ParseMachOHeader(data);
177*f6aab3d8Srobert 
178*f6aab3d8Srobert   if (!header)
179*f6aab3d8Srobert     return false;
180*f6aab3d8Srobert 
181*f6aab3d8Srobert   const size_t header_size = MachHeaderSizeFromMagic(header->magic);
182*f6aab3d8Srobert   const size_t header_and_lc_size = header_size + header->sizeofcmds;
183*f6aab3d8Srobert 
184*f6aab3d8Srobert   if (data.GetByteSize() < header_and_lc_size) {
185*f6aab3d8Srobert     DataBufferSP data_sp =
186*f6aab3d8Srobert         ObjectFile::MapFileData(file, header_and_lc_size, file_offset);
187*f6aab3d8Srobert     data.SetData(data_sp);
188*f6aab3d8Srobert   }
189*f6aab3d8Srobert 
190*f6aab3d8Srobert   return ParseFileset(data, *header, entries);
191*f6aab3d8Srobert }
192*f6aab3d8Srobert 
ParseHeader()193*f6aab3d8Srobert bool ObjectContainerMachOFileset::ParseHeader() {
194*f6aab3d8Srobert   ModuleSP module_sp(GetModule());
195*f6aab3d8Srobert   if (!module_sp)
196*f6aab3d8Srobert     return false;
197*f6aab3d8Srobert 
198*f6aab3d8Srobert   std::lock_guard<std::recursive_mutex> guard(module_sp->GetMutex());
199*f6aab3d8Srobert 
200*f6aab3d8Srobert   std::optional<mach_header> header = ParseMachOHeader(m_data);
201*f6aab3d8Srobert   if (!header)
202*f6aab3d8Srobert     return false;
203*f6aab3d8Srobert 
204*f6aab3d8Srobert   const size_t header_size = MachHeaderSizeFromMagic(header->magic);
205*f6aab3d8Srobert   const size_t header_and_lc_size = header_size + header->sizeofcmds;
206*f6aab3d8Srobert 
207*f6aab3d8Srobert   if (m_data.GetByteSize() < header_and_lc_size) {
208*f6aab3d8Srobert     ProcessSP process_sp(m_process_wp.lock());
209*f6aab3d8Srobert     DataBufferSP data_sp =
210*f6aab3d8Srobert         process_sp
211*f6aab3d8Srobert             ? ObjectFile::ReadMemory(process_sp, m_memory_addr,
212*f6aab3d8Srobert                                      header_and_lc_size)
213*f6aab3d8Srobert             : ObjectFile::MapFileData(m_file, header_and_lc_size, m_offset);
214*f6aab3d8Srobert     m_data.SetData(data_sp);
215*f6aab3d8Srobert   }
216*f6aab3d8Srobert 
217*f6aab3d8Srobert   return ParseFileset(m_data, *header, m_entries, m_memory_addr);
218*f6aab3d8Srobert }
219*f6aab3d8Srobert 
GetModuleSpecifications(const lldb_private::FileSpec & file,lldb::DataBufferSP & data_sp,lldb::offset_t data_offset,lldb::offset_t file_offset,lldb::offset_t file_size,lldb_private::ModuleSpecList & specs)220*f6aab3d8Srobert size_t ObjectContainerMachOFileset::GetModuleSpecifications(
221*f6aab3d8Srobert     const lldb_private::FileSpec &file, lldb::DataBufferSP &data_sp,
222*f6aab3d8Srobert     lldb::offset_t data_offset, lldb::offset_t file_offset,
223*f6aab3d8Srobert     lldb::offset_t file_size, lldb_private::ModuleSpecList &specs) {
224*f6aab3d8Srobert   const size_t initial_count = specs.GetSize();
225*f6aab3d8Srobert 
226*f6aab3d8Srobert   DataExtractor data;
227*f6aab3d8Srobert   data.SetData(data_sp, data_offset, data_sp->GetByteSize());
228*f6aab3d8Srobert 
229*f6aab3d8Srobert   if (MagicBytesMatch(data)) {
230*f6aab3d8Srobert     std::vector<Entry> entries;
231*f6aab3d8Srobert     if (ParseHeader(data, file, file_offset, entries)) {
232*f6aab3d8Srobert       for (const Entry &entry : entries) {
233*f6aab3d8Srobert         const lldb::offset_t entry_offset = entry.fileoff + file_offset;
234*f6aab3d8Srobert         if (ObjectFile::GetModuleSpecifications(
235*f6aab3d8Srobert                 file, entry_offset, file_size - entry_offset, specs)) {
236*f6aab3d8Srobert           ModuleSpec &spec = specs.GetModuleSpecRefAtIndex(specs.GetSize() - 1);
237*f6aab3d8Srobert           spec.GetObjectName() = ConstString(entry.id);
238*f6aab3d8Srobert         }
239*f6aab3d8Srobert       }
240*f6aab3d8Srobert     }
241*f6aab3d8Srobert   }
242*f6aab3d8Srobert   return specs.GetSize() - initial_count;
243*f6aab3d8Srobert }
244*f6aab3d8Srobert 
MagicBytesMatch(DataBufferSP data_sp,lldb::addr_t data_offset,lldb::addr_t data_length)245*f6aab3d8Srobert bool ObjectContainerMachOFileset::MagicBytesMatch(DataBufferSP data_sp,
246*f6aab3d8Srobert                                                   lldb::addr_t data_offset,
247*f6aab3d8Srobert                                                   lldb::addr_t data_length) {
248*f6aab3d8Srobert   DataExtractor data;
249*f6aab3d8Srobert   data.SetData(data_sp, data_offset, data_length);
250*f6aab3d8Srobert   return MagicBytesMatch(data);
251*f6aab3d8Srobert }
252*f6aab3d8Srobert 
MagicBytesMatch(const DataExtractor & data)253*f6aab3d8Srobert bool ObjectContainerMachOFileset::MagicBytesMatch(const DataExtractor &data) {
254*f6aab3d8Srobert   lldb::offset_t offset = 0;
255*f6aab3d8Srobert   uint32_t magic = data.GetU32(&offset);
256*f6aab3d8Srobert   switch (magic) {
257*f6aab3d8Srobert   case MH_MAGIC:
258*f6aab3d8Srobert   case MH_CIGAM:
259*f6aab3d8Srobert   case MH_MAGIC_64:
260*f6aab3d8Srobert   case MH_CIGAM_64:
261*f6aab3d8Srobert     break;
262*f6aab3d8Srobert   default:
263*f6aab3d8Srobert     return false;
264*f6aab3d8Srobert   }
265*f6aab3d8Srobert   offset += 4; // cputype
266*f6aab3d8Srobert   offset += 4; // cpusubtype
267*f6aab3d8Srobert   uint32_t filetype = data.GetU32(&offset);
268*f6aab3d8Srobert   return filetype == MH_FILESET;
269*f6aab3d8Srobert }
270*f6aab3d8Srobert 
271*f6aab3d8Srobert ObjectFileSP
GetObjectFile(const lldb_private::FileSpec * file)272*f6aab3d8Srobert ObjectContainerMachOFileset::GetObjectFile(const lldb_private::FileSpec *file) {
273*f6aab3d8Srobert   ModuleSP module_sp(GetModule());
274*f6aab3d8Srobert   if (!module_sp)
275*f6aab3d8Srobert     return {};
276*f6aab3d8Srobert 
277*f6aab3d8Srobert   ConstString object_name = module_sp->GetObjectName();
278*f6aab3d8Srobert   if (!object_name)
279*f6aab3d8Srobert     return {};
280*f6aab3d8Srobert 
281*f6aab3d8Srobert   Entry *entry = FindEntry(object_name.GetCString());
282*f6aab3d8Srobert   if (!entry)
283*f6aab3d8Srobert     return {};
284*f6aab3d8Srobert 
285*f6aab3d8Srobert   DataBufferSP data_sp;
286*f6aab3d8Srobert   lldb::offset_t data_offset = 0;
287*f6aab3d8Srobert   return ObjectFile::FindPlugin(module_sp, file, m_offset + entry->fileoff,
288*f6aab3d8Srobert                                 m_data.GetByteSize() - entry->fileoff, data_sp,
289*f6aab3d8Srobert                                 data_offset);
290*f6aab3d8Srobert }
291*f6aab3d8Srobert 
292*f6aab3d8Srobert ObjectContainerMachOFileset::Entry *
FindEntry(llvm::StringRef id)293*f6aab3d8Srobert ObjectContainerMachOFileset::FindEntry(llvm::StringRef id) {
294*f6aab3d8Srobert   for (Entry &entry : m_entries) {
295*f6aab3d8Srobert     if (entry.id == id)
296*f6aab3d8Srobert       return &entry;
297*f6aab3d8Srobert   }
298*f6aab3d8Srobert   return nullptr;
299*f6aab3d8Srobert }
300