xref: /netbsd-src/external/gpl3/gdb/dist/gdb/solib-darwin.c (revision 82d56013d7b633d116a93943de88e08335357a7c)
1 /* Handle Darwin shared libraries for GDB, the GNU Debugger.
2 
3    Copyright (C) 2009-2020 Free Software Foundation, Inc.
4 
5    This file is part of GDB.
6 
7    This program is free software; you can redistribute it and/or modify
8    it under the terms of the GNU General Public License as published by
9    the Free Software Foundation; either version 3 of the License, or
10    (at your option) any later version.
11 
12    This program is distributed in the hope that it will be useful,
13    but WITHOUT ANY WARRANTY; without even the implied warranty of
14    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15    GNU General Public License for more details.
16 
17    You should have received a copy of the GNU General Public License
18    along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
19 
20 #include "defs.h"
21 
22 #include "symtab.h"
23 #include "bfd.h"
24 #include "symfile.h"
25 #include "objfiles.h"
26 #include "gdbcore.h"
27 #include "target.h"
28 #include "inferior.h"
29 #include "regcache.h"
30 #include "gdbthread.h"
31 #include "gdb_bfd.h"
32 
33 #include "solist.h"
34 #include "solib.h"
35 #include "solib-svr4.h"
36 
37 #include "bfd-target.h"
38 #include "elf-bfd.h"
39 #include "exec.h"
40 #include "auxv.h"
41 #include "mach-o.h"
42 #include "mach-o/external.h"
43 
44 struct gdb_dyld_image_info
45 {
46   /* Base address (which corresponds to the Mach-O header).  */
47   CORE_ADDR mach_header;
48   /* Image file path.  */
49   CORE_ADDR file_path;
50   /* st.m_time of image file.  */
51   unsigned long mtime;
52 };
53 
54 /* Content of inferior dyld_all_image_infos structure.
55    See /usr/include/mach-o/dyld_images.h for the documentation.  */
56 struct gdb_dyld_all_image_infos
57 {
58   /* Version (1).  */
59   unsigned int version;
60   /* Number of images.  */
61   unsigned int count;
62   /* Image description.  */
63   CORE_ADDR info;
64   /* Notifier (function called when a library is added or removed).  */
65   CORE_ADDR notifier;
66 };
67 
68 /* Current all_image_infos version.  */
69 #define DYLD_VERSION_MIN 1
70 #define DYLD_VERSION_MAX 15
71 
72 /* Per PSPACE specific data.  */
73 struct darwin_info
74 {
75   /* Address of structure dyld_all_image_infos in inferior.  */
76   CORE_ADDR all_image_addr = 0;
77 
78   /* Gdb copy of dyld_all_info_infos.  */
79   struct gdb_dyld_all_image_infos all_image {};
80 };
81 
82 /* Per-program-space data key.  */
83 static program_space_key<darwin_info> solib_darwin_pspace_data;
84 
85 /* Get the current darwin data.  If none is found yet, add it now.  This
86    function always returns a valid object.  */
87 
88 static struct darwin_info *
89 get_darwin_info (void)
90 {
91   struct darwin_info *info;
92 
93   info = solib_darwin_pspace_data.get (current_program_space);
94   if (info != NULL)
95     return info;
96 
97   return solib_darwin_pspace_data.emplace (current_program_space);
98 }
99 
100 /* Return non-zero if the version in dyld_all_image is known.  */
101 
102 static int
103 darwin_dyld_version_ok (const struct darwin_info *info)
104 {
105   return info->all_image.version >= DYLD_VERSION_MIN
106     && info->all_image.version <= DYLD_VERSION_MAX;
107 }
108 
109 /* Read dyld_all_image from inferior.  */
110 
111 static void
112 darwin_load_image_infos (struct darwin_info *info)
113 {
114   gdb_byte buf[24];
115   enum bfd_endian byte_order = gdbarch_byte_order (target_gdbarch ());
116   struct type *ptr_type = builtin_type (target_gdbarch ())->builtin_data_ptr;
117   int len;
118 
119   /* If the structure address is not known, don't continue.  */
120   if (info->all_image_addr == 0)
121     return;
122 
123   /* The structure has 4 fields: version (4 bytes), count (4 bytes),
124      info (pointer) and notifier (pointer).  */
125   len = 4 + 4 + 2 * TYPE_LENGTH (ptr_type);
126   gdb_assert (len <= sizeof (buf));
127   memset (&info->all_image, 0, sizeof (info->all_image));
128 
129   /* Read structure raw bytes from target.  */
130   if (target_read_memory (info->all_image_addr, buf, len))
131     return;
132 
133   /* Extract the fields.  */
134   info->all_image.version = extract_unsigned_integer (buf, 4, byte_order);
135   if (!darwin_dyld_version_ok (info))
136     return;
137 
138   info->all_image.count = extract_unsigned_integer (buf + 4, 4, byte_order);
139   info->all_image.info = extract_typed_address (buf + 8, ptr_type);
140   info->all_image.notifier = extract_typed_address
141     (buf + 8 + TYPE_LENGTH (ptr_type), ptr_type);
142 }
143 
144 /* Link map info to include in an allocated so_list entry.  */
145 
146 struct lm_info_darwin : public lm_info_base
147 {
148   /* The target location of lm.  */
149   CORE_ADDR lm_addr = 0;
150 };
151 
152 /* Lookup the value for a specific symbol.  */
153 
154 static CORE_ADDR
155 lookup_symbol_from_bfd (bfd *abfd, const char *symname)
156 {
157   long storage_needed;
158   asymbol **symbol_table;
159   unsigned int number_of_symbols;
160   unsigned int i;
161   CORE_ADDR symaddr = 0;
162 
163   storage_needed = bfd_get_symtab_upper_bound (abfd);
164 
165   if (storage_needed <= 0)
166     return 0;
167 
168   symbol_table = (asymbol **) xmalloc (storage_needed);
169   number_of_symbols = bfd_canonicalize_symtab (abfd, symbol_table);
170 
171   for (i = 0; i < number_of_symbols; i++)
172     {
173       asymbol *sym = symbol_table[i];
174 
175       if (strcmp (sym->name, symname) == 0
176 	  && (sym->section->flags & (SEC_CODE | SEC_DATA)) != 0)
177 	{
178 	  /* BFD symbols are section relative.  */
179 	  symaddr = sym->value + sym->section->vma;
180 	  break;
181 	}
182     }
183   xfree (symbol_table);
184 
185   return symaddr;
186 }
187 
188 /* Return program interpreter string.  */
189 
190 static char *
191 find_program_interpreter (void)
192 {
193   char *buf = NULL;
194 
195   /* If we have an exec_bfd, get the interpreter from the load commands.  */
196   if (exec_bfd)
197     {
198       bfd_mach_o_load_command *cmd;
199 
200       if (bfd_mach_o_lookup_command (exec_bfd,
201                                      BFD_MACH_O_LC_LOAD_DYLINKER, &cmd) == 1)
202         return cmd->command.dylinker.name_str;
203     }
204 
205   /* If we didn't find it, read from memory.
206      FIXME: todo.  */
207   return buf;
208 }
209 
210 /*  Not used.  I don't see how the main symbol file can be found: the
211     interpreter name is needed and it is known from the executable file.
212     Note that darwin-nat.c implements pid_to_exec_file.  */
213 
214 static int
215 open_symbol_file_object (int from_tty)
216 {
217   return 0;
218 }
219 
220 /* Build a list of currently loaded shared objects.  See solib-svr4.c.  */
221 
222 static struct so_list *
223 darwin_current_sos (void)
224 {
225   struct type *ptr_type = builtin_type (target_gdbarch ())->builtin_data_ptr;
226   enum bfd_endian byte_order = type_byte_order (ptr_type);
227   int ptr_len = TYPE_LENGTH (ptr_type);
228   unsigned int image_info_size;
229   struct so_list *head = NULL;
230   struct so_list *tail = NULL;
231   int i;
232   struct darwin_info *info = get_darwin_info ();
233 
234   /* Be sure image infos are loaded.  */
235   darwin_load_image_infos (info);
236 
237   if (!darwin_dyld_version_ok (info))
238     return NULL;
239 
240   image_info_size = ptr_len * 3;
241 
242   /* Read infos for each solib.
243      The first entry was rumored to be the executable itself, but this is not
244      true when a large number of shared libraries are used (table expanded ?).
245      We now check all entries, but discard executable images.  */
246   for (i = 0; i < info->all_image.count; i++)
247     {
248       CORE_ADDR iinfo = info->all_image.info + i * image_info_size;
249       gdb_byte buf[image_info_size];
250       CORE_ADDR load_addr;
251       CORE_ADDR path_addr;
252       struct mach_o_header_external hdr;
253       unsigned long hdr_val;
254 
255       /* Read image info from inferior.  */
256       if (target_read_memory (iinfo, buf, image_info_size))
257 	break;
258 
259       load_addr = extract_typed_address (buf, ptr_type);
260       path_addr = extract_typed_address (buf + ptr_len, ptr_type);
261 
262       /* Read Mach-O header from memory.  */
263       if (target_read_memory (load_addr, (gdb_byte *) &hdr, sizeof (hdr) - 4))
264 	break;
265       /* Discard wrong magic numbers.  Shouldn't happen.  */
266       hdr_val = extract_unsigned_integer
267         (hdr.magic, sizeof (hdr.magic), byte_order);
268       if (hdr_val != BFD_MACH_O_MH_MAGIC && hdr_val != BFD_MACH_O_MH_MAGIC_64)
269         continue;
270       /* Discard executable.  Should happen only once.  */
271       hdr_val = extract_unsigned_integer
272         (hdr.filetype, sizeof (hdr.filetype), byte_order);
273       if (hdr_val == BFD_MACH_O_MH_EXECUTE)
274         continue;
275 
276       gdb::unique_xmalloc_ptr<char> file_path
277 	= target_read_string (path_addr, SO_NAME_MAX_PATH_SIZE - 1);
278       if (file_path == nullptr)
279 	break;
280 
281       /* Create and fill the new so_list element.  */
282       gdb::unique_xmalloc_ptr<struct so_list> newobj (XCNEW (struct so_list));
283 
284       lm_info_darwin *li = new lm_info_darwin;
285       newobj->lm_info = li;
286 
287       strncpy (newobj->so_name, file_path.get (), SO_NAME_MAX_PATH_SIZE - 1);
288       newobj->so_name[SO_NAME_MAX_PATH_SIZE - 1] = '\0';
289       strcpy (newobj->so_original_name, newobj->so_name);
290       li->lm_addr = load_addr;
291 
292       if (head == NULL)
293 	head = newobj.get ();
294       else
295 	tail->next = newobj.get ();
296       tail = newobj.release ();
297     }
298 
299   return head;
300 }
301 
302 /* Check LOAD_ADDR points to a Mach-O executable header.  Return LOAD_ADDR
303    in case of success, 0 in case of failure.  */
304 
305 static CORE_ADDR
306 darwin_validate_exec_header (CORE_ADDR load_addr)
307 {
308   enum bfd_endian byte_order = gdbarch_byte_order (target_gdbarch ());
309   struct mach_o_header_external hdr;
310   unsigned long hdr_val;
311 
312   /* Read Mach-O header from memory.  */
313   if (target_read_memory (load_addr, (gdb_byte *) &hdr, sizeof (hdr) - 4))
314     return 0;
315 
316   /* Discard wrong magic numbers.  Shouldn't happen.  */
317   hdr_val = extract_unsigned_integer
318     (hdr.magic, sizeof (hdr.magic), byte_order);
319   if (hdr_val != BFD_MACH_O_MH_MAGIC && hdr_val != BFD_MACH_O_MH_MAGIC_64)
320     return 0;
321 
322   /* Check executable.  */
323   hdr_val = extract_unsigned_integer
324     (hdr.filetype, sizeof (hdr.filetype), byte_order);
325   if (hdr_val == BFD_MACH_O_MH_EXECUTE)
326     return load_addr;
327 
328   return 0;
329 }
330 
331 /* Get the load address of the executable using dyld list of images.
332    We assume that the dyld info are correct (which is wrong if the target
333    is stopped at the first instruction).  */
334 
335 static CORE_ADDR
336 darwin_read_exec_load_addr_from_dyld (struct darwin_info *info)
337 {
338   struct type *ptr_type = builtin_type (target_gdbarch ())->builtin_data_ptr;
339   int ptr_len = TYPE_LENGTH (ptr_type);
340   unsigned int image_info_size = ptr_len * 3;
341   int i;
342 
343   /* Read infos for each solib.  One of them should be the executable.  */
344   for (i = 0; i < info->all_image.count; i++)
345     {
346       CORE_ADDR iinfo = info->all_image.info + i * image_info_size;
347       gdb_byte buf[image_info_size];
348       CORE_ADDR load_addr;
349 
350       /* Read image info from inferior.  */
351       if (target_read_memory (iinfo, buf, image_info_size))
352 	break;
353 
354       load_addr = extract_typed_address (buf, ptr_type);
355       if (darwin_validate_exec_header (load_addr) == load_addr)
356 	return load_addr;
357     }
358 
359   return 0;
360 }
361 
362 /* Get the load address of the executable when the PC is at the dyld
363    entry point using parameter passed by the kernel (at SP). */
364 
365 static CORE_ADDR
366 darwin_read_exec_load_addr_at_init (struct darwin_info *info)
367 {
368   struct gdbarch *gdbarch = target_gdbarch ();
369   enum bfd_endian byte_order = gdbarch_byte_order (gdbarch);
370   int addr_size = gdbarch_addr_bit (gdbarch) / 8;
371   ULONGEST load_ptr_addr;
372   ULONGEST load_addr;
373   gdb_byte buf[8];
374 
375   /* Get SP.  */
376   if (regcache_cooked_read_unsigned (get_current_regcache (),
377 				     gdbarch_sp_regnum (gdbarch),
378 				     &load_ptr_addr) != REG_VALID)
379     return 0;
380 
381   /* Read value at SP (image load address).  */
382   if (target_read_memory (load_ptr_addr, buf, addr_size))
383     return 0;
384 
385   load_addr = extract_unsigned_integer (buf, addr_size, byte_order);
386 
387   return darwin_validate_exec_header (load_addr);
388 }
389 
390 /* Return 1 if PC lies in the dynamic symbol resolution code of the
391    run time loader.  */
392 
393 static int
394 darwin_in_dynsym_resolve_code (CORE_ADDR pc)
395 {
396   return 0;
397 }
398 
399 /* A wrapper for bfd_mach_o_fat_extract that handles reference
400    counting properly.  This will either return NULL, or return a new
401    reference to a BFD.  */
402 
403 static gdb_bfd_ref_ptr
404 gdb_bfd_mach_o_fat_extract (bfd *abfd, bfd_format format,
405 			    const bfd_arch_info_type *arch)
406 {
407   bfd *result = bfd_mach_o_fat_extract (abfd, format, arch);
408 
409   if (result == NULL)
410     return NULL;
411 
412   if (result == abfd)
413     gdb_bfd_ref (result);
414   else
415     gdb_bfd_mark_parent (result, abfd);
416 
417   return gdb_bfd_ref_ptr (result);
418 }
419 
420 /* Return the BFD for the program interpreter.  */
421 
422 static gdb_bfd_ref_ptr
423 darwin_get_dyld_bfd ()
424 {
425   char *interp_name;
426 
427   /* This method doesn't work with an attached process.  */
428   if (current_inferior ()->attach_flag)
429     return NULL;
430 
431   /* Find the program interpreter.  */
432   interp_name = find_program_interpreter ();
433   if (!interp_name)
434     return NULL;
435 
436   /* Create a bfd for the interpreter.  */
437   gdb_bfd_ref_ptr dyld_bfd (gdb_bfd_open (interp_name, gnutarget));
438   if (dyld_bfd != NULL)
439     {
440       gdb_bfd_ref_ptr sub
441 	(gdb_bfd_mach_o_fat_extract (dyld_bfd.get (), bfd_object,
442 				     gdbarch_bfd_arch_info (target_gdbarch ())));
443       dyld_bfd = sub;
444     }
445   return dyld_bfd;
446 }
447 
448 /* Extract dyld_all_image_addr when the process was just created, assuming the
449    current PC is at the entry of the dynamic linker.  */
450 
451 static void
452 darwin_solib_get_all_image_info_addr_at_init (struct darwin_info *info)
453 {
454   CORE_ADDR load_addr = 0;
455   gdb_bfd_ref_ptr dyld_bfd = darwin_get_dyld_bfd ();
456 
457   if (dyld_bfd == NULL)
458     return;
459 
460   /* We find the dynamic linker's base address by examining
461      the current pc (which should point at the entry point for the
462      dynamic linker) and subtracting the offset of the entry point.  */
463   load_addr = (regcache_read_pc (get_current_regcache ())
464                - bfd_get_start_address (dyld_bfd.get ()));
465 
466   /* Now try to set a breakpoint in the dynamic linker.  */
467   info->all_image_addr =
468     lookup_symbol_from_bfd (dyld_bfd.get (), "_dyld_all_image_infos");
469 
470   if (info->all_image_addr == 0)
471     return;
472 
473   info->all_image_addr += load_addr;
474 }
475 
476 /* Extract dyld_all_image_addr reading it from
477    TARGET_OBJECT_DARWIN_DYLD_INFO.  */
478 
479 static void
480 darwin_solib_read_all_image_info_addr (struct darwin_info *info)
481 {
482   gdb_byte buf[8];
483   LONGEST len;
484   struct type *ptr_type = builtin_type (target_gdbarch ())->builtin_data_ptr;
485 
486   /* Sanity check.  */
487   if (TYPE_LENGTH (ptr_type) > sizeof (buf))
488     return;
489 
490   len = target_read (current_top_target (), TARGET_OBJECT_DARWIN_DYLD_INFO,
491 		     NULL, buf, 0, TYPE_LENGTH (ptr_type));
492   if (len <= 0)
493     return;
494 
495   /* The use of BIG endian is intended, as BUF is a raw stream of bytes.  This
496       makes the support of remote protocol easier.  */
497   info->all_image_addr = extract_unsigned_integer (buf, len, BFD_ENDIAN_BIG);
498 }
499 
500 /* Shared library startup support.  See documentation in solib-svr4.c.  */
501 
502 static void
503 darwin_solib_create_inferior_hook (int from_tty)
504 {
505   struct darwin_info *info = get_darwin_info ();
506   CORE_ADDR load_addr;
507 
508   info->all_image_addr = 0;
509 
510   darwin_solib_read_all_image_info_addr (info);
511 
512   if (info->all_image_addr == 0)
513     darwin_solib_get_all_image_info_addr_at_init (info);
514 
515   if (info->all_image_addr == 0)
516     return;
517 
518   darwin_load_image_infos (info);
519 
520   if (!darwin_dyld_version_ok (info))
521     {
522       warning (_("unhandled dyld version (%d)"), info->all_image.version);
523       return;
524     }
525 
526   if (info->all_image.count != 0)
527     {
528       /* Possible relocate the main executable (PIE).  */
529       load_addr = darwin_read_exec_load_addr_from_dyld (info);
530     }
531   else
532     {
533       /* Possible issue:
534 	 Do not break on the notifier if dyld is not initialized (deduced from
535 	 count == 0).  In that case, dyld hasn't relocated itself and the
536 	 notifier may point to a wrong address.  */
537 
538       load_addr = darwin_read_exec_load_addr_at_init (info);
539     }
540 
541   if (load_addr != 0 && symfile_objfile != NULL)
542     {
543       CORE_ADDR vmaddr;
544 
545       /* Find the base address of the executable.  */
546       vmaddr = bfd_mach_o_get_base_address (exec_bfd);
547 
548       /* Relocate.  */
549       if (vmaddr != load_addr)
550 	objfile_rebase (symfile_objfile, load_addr - vmaddr);
551     }
552 
553   /* Set solib notifier (to reload list of shared libraries).  */
554   CORE_ADDR notifier = info->all_image.notifier;
555 
556   if (info->all_image.count == 0)
557     {
558       /* Dyld hasn't yet relocated itself, so the notifier address may
559 	 be incorrect (as it has to be relocated).  */
560       CORE_ADDR start = bfd_get_start_address (exec_bfd);
561       if (start == 0)
562 	notifier = 0;
563       else
564         {
565           gdb_bfd_ref_ptr dyld_bfd = darwin_get_dyld_bfd ();
566           if (dyld_bfd != NULL)
567             {
568               CORE_ADDR dyld_bfd_start_address;
569               CORE_ADDR dyld_relocated_base_address;
570               CORE_ADDR pc;
571 
572               dyld_bfd_start_address = bfd_get_start_address (dyld_bfd.get());
573 
574               /* We find the dynamic linker's base address by examining
575                  the current pc (which should point at the entry point
576                  for the dynamic linker) and subtracting the offset of
577                  the entry point.  */
578 
579               pc = regcache_read_pc (get_current_regcache ());
580               dyld_relocated_base_address = pc - dyld_bfd_start_address;
581 
582               /* We get the proper notifier relocated address by
583                  adding the dyld relocated base address to the current
584                  notifier offset value.  */
585 
586               notifier += dyld_relocated_base_address;
587             }
588         }
589     }
590 
591   /* Add the breakpoint which is hit by dyld when the list of solib is
592      modified.  */
593   if (notifier != 0)
594     create_solib_event_breakpoint (target_gdbarch (), notifier);
595 }
596 
597 static void
598 darwin_clear_solib (void)
599 {
600   struct darwin_info *info = get_darwin_info ();
601 
602   info->all_image_addr = 0;
603   info->all_image.version = 0;
604 }
605 
606 static void
607 darwin_free_so (struct so_list *so)
608 {
609   lm_info_darwin *li = (lm_info_darwin *) so->lm_info;
610 
611   delete li;
612 }
613 
614 /* The section table is built from bfd sections using bfd VMAs.
615    Relocate these VMAs according to solib info.  */
616 
617 static void
618 darwin_relocate_section_addresses (struct so_list *so,
619 				   struct target_section *sec)
620 {
621   lm_info_darwin *li = (lm_info_darwin *) so->lm_info;
622 
623   sec->addr += li->lm_addr;
624   sec->endaddr += li->lm_addr;
625 
626   /* Best effort to set addr_high/addr_low.  This is used only by
627      'info sharedlibary'.  */
628   if (so->addr_high == 0)
629     {
630       so->addr_low = sec->addr;
631       so->addr_high = sec->endaddr;
632     }
633   if (sec->endaddr > so->addr_high)
634     so->addr_high = sec->endaddr;
635   if (sec->addr < so->addr_low)
636     so->addr_low = sec->addr;
637 }
638 
639 static gdb_bfd_ref_ptr
640 darwin_bfd_open (const char *pathname)
641 {
642   int found_file;
643 
644   /* Search for shared library file.  */
645   gdb::unique_xmalloc_ptr<char> found_pathname
646     = solib_find (pathname, &found_file);
647   if (found_pathname == NULL)
648     perror_with_name (pathname);
649 
650   /* Open bfd for shared library.  */
651   gdb_bfd_ref_ptr abfd (solib_bfd_fopen (found_pathname.get (), found_file));
652 
653   gdb_bfd_ref_ptr res
654     (gdb_bfd_mach_o_fat_extract (abfd.get (), bfd_object,
655 				 gdbarch_bfd_arch_info (target_gdbarch ())));
656   if (res == NULL)
657     error (_("`%s': not a shared-library: %s"),
658 	   bfd_get_filename (abfd.get ()), bfd_errmsg (bfd_get_error ()));
659 
660   /* The current filename for fat-binary BFDs is a name generated
661      by BFD, usually a string containing the name of the architecture.
662      Reset its value to the actual filename.  */
663   bfd_set_filename (res.get (), pathname);
664 
665   return res;
666 }
667 
668 struct target_so_ops darwin_so_ops;
669 
670 void _initialize_darwin_solib ();
671 void
672 _initialize_darwin_solib ()
673 {
674   darwin_so_ops.relocate_section_addresses = darwin_relocate_section_addresses;
675   darwin_so_ops.free_so = darwin_free_so;
676   darwin_so_ops.clear_solib = darwin_clear_solib;
677   darwin_so_ops.solib_create_inferior_hook = darwin_solib_create_inferior_hook;
678   darwin_so_ops.current_sos = darwin_current_sos;
679   darwin_so_ops.open_symbol_file_object = open_symbol_file_object;
680   darwin_so_ops.in_dynsym_resolve_code = darwin_in_dynsym_resolve_code;
681   darwin_so_ops.bfd_open = darwin_bfd_open;
682 }
683