xref: /openbsd-src/gnu/usr.bin/binutils/gdb/coff-pe-read.c (revision b725ae7711052a2233e31a66fefb8a752c388d7a)
1*b725ae77Skettenis /* Read the export table symbols from a portable executable and
2*b725ae77Skettenis    convert to internal format, for GDB. Used as a last resort if no
3*b725ae77Skettenis    debugging symbols recognized.
4*b725ae77Skettenis 
5*b725ae77Skettenis    Copyright 2003 Free Software Foundation, Inc.
6*b725ae77Skettenis 
7*b725ae77Skettenis    This file is part of GDB.
8*b725ae77Skettenis 
9*b725ae77Skettenis    This program is free software; you can redistribute it and/or modify
10*b725ae77Skettenis    it under the terms of the GNU General Public License as published by
11*b725ae77Skettenis    the Free Software Foundation; either version 2 of the License, or
12*b725ae77Skettenis    (at your option) any later version.
13*b725ae77Skettenis 
14*b725ae77Skettenis    This program is distributed in the hope that it will be useful,
15*b725ae77Skettenis    but WITHOUT ANY WARRANTY; without even the implied warranty of
16*b725ae77Skettenis    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
17*b725ae77Skettenis    GNU General Public License for more details.
18*b725ae77Skettenis 
19*b725ae77Skettenis    You should have received a copy of the GNU General Public License
20*b725ae77Skettenis    along with this program; if not, write to the Free Software
21*b725ae77Skettenis    Foundation, Inc., 59 Temple Place - Suite 330,
22*b725ae77Skettenis    Boston, MA 02111-1307, USA.
23*b725ae77Skettenis 
24*b725ae77Skettenis    Contributed by Raoul M. Gough (RaoulGough@yahoo.co.uk). */
25*b725ae77Skettenis 
26*b725ae77Skettenis #include "coff-pe-read.h"
27*b725ae77Skettenis 
28*b725ae77Skettenis #include "bfd.h"
29*b725ae77Skettenis 
30*b725ae77Skettenis #include "defs.h"
31*b725ae77Skettenis #include "gdbtypes.h"
32*b725ae77Skettenis 
33*b725ae77Skettenis #include "symtab.h"
34*b725ae77Skettenis #include "symfile.h"
35*b725ae77Skettenis #include "objfiles.h"
36*b725ae77Skettenis 
37*b725ae77Skettenis /* Internal section information */
38*b725ae77Skettenis 
39*b725ae77Skettenis struct read_pe_section_data
40*b725ae77Skettenis {
41*b725ae77Skettenis   CORE_ADDR vma_offset;		/* Offset to loaded address of section. */
42*b725ae77Skettenis   unsigned long rva_start;	/* Start offset within the pe. */
43*b725ae77Skettenis   unsigned long rva_end;	/* End offset within the pe. */
44*b725ae77Skettenis   enum minimal_symbol_type ms_type;	/* Type to assign symbols in section. */
45*b725ae77Skettenis };
46*b725ae77Skettenis 
47*b725ae77Skettenis #define PE_SECTION_INDEX_TEXT     0
48*b725ae77Skettenis #define PE_SECTION_INDEX_DATA     1
49*b725ae77Skettenis #define PE_SECTION_INDEX_BSS      2
50*b725ae77Skettenis #define PE_SECTION_TABLE_SIZE     3
51*b725ae77Skettenis #define PE_SECTION_INDEX_INVALID -1
52*b725ae77Skettenis 
53*b725ae77Skettenis /* Get the index of the named section in our own array, which contains
54*b725ae77Skettenis    text, data and bss in that order. Return PE_SECTION_INDEX_INVALID
55*b725ae77Skettenis    if passed an unrecognised section name. */
56*b725ae77Skettenis 
57*b725ae77Skettenis static int
read_pe_section_index(const char * section_name)58*b725ae77Skettenis read_pe_section_index (const char *section_name)
59*b725ae77Skettenis {
60*b725ae77Skettenis   if (strcmp (section_name, ".text") == 0)
61*b725ae77Skettenis     {
62*b725ae77Skettenis       return PE_SECTION_INDEX_TEXT;
63*b725ae77Skettenis     }
64*b725ae77Skettenis 
65*b725ae77Skettenis   else if (strcmp (section_name, ".data") == 0)
66*b725ae77Skettenis     {
67*b725ae77Skettenis       return PE_SECTION_INDEX_DATA;
68*b725ae77Skettenis     }
69*b725ae77Skettenis 
70*b725ae77Skettenis   else if (strcmp (section_name, ".bss") == 0)
71*b725ae77Skettenis     {
72*b725ae77Skettenis       return PE_SECTION_INDEX_BSS;
73*b725ae77Skettenis     }
74*b725ae77Skettenis 
75*b725ae77Skettenis   else
76*b725ae77Skettenis     {
77*b725ae77Skettenis       return PE_SECTION_INDEX_INVALID;
78*b725ae77Skettenis     }
79*b725ae77Skettenis }
80*b725ae77Skettenis 
81*b725ae77Skettenis /* Record the virtual memory address of a section. */
82*b725ae77Skettenis 
83*b725ae77Skettenis static void
get_section_vmas(bfd * abfd,asection * sectp,void * context)84*b725ae77Skettenis get_section_vmas (bfd *abfd, asection *sectp, void *context)
85*b725ae77Skettenis {
86*b725ae77Skettenis   struct read_pe_section_data *sections = context;
87*b725ae77Skettenis   int sectix = read_pe_section_index (sectp->name);
88*b725ae77Skettenis 
89*b725ae77Skettenis   if (sectix != PE_SECTION_INDEX_INVALID)
90*b725ae77Skettenis     {
91*b725ae77Skettenis       /* Data within the section start at rva_start in the pe and at
92*b725ae77Skettenis          bfd_get_section_vma() within memory. Store the offset. */
93*b725ae77Skettenis 
94*b725ae77Skettenis       sections[sectix].vma_offset
95*b725ae77Skettenis 	= bfd_get_section_vma (abfd, sectp) - sections[sectix].rva_start;
96*b725ae77Skettenis     }
97*b725ae77Skettenis }
98*b725ae77Skettenis 
99*b725ae77Skettenis /* Create a minimal symbol entry for an exported symbol. */
100*b725ae77Skettenis 
101*b725ae77Skettenis static void
add_pe_exported_sym(char * sym_name,unsigned long func_rva,const struct read_pe_section_data * section_data,const char * dll_name,struct objfile * objfile)102*b725ae77Skettenis add_pe_exported_sym (char *sym_name,
103*b725ae77Skettenis 		     unsigned long func_rva,
104*b725ae77Skettenis 		     const struct read_pe_section_data *section_data,
105*b725ae77Skettenis 		     const char *dll_name, struct objfile *objfile)
106*b725ae77Skettenis {
107*b725ae77Skettenis   /* Add the stored offset to get the loaded address of the symbol. */
108*b725ae77Skettenis 
109*b725ae77Skettenis   CORE_ADDR vma = func_rva + section_data->vma_offset;
110*b725ae77Skettenis 
111*b725ae77Skettenis   char *qualified_name = 0;
112*b725ae77Skettenis   int dll_name_len = strlen (dll_name);
113*b725ae77Skettenis   int count;
114*b725ae77Skettenis 
115*b725ae77Skettenis   /* Generate a (hopefully unique) qualified name using the first part
116*b725ae77Skettenis      of the dll name, e.g. KERNEL32!AddAtomA. This matches the style
117*b725ae77Skettenis      used by windbg from the "Microsoft Debugging Tools for Windows". */
118*b725ae77Skettenis 
119*b725ae77Skettenis   qualified_name = xmalloc (dll_name_len + strlen (sym_name) + 2);
120*b725ae77Skettenis 
121*b725ae77Skettenis   strncpy (qualified_name, dll_name, dll_name_len);
122*b725ae77Skettenis   qualified_name[dll_name_len] = '!';
123*b725ae77Skettenis   strcpy (qualified_name + dll_name_len + 1, sym_name);
124*b725ae77Skettenis 
125*b725ae77Skettenis   prim_record_minimal_symbol (qualified_name,
126*b725ae77Skettenis 			      vma, section_data->ms_type, objfile);
127*b725ae77Skettenis 
128*b725ae77Skettenis   xfree (qualified_name);
129*b725ae77Skettenis 
130*b725ae77Skettenis   /* Enter the plain name as well, which might not be unique. */
131*b725ae77Skettenis   prim_record_minimal_symbol (sym_name, vma, section_data->ms_type, objfile);
132*b725ae77Skettenis }
133*b725ae77Skettenis 
134*b725ae77Skettenis /* Truncate a dll_name at the first dot character. */
135*b725ae77Skettenis 
136*b725ae77Skettenis static void
read_pe_truncate_name(char * dll_name)137*b725ae77Skettenis read_pe_truncate_name (char *dll_name)
138*b725ae77Skettenis {
139*b725ae77Skettenis   while (*dll_name)
140*b725ae77Skettenis     {
141*b725ae77Skettenis       if ((*dll_name) == '.')
142*b725ae77Skettenis 	{
143*b725ae77Skettenis 	  *dll_name = '\0';	/* truncates and causes loop exit. */
144*b725ae77Skettenis 	}
145*b725ae77Skettenis 
146*b725ae77Skettenis       else
147*b725ae77Skettenis 	{
148*b725ae77Skettenis 	  ++dll_name;
149*b725ae77Skettenis 	}
150*b725ae77Skettenis     }
151*b725ae77Skettenis }
152*b725ae77Skettenis 
153*b725ae77Skettenis /* Low-level support functions, direct from the ld module pe-dll.c. */
154*b725ae77Skettenis static unsigned int
pe_get16(bfd * abfd,int where)155*b725ae77Skettenis pe_get16 (bfd *abfd, int where)
156*b725ae77Skettenis {
157*b725ae77Skettenis   unsigned char b[2];
158*b725ae77Skettenis 
159*b725ae77Skettenis   bfd_seek (abfd, (file_ptr) where, SEEK_SET);
160*b725ae77Skettenis   bfd_bread (b, (bfd_size_type) 2, abfd);
161*b725ae77Skettenis   return b[0] + (b[1] << 8);
162*b725ae77Skettenis }
163*b725ae77Skettenis 
164*b725ae77Skettenis static unsigned int
pe_get32(bfd * abfd,int where)165*b725ae77Skettenis pe_get32 (bfd *abfd, int where)
166*b725ae77Skettenis {
167*b725ae77Skettenis   unsigned char b[4];
168*b725ae77Skettenis 
169*b725ae77Skettenis   bfd_seek (abfd, (file_ptr) where, SEEK_SET);
170*b725ae77Skettenis   bfd_bread (b, (bfd_size_type) 4, abfd);
171*b725ae77Skettenis   return b[0] + (b[1] << 8) + (b[2] << 16) + (b[3] << 24);
172*b725ae77Skettenis }
173*b725ae77Skettenis 
174*b725ae77Skettenis static unsigned int
pe_as32(void * ptr)175*b725ae77Skettenis pe_as32 (void *ptr)
176*b725ae77Skettenis {
177*b725ae77Skettenis   unsigned char *b = ptr;
178*b725ae77Skettenis 
179*b725ae77Skettenis   return b[0] + (b[1] << 8) + (b[2] << 16) + (b[3] << 24);
180*b725ae77Skettenis }
181*b725ae77Skettenis 
182*b725ae77Skettenis /* Read the (non-debug) export symbol table from a portable
183*b725ae77Skettenis    executable. Code originally lifted from the ld function
184*b725ae77Skettenis    pe_implied_import_dll in pe-dll.c. */
185*b725ae77Skettenis 
186*b725ae77Skettenis void
read_pe_exported_syms(struct objfile * objfile)187*b725ae77Skettenis read_pe_exported_syms (struct objfile *objfile)
188*b725ae77Skettenis {
189*b725ae77Skettenis   bfd *dll = objfile->obfd;
190*b725ae77Skettenis   unsigned long pe_header_offset, opthdr_ofs, num_entries, i;
191*b725ae77Skettenis   unsigned long export_rva, export_size, nsections, secptr, expptr;
192*b725ae77Skettenis   unsigned long exp_funcbase;
193*b725ae77Skettenis   unsigned char *expdata, *erva;
194*b725ae77Skettenis   unsigned long name_rvas, ordinals, nexp, ordbase;
195*b725ae77Skettenis   char *dll_name;
196*b725ae77Skettenis 
197*b725ae77Skettenis   /* Array elements are for text, data and bss in that order
198*b725ae77Skettenis      Initialization with start_rva > end_rva guarantees that
199*b725ae77Skettenis      unused sections won't be matched. */
200*b725ae77Skettenis   struct read_pe_section_data section_data[PE_SECTION_TABLE_SIZE]
201*b725ae77Skettenis     = { {0, 1, 0, mst_text},
202*b725ae77Skettenis   {0, 1, 0, mst_data},
203*b725ae77Skettenis   {0, 1, 0, mst_bss}
204*b725ae77Skettenis   };
205*b725ae77Skettenis 
206*b725ae77Skettenis   struct cleanup *back_to = 0;
207*b725ae77Skettenis 
208*b725ae77Skettenis   char const *target = bfd_get_target (objfile->obfd);
209*b725ae77Skettenis 
210*b725ae77Skettenis   if ((strcmp (target, "pe-i386") != 0) && (strcmp (target, "pei-i386") != 0))
211*b725ae77Skettenis     {
212*b725ae77Skettenis       /* This is not an i386 format file. Abort now, because the code
213*b725ae77Skettenis          is untested on anything else. *FIXME* test on further
214*b725ae77Skettenis          architectures and loosen or remove this test. */
215*b725ae77Skettenis       return;
216*b725ae77Skettenis     }
217*b725ae77Skettenis 
218*b725ae77Skettenis   /* Get pe_header, optional header and numbers of export entries.  */
219*b725ae77Skettenis   pe_header_offset = pe_get32 (dll, 0x3c);
220*b725ae77Skettenis   opthdr_ofs = pe_header_offset + 4 + 20;
221*b725ae77Skettenis   num_entries = pe_get32 (dll, opthdr_ofs + 92);
222*b725ae77Skettenis 
223*b725ae77Skettenis   if (num_entries < 1)		/* No exports.  */
224*b725ae77Skettenis     {
225*b725ae77Skettenis       return;
226*b725ae77Skettenis     }
227*b725ae77Skettenis 
228*b725ae77Skettenis   export_rva = pe_get32 (dll, opthdr_ofs + 96);
229*b725ae77Skettenis   export_size = pe_get32 (dll, opthdr_ofs + 100);
230*b725ae77Skettenis   nsections = pe_get16 (dll, pe_header_offset + 4 + 2);
231*b725ae77Skettenis   secptr = (pe_header_offset + 4 + 20 +
232*b725ae77Skettenis 	    pe_get16 (dll, pe_header_offset + 4 + 16));
233*b725ae77Skettenis   expptr = 0;
234*b725ae77Skettenis 
235*b725ae77Skettenis   /* Get the rva and size of the export section.  */
236*b725ae77Skettenis   for (i = 0; i < nsections; i++)
237*b725ae77Skettenis     {
238*b725ae77Skettenis       char sname[8];
239*b725ae77Skettenis       unsigned long secptr1 = secptr + 40 * i;
240*b725ae77Skettenis       unsigned long vaddr = pe_get32 (dll, secptr1 + 12);
241*b725ae77Skettenis       unsigned long vsize = pe_get32 (dll, secptr1 + 16);
242*b725ae77Skettenis       unsigned long fptr = pe_get32 (dll, secptr1 + 20);
243*b725ae77Skettenis 
244*b725ae77Skettenis       bfd_seek (dll, (file_ptr) secptr1, SEEK_SET);
245*b725ae77Skettenis       bfd_bread (sname, (bfd_size_type) 8, dll);
246*b725ae77Skettenis 
247*b725ae77Skettenis       if (vaddr <= export_rva && vaddr + vsize > export_rva)
248*b725ae77Skettenis 	{
249*b725ae77Skettenis 	  expptr = fptr + (export_rva - vaddr);
250*b725ae77Skettenis 	  if (export_rva + export_size > vaddr + vsize)
251*b725ae77Skettenis 	    export_size = vsize - (export_rva - vaddr);
252*b725ae77Skettenis 	  break;
253*b725ae77Skettenis 	}
254*b725ae77Skettenis     }
255*b725ae77Skettenis 
256*b725ae77Skettenis   if (export_size == 0)
257*b725ae77Skettenis     {
258*b725ae77Skettenis       /* Empty export table. */
259*b725ae77Skettenis       return;
260*b725ae77Skettenis     }
261*b725ae77Skettenis 
262*b725ae77Skettenis   /* Scan sections and store the base and size of the relevant sections. */
263*b725ae77Skettenis   for (i = 0; i < nsections; i++)
264*b725ae77Skettenis     {
265*b725ae77Skettenis       unsigned long secptr1 = secptr + 40 * i;
266*b725ae77Skettenis       unsigned long vsize = pe_get32 (dll, secptr1 + 8);
267*b725ae77Skettenis       unsigned long vaddr = pe_get32 (dll, secptr1 + 12);
268*b725ae77Skettenis       unsigned long flags = pe_get32 (dll, secptr1 + 36);
269*b725ae77Skettenis       char sec_name[9];
270*b725ae77Skettenis       int sectix;
271*b725ae77Skettenis 
272*b725ae77Skettenis       sec_name[8] = '\0';
273*b725ae77Skettenis       bfd_seek (dll, (file_ptr) secptr1 + 0, SEEK_SET);
274*b725ae77Skettenis       bfd_bread (sec_name, (bfd_size_type) 8, dll);
275*b725ae77Skettenis 
276*b725ae77Skettenis       sectix = read_pe_section_index (sec_name);
277*b725ae77Skettenis 
278*b725ae77Skettenis       if (sectix != PE_SECTION_INDEX_INVALID)
279*b725ae77Skettenis 	{
280*b725ae77Skettenis 	  section_data[sectix].rva_start = vaddr;
281*b725ae77Skettenis 	  section_data[sectix].rva_end = vaddr + vsize;
282*b725ae77Skettenis 	}
283*b725ae77Skettenis     }
284*b725ae77Skettenis 
285*b725ae77Skettenis   expdata = (unsigned char *) xmalloc (export_size);
286*b725ae77Skettenis   back_to = make_cleanup (xfree, expdata);
287*b725ae77Skettenis 
288*b725ae77Skettenis   bfd_seek (dll, (file_ptr) expptr, SEEK_SET);
289*b725ae77Skettenis   bfd_bread (expdata, (bfd_size_type) export_size, dll);
290*b725ae77Skettenis   erva = expdata - export_rva;
291*b725ae77Skettenis 
292*b725ae77Skettenis   nexp = pe_as32 (expdata + 24);
293*b725ae77Skettenis   name_rvas = pe_as32 (expdata + 32);
294*b725ae77Skettenis   ordinals = pe_as32 (expdata + 36);
295*b725ae77Skettenis   ordbase = pe_as32 (expdata + 16);
296*b725ae77Skettenis   exp_funcbase = pe_as32 (expdata + 28);
297*b725ae77Skettenis 
298*b725ae77Skettenis   /* Use internal dll name instead of full pathname. */
299*b725ae77Skettenis   dll_name = pe_as32 (expdata + 12) + erva;
300*b725ae77Skettenis 
301*b725ae77Skettenis   bfd_map_over_sections (dll, get_section_vmas, section_data);
302*b725ae77Skettenis 
303*b725ae77Skettenis   /* Adjust the vma_offsets in case this PE got relocated. This
304*b725ae77Skettenis      assumes that *all* sections share the same relocation offset
305*b725ae77Skettenis      as the text section. */
306*b725ae77Skettenis   for (i = 0; i < PE_SECTION_TABLE_SIZE; i++)
307*b725ae77Skettenis     {
308*b725ae77Skettenis       section_data[i].vma_offset
309*b725ae77Skettenis 	+= ANOFFSET (objfile->section_offsets, SECT_OFF_TEXT (objfile));
310*b725ae77Skettenis     }
311*b725ae77Skettenis 
312*b725ae77Skettenis   printf_filtered ("Minimal symbols from %s...", dll_name);
313*b725ae77Skettenis   wrap_here ("");
314*b725ae77Skettenis 
315*b725ae77Skettenis   /* Truncate name at first dot. Should maybe also convert to all
316*b725ae77Skettenis      lower case for convenience on Windows. */
317*b725ae77Skettenis   read_pe_truncate_name (dll_name);
318*b725ae77Skettenis 
319*b725ae77Skettenis   /* Iterate through the list of symbols.  */
320*b725ae77Skettenis   for (i = 0; i < nexp; i++)
321*b725ae77Skettenis     {
322*b725ae77Skettenis       /* Pointer to the names vector.  */
323*b725ae77Skettenis       unsigned long name_rva = pe_as32 (erva + name_rvas + i * 4);
324*b725ae77Skettenis 
325*b725ae77Skettenis       /* Pointer to the function address vector.  */
326*b725ae77Skettenis       unsigned long func_rva = pe_as32 (erva + exp_funcbase + i * 4);
327*b725ae77Skettenis 
328*b725ae77Skettenis       /* Find this symbol's section in our own array. */
329*b725ae77Skettenis       int sectix = 0;
330*b725ae77Skettenis 
331*b725ae77Skettenis       for (sectix = 0; sectix < PE_SECTION_TABLE_SIZE; ++sectix)
332*b725ae77Skettenis 	{
333*b725ae77Skettenis 	  if ((func_rva >= section_data[sectix].rva_start)
334*b725ae77Skettenis 	      && (func_rva < section_data[sectix].rva_end))
335*b725ae77Skettenis 	    {
336*b725ae77Skettenis 	      add_pe_exported_sym (erva + name_rva,
337*b725ae77Skettenis 				   func_rva,
338*b725ae77Skettenis 				   section_data + sectix, dll_name, objfile);
339*b725ae77Skettenis 	      break;
340*b725ae77Skettenis 	    }
341*b725ae77Skettenis 	}
342*b725ae77Skettenis     }
343*b725ae77Skettenis 
344*b725ae77Skettenis   /* discard expdata. */
345*b725ae77Skettenis   do_cleanups (back_to);
346*b725ae77Skettenis }
347