1*a9fa9459Szrj // reduced_debug_output.cc -- output reduced debugging information to save space
2*a9fa9459Szrj
3*a9fa9459Szrj // Copyright (C) 2008-2016 Free Software Foundation, Inc.
4*a9fa9459Szrj // Written by Caleb Howe <cshowe@google.com>.
5*a9fa9459Szrj
6*a9fa9459Szrj // This file is part of gold.
7*a9fa9459Szrj
8*a9fa9459Szrj // This program is free software; you can redistribute it and/or modify
9*a9fa9459Szrj // it under the terms of the GNU General Public License as published by
10*a9fa9459Szrj // the Free Software Foundation; either version 3 of the License, or
11*a9fa9459Szrj // (at your option) any later version.
12*a9fa9459Szrj
13*a9fa9459Szrj // This program is distributed in the hope that it will be useful,
14*a9fa9459Szrj // but WITHOUT ANY WARRANTY; without even the implied warranty of
15*a9fa9459Szrj // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16*a9fa9459Szrj // GNU General Public License for more details.
17*a9fa9459Szrj
18*a9fa9459Szrj // You should have received a copy of the GNU General Public License
19*a9fa9459Szrj // along with this program; if not, write to the Free Software
20*a9fa9459Szrj // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston,
21*a9fa9459Szrj // MA 02110-1301, USA.
22*a9fa9459Szrj
23*a9fa9459Szrj #include "gold.h"
24*a9fa9459Szrj
25*a9fa9459Szrj #include "parameters.h"
26*a9fa9459Szrj #include "options.h"
27*a9fa9459Szrj #include "dwarf.h"
28*a9fa9459Szrj #include "dwarf_reader.h"
29*a9fa9459Szrj #include "reduced_debug_output.h"
30*a9fa9459Szrj #include "int_encoding.h"
31*a9fa9459Szrj
32*a9fa9459Szrj #include <vector>
33*a9fa9459Szrj
34*a9fa9459Szrj namespace gold
35*a9fa9459Szrj {
36*a9fa9459Szrj
37*a9fa9459Szrj // Given a pointer to the beginning of a die and the beginning of the associated
38*a9fa9459Szrj // abbreviation fills in die_end with the end of the information entry. If
39*a9fa9459Szrj // successful returns true. Get_die_end also takes a pointer to the end of the
40*a9fa9459Szrj // buffer containing the die. If die_end would be beyond the end of the
41*a9fa9459Szrj // buffer, or if an unsupported dwarf form is encountered returns false.
42*a9fa9459Szrj bool
get_die_end(unsigned char * die,unsigned char * abbrev,unsigned char ** die_end,unsigned char * buffer_end,int address_size,bool is64)43*a9fa9459Szrj Output_reduced_debug_info_section::get_die_end(
44*a9fa9459Szrj unsigned char* die, unsigned char* abbrev, unsigned char** die_end,
45*a9fa9459Szrj unsigned char* buffer_end, int address_size, bool is64)
46*a9fa9459Szrj {
47*a9fa9459Szrj size_t LEB_size;
48*a9fa9459Szrj uint64_t LEB_decoded;
49*a9fa9459Szrj for(;;)
50*a9fa9459Szrj {
51*a9fa9459Szrj uint64_t attribute = read_unsigned_LEB_128(abbrev, &LEB_size);
52*a9fa9459Szrj abbrev += LEB_size;
53*a9fa9459Szrj elfcpp::DW_FORM form =
54*a9fa9459Szrj static_cast<elfcpp::DW_FORM>(read_unsigned_LEB_128(abbrev,
55*a9fa9459Szrj &LEB_size));
56*a9fa9459Szrj abbrev += LEB_size;
57*a9fa9459Szrj if (!(attribute || form))
58*a9fa9459Szrj break;
59*a9fa9459Szrj if (die >= buffer_end)
60*a9fa9459Szrj return false;
61*a9fa9459Szrj switch(form)
62*a9fa9459Szrj {
63*a9fa9459Szrj case elfcpp::DW_FORM_flag_present:
64*a9fa9459Szrj break;
65*a9fa9459Szrj case elfcpp::DW_FORM_strp:
66*a9fa9459Szrj case elfcpp::DW_FORM_sec_offset:
67*a9fa9459Szrj die += is64 ? 8 : 4;
68*a9fa9459Szrj break;
69*a9fa9459Szrj case elfcpp::DW_FORM_addr:
70*a9fa9459Szrj case elfcpp::DW_FORM_ref_addr:
71*a9fa9459Szrj die += address_size;
72*a9fa9459Szrj break;
73*a9fa9459Szrj case elfcpp::DW_FORM_block1:
74*a9fa9459Szrj die += *die;
75*a9fa9459Szrj die += 1;
76*a9fa9459Szrj break;
77*a9fa9459Szrj case elfcpp::DW_FORM_block2:
78*a9fa9459Szrj {
79*a9fa9459Szrj uint16_t block_size;
80*a9fa9459Szrj block_size = read_from_pointer<16>(&die);
81*a9fa9459Szrj die += block_size;
82*a9fa9459Szrj break;
83*a9fa9459Szrj }
84*a9fa9459Szrj case elfcpp::DW_FORM_block4:
85*a9fa9459Szrj {
86*a9fa9459Szrj uint32_t block_size;
87*a9fa9459Szrj block_size = read_from_pointer<32>(&die);
88*a9fa9459Szrj die += block_size;
89*a9fa9459Szrj break;
90*a9fa9459Szrj }
91*a9fa9459Szrj case elfcpp::DW_FORM_block:
92*a9fa9459Szrj case elfcpp::DW_FORM_exprloc:
93*a9fa9459Szrj LEB_decoded = read_unsigned_LEB_128(die, &LEB_size);
94*a9fa9459Szrj die += (LEB_decoded + LEB_size);
95*a9fa9459Szrj break;
96*a9fa9459Szrj case elfcpp::DW_FORM_data1:
97*a9fa9459Szrj case elfcpp::DW_FORM_ref1:
98*a9fa9459Szrj case elfcpp::DW_FORM_flag:
99*a9fa9459Szrj die += 1;
100*a9fa9459Szrj break;
101*a9fa9459Szrj case elfcpp::DW_FORM_data2:
102*a9fa9459Szrj case elfcpp::DW_FORM_ref2:
103*a9fa9459Szrj die += 2;
104*a9fa9459Szrj break;
105*a9fa9459Szrj case elfcpp::DW_FORM_data4:
106*a9fa9459Szrj case elfcpp::DW_FORM_ref4:
107*a9fa9459Szrj die += 4;
108*a9fa9459Szrj break;
109*a9fa9459Szrj case elfcpp::DW_FORM_data8:
110*a9fa9459Szrj case elfcpp::DW_FORM_ref8:
111*a9fa9459Szrj case elfcpp::DW_FORM_ref_sig8:
112*a9fa9459Szrj die += 8;
113*a9fa9459Szrj break;
114*a9fa9459Szrj case elfcpp::DW_FORM_ref_udata:
115*a9fa9459Szrj case elfcpp::DW_FORM_udata:
116*a9fa9459Szrj read_unsigned_LEB_128(die, &LEB_size);
117*a9fa9459Szrj die += LEB_size;
118*a9fa9459Szrj break;
119*a9fa9459Szrj case elfcpp::DW_FORM_sdata:
120*a9fa9459Szrj read_signed_LEB_128(die, &LEB_size);
121*a9fa9459Szrj die += LEB_size;
122*a9fa9459Szrj break;
123*a9fa9459Szrj case elfcpp::DW_FORM_string:
124*a9fa9459Szrj {
125*a9fa9459Szrj size_t length = strlen(reinterpret_cast<char*>(die));
126*a9fa9459Szrj die += length + 1;
127*a9fa9459Szrj break;
128*a9fa9459Szrj }
129*a9fa9459Szrj case elfcpp::DW_FORM_indirect:
130*a9fa9459Szrj case elfcpp::DW_FORM_GNU_addr_index:
131*a9fa9459Szrj case elfcpp::DW_FORM_GNU_str_index:
132*a9fa9459Szrj default:
133*a9fa9459Szrj return false;
134*a9fa9459Szrj }
135*a9fa9459Szrj }
136*a9fa9459Szrj *die_end = die;
137*a9fa9459Szrj return true;
138*a9fa9459Szrj }
139*a9fa9459Szrj
140*a9fa9459Szrj void
set_final_data_size()141*a9fa9459Szrj Output_reduced_debug_abbrev_section::set_final_data_size()
142*a9fa9459Szrj {
143*a9fa9459Szrj if (this->sized_ || this->failed_)
144*a9fa9459Szrj return;
145*a9fa9459Szrj
146*a9fa9459Szrj uint64_t abbrev_number;
147*a9fa9459Szrj size_t LEB_size;
148*a9fa9459Szrj unsigned char* abbrev_data = this->postprocessing_buffer();
149*a9fa9459Szrj unsigned char* abbrev_end = this->postprocessing_buffer() +
150*a9fa9459Szrj this->postprocessing_buffer_size();
151*a9fa9459Szrj this->write_to_postprocessing_buffer();
152*a9fa9459Szrj while(abbrev_data < abbrev_end)
153*a9fa9459Szrj {
154*a9fa9459Szrj uint64_t abbrev_offset = abbrev_data - this->postprocessing_buffer();
155*a9fa9459Szrj while((abbrev_number = read_unsigned_LEB_128(abbrev_data, &LEB_size)))
156*a9fa9459Szrj {
157*a9fa9459Szrj if (abbrev_data >= abbrev_end)
158*a9fa9459Szrj {
159*a9fa9459Szrj failed("Debug abbreviations extend beyond .debug_abbrev "
160*a9fa9459Szrj "section; failed to reduce debug abbreviations");
161*a9fa9459Szrj return;
162*a9fa9459Szrj }
163*a9fa9459Szrj abbrev_data += LEB_size;
164*a9fa9459Szrj
165*a9fa9459Szrj // Together with the abbreviation number these fields make up
166*a9fa9459Szrj // the header for each abbreviation.
167*a9fa9459Szrj uint64_t abbrev_type = read_unsigned_LEB_128(abbrev_data, &LEB_size);
168*a9fa9459Szrj abbrev_data += LEB_size;
169*a9fa9459Szrj
170*a9fa9459Szrj // This would ordinarily be the has_children field of the
171*a9fa9459Szrj // abbreviation. But it's going to be false after reducing the
172*a9fa9459Szrj // information, so there's no point in storing it.
173*a9fa9459Szrj abbrev_data++;
174*a9fa9459Szrj
175*a9fa9459Szrj // Read to the end of the current abbreviation.
176*a9fa9459Szrj // This is indicated by two zero unsigned LEBs in a row. We don't
177*a9fa9459Szrj // need to parse the data yet, so we just scan through the data
178*a9fa9459Szrj // looking for two consecutive 0 bytes indicating the end of the
179*a9fa9459Szrj // abbreviation.
180*a9fa9459Szrj unsigned char* current_abbrev;
181*a9fa9459Szrj for (current_abbrev = abbrev_data;
182*a9fa9459Szrj current_abbrev[0] || current_abbrev[1];
183*a9fa9459Szrj current_abbrev++)
184*a9fa9459Szrj {
185*a9fa9459Szrj if (current_abbrev >= abbrev_end)
186*a9fa9459Szrj {
187*a9fa9459Szrj this->failed(_("Debug abbreviations extend beyond "
188*a9fa9459Szrj ".debug_abbrev section; failed to reduce "
189*a9fa9459Szrj "debug abbreviations"));
190*a9fa9459Szrj return;
191*a9fa9459Szrj }
192*a9fa9459Szrj }
193*a9fa9459Szrj // Account for the two nulls and advance to the start of the
194*a9fa9459Szrj // next abbreviation.
195*a9fa9459Szrj current_abbrev += 2;
196*a9fa9459Szrj
197*a9fa9459Szrj // We're eliminating every entry except for compile units, so we
198*a9fa9459Szrj // only need to store abbreviations that describe them
199*a9fa9459Szrj if (abbrev_type == elfcpp::DW_TAG_compile_unit)
200*a9fa9459Szrj {
201*a9fa9459Szrj write_unsigned_LEB_128(&this->data_, ++this->abbrev_count_);
202*a9fa9459Szrj write_unsigned_LEB_128(&this->data_, abbrev_type);
203*a9fa9459Szrj // has_children is false for all entries
204*a9fa9459Szrj this->data_.push_back(0);
205*a9fa9459Szrj this->abbrev_mapping_[std::make_pair(abbrev_offset,
206*a9fa9459Szrj abbrev_number)] =
207*a9fa9459Szrj std::make_pair(abbrev_count_, this->data_.size());
208*a9fa9459Szrj this->data_.insert(this->data_.end(), abbrev_data,
209*a9fa9459Szrj current_abbrev);
210*a9fa9459Szrj }
211*a9fa9459Szrj abbrev_data = current_abbrev;
212*a9fa9459Szrj }
213*a9fa9459Szrj gold_assert(LEB_size == 1);
214*a9fa9459Szrj abbrev_data += LEB_size;
215*a9fa9459Szrj }
216*a9fa9459Szrj // Null terminate the list of abbreviations
217*a9fa9459Szrj this->data_.push_back(0);
218*a9fa9459Szrj this->set_data_size(data_.size());
219*a9fa9459Szrj this->sized_ = true;
220*a9fa9459Szrj }
221*a9fa9459Szrj
222*a9fa9459Szrj void
do_write(Output_file * of)223*a9fa9459Szrj Output_reduced_debug_abbrev_section::do_write(Output_file* of)
224*a9fa9459Szrj {
225*a9fa9459Szrj off_t offset = this->offset();
226*a9fa9459Szrj off_t data_size = this->data_size();
227*a9fa9459Szrj unsigned char* view = of->get_output_view(offset, data_size);
228*a9fa9459Szrj if (this->failed_)
229*a9fa9459Szrj memcpy(view, this->postprocessing_buffer(),
230*a9fa9459Szrj this->postprocessing_buffer_size());
231*a9fa9459Szrj else
232*a9fa9459Szrj memcpy(view, &this->data_.front(), data_size);
233*a9fa9459Szrj of->write_output_view(offset, data_size, view);
234*a9fa9459Szrj }
235*a9fa9459Szrj
236*a9fa9459Szrj // Locates the abbreviation with abbreviation_number abbrev_number in the
237*a9fa9459Szrj // abbreviation table at offset abbrev_offset. abbrev_number is updated with
238*a9fa9459Szrj // its new abbreviation number and a pointer to the beginning of the
239*a9fa9459Szrj // abbreviation is returned.
240*a9fa9459Szrj unsigned char*
get_new_abbrev(uint64_t * abbrev_number,uint64_t abbrev_offset)241*a9fa9459Szrj Output_reduced_debug_abbrev_section::get_new_abbrev(
242*a9fa9459Szrj uint64_t* abbrev_number, uint64_t abbrev_offset)
243*a9fa9459Szrj {
244*a9fa9459Szrj set_final_data_size();
245*a9fa9459Szrj std::pair<uint64_t, uint64_t> abbrev_info =
246*a9fa9459Szrj this->abbrev_mapping_[std::make_pair(abbrev_offset, *abbrev_number)];
247*a9fa9459Szrj *abbrev_number = abbrev_info.first;
248*a9fa9459Szrj return &this->data_[abbrev_info.second];
249*a9fa9459Szrj }
250*a9fa9459Szrj
set_final_data_size()251*a9fa9459Szrj void Output_reduced_debug_info_section::set_final_data_size()
252*a9fa9459Szrj {
253*a9fa9459Szrj if (this->failed_)
254*a9fa9459Szrj return;
255*a9fa9459Szrj unsigned char* debug_info = this->postprocessing_buffer();
256*a9fa9459Szrj unsigned char* debug_info_end = (this->postprocessing_buffer()
257*a9fa9459Szrj + this->postprocessing_buffer_size());
258*a9fa9459Szrj unsigned char* next_compile_unit;
259*a9fa9459Szrj this->write_to_postprocessing_buffer();
260*a9fa9459Szrj
261*a9fa9459Szrj while (debug_info < debug_info_end)
262*a9fa9459Szrj {
263*a9fa9459Szrj uint32_t compile_unit_start = read_from_pointer<32>(&debug_info);
264*a9fa9459Szrj // The first 4 bytes of each compile unit determine whether or
265*a9fa9459Szrj // not we're using dwarf32 or dwarf64. This is not necessarily
266*a9fa9459Szrj // related to whether the binary is 32 or 64 bits.
267*a9fa9459Szrj if (compile_unit_start == 0xFFFFFFFF)
268*a9fa9459Szrj {
269*a9fa9459Szrj // Technically the size can be up to 96 bits. Rather than handle
270*a9fa9459Szrj // 96/128 bit integers we just truncate the size at 64 bits.
271*a9fa9459Szrj if (0 != read_from_pointer<32>(&debug_info))
272*a9fa9459Szrj {
273*a9fa9459Szrj this->failed(_("Extremely large compile unit in debug info; "
274*a9fa9459Szrj "failed to reduce debug info"));
275*a9fa9459Szrj return;
276*a9fa9459Szrj }
277*a9fa9459Szrj const int dwarf64_header_size = sizeof(uint64_t) + sizeof(uint16_t) +
278*a9fa9459Szrj sizeof(uint64_t) + sizeof(uint8_t);
279*a9fa9459Szrj if (debug_info + dwarf64_header_size >= debug_info_end)
280*a9fa9459Szrj {
281*a9fa9459Szrj this->failed(_("Debug info extends beyond .debug_info section;"
282*a9fa9459Szrj "failed to reduce debug info"));
283*a9fa9459Szrj return;
284*a9fa9459Szrj }
285*a9fa9459Szrj
286*a9fa9459Szrj uint64_t compile_unit_size = read_from_pointer<64>(&debug_info);
287*a9fa9459Szrj next_compile_unit = debug_info + compile_unit_size;
288*a9fa9459Szrj uint16_t version = read_from_pointer<16>(&debug_info);
289*a9fa9459Szrj uint64_t abbrev_offset = read_from_pointer<64>(&debug_info);
290*a9fa9459Szrj uint8_t address_size = read_from_pointer<8>(&debug_info);
291*a9fa9459Szrj size_t LEB_size;
292*a9fa9459Szrj uint64_t abbreviation_number = read_unsigned_LEB_128(debug_info,
293*a9fa9459Szrj &LEB_size);
294*a9fa9459Szrj debug_info += LEB_size;
295*a9fa9459Szrj unsigned char* die_abbrev = this->associated_abbrev_->get_new_abbrev(
296*a9fa9459Szrj &abbreviation_number, abbrev_offset);
297*a9fa9459Szrj unsigned char* die_end;
298*a9fa9459Szrj if (!this->get_die_end(debug_info, die_abbrev, &die_end,
299*a9fa9459Szrj debug_info_end, address_size, true))
300*a9fa9459Szrj {
301*a9fa9459Szrj this->failed(_("Invalid DIE in debug info; "
302*a9fa9459Szrj "failed to reduce debug info"));
303*a9fa9459Szrj return;
304*a9fa9459Szrj }
305*a9fa9459Szrj
306*a9fa9459Szrj insert_into_vector<32>(&this->data_, 0xFFFFFFFF);
307*a9fa9459Szrj insert_into_vector<32>(&this->data_, 0);
308*a9fa9459Szrj insert_into_vector<64>(
309*a9fa9459Szrj &this->data_,
310*a9fa9459Szrj (11 + get_length_as_unsigned_LEB_128(abbreviation_number)
311*a9fa9459Szrj + die_end - debug_info));
312*a9fa9459Szrj insert_into_vector<16>(&this->data_, version);
313*a9fa9459Szrj insert_into_vector<64>(&this->data_, 0);
314*a9fa9459Szrj insert_into_vector<8>(&this->data_, address_size);
315*a9fa9459Szrj write_unsigned_LEB_128(&this->data_, abbreviation_number);
316*a9fa9459Szrj this->data_.insert(this->data_.end(), debug_info, die_end);
317*a9fa9459Szrj }
318*a9fa9459Szrj else
319*a9fa9459Szrj {
320*a9fa9459Szrj const int dwarf32_header_size =
321*a9fa9459Szrj sizeof(uint16_t) + sizeof(uint32_t) + sizeof(uint8_t);
322*a9fa9459Szrj if (debug_info + dwarf32_header_size >= debug_info_end)
323*a9fa9459Szrj {
324*a9fa9459Szrj this->failed(_("Debug info extends beyond .debug_info section; "
325*a9fa9459Szrj "failed to reduce debug info"));
326*a9fa9459Szrj return;
327*a9fa9459Szrj }
328*a9fa9459Szrj uint32_t compile_unit_size = compile_unit_start;
329*a9fa9459Szrj next_compile_unit = debug_info + compile_unit_size;
330*a9fa9459Szrj uint16_t version = read_from_pointer<16>(&debug_info);
331*a9fa9459Szrj uint32_t abbrev_offset = read_from_pointer<32>(&debug_info);
332*a9fa9459Szrj uint8_t address_size = read_from_pointer<8>(&debug_info);
333*a9fa9459Szrj size_t LEB_size;
334*a9fa9459Szrj uint64_t abbreviation_number = read_unsigned_LEB_128(debug_info,
335*a9fa9459Szrj &LEB_size);
336*a9fa9459Szrj debug_info += LEB_size;
337*a9fa9459Szrj unsigned char* die_abbrev = this->associated_abbrev_->get_new_abbrev(
338*a9fa9459Szrj &abbreviation_number, abbrev_offset);
339*a9fa9459Szrj unsigned char* die_end;
340*a9fa9459Szrj if (!this->get_die_end(debug_info, die_abbrev, &die_end,
341*a9fa9459Szrj debug_info_end, address_size, false))
342*a9fa9459Szrj {
343*a9fa9459Szrj this->failed(_("Invalid DIE in debug info; "
344*a9fa9459Szrj "failed to reduce debug info"));
345*a9fa9459Szrj return;
346*a9fa9459Szrj }
347*a9fa9459Szrj
348*a9fa9459Szrj insert_into_vector<32>(
349*a9fa9459Szrj &this->data_,
350*a9fa9459Szrj (7 + get_length_as_unsigned_LEB_128(abbreviation_number)
351*a9fa9459Szrj + die_end - debug_info));
352*a9fa9459Szrj insert_into_vector<16>(&this->data_, version);
353*a9fa9459Szrj insert_into_vector<32>(&this->data_, 0);
354*a9fa9459Szrj insert_into_vector<8>(&this->data_, address_size);
355*a9fa9459Szrj write_unsigned_LEB_128(&this->data_, abbreviation_number);
356*a9fa9459Szrj this->data_.insert(this->data_.end(), debug_info, die_end);
357*a9fa9459Szrj }
358*a9fa9459Szrj debug_info = next_compile_unit;
359*a9fa9459Szrj }
360*a9fa9459Szrj this->set_data_size(data_.size());
361*a9fa9459Szrj }
362*a9fa9459Szrj
do_write(Output_file * of)363*a9fa9459Szrj void Output_reduced_debug_info_section::do_write(Output_file* of)
364*a9fa9459Szrj {
365*a9fa9459Szrj off_t offset = this->offset();
366*a9fa9459Szrj off_t data_size = this->data_size();
367*a9fa9459Szrj unsigned char* view = of->get_output_view(offset, data_size);
368*a9fa9459Szrj if (this->failed_)
369*a9fa9459Szrj memcpy(view, this->postprocessing_buffer(),
370*a9fa9459Szrj this->postprocessing_buffer_size());
371*a9fa9459Szrj else
372*a9fa9459Szrj memcpy(view, &this->data_.front(), data_size);
373*a9fa9459Szrj of->write_output_view(offset, data_size, view);
374*a9fa9459Szrj }
375*a9fa9459Szrj
376*a9fa9459Szrj } // End namespace gold.
377