// reduced_debug_output.cc -- output reduced debugging information to save space // Copyright (C) 2008-2021 Free Software Foundation, Inc. // Written by Caleb Howe <cshowe@google.com>. // This file is part of gold. // This program is free software; you can redistribute it and/or modify // it under the terms of the GNU General Public License as published by // the Free Software Foundation; either version 3 of the License, or // (at your option) any later version. // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License for more details. // You should have received a copy of the GNU General Public License // along with this program; if not, write to the Free Software // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, // MA 02110-1301, USA. #include "gold.h" #include "parameters.h" #include "options.h" #include "dwarf.h" #include "dwarf_reader.h" #include "reduced_debug_output.h" #include "int_encoding.h" #include <vector> namespace gold { // Given a pointer to the beginning of a die and the beginning of the associated // abbreviation fills in die_end with the end of the information entry. If // successful returns true. Get_die_end also takes a pointer to the end of the // buffer containing the die. If die_end would be beyond the end of the // buffer, or if an unsupported dwarf form is encountered returns false. bool Output_reduced_debug_info_section::get_die_end( unsigned char* die, unsigned char* abbrev, unsigned char** die_end, unsigned char* buffer_end, int address_size, bool is64) { size_t LEB_size; uint64_t LEB_decoded; for(;;) { uint64_t attribute = read_unsigned_LEB_128(abbrev, &LEB_size); abbrev += LEB_size; elfcpp::DW_FORM form = static_cast<elfcpp::DW_FORM>(read_unsigned_LEB_128(abbrev, &LEB_size)); abbrev += LEB_size; if (!(attribute || form)) break; if (die >= buffer_end) return false; switch(form) { case elfcpp::DW_FORM_flag_present: break; case elfcpp::DW_FORM_strp: case elfcpp::DW_FORM_sec_offset: die += is64 ? 8 : 4; break; case elfcpp::DW_FORM_addr: case elfcpp::DW_FORM_ref_addr: die += address_size; break; case elfcpp::DW_FORM_block1: die += *die; die += 1; break; case elfcpp::DW_FORM_block2: { uint16_t block_size; block_size = read_from_pointer<16>(&die); die += block_size; break; } case elfcpp::DW_FORM_block4: { uint32_t block_size; block_size = read_from_pointer<32>(&die); die += block_size; break; } case elfcpp::DW_FORM_block: case elfcpp::DW_FORM_exprloc: LEB_decoded = read_unsigned_LEB_128(die, &LEB_size); die += (LEB_decoded + LEB_size); break; case elfcpp::DW_FORM_data1: case elfcpp::DW_FORM_ref1: case elfcpp::DW_FORM_flag: die += 1; break; case elfcpp::DW_FORM_data2: case elfcpp::DW_FORM_ref2: die += 2; break; case elfcpp::DW_FORM_data4: case elfcpp::DW_FORM_ref4: die += 4; break; case elfcpp::DW_FORM_data8: case elfcpp::DW_FORM_ref8: case elfcpp::DW_FORM_ref_sig8: die += 8; break; case elfcpp::DW_FORM_ref_udata: case elfcpp::DW_FORM_udata: read_unsigned_LEB_128(die, &LEB_size); die += LEB_size; break; case elfcpp::DW_FORM_sdata: read_signed_LEB_128(die, &LEB_size); die += LEB_size; break; case elfcpp::DW_FORM_string: { size_t length = strlen(reinterpret_cast<char*>(die)); die += length + 1; break; } case elfcpp::DW_FORM_indirect: case elfcpp::DW_FORM_GNU_addr_index: case elfcpp::DW_FORM_GNU_str_index: default: return false; } } *die_end = die; return true; } void Output_reduced_debug_abbrev_section::set_final_data_size() { if (this->sized_ || this->failed_) return; uint64_t abbrev_number; size_t LEB_size; unsigned char* abbrev_data = this->postprocessing_buffer(); unsigned char* abbrev_end = this->postprocessing_buffer() + this->postprocessing_buffer_size(); this->write_to_postprocessing_buffer(); while(abbrev_data < abbrev_end) { uint64_t abbrev_offset = abbrev_data - this->postprocessing_buffer(); while((abbrev_number = read_unsigned_LEB_128(abbrev_data, &LEB_size))) { if (abbrev_data >= abbrev_end) { failed("Debug abbreviations extend beyond .debug_abbrev " "section; failed to reduce debug abbreviations"); return; } abbrev_data += LEB_size; // Together with the abbreviation number these fields make up // the header for each abbreviation. uint64_t abbrev_type = read_unsigned_LEB_128(abbrev_data, &LEB_size); abbrev_data += LEB_size; // This would ordinarily be the has_children field of the // abbreviation. But it's going to be false after reducing the // information, so there's no point in storing it. abbrev_data++; // Read to the end of the current abbreviation. // This is indicated by two zero unsigned LEBs in a row. We don't // need to parse the data yet, so we just scan through the data // looking for two consecutive 0 bytes indicating the end of the // abbreviation. unsigned char* current_abbrev; for (current_abbrev = abbrev_data; current_abbrev[0] || current_abbrev[1]; current_abbrev++) { if (current_abbrev >= abbrev_end) { this->failed(_("Debug abbreviations extend beyond " ".debug_abbrev section; failed to reduce " "debug abbreviations")); return; } } // Account for the two nulls and advance to the start of the // next abbreviation. current_abbrev += 2; // We're eliminating every entry except for compile units, so we // only need to store abbreviations that describe them if (abbrev_type == elfcpp::DW_TAG_compile_unit) { write_unsigned_LEB_128(&this->data_, ++this->abbrev_count_); write_unsigned_LEB_128(&this->data_, abbrev_type); // has_children is false for all entries this->data_.push_back(0); this->abbrev_mapping_[std::make_pair(abbrev_offset, abbrev_number)] = std::make_pair(abbrev_count_, this->data_.size()); this->data_.insert(this->data_.end(), abbrev_data, current_abbrev); } abbrev_data = current_abbrev; } gold_assert(LEB_size == 1); abbrev_data += LEB_size; } // Null terminate the list of abbreviations this->data_.push_back(0); this->set_data_size(data_.size()); this->sized_ = true; } void Output_reduced_debug_abbrev_section::do_write(Output_file* of) { off_t offset = this->offset(); off_t data_size = this->data_size(); unsigned char* view = of->get_output_view(offset, data_size); if (this->failed_) memcpy(view, this->postprocessing_buffer(), this->postprocessing_buffer_size()); else memcpy(view, &this->data_.front(), data_size); of->write_output_view(offset, data_size, view); } // Locates the abbreviation with abbreviation_number abbrev_number in the // abbreviation table at offset abbrev_offset. abbrev_number is updated with // its new abbreviation number and a pointer to the beginning of the // abbreviation is returned. unsigned char* Output_reduced_debug_abbrev_section::get_new_abbrev( uint64_t* abbrev_number, uint64_t abbrev_offset) { set_final_data_size(); std::pair<uint64_t, uint64_t> abbrev_info = this->abbrev_mapping_[std::make_pair(abbrev_offset, *abbrev_number)]; *abbrev_number = abbrev_info.first; return &this->data_[abbrev_info.second]; } void Output_reduced_debug_info_section::set_final_data_size() { if (this->failed_) return; unsigned char* debug_info = this->postprocessing_buffer(); unsigned char* debug_info_end = (this->postprocessing_buffer() + this->postprocessing_buffer_size()); unsigned char* next_compile_unit; this->write_to_postprocessing_buffer(); while (debug_info < debug_info_end) { uint32_t compile_unit_start = read_from_pointer<32>(&debug_info); // The first 4 bytes of each compile unit determine whether or // not we're using dwarf32 or dwarf64. This is not necessarily // related to whether the binary is 32 or 64 bits. if (compile_unit_start == 0xFFFFFFFF) { // Technically the size can be up to 96 bits. Rather than handle // 96/128 bit integers we just truncate the size at 64 bits. if (0 != read_from_pointer<32>(&debug_info)) { this->failed(_("Extremely large compile unit in debug info; " "failed to reduce debug info")); return; } const int dwarf64_header_size = sizeof(uint64_t) + sizeof(uint16_t) + sizeof(uint64_t) + sizeof(uint8_t); if (debug_info + dwarf64_header_size >= debug_info_end) { this->failed(_("Debug info extends beyond .debug_info section;" "failed to reduce debug info")); return; } uint64_t compile_unit_size = read_from_pointer<64>(&debug_info); next_compile_unit = debug_info + compile_unit_size; uint16_t version = read_from_pointer<16>(&debug_info); uint64_t abbrev_offset = read_from_pointer<64>(&debug_info); uint8_t address_size = read_from_pointer<8>(&debug_info); size_t LEB_size; uint64_t abbreviation_number = read_unsigned_LEB_128(debug_info, &LEB_size); debug_info += LEB_size; unsigned char* die_abbrev = this->associated_abbrev_->get_new_abbrev( &abbreviation_number, abbrev_offset); unsigned char* die_end; if (!this->get_die_end(debug_info, die_abbrev, &die_end, debug_info_end, address_size, true)) { this->failed(_("Invalid DIE in debug info; " "failed to reduce debug info")); return; } insert_into_vector<32>(&this->data_, 0xFFFFFFFF); insert_into_vector<32>(&this->data_, 0); insert_into_vector<64>( &this->data_, (11 + get_length_as_unsigned_LEB_128(abbreviation_number) + die_end - debug_info)); insert_into_vector<16>(&this->data_, version); insert_into_vector<64>(&this->data_, 0); insert_into_vector<8>(&this->data_, address_size); write_unsigned_LEB_128(&this->data_, abbreviation_number); this->data_.insert(this->data_.end(), debug_info, die_end); } else { const int dwarf32_header_size = sizeof(uint16_t) + sizeof(uint32_t) + sizeof(uint8_t); if (debug_info + dwarf32_header_size >= debug_info_end) { this->failed(_("Debug info extends beyond .debug_info section; " "failed to reduce debug info")); return; } uint32_t compile_unit_size = compile_unit_start; next_compile_unit = debug_info + compile_unit_size; uint16_t version = read_from_pointer<16>(&debug_info); uint32_t abbrev_offset = read_from_pointer<32>(&debug_info); uint8_t address_size = read_from_pointer<8>(&debug_info); size_t LEB_size; uint64_t abbreviation_number = read_unsigned_LEB_128(debug_info, &LEB_size); debug_info += LEB_size; unsigned char* die_abbrev = this->associated_abbrev_->get_new_abbrev( &abbreviation_number, abbrev_offset); unsigned char* die_end; if (!this->get_die_end(debug_info, die_abbrev, &die_end, debug_info_end, address_size, false)) { this->failed(_("Invalid DIE in debug info; " "failed to reduce debug info")); return; } insert_into_vector<32>( &this->data_, (7 + get_length_as_unsigned_LEB_128(abbreviation_number) + die_end - debug_info)); insert_into_vector<16>(&this->data_, version); insert_into_vector<32>(&this->data_, 0); insert_into_vector<8>(&this->data_, address_size); write_unsigned_LEB_128(&this->data_, abbreviation_number); this->data_.insert(this->data_.end(), debug_info, die_end); } debug_info = next_compile_unit; } this->set_data_size(data_.size()); } void Output_reduced_debug_info_section::do_write(Output_file* of) { off_t offset = this->offset(); off_t data_size = this->data_size(); unsigned char* view = of->get_output_view(offset, data_size); if (this->failed_) memcpy(view, this->postprocessing_buffer(), this->postprocessing_buffer_size()); else memcpy(view, &this->data_.front(), data_size); of->write_output_view(offset, data_size, view); } } // End namespace gold.