| // reduced_debug_output.cc -- output reduced debugging information to save space |
| |
| // Copyright (C) 2008-2024 Free Software Foundation, Inc. |
| // Written by Caleb Howe <cshowe@google.com>. |
| |
| // This file is part of gold. |
| |
| // This program is free software; you can redistribute it and/or modify |
| // it under the terms of the GNU General Public License as published by |
| // the Free Software Foundation; either version 3 of the License, or |
| // (at your option) any later version. |
| |
| // This program is distributed in the hope that it will be useful, |
| // but WITHOUT ANY WARRANTY; without even the implied warranty of |
| // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| // GNU General Public License for more details. |
| |
| // You should have received a copy of the GNU General Public License |
| // along with this program; if not, write to the Free Software |
| // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, |
| // MA 02110-1301, USA. |
| |
| #include "gold.h" |
| |
| #include "parameters.h" |
| #include "options.h" |
| #include "dwarf.h" |
| #include "dwarf_reader.h" |
| #include "reduced_debug_output.h" |
| #include "int_encoding.h" |
| |
| #include <vector> |
| |
| namespace gold |
| { |
| |
| // Given a pointer to the beginning of a die and the beginning of the associated |
| // abbreviation fills in die_end with the end of the information entry. If |
| // successful returns true. Get_die_end also takes a pointer to the end of the |
| // buffer containing the die. If die_end would be beyond the end of the |
| // buffer, or if an unsupported dwarf form is encountered returns false. |
| bool |
| Output_reduced_debug_info_section::get_die_end( |
| unsigned char* die, unsigned char* abbrev, unsigned char** die_end, |
| unsigned char* buffer_end, int address_size, bool is64) |
| { |
| size_t LEB_size; |
| uint64_t LEB_decoded; |
| for(;;) |
| { |
| uint64_t attribute = read_unsigned_LEB_128(abbrev, &LEB_size); |
| abbrev += LEB_size; |
| elfcpp::DW_FORM form = |
| static_cast<elfcpp::DW_FORM>(read_unsigned_LEB_128(abbrev, |
| &LEB_size)); |
| abbrev += LEB_size; |
| if (!(attribute || form)) |
| break; |
| if (die >= buffer_end) |
| return false; |
| switch(form) |
| { |
| case elfcpp::DW_FORM_flag_present: |
| break; |
| case elfcpp::DW_FORM_strp: |
| case elfcpp::DW_FORM_sec_offset: |
| die += is64 ? 8 : 4; |
| break; |
| case elfcpp::DW_FORM_addr: |
| case elfcpp::DW_FORM_ref_addr: |
| die += address_size; |
| break; |
| case elfcpp::DW_FORM_block1: |
| die += *die; |
| die += 1; |
| break; |
| case elfcpp::DW_FORM_block2: |
| { |
| uint16_t block_size; |
| block_size = read_from_pointer<16>(&die); |
| die += block_size; |
| break; |
| } |
| case elfcpp::DW_FORM_block4: |
| { |
| uint32_t block_size; |
| block_size = read_from_pointer<32>(&die); |
| die += block_size; |
| break; |
| } |
| case elfcpp::DW_FORM_block: |
| case elfcpp::DW_FORM_exprloc: |
| LEB_decoded = read_unsigned_LEB_128(die, &LEB_size); |
| die += (LEB_decoded + LEB_size); |
| break; |
| case elfcpp::DW_FORM_data1: |
| case elfcpp::DW_FORM_ref1: |
| case elfcpp::DW_FORM_flag: |
| die += 1; |
| break; |
| case elfcpp::DW_FORM_data2: |
| case elfcpp::DW_FORM_ref2: |
| die += 2; |
| break; |
| case elfcpp::DW_FORM_data4: |
| case elfcpp::DW_FORM_ref4: |
| die += 4; |
| break; |
| case elfcpp::DW_FORM_data8: |
| case elfcpp::DW_FORM_ref8: |
| case elfcpp::DW_FORM_ref_sig8: |
| die += 8; |
| break; |
| case elfcpp::DW_FORM_ref_udata: |
| case elfcpp::DW_FORM_udata: |
| read_unsigned_LEB_128(die, &LEB_size); |
| die += LEB_size; |
| break; |
| case elfcpp::DW_FORM_sdata: |
| read_signed_LEB_128(die, &LEB_size); |
| die += LEB_size; |
| break; |
| case elfcpp::DW_FORM_string: |
| { |
| size_t length = strlen(reinterpret_cast<char*>(die)); |
| die += length + 1; |
| break; |
| } |
| case elfcpp::DW_FORM_indirect: |
| case elfcpp::DW_FORM_GNU_addr_index: |
| case elfcpp::DW_FORM_GNU_str_index: |
| default: |
| return false; |
| } |
| } |
| *die_end = die; |
| return true; |
| } |
| |
| void |
| Output_reduced_debug_abbrev_section::set_final_data_size() |
| { |
| if (this->sized_ || this->failed_) |
| return; |
| |
| uint64_t abbrev_number; |
| size_t LEB_size; |
| unsigned char* abbrev_data = this->postprocessing_buffer(); |
| unsigned char* abbrev_end = this->postprocessing_buffer() + |
| this->postprocessing_buffer_size(); |
| this->write_to_postprocessing_buffer(); |
| while(abbrev_data < abbrev_end) |
| { |
| uint64_t abbrev_offset = abbrev_data - this->postprocessing_buffer(); |
| while((abbrev_number = read_unsigned_LEB_128(abbrev_data, &LEB_size))) |
| { |
| if (abbrev_data >= abbrev_end) |
| { |
| failed("Debug abbreviations extend beyond .debug_abbrev " |
| "section; failed to reduce debug abbreviations"); |
| return; |
| } |
| abbrev_data += LEB_size; |
| |
| // Together with the abbreviation number these fields make up |
| // the header for each abbreviation. |
| uint64_t abbrev_type = read_unsigned_LEB_128(abbrev_data, &LEB_size); |
| abbrev_data += LEB_size; |
| |
| // This would ordinarily be the has_children field of the |
| // abbreviation. But it's going to be false after reducing the |
| // information, so there's no point in storing it. |
| abbrev_data++; |
| |
| // Read to the end of the current abbreviation. |
| // This is indicated by two zero unsigned LEBs in a row. We don't |
| // need to parse the data yet, so we just scan through the data |
| // looking for two consecutive 0 bytes indicating the end of the |
| // abbreviation. |
| unsigned char* current_abbrev; |
| for (current_abbrev = abbrev_data; |
| current_abbrev[0] || current_abbrev[1]; |
| current_abbrev++) |
| { |
| if (current_abbrev >= abbrev_end) |
| { |
| this->failed(_("Debug abbreviations extend beyond " |
| ".debug_abbrev section; failed to reduce " |
| "debug abbreviations")); |
| return; |
| } |
| } |
| // Account for the two nulls and advance to the start of the |
| // next abbreviation. |
| current_abbrev += 2; |
| |
| // We're eliminating every entry except for compile units, so we |
| // only need to store abbreviations that describe them |
| if (abbrev_type == elfcpp::DW_TAG_compile_unit) |
| { |
| write_unsigned_LEB_128(&this->data_, ++this->abbrev_count_); |
| write_unsigned_LEB_128(&this->data_, abbrev_type); |
| // has_children is false for all entries |
| this->data_.push_back(0); |
| this->abbrev_mapping_[std::make_pair(abbrev_offset, |
| abbrev_number)] = |
| std::make_pair(abbrev_count_, this->data_.size()); |
| this->data_.insert(this->data_.end(), abbrev_data, |
| current_abbrev); |
| } |
| abbrev_data = current_abbrev; |
| } |
| gold_assert(LEB_size == 1); |
| abbrev_data += LEB_size; |
| } |
| // Null terminate the list of abbreviations |
| this->data_.push_back(0); |
| this->set_data_size(data_.size()); |
| this->sized_ = true; |
| } |
| |
| void |
| Output_reduced_debug_abbrev_section::do_write(Output_file* of) |
| { |
| off_t offset = this->offset(); |
| off_t data_size = this->data_size(); |
| unsigned char* view = of->get_output_view(offset, data_size); |
| if (this->failed_) |
| memcpy(view, this->postprocessing_buffer(), |
| this->postprocessing_buffer_size()); |
| else |
| memcpy(view, &this->data_.front(), data_size); |
| of->write_output_view(offset, data_size, view); |
| } |
| |
| // Locates the abbreviation with abbreviation_number abbrev_number in the |
| // abbreviation table at offset abbrev_offset. abbrev_number is updated with |
| // its new abbreviation number and a pointer to the beginning of the |
| // abbreviation is returned. |
| unsigned char* |
| Output_reduced_debug_abbrev_section::get_new_abbrev( |
| uint64_t* abbrev_number, uint64_t abbrev_offset) |
| { |
| set_final_data_size(); |
| std::pair<uint64_t, uint64_t> abbrev_info = |
| this->abbrev_mapping_[std::make_pair(abbrev_offset, *abbrev_number)]; |
| *abbrev_number = abbrev_info.first; |
| return &this->data_[abbrev_info.second]; |
| } |
| |
| void Output_reduced_debug_info_section::set_final_data_size() |
| { |
| if (this->failed_) |
| return; |
| unsigned char* debug_info = this->postprocessing_buffer(); |
| unsigned char* debug_info_end = (this->postprocessing_buffer() |
| + this->postprocessing_buffer_size()); |
| unsigned char* next_compile_unit; |
| this->write_to_postprocessing_buffer(); |
| |
| while (debug_info < debug_info_end) |
| { |
| uint32_t compile_unit_start = read_from_pointer<32>(&debug_info); |
| // The first 4 bytes of each compile unit determine whether or |
| // not we're using dwarf32 or dwarf64. This is not necessarily |
| // related to whether the binary is 32 or 64 bits. |
| if (compile_unit_start == 0xFFFFFFFF) |
| { |
| // Technically the size can be up to 96 bits. Rather than handle |
| // 96/128 bit integers we just truncate the size at 64 bits. |
| if (0 != read_from_pointer<32>(&debug_info)) |
| { |
| this->failed(_("Extremely large compile unit in debug info; " |
| "failed to reduce debug info")); |
| return; |
| } |
| const int dwarf64_header_size = sizeof(uint64_t) + sizeof(uint16_t) + |
| sizeof(uint64_t) + sizeof(uint8_t); |
| if (debug_info + dwarf64_header_size >= debug_info_end) |
| { |
| this->failed(_("Debug info extends beyond .debug_info section;" |
| "failed to reduce debug info")); |
| return; |
| } |
| |
| uint64_t compile_unit_size = read_from_pointer<64>(&debug_info); |
| next_compile_unit = debug_info + compile_unit_size; |
| uint16_t version = read_from_pointer<16>(&debug_info); |
| uint64_t abbrev_offset = read_from_pointer<64>(&debug_info); |
| uint8_t address_size = read_from_pointer<8>(&debug_info); |
| size_t LEB_size; |
| uint64_t abbreviation_number = read_unsigned_LEB_128(debug_info, |
| &LEB_size); |
| debug_info += LEB_size; |
| unsigned char* die_abbrev = this->associated_abbrev_->get_new_abbrev( |
| &abbreviation_number, abbrev_offset); |
| unsigned char* die_end; |
| if (!this->get_die_end(debug_info, die_abbrev, &die_end, |
| debug_info_end, address_size, true)) |
| { |
| this->failed(_("Invalid DIE in debug info; " |
| "failed to reduce debug info")); |
| return; |
| } |
| |
| insert_into_vector<32>(&this->data_, 0xFFFFFFFF); |
| insert_into_vector<32>(&this->data_, 0); |
| insert_into_vector<64>( |
| &this->data_, |
| (11 + get_length_as_unsigned_LEB_128(abbreviation_number) |
| + die_end - debug_info)); |
| insert_into_vector<16>(&this->data_, version); |
| insert_into_vector<64>(&this->data_, 0); |
| insert_into_vector<8>(&this->data_, address_size); |
| write_unsigned_LEB_128(&this->data_, abbreviation_number); |
| this->data_.insert(this->data_.end(), debug_info, die_end); |
| } |
| else |
| { |
| const int dwarf32_header_size = |
| sizeof(uint16_t) + sizeof(uint32_t) + sizeof(uint8_t); |
| if (debug_info + dwarf32_header_size >= debug_info_end) |
| { |
| this->failed(_("Debug info extends beyond .debug_info section; " |
| "failed to reduce debug info")); |
| return; |
| } |
| uint32_t compile_unit_size = compile_unit_start; |
| next_compile_unit = debug_info + compile_unit_size; |
| uint16_t version = read_from_pointer<16>(&debug_info); |
| uint32_t abbrev_offset = read_from_pointer<32>(&debug_info); |
| uint8_t address_size = read_from_pointer<8>(&debug_info); |
| size_t LEB_size; |
| uint64_t abbreviation_number = read_unsigned_LEB_128(debug_info, |
| &LEB_size); |
| debug_info += LEB_size; |
| unsigned char* die_abbrev = this->associated_abbrev_->get_new_abbrev( |
| &abbreviation_number, abbrev_offset); |
| unsigned char* die_end; |
| if (!this->get_die_end(debug_info, die_abbrev, &die_end, |
| debug_info_end, address_size, false)) |
| { |
| this->failed(_("Invalid DIE in debug info; " |
| "failed to reduce debug info")); |
| return; |
| } |
| |
| insert_into_vector<32>( |
| &this->data_, |
| (7 + get_length_as_unsigned_LEB_128(abbreviation_number) |
| + die_end - debug_info)); |
| insert_into_vector<16>(&this->data_, version); |
| insert_into_vector<32>(&this->data_, 0); |
| insert_into_vector<8>(&this->data_, address_size); |
| write_unsigned_LEB_128(&this->data_, abbreviation_number); |
| this->data_.insert(this->data_.end(), debug_info, die_end); |
| } |
| debug_info = next_compile_unit; |
| } |
| this->set_data_size(data_.size()); |
| } |
| |
| void Output_reduced_debug_info_section::do_write(Output_file* of) |
| { |
| off_t offset = this->offset(); |
| off_t data_size = this->data_size(); |
| unsigned char* view = of->get_output_view(offset, data_size); |
| if (this->failed_) |
| memcpy(view, this->postprocessing_buffer(), |
| this->postprocessing_buffer_size()); |
| else |
| memcpy(view, &this->data_.front(), data_size); |
| of->write_output_view(offset, data_size, view); |
| } |
| |
| } // End namespace gold. |