|  | // merge.h -- handle section merging for gold  -*- C++ -*- | 
|  |  | 
|  | // Copyright (C) 2006-2023 Free Software Foundation, Inc. | 
|  | // Written by Ian Lance Taylor <iant@google.com>. | 
|  |  | 
|  | // This file is part of gold. | 
|  |  | 
|  | // This program is free software; you can redistribute it and/or modify | 
|  | // it under the terms of the GNU General Public License as published by | 
|  | // the Free Software Foundation; either version 3 of the License, or | 
|  | // (at your option) any later version. | 
|  |  | 
|  | // This program is distributed in the hope that it will be useful, | 
|  | // but WITHOUT ANY WARRANTY; without even the implied warranty of | 
|  | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
|  | // GNU General Public License for more details. | 
|  |  | 
|  | // You should have received a copy of the GNU General Public License | 
|  | // along with this program; if not, write to the Free Software | 
|  | // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, | 
|  | // MA 02110-1301, USA. | 
|  |  | 
|  | #ifndef GOLD_MERGE_H | 
|  | #define GOLD_MERGE_H | 
|  |  | 
|  | #include <climits> | 
|  | #include <map> | 
|  | #include <vector> | 
|  |  | 
|  | #include "stringpool.h" | 
|  | #include "output.h" | 
|  |  | 
|  | namespace gold | 
|  | { | 
|  |  | 
|  | // For each object with merge sections, we store an Object_merge_map. | 
|  | // This is used to map locations in input sections to a merged output | 
|  | // section.  The output section itself is not recorded here--it can be | 
|  | // found in the output_sections_ field of the Object. | 
|  |  | 
|  | class Object_merge_map | 
|  | { | 
|  | public: | 
|  | Object_merge_map() | 
|  | : section_merge_maps_() | 
|  | { } | 
|  |  | 
|  | ~Object_merge_map(); | 
|  |  | 
|  | // Add a mapping for MERGE_MAP, for the bytes from OFFSET to OFFSET | 
|  | // + LENGTH in the input section SHNDX to OUTPUT_OFFSET in the | 
|  | // output section.  An OUTPUT_OFFSET of -1 means that the bytes are | 
|  | // discarded.  OUTPUT_OFFSET is relative to the start of the merged | 
|  | // data in the output section. | 
|  | void | 
|  | add_mapping(const Output_section_data*, unsigned int shndx, | 
|  | section_offset_type offset, section_size_type length, | 
|  | section_offset_type output_offset); | 
|  |  | 
|  | // Get the output offset for an input address.  MERGE_MAP is the map | 
|  | // we are looking for, or NULL if we don't care.  The input address | 
|  | // is at offset OFFSET in section SHNDX.  This sets *OUTPUT_OFFSET | 
|  | // to the offset in the output section; this will be -1 if the bytes | 
|  | // are not being copied to the output.  This returns true if the | 
|  | // mapping is known, false otherwise.  *OUTPUT_OFFSET is relative to | 
|  | // the start of the merged data in the output section. | 
|  | bool | 
|  | get_output_offset(unsigned int shndx, | 
|  | section_offset_type offset, | 
|  | section_offset_type* output_offset); | 
|  |  | 
|  | const Output_section_data* | 
|  | find_merge_section(unsigned int shndx) const; | 
|  |  | 
|  | // Initialize an mapping from input offsets to output addresses for | 
|  | // section SHNDX.  STARTING_ADDRESS is the output address of the | 
|  | // merged section. | 
|  | template<int size> | 
|  | void | 
|  | initialize_input_to_output_map( | 
|  | unsigned int shndx, | 
|  | typename elfcpp::Elf_types<size>::Elf_Addr starting_address, | 
|  | Unordered_map<section_offset_type, | 
|  | typename elfcpp::Elf_types<size>::Elf_Addr>*); | 
|  |  | 
|  | // Map input section offsets to a length and an output section | 
|  | // offset.  An output section offset of -1 means that this part of | 
|  | // the input section is being discarded. | 
|  | struct Input_merge_entry | 
|  | { | 
|  | // The offset in the input section. | 
|  | section_offset_type input_offset; | 
|  | // The length. | 
|  | section_size_type length; | 
|  | // The offset in the output section. | 
|  | section_offset_type output_offset; | 
|  | }; | 
|  |  | 
|  | // A list of entries for a particular input section. | 
|  | struct Input_merge_map | 
|  | { | 
|  | void add_mapping(section_offset_type input_offset, section_size_type length, | 
|  | section_offset_type output_offset); | 
|  |  | 
|  | typedef std::vector<Input_merge_entry> Entries; | 
|  |  | 
|  | // We store these with the Relobj, and we look them up by input | 
|  | // section.  It is possible to have two different merge maps | 
|  | // associated with a single output section.  For example, this | 
|  | // happens routinely with .rodata, when merged string constants | 
|  | // and merged fixed size constants are both put into .rodata.  The | 
|  | // output offset that we store is not the offset from the start of | 
|  | // the output section; it is the offset from the start of the | 
|  | // merged data in the output section.  That means that the caller | 
|  | // is going to add the offset of the merged data within the output | 
|  | // section, which means that the caller needs to know which set of | 
|  | // merged data it found the entry in.  So it's not enough to find | 
|  | // this data based on the input section and the output section; we | 
|  | // also have to find it based on a set of merged data in the | 
|  | // output section.  In order to verify that we are looking at the | 
|  | // right data, we store a pointer to the Merge_map here, and we | 
|  | // pass in a pointer when looking at the data.  If we are asked to | 
|  | // look up information for a different Merge_map, we report that | 
|  | // we don't have it, rather than trying a lookup and returning an | 
|  | // answer which will receive the wrong offset. | 
|  | const Output_section_data* output_data; | 
|  | // The list of mappings. | 
|  | Entries entries; | 
|  | // Whether the ENTRIES field is sorted by input_offset. | 
|  | bool sorted; | 
|  |  | 
|  | Input_merge_map() | 
|  | : output_data(NULL), entries(), sorted(true) | 
|  | { } | 
|  | }; | 
|  |  | 
|  | // Get or make the Input_merge_map to use for the section SHNDX | 
|  | // with MERGE_MAP. | 
|  | Input_merge_map* | 
|  | get_or_make_input_merge_map(const Output_section_data* merge_map, | 
|  | unsigned int shndx); | 
|  |  | 
|  | private: | 
|  | // A less-than comparison routine for Input_merge_entry. | 
|  | struct Input_merge_compare | 
|  | { | 
|  | bool | 
|  | operator()(const Input_merge_entry& i1, const Input_merge_entry& i2) const | 
|  | { return i1.input_offset < i2.input_offset; } | 
|  | }; | 
|  |  | 
|  | // Map input section indices to merge maps. | 
|  | typedef std::vector<std::pair<unsigned int, Input_merge_map*> > | 
|  | Section_merge_maps; | 
|  |  | 
|  | // Return a pointer to the Input_merge_map to use for the input | 
|  | // section SHNDX, or NULL. | 
|  | const Input_merge_map* | 
|  | get_input_merge_map(unsigned int shndx) const; | 
|  |  | 
|  | Input_merge_map * | 
|  | get_input_merge_map(unsigned int shndx) { | 
|  | return const_cast<Input_merge_map *>(static_cast<const Object_merge_map *>( | 
|  | this)->get_input_merge_map(shndx)); | 
|  | } | 
|  |  | 
|  | Section_merge_maps section_merge_maps_; | 
|  | }; | 
|  |  | 
|  | // A general class for SHF_MERGE data, to hold functions shared by | 
|  | // fixed-size constant data and string data. | 
|  |  | 
|  | class Output_merge_base : public Output_section_data | 
|  | { | 
|  | public: | 
|  | Output_merge_base(uint64_t entsize, uint64_t addralign) | 
|  | : Output_section_data(addralign), entsize_(entsize), | 
|  | keeps_input_sections_(false), first_relobj_(NULL), first_shndx_(-1), | 
|  | input_sections_() | 
|  | { } | 
|  |  | 
|  | // Return the entry size. | 
|  | uint64_t | 
|  | entsize() const | 
|  | { return this->entsize_; } | 
|  |  | 
|  | // Whether this is a merge string section.  This is only true of | 
|  | // Output_merge_string. | 
|  | bool | 
|  | is_string() | 
|  | { return this->do_is_string(); } | 
|  |  | 
|  | // Whether this keeps input sections. | 
|  | bool | 
|  | keeps_input_sections() const | 
|  | { return this->keeps_input_sections_; } | 
|  |  | 
|  | // Set the keeps-input-sections flag.  This is virtual so that sub-classes | 
|  | // can perform additional checks. | 
|  | void | 
|  | set_keeps_input_sections() | 
|  | { this->do_set_keeps_input_sections(); } | 
|  |  | 
|  | // Return the object of the first merged input section.  This used | 
|  | // for script processing.  This is NULL if merge section is empty. | 
|  | Relobj* | 
|  | first_relobj() const | 
|  | { return this->first_relobj_; } | 
|  |  | 
|  | // Return the section index of the first merged input section.  This | 
|  | // is used for script processing.  This is valid only if merge section | 
|  | // is not valid. | 
|  | unsigned int | 
|  | first_shndx() const | 
|  | { | 
|  | gold_assert(this->first_relobj_ != NULL); | 
|  | return this->first_shndx_; | 
|  | } | 
|  |  | 
|  | // Set of merged input sections. | 
|  | typedef Unordered_set<Section_id, Section_id_hash> Input_sections; | 
|  |  | 
|  | // Beginning of merged input sections. | 
|  | Input_sections::const_iterator | 
|  | input_sections_begin() const | 
|  | { | 
|  | gold_assert(this->keeps_input_sections_); | 
|  | return this->input_sections_.begin(); | 
|  | } | 
|  |  | 
|  | // Beginning of merged input sections. | 
|  | Input_sections::const_iterator | 
|  | input_sections_end() const | 
|  | { | 
|  | gold_assert(this->keeps_input_sections_); | 
|  | return this->input_sections_.end(); | 
|  | } | 
|  |  | 
|  | protected: | 
|  | // Return the output offset for an input offset. | 
|  | bool | 
|  | do_output_offset(const Relobj* object, unsigned int shndx, | 
|  | section_offset_type offset, | 
|  | section_offset_type* poutput) const; | 
|  |  | 
|  | // This may be overridden by the child class. | 
|  | virtual bool | 
|  | do_is_string() | 
|  | { return false; } | 
|  |  | 
|  | // This may be overridden by the child class. | 
|  | virtual void | 
|  | do_set_keeps_input_sections() | 
|  | { this->keeps_input_sections_ = true; } | 
|  |  | 
|  | // Record the merged input section for script processing. | 
|  | void | 
|  | record_input_section(Relobj* relobj, unsigned int shndx); | 
|  |  | 
|  | private: | 
|  | // The entry size.  For fixed-size constants, this is the size of | 
|  | // the constants.  For strings, this is the size of a character. | 
|  | uint64_t entsize_; | 
|  | // Whether we keep input sections. | 
|  | bool keeps_input_sections_; | 
|  | // Object of the first merged input section.  We use this for script | 
|  | // processing. | 
|  | Relobj* first_relobj_; | 
|  | // Section index of the first merged input section. | 
|  | unsigned int first_shndx_; | 
|  | // Input sections.  We only keep them is keeps_input_sections_ is true. | 
|  | Input_sections input_sections_; | 
|  | }; | 
|  |  | 
|  | // Handle SHF_MERGE sections with fixed-size constant data. | 
|  |  | 
|  | class Output_merge_data : public Output_merge_base | 
|  | { | 
|  | public: | 
|  | Output_merge_data(uint64_t entsize, uint64_t addralign) | 
|  | : Output_merge_base(entsize, addralign), p_(NULL), len_(0), alc_(0), | 
|  | input_count_(0), | 
|  | hashtable_(128, Merge_data_hash(this), Merge_data_eq(this)) | 
|  | { } | 
|  |  | 
|  | protected: | 
|  | // Add an input section. | 
|  | bool | 
|  | do_add_input_section(Relobj* object, unsigned int shndx); | 
|  |  | 
|  | // Set the final data size. | 
|  | void | 
|  | set_final_data_size(); | 
|  |  | 
|  | // Write the data to the file. | 
|  | void | 
|  | do_write(Output_file*); | 
|  |  | 
|  | // Write the data to a buffer. | 
|  | void | 
|  | do_write_to_buffer(unsigned char*); | 
|  |  | 
|  | // Write to a map file. | 
|  | void | 
|  | do_print_to_mapfile(Mapfile* mapfile) const | 
|  | { mapfile->print_output_data(this, _("** merge constants")); } | 
|  |  | 
|  | // Print merge stats to stderr. | 
|  | void | 
|  | do_print_merge_stats(const char* section_name); | 
|  |  | 
|  | // Set keeps-input-sections flag. | 
|  | void | 
|  | do_set_keeps_input_sections() | 
|  | { | 
|  | gold_assert(this->input_count_ == 0); | 
|  | Output_merge_base::do_set_keeps_input_sections(); | 
|  | } | 
|  |  | 
|  | private: | 
|  | // We build a hash table of the fixed-size constants.  Each constant | 
|  | // is stored as a pointer into the section data we are accumulating. | 
|  |  | 
|  | // A key in the hash table.  This is an offset in the section | 
|  | // contents we are building. | 
|  | typedef section_offset_type Merge_data_key; | 
|  |  | 
|  | // Compute the hash code.  To do this we need a pointer back to the | 
|  | // object holding the data. | 
|  | class Merge_data_hash | 
|  | { | 
|  | public: | 
|  | Merge_data_hash(const Output_merge_data* pomd) | 
|  | : pomd_(pomd) | 
|  | { } | 
|  |  | 
|  | size_t | 
|  | operator()(Merge_data_key) const; | 
|  |  | 
|  | private: | 
|  | const Output_merge_data* pomd_; | 
|  | }; | 
|  |  | 
|  | friend class Merge_data_hash; | 
|  |  | 
|  | // Compare two entries in the hash table for equality.  To do this | 
|  | // we need a pointer back to the object holding the data.  Note that | 
|  | // we now have a pointer to the object stored in two places in the | 
|  | // hash table.  Fixing this would require specializing the hash | 
|  | // table, which would be hard to do portably. | 
|  | class Merge_data_eq | 
|  | { | 
|  | public: | 
|  | Merge_data_eq(const Output_merge_data* pomd) | 
|  | : pomd_(pomd) | 
|  | { } | 
|  |  | 
|  | bool | 
|  | operator()(Merge_data_key k1, Merge_data_key k2) const; | 
|  |  | 
|  | private: | 
|  | const Output_merge_data* pomd_; | 
|  | }; | 
|  |  | 
|  | friend class Merge_data_eq; | 
|  |  | 
|  | // The type of the hash table. | 
|  | typedef Unordered_set<Merge_data_key, Merge_data_hash, Merge_data_eq> | 
|  | Merge_data_hashtable; | 
|  |  | 
|  | // Given a hash table key, which is just an offset into the section | 
|  | // data, return a pointer to the corresponding constant. | 
|  | const unsigned char* | 
|  | constant(Merge_data_key k) const | 
|  | { | 
|  | gold_assert(k >= 0 && k < static_cast<section_offset_type>(this->len_)); | 
|  | return this->p_ + k; | 
|  | } | 
|  |  | 
|  | // Add a constant to the output. | 
|  | void | 
|  | add_constant(const unsigned char*); | 
|  |  | 
|  | // The accumulated data. | 
|  | unsigned char* p_; | 
|  | // The length of the accumulated data. | 
|  | section_size_type len_; | 
|  | // The size of the allocated buffer. | 
|  | section_size_type alc_; | 
|  | // The number of entries seen in input files. | 
|  | size_t input_count_; | 
|  | // The hash table. | 
|  | Merge_data_hashtable hashtable_; | 
|  | }; | 
|  |  | 
|  | // Handle SHF_MERGE sections with string data.  This is a template | 
|  | // based on the type of the characters in the string. | 
|  |  | 
|  | template<typename Char_type> | 
|  | class Output_merge_string : public Output_merge_base | 
|  | { | 
|  | public: | 
|  | Output_merge_string(uint64_t addralign) | 
|  | : Output_merge_base(sizeof(Char_type), addralign), stringpool_(addralign), | 
|  | merged_strings_lists_(), input_count_(0), input_size_(0) | 
|  | { | 
|  | this->stringpool_.set_no_zero_null(); | 
|  | } | 
|  |  | 
|  | protected: | 
|  | // Add an input section. | 
|  | bool | 
|  | do_add_input_section(Relobj* object, unsigned int shndx); | 
|  |  | 
|  | // Do all the final processing after the input sections are read in. | 
|  | // Returns the final data size. | 
|  | section_size_type | 
|  | finalize_merged_data(); | 
|  |  | 
|  | // Set the final data size. | 
|  | void | 
|  | set_final_data_size(); | 
|  |  | 
|  | // Write the data to the file. | 
|  | void | 
|  | do_write(Output_file*); | 
|  |  | 
|  | // Write the data to a buffer. | 
|  | void | 
|  | do_write_to_buffer(unsigned char*); | 
|  |  | 
|  | // Write to a map file. | 
|  | void | 
|  | do_print_to_mapfile(Mapfile* mapfile) const | 
|  | { mapfile->print_output_data(this, _("** merge strings")); } | 
|  |  | 
|  | // Print merge stats to stderr. | 
|  | void | 
|  | do_print_merge_stats(const char* section_name); | 
|  |  | 
|  | // Writes the stringpool to a buffer. | 
|  | void | 
|  | stringpool_to_buffer(unsigned char* buffer, section_size_type buffer_size) | 
|  | { this->stringpool_.write_to_buffer(buffer, buffer_size); } | 
|  |  | 
|  | // Clears all the data in the stringpool, to save on memory. | 
|  | void | 
|  | clear_stringpool() | 
|  | { this->stringpool_.clear(); } | 
|  |  | 
|  | // Whether this is a merge string section. | 
|  | virtual bool | 
|  | do_is_string() | 
|  | { return true; } | 
|  |  | 
|  | // Set keeps-input-sections flag. | 
|  | void | 
|  | do_set_keeps_input_sections() | 
|  | { | 
|  | gold_assert(this->input_count_ == 0); | 
|  | Output_merge_base::do_set_keeps_input_sections(); | 
|  | } | 
|  |  | 
|  | private: | 
|  | // The name of the string type, for stats. | 
|  | const char* | 
|  | string_name(); | 
|  |  | 
|  | // As we see input sections, we build a mapping from object, section | 
|  | // index and offset to strings. | 
|  | struct Merged_string | 
|  | { | 
|  | // The offset in the input section. | 
|  | section_offset_type offset; | 
|  | // The key in the Stringpool. | 
|  | Stringpool::Key stringpool_key; | 
|  |  | 
|  | Merged_string(section_offset_type offseta, Stringpool::Key stringpool_keya) | 
|  | : offset(offseta), stringpool_key(stringpool_keya) | 
|  | { } | 
|  | }; | 
|  |  | 
|  | typedef std::vector<Merged_string> Merged_strings; | 
|  |  | 
|  | struct Merged_strings_list | 
|  | { | 
|  | // The input object where the strings were found. | 
|  | Relobj* object; | 
|  | // The input section in the input object. | 
|  | unsigned int shndx; | 
|  | // The list of merged strings. | 
|  | Merged_strings merged_strings; | 
|  |  | 
|  | Merged_strings_list(Relobj* objecta, unsigned int shndxa) | 
|  | : object(objecta), shndx(shndxa), merged_strings() | 
|  | { } | 
|  | }; | 
|  |  | 
|  | typedef std::vector<Merged_strings_list*> Merged_strings_lists; | 
|  |  | 
|  | // As we see the strings, we add them to a Stringpool. | 
|  | Stringpool_template<Char_type> stringpool_; | 
|  | // Map from a location in an input object to an entry in the | 
|  | // Stringpool. | 
|  | Merged_strings_lists merged_strings_lists_; | 
|  | // The number of entries seen in input files. | 
|  | size_t input_count_; | 
|  | // The total size of input sections. | 
|  | size_t input_size_; | 
|  | }; | 
|  |  | 
|  | } // End namespace gold. | 
|  |  | 
|  | #endif // !defined(GOLD_MERGE_H) |