123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515 |
- // merge.h -- handle section merging for gold -*- C++ -*-
- // Copyright (C) 2006-2015 Free Software Foundation, Inc.
- // Written by Ian Lance Taylor <iant@google.com>.
- // This file is part of gold.
- // This program is free software; you can redistribute it and/or modify
- // it under the terms of the GNU General Public License as published by
- // the Free Software Foundation; either version 3 of the License, or
- // (at your option) any later version.
- // This program is distributed in the hope that it will be useful,
- // but WITHOUT ANY WARRANTY; without even the implied warranty of
- // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- // GNU General Public License for more details.
- // You should have received a copy of the GNU General Public License
- // along with this program; if not, write to the Free Software
- // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston,
- // MA 02110-1301, USA.
- #ifndef GOLD_MERGE_H
- #define GOLD_MERGE_H
- #include <climits>
- #include <map>
- #include <vector>
- #include "stringpool.h"
- #include "output.h"
- namespace gold
- {
- // For each object with merge sections, we store an Object_merge_map.
- // This is used to map locations in input sections to a merged output
- // section. The output section itself is not recorded here--it can be
- // found in the output_sections_ field of the Object.
- class Object_merge_map
- {
- public:
- Object_merge_map()
- : section_merge_maps_()
- { }
- ~Object_merge_map();
- // Add a mapping for MERGE_MAP, for the bytes from OFFSET to OFFSET
- // + LENGTH in the input section SHNDX to OUTPUT_OFFSET in the
- // output section. An OUTPUT_OFFSET of -1 means that the bytes are
- // discarded. OUTPUT_OFFSET is relative to the start of the merged
- // data in the output section.
- void
- add_mapping(const Output_section_data*, unsigned int shndx,
- section_offset_type offset, section_size_type length,
- section_offset_type output_offset);
- // Get the output offset for an input address. MERGE_MAP is the map
- // we are looking for, or NULL if we don't care. The input address
- // is at offset OFFSET in section SHNDX. This sets *OUTPUT_OFFSET
- // to the offset in the output section; this will be -1 if the bytes
- // are not being copied to the output. This returns true if the
- // mapping is known, false otherwise. *OUTPUT_OFFSET is relative to
- // the start of the merged data in the output section.
- bool
- get_output_offset(unsigned int shndx,
- section_offset_type offset,
- section_offset_type* output_offset);
- const Output_section_data*
- find_merge_section(unsigned int shndx) const;
- // Initialize an mapping from input offsets to output addresses for
- // section SHNDX. STARTING_ADDRESS is the output address of the
- // merged section.
- template<int size>
- void
- initialize_input_to_output_map(
- unsigned int shndx,
- typename elfcpp::Elf_types<size>::Elf_Addr starting_address,
- Unordered_map<section_offset_type,
- typename elfcpp::Elf_types<size>::Elf_Addr>*);
- // Map input section offsets to a length and an output section
- // offset. An output section offset of -1 means that this part of
- // the input section is being discarded.
- struct Input_merge_entry
- {
- // The offset in the input section.
- section_offset_type input_offset;
- // The length.
- section_size_type length;
- // The offset in the output section.
- section_offset_type output_offset;
- };
- // A list of entries for a particular input section.
- struct Input_merge_map
- {
- void add_mapping(section_offset_type input_offset, section_size_type length,
- section_offset_type output_offset);
- typedef std::vector<Input_merge_entry> Entries;
- // We store these with the Relobj, and we look them up by input
- // section. It is possible to have two different merge maps
- // associated with a single output section. For example, this
- // happens routinely with .rodata, when merged string constants
- // and merged fixed size constants are both put into .rodata. The
- // output offset that we store is not the offset from the start of
- // the output section; it is the offset from the start of the
- // merged data in the output section. That means that the caller
- // is going to add the offset of the merged data within the output
- // section, which means that the caller needs to know which set of
- // merged data it found the entry in. So it's not enough to find
- // this data based on the input section and the output section; we
- // also have to find it based on a set of merged data in the
- // output section. In order to verify that we are looking at the
- // right data, we store a pointer to the Merge_map here, and we
- // pass in a pointer when looking at the data. If we are asked to
- // look up information for a different Merge_map, we report that
- // we don't have it, rather than trying a lookup and returning an
- // answer which will receive the wrong offset.
- const Output_section_data* output_data;
- // The list of mappings.
- Entries entries;
- // Whether the ENTRIES field is sorted by input_offset.
- bool sorted;
- Input_merge_map()
- : output_data(NULL), entries(), sorted(true)
- { }
- };
- // Get or make the Input_merge_map to use for the section SHNDX
- // with MERGE_MAP.
- Input_merge_map*
- get_or_make_input_merge_map(const Output_section_data* merge_map,
- unsigned int shndx);
- private:
- // A less-than comparison routine for Input_merge_entry.
- struct Input_merge_compare
- {
- bool
- operator()(const Input_merge_entry& i1, const Input_merge_entry& i2) const
- { return i1.input_offset < i2.input_offset; }
- };
- // Map input section indices to merge maps.
- typedef std::vector<std::pair<unsigned int, Input_merge_map*> >
- Section_merge_maps;
- // Return a pointer to the Input_merge_map to use for the input
- // section SHNDX, or NULL.
- const Input_merge_map*
- get_input_merge_map(unsigned int shndx) const;
- Input_merge_map *
- get_input_merge_map(unsigned int shndx) {
- return const_cast<Input_merge_map *>(static_cast<const Object_merge_map *>(
- this)->get_input_merge_map(shndx));
- }
- Section_merge_maps section_merge_maps_;
- };
- // A general class for SHF_MERGE data, to hold functions shared by
- // fixed-size constant data and string data.
- class Output_merge_base : public Output_section_data
- {
- public:
- Output_merge_base(uint64_t entsize, uint64_t addralign)
- : Output_section_data(addralign), entsize_(entsize),
- keeps_input_sections_(false), first_relobj_(NULL), first_shndx_(-1),
- input_sections_()
- { }
- // Return the entry size.
- uint64_t
- entsize() const
- { return this->entsize_; }
- // Whether this is a merge string section. This is only true of
- // Output_merge_string.
- bool
- is_string()
- { return this->do_is_string(); }
- // Whether this keeps input sections.
- bool
- keeps_input_sections() const
- { return this->keeps_input_sections_; }
- // Set the keeps-input-sections flag. This is virtual so that sub-classes
- // can perform additional checks.
- void
- set_keeps_input_sections()
- { this->do_set_keeps_input_sections(); }
- // Return the object of the first merged input section. This used
- // for script processing. This is NULL if merge section is empty.
- Relobj*
- first_relobj() const
- { return this->first_relobj_; }
- // Return the section index of the first merged input section. This
- // is used for script processing. This is valid only if merge section
- // is not valid.
- unsigned int
- first_shndx() const
- {
- gold_assert(this->first_relobj_ != NULL);
- return this->first_shndx_;
- }
-
- // Set of merged input sections.
- typedef Unordered_set<Section_id, Section_id_hash> Input_sections;
- // Beginning of merged input sections.
- Input_sections::const_iterator
- input_sections_begin() const
- {
- gold_assert(this->keeps_input_sections_);
- return this->input_sections_.begin();
- }
- // Beginning of merged input sections.
- Input_sections::const_iterator
- input_sections_end() const
- {
- gold_assert(this->keeps_input_sections_);
- return this->input_sections_.end();
- }
-
- protected:
- // Return the output offset for an input offset.
- bool
- do_output_offset(const Relobj* object, unsigned int shndx,
- section_offset_type offset,
- section_offset_type* poutput) const;
- // This may be overridden by the child class.
- virtual bool
- do_is_string()
- { return false; }
- // This may be overridden by the child class.
- virtual void
- do_set_keeps_input_sections()
- { this->keeps_input_sections_ = true; }
- // Record the merged input section for script processing.
- void
- record_input_section(Relobj* relobj, unsigned int shndx);
- private:
- // The entry size. For fixed-size constants, this is the size of
- // the constants. For strings, this is the size of a character.
- uint64_t entsize_;
- // Whether we keep input sections.
- bool keeps_input_sections_;
- // Object of the first merged input section. We use this for script
- // processing.
- Relobj* first_relobj_;
- // Section index of the first merged input section.
- unsigned int first_shndx_;
- // Input sections. We only keep them is keeps_input_sections_ is true.
- Input_sections input_sections_;
- };
- // Handle SHF_MERGE sections with fixed-size constant data.
- class Output_merge_data : public Output_merge_base
- {
- public:
- Output_merge_data(uint64_t entsize, uint64_t addralign)
- : Output_merge_base(entsize, addralign), p_(NULL), len_(0), alc_(0),
- input_count_(0),
- hashtable_(128, Merge_data_hash(this), Merge_data_eq(this))
- { }
- protected:
- // Add an input section.
- bool
- do_add_input_section(Relobj* object, unsigned int shndx);
- // Set the final data size.
- void
- set_final_data_size();
- // Write the data to the file.
- void
- do_write(Output_file*);
- // Write the data to a buffer.
- void
- do_write_to_buffer(unsigned char*);
- // Write to a map file.
- void
- do_print_to_mapfile(Mapfile* mapfile) const
- { mapfile->print_output_data(this, _("** merge constants")); }
- // Print merge stats to stderr.
- void
- do_print_merge_stats(const char* section_name);
- // Set keeps-input-sections flag.
- void
- do_set_keeps_input_sections()
- {
- gold_assert(this->input_count_ == 0);
- Output_merge_base::do_set_keeps_input_sections();
- }
- private:
- // We build a hash table of the fixed-size constants. Each constant
- // is stored as a pointer into the section data we are accumulating.
- // A key in the hash table. This is an offset in the section
- // contents we are building.
- typedef section_offset_type Merge_data_key;
- // Compute the hash code. To do this we need a pointer back to the
- // object holding the data.
- class Merge_data_hash
- {
- public:
- Merge_data_hash(const Output_merge_data* pomd)
- : pomd_(pomd)
- { }
- size_t
- operator()(Merge_data_key) const;
- private:
- const Output_merge_data* pomd_;
- };
- friend class Merge_data_hash;
- // Compare two entries in the hash table for equality. To do this
- // we need a pointer back to the object holding the data. Note that
- // we now have a pointer to the object stored in two places in the
- // hash table. Fixing this would require specializing the hash
- // table, which would be hard to do portably.
- class Merge_data_eq
- {
- public:
- Merge_data_eq(const Output_merge_data* pomd)
- : pomd_(pomd)
- { }
- bool
- operator()(Merge_data_key k1, Merge_data_key k2) const;
- private:
- const Output_merge_data* pomd_;
- };
- friend class Merge_data_eq;
- // The type of the hash table.
- typedef Unordered_set<Merge_data_key, Merge_data_hash, Merge_data_eq>
- Merge_data_hashtable;
- // Given a hash table key, which is just an offset into the section
- // data, return a pointer to the corresponding constant.
- const unsigned char*
- constant(Merge_data_key k) const
- {
- gold_assert(k >= 0 && k < static_cast<section_offset_type>(this->len_));
- return this->p_ + k;
- }
- // Add a constant to the output.
- void
- add_constant(const unsigned char*);
- // The accumulated data.
- unsigned char* p_;
- // The length of the accumulated data.
- section_size_type len_;
- // The size of the allocated buffer.
- section_size_type alc_;
- // The number of entries seen in input files.
- size_t input_count_;
- // The hash table.
- Merge_data_hashtable hashtable_;
- };
- // Handle SHF_MERGE sections with string data. This is a template
- // based on the type of the characters in the string.
- template<typename Char_type>
- class Output_merge_string : public Output_merge_base
- {
- public:
- Output_merge_string(uint64_t addralign)
- : Output_merge_base(sizeof(Char_type), addralign), stringpool_(addralign),
- merged_strings_lists_(), input_count_(0), input_size_(0)
- {
- this->stringpool_.set_no_zero_null();
- }
- protected:
- // Add an input section.
- bool
- do_add_input_section(Relobj* object, unsigned int shndx);
- // Do all the final processing after the input sections are read in.
- // Returns the final data size.
- section_size_type
- finalize_merged_data();
- // Set the final data size.
- void
- set_final_data_size();
- // Write the data to the file.
- void
- do_write(Output_file*);
- // Write the data to a buffer.
- void
- do_write_to_buffer(unsigned char*);
- // Write to a map file.
- void
- do_print_to_mapfile(Mapfile* mapfile) const
- { mapfile->print_output_data(this, _("** merge strings")); }
- // Print merge stats to stderr.
- void
- do_print_merge_stats(const char* section_name);
- // Writes the stringpool to a buffer.
- void
- stringpool_to_buffer(unsigned char* buffer, section_size_type buffer_size)
- { this->stringpool_.write_to_buffer(buffer, buffer_size); }
- // Clears all the data in the stringpool, to save on memory.
- void
- clear_stringpool()
- { this->stringpool_.clear(); }
- // Whether this is a merge string section.
- virtual bool
- do_is_string()
- { return true; }
- // Set keeps-input-sections flag.
- void
- do_set_keeps_input_sections()
- {
- gold_assert(this->input_count_ == 0);
- Output_merge_base::do_set_keeps_input_sections();
- }
- private:
- // The name of the string type, for stats.
- const char*
- string_name();
- // As we see input sections, we build a mapping from object, section
- // index and offset to strings.
- struct Merged_string
- {
- // The offset in the input section.
- section_offset_type offset;
- // The key in the Stringpool.
- Stringpool::Key stringpool_key;
- Merged_string(section_offset_type offseta, Stringpool::Key stringpool_keya)
- : offset(offseta), stringpool_key(stringpool_keya)
- { }
- };
- typedef std::vector<Merged_string> Merged_strings;
- struct Merged_strings_list
- {
- // The input object where the strings were found.
- Relobj* object;
- // The input section in the input object.
- unsigned int shndx;
- // The list of merged strings.
- Merged_strings merged_strings;
- Merged_strings_list(Relobj* objecta, unsigned int shndxa)
- : object(objecta), shndx(shndxa), merged_strings()
- { }
- };
- typedef std::vector<Merged_strings_list*> Merged_strings_lists;
- // As we see the strings, we add them to a Stringpool.
- Stringpool_template<Char_type> stringpool_;
- // Map from a location in an input object to an entry in the
- // Stringpool.
- Merged_strings_lists merged_strings_lists_;
- // The number of entries seen in input files.
- size_t input_count_;
- // The total size of input sections.
- size_t input_size_;
- };
- } // End namespace gold.
- #endif // !defined(GOLD_MERGE_H)
|