| // script.h -- handle linker scripts for gold -*- C++ -*- |
| |
| // Copyright (C) 2006-2024 Free Software Foundation, Inc. |
| // Written by Ian Lance Taylor <iant@google.com>. |
| |
| // This file is part of gold. |
| |
| // This program is free software; you can redistribute it and/or modify |
| // it under the terms of the GNU General Public License as published by |
| // the Free Software Foundation; either version 3 of the License, or |
| // (at your option) any later version. |
| |
| // This program is distributed in the hope that it will be useful, |
| // but WITHOUT ANY WARRANTY; without even the implied warranty of |
| // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| // GNU General Public License for more details. |
| |
| // You should have received a copy of the GNU General Public License |
| // along with this program; if not, write to the Free Software |
| // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, |
| // MA 02110-1301, USA. |
| |
| // We implement a subset of the original GNU ld linker script language |
| // for compatibility. The goal is not to implement the entire |
| // language. It is merely to implement enough to handle common uses. |
| // In particular we need to handle /usr/lib/libc.so on a typical |
| // GNU/Linux system, and we want to handle linker scripts used by the |
| // Linux kernel build. |
| |
| #ifndef GOLD_SCRIPT_H |
| #define GOLD_SCRIPT_H |
| |
| #include <cstdio> |
| #include <string> |
| #include <vector> |
| |
| #include "elfcpp.h" |
| #include "script-sections.h" |
| |
| namespace gold |
| { |
| |
| class General_options; |
| class Command_line; |
| class Symbol_table; |
| class Layout; |
| class Mapfile; |
| class Input_argument; |
| class Input_arguments; |
| class Input_objects; |
| class Input_group; |
| class Input_file; |
| class Output_segment; |
| class Task_token; |
| class Workqueue; |
| struct Version_dependency_list; |
| struct Version_expression_list; |
| struct Version_tree; |
| struct Version_expression; |
| class Lazy_demangler; |
| class Incremental_script_entry; |
| |
| // This class represents an expression in a linker script. |
| |
| class Expression |
| { |
| protected: |
| // These should only be created by child classes. |
| Expression() |
| { } |
| |
| public: |
| virtual ~Expression() |
| { } |
| |
| // Return the value of the expression which is not permitted to |
| // refer to the dot symbol. CHECK_ASSERTIONS is true if we should |
| // check whether assertions are true. |
| uint64_t |
| eval(const Symbol_table*, const Layout*, bool check_assertions); |
| |
| // Return the value of an expression which is permitted to refer to |
| // the dot symbol. DOT_VALUE is the absolute value of the dot |
| // symbol. DOT_SECTION is the section in which dot is defined; it |
| // should be NULL if the dot symbol has an absolute value (e.g., is |
| // defined in a SECTIONS clause outside of any output section |
| // definition). This sets *RESULT_SECTION to indicate where the |
| // value is defined. If the value is absolute *RESULT_SECTION will |
| // be NULL. Note that the returned value is still an absolute |
| // value; to get a section relative value the caller must subtract |
| // the section address. If RESULT_ALIGNMENT is not NULL, this sets |
| // *RESULT_ALIGNMENT to the alignment of the value of that alignment |
| // is larger than *RESULT_ALIGNMENT; this will only be non-zero if |
| // this is an ALIGN expression. If IS_SECTION_DOT_ASSIGMENT is true, |
| // we are evaluating an assignment to dot within an output section, |
| // and an absolute value should be interpreted as an offset within |
| // the section. |
| uint64_t |
| eval_with_dot(const Symbol_table*, const Layout*, bool check_assertions, |
| uint64_t dot_value, Output_section* dot_section, |
| Output_section** result_section, uint64_t* result_alignment, |
| bool is_section_dot_assignment); |
| |
| // Return the value of an expression which may or may not be |
| // permitted to refer to the dot symbol, depending on |
| // is_dot_available. If IS_SECTION_DOT_ASSIGMENT is true, |
| // we are evaluating an assignment to dot within an output section, |
| // and an absolute value should be interpreted as an offset within |
| // the section. |
| uint64_t |
| eval_maybe_dot(const Symbol_table*, const Layout*, bool check_assertions, |
| bool is_dot_available, uint64_t dot_value, |
| Output_section* dot_section, |
| Output_section** result_section, uint64_t* result_alignment, |
| elfcpp::STT* type, elfcpp::STV* vis, unsigned char* nonvis, |
| bool is_section_dot_assignment, bool* is_valid_pointer); |
| |
| // Print the expression to the FILE. This is for debugging. |
| virtual void |
| print(FILE*) const = 0; |
| |
| protected: |
| struct Expression_eval_info; |
| |
| public: |
| // Compute the value of the expression (implemented by child class). |
| // This is public rather than protected because it is called |
| // directly by children of Expression on other Expression objects. |
| virtual uint64_t |
| value(const Expression_eval_info*) = 0; |
| |
| // Sets all symbols used in expressions as seen in a real ELF object. |
| virtual void |
| set_expr_sym_in_real_elf(Symbol_table*) const |
| { return; } |
| |
| private: |
| // May not be copied. |
| Expression(const Expression&); |
| Expression& operator=(const Expression&); |
| }; |
| |
| // Version_script_info stores information parsed from the version |
| // script, either provided by --version-script or as part of a linker |
| // script. A single Version_script_info object per target is owned by |
| // Script_options. |
| |
| class Version_script_info |
| { |
| public: |
| // The languages which can be specified in a versionn script. |
| enum Language |
| { |
| LANGUAGE_C, // No demangling. |
| LANGUAGE_CXX, // C++ demangling. |
| LANGUAGE_JAVA, // Java demangling. |
| LANGUAGE_COUNT |
| }; |
| |
| Version_script_info(); |
| |
| ~Version_script_info(); |
| |
| // Clear everything. |
| void |
| clear(); |
| |
| // Finalize the version control information. |
| void |
| finalize(); |
| |
| // Return whether the information is finalized. |
| bool |
| is_finalized() const |
| { return this->is_finalized_; } |
| |
| // Return whether any version were defined in the version script. |
| bool |
| empty() const |
| { return this->version_trees_.empty(); } |
| |
| // If there is a version associated with SYMBOL, return true, and |
| // set *VERSION to the version, and *IS_GLOBAL to whether the symbol |
| // should be global. Otherwise, return false. |
| bool |
| get_symbol_version(const char* symbol, std::string* version, |
| bool* is_global) const; |
| |
| // Return whether this symbol matches the local: section of some |
| // version. |
| bool |
| symbol_is_local(const char* symbol) const |
| { |
| bool is_global; |
| return (this->get_symbol_version(symbol, NULL, &is_global) |
| && !is_global); |
| } |
| |
| // Return the names of versions defined in the version script. |
| std::vector<std::string> |
| get_versions() const; |
| |
| // Return the list of dependencies for this version. |
| std::vector<std::string> |
| get_dependencies(const char* version) const; |
| |
| // The following functions should only be used by the bison helper |
| // functions. They allocate new structs whose memory belongs to |
| // Version_script_info. The bison functions copy the information |
| // from the version script into these structs. |
| struct Version_dependency_list* |
| allocate_dependency_list(); |
| |
| struct Version_expression_list* |
| allocate_expression_list(); |
| |
| struct Version_tree* |
| allocate_version_tree(); |
| |
| // Build the lookup tables after all data have been read. |
| void |
| build_lookup_tables(); |
| |
| // Give an error if there are any unmatched names in the version |
| // script. |
| void |
| check_unmatched_names(const Symbol_table*) const; |
| |
| // Print contents to the FILE. This is for debugging. |
| void |
| print(FILE*) const; |
| |
| private: |
| void |
| print_expression_list(FILE* f, const Version_expression_list*) const; |
| |
| bool |
| get_symbol_version_helper(const char* symbol, |
| bool check_global, |
| std::string* pversion) const; |
| |
| // Fast lookup information for a given language. |
| |
| // We map from exact match strings to Version_tree's. Historically |
| // version scripts sometimes have the same symbol multiple times, |
| // which is ambiguous. We warn about that case by storing the |
| // second Version_tree we see. |
| struct Version_tree_match |
| { |
| Version_tree_match(const Version_tree* r, bool ig, |
| const Version_expression* e) |
| : real(r), is_global(ig), expression(e), ambiguous(NULL) |
| { } |
| |
| // The Version_tree that we return. |
| const Version_tree* real; |
| // True if this is a global match for the REAL member, false if it |
| // is a local match. |
| bool is_global; |
| // Point back to the Version_expression for which we created this |
| // match. |
| const Version_expression* expression; |
| // If not NULL, another Version_tree that defines the symbol. |
| const Version_tree* ambiguous; |
| }; |
| |
| // Map from an exact match string to a Version_tree. |
| |
| typedef Unordered_map<std::string, Version_tree_match> Exact; |
| |
| // Fast lookup information for a glob pattern. |
| struct Glob |
| { |
| Glob() |
| : expression(NULL), version(NULL), is_global(false) |
| { } |
| |
| Glob(const Version_expression* e, const Version_tree* v, bool ig) |
| : expression(e), version(v), is_global(ig) |
| { } |
| |
| // A pointer to the version expression holding the pattern to |
| // match and the language to use for demangling the symbol before |
| // doing the match. |
| const Version_expression* expression; |
| // The Version_tree we use if this pattern matches. |
| const Version_tree* version; |
| // True if this is a global symbol. |
| bool is_global; |
| }; |
| |
| typedef std::vector<Glob> Globs; |
| |
| bool |
| unquote(std::string*) const; |
| |
| void |
| add_exact_match(const std::string&, const Version_tree*, bool is_global, |
| const Version_expression*, Exact*); |
| |
| void |
| build_expression_list_lookup(const Version_expression_list*, |
| const Version_tree*, bool); |
| |
| const char* |
| get_name_to_match(const char*, int, |
| Lazy_demangler*, Lazy_demangler*) const; |
| |
| // All the version dependencies we allocate. |
| std::vector<Version_dependency_list*> dependency_lists_; |
| // All the version expressions we allocate. |
| std::vector<Version_expression_list*> expression_lists_; |
| // The list of versions. |
| std::vector<Version_tree*> version_trees_; |
| // Exact matches for global symbols, by language. |
| Exact* exact_[LANGUAGE_COUNT]; |
| // A vector of glob patterns mapping to Version_trees. |
| Globs globs_; |
| // The default version to use, if there is one. This is from a |
| // pattern of "*". |
| const Version_tree* default_version_; |
| // True if the default version is global. |
| bool default_is_global_; |
| // Whether this has been finalized. |
| bool is_finalized_; |
| }; |
| |
| // This class manages assignments to symbols. These can appear in |
| // three different locations in scripts: outside of a SECTIONS clause, |
| // within a SECTIONS clause, and within an output section definition |
| // within a SECTIONS clause. This can also appear on the command line |
| // via the --defsym command line option. |
| |
| class Symbol_assignment |
| { |
| public: |
| Symbol_assignment(const char* name, size_t namelen, bool is_defsym, |
| Expression* val, bool provide, bool hidden) |
| : name_(name, namelen), val_(val), is_defsym_(is_defsym), |
| provide_(provide), hidden_(hidden), sym_(NULL) |
| { } |
| |
| // Add the symbol to the symbol table. |
| void |
| add_to_table(Symbol_table*); |
| |
| // Finalize the symbol value. |
| void |
| finalize(Symbol_table*, const Layout*); |
| |
| bool |
| is_defsym() const |
| { return is_defsym_; } |
| |
| Expression * |
| value() const |
| { return val_; } |
| |
| // Finalize the symbol value when it can refer to the dot symbol. |
| void |
| finalize_with_dot(Symbol_table*, const Layout*, uint64_t dot_value, |
| Output_section* dot_section); |
| |
| // Set the symbol value, but only if the value is absolute or relative to |
| // DOT_SECTION. This is used while processing a SECTIONS clause. |
| // We assume that dot is an absolute value here. We do not check assertions. |
| void |
| set_if_absolute(Symbol_table*, const Layout*, bool is_dot_available, |
| uint64_t dot_value, Output_section* dot_section); |
| |
| const std::string& |
| name() const |
| { return this->name_; } |
| |
| // Print the assignment to the FILE. This is for debugging. |
| void |
| print(FILE*) const; |
| |
| private: |
| // Shared by finalize and finalize_with_dot. |
| void |
| finalize_maybe_dot(Symbol_table*, const Layout*, bool is_dot_available, |
| uint64_t dot_value, Output_section* dot_section); |
| |
| // Sized version of finalize. |
| template<int size> |
| void |
| sized_finalize(Symbol_table*, const Layout*, bool is_dot_available, |
| uint64_t dot_value, Output_section*); |
| |
| // Symbol name. |
| std::string name_; |
| // Expression to assign to symbol. |
| Expression* val_; |
| // True if this symbol is defined by a --defsym, false if it is |
| // defined in a linker script. |
| bool is_defsym_; |
| // Whether the assignment should be provided (only set if there is |
| // an undefined reference to the symbol. |
| bool provide_; |
| // Whether the assignment should be hidden. |
| bool hidden_; |
| // The entry in the symbol table. |
| Symbol* sym_; |
| }; |
| |
| // This class manages assertions in linker scripts. These can appear |
| // in all the places where a Symbol_assignment can appear. |
| |
| class Script_assertion |
| { |
| public: |
| Script_assertion(Expression* check, const char* message, |
| size_t messagelen) |
| : check_(check), message_(message, messagelen) |
| { } |
| |
| // Check the assertion. |
| void |
| check(const Symbol_table*, const Layout*); |
| |
| // Print the assertion to the FILE. This is for debugging. |
| void |
| print(FILE*) const; |
| |
| private: |
| // The expression to check. |
| Expression* check_; |
| // The message to issue if the expression fails. |
| std::string message_; |
| }; |
| |
| // We can read a linker script in two different contexts: when |
| // initially parsing the command line, and when we find an input file |
| // which is actually a linker script. Also some of the data which can |
| // be set by a linker script can also be set via command line options |
| // like -e and --defsym. This means that we have a type of data which |
| // can be set both during command line option parsing and while |
| // reading input files. We store that data in an instance of this |
| // object. We will keep pointers to that instance in both the |
| // Command_line and Layout objects. |
| |
| class Script_options |
| { |
| public: |
| Script_options(); |
| |
| // Add a symbol to be defined. |
| void |
| add_symbol_assignment(const char* name, size_t length, bool is_defsym, |
| Expression* value, bool provide, bool hidden); |
| |
| // Look for an assigned symbol. |
| bool |
| is_pending_assignment(const char* name); |
| |
| // Add a reference to a symbol. |
| void |
| add_symbol_reference(const char* name, size_t length); |
| |
| // Add an assertion. |
| void |
| add_assertion(Expression* check, const char* message, size_t messagelen); |
| |
| // Define a symbol from the command line. |
| bool |
| define_symbol(const char* definition); |
| |
| // Populates the set with symbol names used in LHS of defsym. |
| void |
| find_defsym_defs(Unordered_set<std::string>&); |
| |
| // Set symbols used in defsym expressions as seen in a real ELF object. |
| void set_defsym_uses_in_real_elf(Symbol_table*) const; |
| |
| // Create sections required by any linker scripts. |
| void |
| create_script_sections(Layout*); |
| |
| // Add all symbol definitions to the symbol table. |
| void |
| add_symbols_to_table(Symbol_table*); |
| |
| // Used to iterate over symbols which are referenced in expressions |
| // but not defined. |
| typedef Unordered_set<std::string>::const_iterator referenced_const_iterator; |
| |
| referenced_const_iterator |
| referenced_begin() const |
| { return this->symbol_references_.begin(); } |
| |
| referenced_const_iterator |
| referenced_end() const |
| { return this->symbol_references_.end(); } |
| |
| // Return whether a symbol is referenced but not defined. |
| bool |
| is_referenced(const std::string& name) const |
| { |
| return (this->symbol_references_.find(name) |
| != this->symbol_references_.end()); |
| } |
| |
| // Return whether there are any symbols which were referenced but |
| // not defined. |
| bool |
| any_unreferenced() const |
| { return !this->symbol_references_.empty(); } |
| |
| // Finalize the symbol values. Also check assertions. |
| void |
| finalize_symbols(Symbol_table*, const Layout*); |
| |
| // Version information parsed from a version script. Everything |
| // else has a pointer to this object. |
| Version_script_info* |
| version_script_info() |
| { return &this->version_script_info_; } |
| |
| const Version_script_info* |
| version_script_info() const |
| { return &this->version_script_info_; } |
| |
| // A SECTIONS clause parsed from a linker script. Everything else |
| // has a pointer to this object. |
| Script_sections* |
| script_sections() |
| { return &this->script_sections_; } |
| |
| const Script_sections* |
| script_sections() const |
| { return &this->script_sections_; } |
| |
| // Whether we saw a SECTIONS clause. |
| bool |
| saw_sections_clause() const |
| { return this->script_sections_.saw_sections_clause(); } |
| |
| // Whether we saw a PHDRS clause. |
| bool |
| saw_phdrs_clause() const |
| { return this->script_sections_.saw_phdrs_clause(); } |
| |
| // Set section addresses using a SECTIONS clause. Return the |
| // segment which should hold the file header and segment headers; |
| // this may return NULL, in which case the headers are not in a |
| // loadable segment. |
| Output_segment* |
| set_section_addresses(Symbol_table*, Layout*); |
| |
| // Print the script to the FILE. This is for debugging. |
| void |
| print(FILE*) const; |
| |
| private: |
| // We keep a list of symbol assignments which occur outside of a |
| // SECTIONS clause. |
| typedef std::vector<Symbol_assignment*> Symbol_assignments; |
| |
| // We keep a list of all assertions which occur outside of a |
| // SECTIONS clause. |
| typedef std::vector<Script_assertion*> Assertions; |
| |
| // The entry address. This will be empty if not set. |
| std::string entry_; |
| // Symbols to set. |
| Symbol_assignments symbol_assignments_; |
| // Symbols defined in an expression, for faster lookup. |
| Unordered_set<std::string> symbol_definitions_; |
| // Symbols referenced in an expression. |
| Unordered_set<std::string> symbol_references_; |
| // Assertions to check. |
| Assertions assertions_; |
| // Version information parsed from a version script. |
| Version_script_info version_script_info_; |
| // Information from any SECTIONS clauses. |
| Script_sections script_sections_; |
| }; |
| |
| // FILE was found as an argument on the command line, but was not |
| // recognized as an ELF file. Try to read it as a script. Return |
| // true if the file was handled. This has to handle /usr/lib/libc.so |
| // on a GNU/Linux system. *USED_NEXT_BLOCKER is set to indicate |
| // whether the function took over NEXT_BLOCKER. |
| |
| bool |
| read_input_script(Workqueue*, Symbol_table*, Layout*, Dirsearch*, int, |
| Input_objects*, Mapfile*, Input_group*, |
| const Input_argument*, Input_file*, |
| Task_token* next_blocker, bool* used_next_blocker); |
| |
| // FILE was found as an argument to --script (-T). |
| // Read it as a script, and execute its contents immediately. |
| |
| bool |
| read_commandline_script(const char* filename, Command_line* cmdline); |
| |
| // FILE was found as an argument to --version-script. Read it as a |
| // version script, and store its contents in |
| // cmdline->script_options()->version_script_info(). |
| |
| bool |
| read_version_script(const char* filename, Command_line* cmdline); |
| |
| // FILENAME was found as an argument to --dynamic-list. Read it as a |
| // version script (actually, a versym_node from a version script), and |
| // store its contents in DYNAMIC_LIST. |
| |
| bool |
| read_dynamic_list(const char* filename, Command_line* cmdline, |
| Script_options* dynamic_list); |
| |
| } // End namespace gold. |
| |
| #endif // !defined(GOLD_SCRIPT_H) |