|  | // script.h -- handle linker scripts for gold   -*- C++ -*- | 
|  |  | 
|  | // Copyright (C) 2006-2023 Free Software Foundation, Inc. | 
|  | // Written by Ian Lance Taylor <iant@google.com>. | 
|  |  | 
|  | // This file is part of gold. | 
|  |  | 
|  | // This program is free software; you can redistribute it and/or modify | 
|  | // it under the terms of the GNU General Public License as published by | 
|  | // the Free Software Foundation; either version 3 of the License, or | 
|  | // (at your option) any later version. | 
|  |  | 
|  | // This program is distributed in the hope that it will be useful, | 
|  | // but WITHOUT ANY WARRANTY; without even the implied warranty of | 
|  | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
|  | // GNU General Public License for more details. | 
|  |  | 
|  | // You should have received a copy of the GNU General Public License | 
|  | // along with this program; if not, write to the Free Software | 
|  | // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, | 
|  | // MA 02110-1301, USA. | 
|  |  | 
|  | // We implement a subset of the original GNU ld linker script language | 
|  | // for compatibility.  The goal is not to implement the entire | 
|  | // language.  It is merely to implement enough to handle common uses. | 
|  | // In particular we need to handle /usr/lib/libc.so on a typical | 
|  | // GNU/Linux system, and we want to handle linker scripts used by the | 
|  | // Linux kernel build. | 
|  |  | 
|  | #ifndef GOLD_SCRIPT_H | 
|  | #define GOLD_SCRIPT_H | 
|  |  | 
|  | #include <cstdio> | 
|  | #include <string> | 
|  | #include <vector> | 
|  |  | 
|  | #include "elfcpp.h" | 
|  | #include "script-sections.h" | 
|  |  | 
|  | namespace gold | 
|  | { | 
|  |  | 
|  | class General_options; | 
|  | class Command_line; | 
|  | class Symbol_table; | 
|  | class Layout; | 
|  | class Mapfile; | 
|  | class Input_argument; | 
|  | class Input_arguments; | 
|  | class Input_objects; | 
|  | class Input_group; | 
|  | class Input_file; | 
|  | class Output_segment; | 
|  | class Task_token; | 
|  | class Workqueue; | 
|  | struct Version_dependency_list; | 
|  | struct Version_expression_list; | 
|  | struct Version_tree; | 
|  | struct Version_expression; | 
|  | class Lazy_demangler; | 
|  | class Incremental_script_entry; | 
|  |  | 
|  | // This class represents an expression in a linker script. | 
|  |  | 
|  | class Expression | 
|  | { | 
|  | protected: | 
|  | // These should only be created by child classes. | 
|  | Expression() | 
|  | { } | 
|  |  | 
|  | public: | 
|  | virtual ~Expression() | 
|  | { } | 
|  |  | 
|  | // Return the value of the expression which is not permitted to | 
|  | // refer to the dot symbol.  CHECK_ASSERTIONS is true if we should | 
|  | // check whether assertions are true. | 
|  | uint64_t | 
|  | eval(const Symbol_table*, const Layout*, bool check_assertions); | 
|  |  | 
|  | // Return the value of an expression which is permitted to refer to | 
|  | // the dot symbol.  DOT_VALUE is the absolute value of the dot | 
|  | // symbol.  DOT_SECTION is the section in which dot is defined; it | 
|  | // should be NULL if the dot symbol has an absolute value (e.g., is | 
|  | // defined in a SECTIONS clause outside of any output section | 
|  | // definition).  This sets *RESULT_SECTION to indicate where the | 
|  | // value is defined.  If the value is absolute *RESULT_SECTION will | 
|  | // be NULL.  Note that the returned value is still an absolute | 
|  | // value; to get a section relative value the caller must subtract | 
|  | // the section address.  If RESULT_ALIGNMENT is not NULL, this sets | 
|  | // *RESULT_ALIGNMENT to the alignment of the value of that alignment | 
|  | // is larger than *RESULT_ALIGNMENT; this will only be non-zero if | 
|  | // this is an ALIGN expression.  If IS_SECTION_DOT_ASSIGMENT is true, | 
|  | // we are evaluating an assignment to dot within an output section, | 
|  | // and an absolute value should be interpreted as an offset within | 
|  | // the section. | 
|  | uint64_t | 
|  | eval_with_dot(const Symbol_table*, const Layout*, bool check_assertions, | 
|  | uint64_t dot_value, Output_section* dot_section, | 
|  | Output_section** result_section, uint64_t* result_alignment, | 
|  | bool is_section_dot_assignment); | 
|  |  | 
|  | // Return the value of an expression which may or may not be | 
|  | // permitted to refer to the dot symbol, depending on | 
|  | // is_dot_available.  If IS_SECTION_DOT_ASSIGMENT is true, | 
|  | // we are evaluating an assignment to dot within an output section, | 
|  | // and an absolute value should be interpreted as an offset within | 
|  | // the section. | 
|  | uint64_t | 
|  | eval_maybe_dot(const Symbol_table*, const Layout*, bool check_assertions, | 
|  | bool is_dot_available, uint64_t dot_value, | 
|  | Output_section* dot_section, | 
|  | Output_section** result_section, uint64_t* result_alignment, | 
|  | elfcpp::STT* type, elfcpp::STV* vis, unsigned char* nonvis, | 
|  | bool is_section_dot_assignment, bool* is_valid_pointer); | 
|  |  | 
|  | // Print the expression to the FILE.  This is for debugging. | 
|  | virtual void | 
|  | print(FILE*) const = 0; | 
|  |  | 
|  | protected: | 
|  | struct Expression_eval_info; | 
|  |  | 
|  | public: | 
|  | // Compute the value of the expression (implemented by child class). | 
|  | // This is public rather than protected because it is called | 
|  | // directly by children of Expression on other Expression objects. | 
|  | virtual uint64_t | 
|  | value(const Expression_eval_info*) = 0; | 
|  |  | 
|  | // Sets all symbols used in expressions as seen in a real ELF object. | 
|  | virtual void | 
|  | set_expr_sym_in_real_elf(Symbol_table*) const | 
|  | { return; } | 
|  |  | 
|  | private: | 
|  | // May not be copied. | 
|  | Expression(const Expression&); | 
|  | Expression& operator=(const Expression&); | 
|  | }; | 
|  |  | 
|  | // Version_script_info stores information parsed from the version | 
|  | // script, either provided by --version-script or as part of a linker | 
|  | // script.  A single Version_script_info object per target is owned by | 
|  | // Script_options. | 
|  |  | 
|  | class Version_script_info | 
|  | { | 
|  | public: | 
|  | // The languages which can be specified in a versionn script. | 
|  | enum Language | 
|  | { | 
|  | LANGUAGE_C,		// No demangling. | 
|  | LANGUAGE_CXX,	// C++ demangling. | 
|  | LANGUAGE_JAVA,	// Java demangling. | 
|  | LANGUAGE_COUNT | 
|  | }; | 
|  |  | 
|  | Version_script_info(); | 
|  |  | 
|  | ~Version_script_info(); | 
|  |  | 
|  | // Clear everything. | 
|  | void | 
|  | clear(); | 
|  |  | 
|  | // Finalize the version control information. | 
|  | void | 
|  | finalize(); | 
|  |  | 
|  | // Return whether the information is finalized. | 
|  | bool | 
|  | is_finalized() const | 
|  | { return this->is_finalized_; } | 
|  |  | 
|  | // Return whether any version were defined in the version script. | 
|  | bool | 
|  | empty() const | 
|  | { return this->version_trees_.empty(); } | 
|  |  | 
|  | // If there is a version associated with SYMBOL, return true, and | 
|  | // set *VERSION to the version, and *IS_GLOBAL to whether the symbol | 
|  | // should be global.  Otherwise, return false. | 
|  | bool | 
|  | get_symbol_version(const char* symbol, std::string* version, | 
|  | bool* is_global) const; | 
|  |  | 
|  | // Return whether this symbol matches the local: section of some | 
|  | // version. | 
|  | bool | 
|  | symbol_is_local(const char* symbol) const | 
|  | { | 
|  | bool is_global; | 
|  | return (this->get_symbol_version(symbol, NULL, &is_global) | 
|  | && !is_global); | 
|  | } | 
|  |  | 
|  | // Return the names of versions defined in the version script. | 
|  | std::vector<std::string> | 
|  | get_versions() const; | 
|  |  | 
|  | // Return the list of dependencies for this version. | 
|  | std::vector<std::string> | 
|  | get_dependencies(const char* version) const; | 
|  |  | 
|  | // The following functions should only be used by the bison helper | 
|  | // functions.  They allocate new structs whose memory belongs to | 
|  | // Version_script_info.  The bison functions copy the information | 
|  | // from the version script into these structs. | 
|  | struct Version_dependency_list* | 
|  | allocate_dependency_list(); | 
|  |  | 
|  | struct Version_expression_list* | 
|  | allocate_expression_list(); | 
|  |  | 
|  | struct Version_tree* | 
|  | allocate_version_tree(); | 
|  |  | 
|  | // Build the lookup tables after all data have been read. | 
|  | void | 
|  | build_lookup_tables(); | 
|  |  | 
|  | // Give an error if there are any unmatched names in the version | 
|  | // script. | 
|  | void | 
|  | check_unmatched_names(const Symbol_table*) const; | 
|  |  | 
|  | // Print contents to the FILE.  This is for debugging. | 
|  | void | 
|  | print(FILE*) const; | 
|  |  | 
|  | private: | 
|  | void | 
|  | print_expression_list(FILE* f, const Version_expression_list*) const; | 
|  |  | 
|  | bool | 
|  | get_symbol_version_helper(const char* symbol, | 
|  | bool check_global, | 
|  | std::string* pversion) const; | 
|  |  | 
|  | // Fast lookup information for a given language. | 
|  |  | 
|  | // We map from exact match strings to Version_tree's.  Historically | 
|  | // version scripts sometimes have the same symbol multiple times, | 
|  | // which is ambiguous.  We warn about that case by storing the | 
|  | // second Version_tree we see. | 
|  | struct Version_tree_match | 
|  | { | 
|  | Version_tree_match(const Version_tree* r, bool ig, | 
|  | const Version_expression* e) | 
|  | : real(r), is_global(ig), expression(e), ambiguous(NULL) | 
|  | { } | 
|  |  | 
|  | // The Version_tree that we return. | 
|  | const Version_tree* real; | 
|  | // True if this is a global match for the REAL member, false if it | 
|  | // is a local match. | 
|  | bool is_global; | 
|  | // Point back to the Version_expression for which we created this | 
|  | // match. | 
|  | const Version_expression* expression; | 
|  | // If not NULL, another Version_tree that defines the symbol. | 
|  | const Version_tree* ambiguous; | 
|  | }; | 
|  |  | 
|  | // Map from an exact match string to a Version_tree. | 
|  |  | 
|  | typedef Unordered_map<std::string, Version_tree_match> Exact; | 
|  |  | 
|  | // Fast lookup information for a glob pattern. | 
|  | struct Glob | 
|  | { | 
|  | Glob() | 
|  | : expression(NULL), version(NULL), is_global(false) | 
|  | { } | 
|  |  | 
|  | Glob(const Version_expression* e, const Version_tree* v, bool ig) | 
|  | : expression(e), version(v), is_global(ig) | 
|  | { } | 
|  |  | 
|  | // A pointer to the version expression holding the pattern to | 
|  | // match and the language to use for demangling the symbol before | 
|  | // doing the match. | 
|  | const Version_expression* expression; | 
|  | // The Version_tree we use if this pattern matches. | 
|  | const Version_tree* version; | 
|  | // True if this is a global symbol. | 
|  | bool is_global; | 
|  | }; | 
|  |  | 
|  | typedef std::vector<Glob> Globs; | 
|  |  | 
|  | bool | 
|  | unquote(std::string*) const; | 
|  |  | 
|  | void | 
|  | add_exact_match(const std::string&, const Version_tree*, bool is_global, | 
|  | const Version_expression*, Exact*); | 
|  |  | 
|  | void | 
|  | build_expression_list_lookup(const Version_expression_list*, | 
|  | const Version_tree*, bool); | 
|  |  | 
|  | const char* | 
|  | get_name_to_match(const char*, int, | 
|  | Lazy_demangler*, Lazy_demangler*) const; | 
|  |  | 
|  | // All the version dependencies we allocate. | 
|  | std::vector<Version_dependency_list*> dependency_lists_; | 
|  | // All the version expressions we allocate. | 
|  | std::vector<Version_expression_list*> expression_lists_; | 
|  | // The list of versions. | 
|  | std::vector<Version_tree*> version_trees_; | 
|  | // Exact matches for global symbols, by language. | 
|  | Exact* exact_[LANGUAGE_COUNT]; | 
|  | // A vector of glob patterns mapping to Version_trees. | 
|  | Globs globs_; | 
|  | // The default version to use, if there is one.  This is from a | 
|  | // pattern of "*". | 
|  | const Version_tree* default_version_; | 
|  | // True if the default version is global. | 
|  | bool default_is_global_; | 
|  | // Whether this has been finalized. | 
|  | bool is_finalized_; | 
|  | }; | 
|  |  | 
|  | // This class manages assignments to symbols.  These can appear in | 
|  | // three different locations in scripts: outside of a SECTIONS clause, | 
|  | // within a SECTIONS clause, and within an output section definition | 
|  | // within a SECTIONS clause.  This can also appear on the command line | 
|  | // via the --defsym command line option. | 
|  |  | 
|  | class Symbol_assignment | 
|  | { | 
|  | public: | 
|  | Symbol_assignment(const char* name, size_t namelen, bool is_defsym, | 
|  | Expression* val, bool provide, bool hidden) | 
|  | : name_(name, namelen), val_(val), is_defsym_(is_defsym), | 
|  | provide_(provide), hidden_(hidden), sym_(NULL) | 
|  | { } | 
|  |  | 
|  | // Add the symbol to the symbol table. | 
|  | void | 
|  | add_to_table(Symbol_table*); | 
|  |  | 
|  | // Finalize the symbol value. | 
|  | void | 
|  | finalize(Symbol_table*, const Layout*); | 
|  |  | 
|  | bool | 
|  | is_defsym() const | 
|  | { return is_defsym_; } | 
|  |  | 
|  | Expression * | 
|  | value() const | 
|  | { return val_; } | 
|  |  | 
|  | // Finalize the symbol value when it can refer to the dot symbol. | 
|  | void | 
|  | finalize_with_dot(Symbol_table*, const Layout*, uint64_t dot_value, | 
|  | Output_section* dot_section); | 
|  |  | 
|  | // Set the symbol value, but only if the value is absolute or relative to | 
|  | // DOT_SECTION.  This is used while processing a SECTIONS clause. | 
|  | // We assume that dot is an absolute value here.  We do not check assertions. | 
|  | void | 
|  | set_if_absolute(Symbol_table*, const Layout*, bool is_dot_available, | 
|  | uint64_t dot_value, Output_section* dot_section); | 
|  |  | 
|  | const std::string& | 
|  | name() const | 
|  | { return this->name_; } | 
|  |  | 
|  | // Print the assignment to the FILE.  This is for debugging. | 
|  | void | 
|  | print(FILE*) const; | 
|  |  | 
|  | private: | 
|  | // Shared by finalize and finalize_with_dot. | 
|  | void | 
|  | finalize_maybe_dot(Symbol_table*, const Layout*, bool is_dot_available, | 
|  | uint64_t dot_value, Output_section* dot_section); | 
|  |  | 
|  | // Sized version of finalize. | 
|  | template<int size> | 
|  | void | 
|  | sized_finalize(Symbol_table*, const Layout*, bool is_dot_available, | 
|  | uint64_t dot_value, Output_section*); | 
|  |  | 
|  | // Symbol name. | 
|  | std::string name_; | 
|  | // Expression to assign to symbol. | 
|  | Expression* val_; | 
|  | // True if this symbol is defined by a --defsym, false if it is | 
|  | // defined in a linker script. | 
|  | bool is_defsym_; | 
|  | // Whether the assignment should be provided (only set if there is | 
|  | // an undefined reference to the symbol. | 
|  | bool provide_; | 
|  | // Whether the assignment should be hidden. | 
|  | bool hidden_; | 
|  | // The entry in the symbol table. | 
|  | Symbol* sym_; | 
|  | }; | 
|  |  | 
|  | // This class manages assertions in linker scripts.  These can appear | 
|  | // in all the places where a Symbol_assignment can appear. | 
|  |  | 
|  | class Script_assertion | 
|  | { | 
|  | public: | 
|  | Script_assertion(Expression* check, const char* message, | 
|  | size_t messagelen) | 
|  | : check_(check), message_(message, messagelen) | 
|  | { } | 
|  |  | 
|  | // Check the assertion. | 
|  | void | 
|  | check(const Symbol_table*, const Layout*); | 
|  |  | 
|  | // Print the assertion to the FILE.  This is for debugging. | 
|  | void | 
|  | print(FILE*) const; | 
|  |  | 
|  | private: | 
|  | // The expression to check. | 
|  | Expression* check_; | 
|  | // The message to issue if the expression fails. | 
|  | std::string message_; | 
|  | }; | 
|  |  | 
|  | // We can read a linker script in two different contexts: when | 
|  | // initially parsing the command line, and when we find an input file | 
|  | // which is actually a linker script.  Also some of the data which can | 
|  | // be set by a linker script can also be set via command line options | 
|  | // like -e and --defsym.  This means that we have a type of data which | 
|  | // can be set both during command line option parsing and while | 
|  | // reading input files.  We store that data in an instance of this | 
|  | // object.  We will keep pointers to that instance in both the | 
|  | // Command_line and Layout objects. | 
|  |  | 
|  | class Script_options | 
|  | { | 
|  | public: | 
|  | Script_options(); | 
|  |  | 
|  | // Add a symbol to be defined. | 
|  | void | 
|  | add_symbol_assignment(const char* name, size_t length, bool is_defsym, | 
|  | Expression* value, bool provide, bool hidden); | 
|  |  | 
|  | // Look for an assigned symbol. | 
|  | bool | 
|  | is_pending_assignment(const char* name); | 
|  |  | 
|  | // Add a reference to a symbol. | 
|  | void | 
|  | add_symbol_reference(const char* name, size_t length); | 
|  |  | 
|  | // Add an assertion. | 
|  | void | 
|  | add_assertion(Expression* check, const char* message, size_t messagelen); | 
|  |  | 
|  | // Define a symbol from the command line. | 
|  | bool | 
|  | define_symbol(const char* definition); | 
|  |  | 
|  | // Populates the set with symbol names used in LHS of defsym. | 
|  | void | 
|  | find_defsym_defs(Unordered_set<std::string>&); | 
|  |  | 
|  | // Set symbols used in defsym expressions as seen in a real ELF object. | 
|  | void set_defsym_uses_in_real_elf(Symbol_table*) const; | 
|  |  | 
|  | // Create sections required by any linker scripts. | 
|  | void | 
|  | create_script_sections(Layout*); | 
|  |  | 
|  | // Add all symbol definitions to the symbol table. | 
|  | void | 
|  | add_symbols_to_table(Symbol_table*); | 
|  |  | 
|  | // Used to iterate over symbols which are referenced in expressions | 
|  | // but not defined. | 
|  | typedef Unordered_set<std::string>::const_iterator referenced_const_iterator; | 
|  |  | 
|  | referenced_const_iterator | 
|  | referenced_begin() const | 
|  | { return this->symbol_references_.begin(); } | 
|  |  | 
|  | referenced_const_iterator | 
|  | referenced_end() const | 
|  | { return this->symbol_references_.end(); } | 
|  |  | 
|  | // Return whether a symbol is referenced but not defined. | 
|  | bool | 
|  | is_referenced(const std::string& name) const | 
|  | { | 
|  | return (this->symbol_references_.find(name) | 
|  | != this->symbol_references_.end()); | 
|  | } | 
|  |  | 
|  | // Return whether there are any symbols which were referenced but | 
|  | // not defined. | 
|  | bool | 
|  | any_unreferenced() const | 
|  | { return !this->symbol_references_.empty(); } | 
|  |  | 
|  | // Finalize the symbol values.  Also check assertions. | 
|  | void | 
|  | finalize_symbols(Symbol_table*, const Layout*); | 
|  |  | 
|  | // Version information parsed from a version script.  Everything | 
|  | // else has a pointer to this object. | 
|  | Version_script_info* | 
|  | version_script_info() | 
|  | { return &this->version_script_info_; } | 
|  |  | 
|  | const Version_script_info* | 
|  | version_script_info() const | 
|  | { return &this->version_script_info_; } | 
|  |  | 
|  | // A SECTIONS clause parsed from a linker script.  Everything else | 
|  | // has a pointer to this object. | 
|  | Script_sections* | 
|  | script_sections() | 
|  | { return &this->script_sections_; } | 
|  |  | 
|  | const Script_sections* | 
|  | script_sections() const | 
|  | { return &this->script_sections_; } | 
|  |  | 
|  | // Whether we saw a SECTIONS clause. | 
|  | bool | 
|  | saw_sections_clause() const | 
|  | { return this->script_sections_.saw_sections_clause(); } | 
|  |  | 
|  | // Whether we saw a PHDRS clause. | 
|  | bool | 
|  | saw_phdrs_clause() const | 
|  | { return this->script_sections_.saw_phdrs_clause(); } | 
|  |  | 
|  | // Set section addresses using a SECTIONS clause.  Return the | 
|  | // segment which should hold the file header and segment headers; | 
|  | // this may return NULL, in which case the headers are not in a | 
|  | // loadable segment. | 
|  | Output_segment* | 
|  | set_section_addresses(Symbol_table*, Layout*); | 
|  |  | 
|  | // Print the script to the FILE.  This is for debugging. | 
|  | void | 
|  | print(FILE*) const; | 
|  |  | 
|  | private: | 
|  | // We keep a list of symbol assignments which occur outside of a | 
|  | // SECTIONS clause. | 
|  | typedef std::vector<Symbol_assignment*> Symbol_assignments; | 
|  |  | 
|  | // We keep a list of all assertions which occur outside of a | 
|  | // SECTIONS clause. | 
|  | typedef std::vector<Script_assertion*> Assertions; | 
|  |  | 
|  | // The entry address.  This will be empty if not set. | 
|  | std::string entry_; | 
|  | // Symbols to set. | 
|  | Symbol_assignments symbol_assignments_; | 
|  | // Symbols defined in an expression, for faster lookup. | 
|  | Unordered_set<std::string> symbol_definitions_; | 
|  | // Symbols referenced in an expression. | 
|  | Unordered_set<std::string> symbol_references_; | 
|  | // Assertions to check. | 
|  | Assertions assertions_; | 
|  | // Version information parsed from a version script. | 
|  | Version_script_info version_script_info_; | 
|  | // Information from any SECTIONS clauses. | 
|  | Script_sections script_sections_; | 
|  | }; | 
|  |  | 
|  | // FILE was found as an argument on the command line, but was not | 
|  | // recognized as an ELF file.  Try to read it as a script.  Return | 
|  | // true if the file was handled.  This has to handle /usr/lib/libc.so | 
|  | // on a GNU/Linux system.  *USED_NEXT_BLOCKER is set to indicate | 
|  | // whether the function took over NEXT_BLOCKER. | 
|  |  | 
|  | bool | 
|  | read_input_script(Workqueue*, Symbol_table*, Layout*, Dirsearch*, int, | 
|  | Input_objects*, Mapfile*, Input_group*, | 
|  | const Input_argument*, Input_file*, | 
|  | Task_token* next_blocker, bool* used_next_blocker); | 
|  |  | 
|  | // FILE was found as an argument to --script (-T). | 
|  | // Read it as a script, and execute its contents immediately. | 
|  |  | 
|  | bool | 
|  | read_commandline_script(const char* filename, Command_line* cmdline); | 
|  |  | 
|  | // FILE was found as an argument to --version-script.  Read it as a | 
|  | // version script, and store its contents in | 
|  | // cmdline->script_options()->version_script_info(). | 
|  |  | 
|  | bool | 
|  | read_version_script(const char* filename, Command_line* cmdline); | 
|  |  | 
|  | // FILENAME was found as an argument to --dynamic-list.  Read it as a | 
|  | // version script (actually, a versym_node from a version script), and | 
|  | // store its contents in DYNAMIC_LIST. | 
|  |  | 
|  | bool | 
|  | read_dynamic_list(const char* filename, Command_line* cmdline, | 
|  | Script_options* dynamic_list); | 
|  |  | 
|  | } // End namespace gold. | 
|  |  | 
|  | #endif // !defined(GOLD_SCRIPT_H) |