1 // script.h -- handle linker scripts for gold -*- C++ -*- 2 3 // Copyright 2006, 2007, 2008, 2009, 2010 Free Software Foundation, Inc. 4 // Written by Ian Lance Taylor <iant@google.com>. 5 6 // This file is part of gold. 7 8 // This program is free software; you can redistribute it and/or modify 9 // it under the terms of the GNU General Public License as published by 10 // the Free Software Foundation; either version 3 of the License, or 11 // (at your option) any later version. 12 13 // This program is distributed in the hope that it will be useful, 14 // but WITHOUT ANY WARRANTY; without even the implied warranty of 15 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 16 // GNU General Public License for more details. 17 18 // You should have received a copy of the GNU General Public License 19 // along with this program; if not, write to the Free Software 20 // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, 21 // MA 02110-1301, USA. 22 23 // We implement a subset of the original GNU ld linker script language 24 // for compatibility. The goal is not to implement the entire 25 // language. It is merely to implement enough to handle common uses. 26 // In particular we need to handle /usr/lib/libc.so on a typical 27 // GNU/Linux system, and we want to handle linker scripts used by the 28 // Linux kernel build. 29 30 #ifndef GOLD_SCRIPT_H 31 #define GOLD_SCRIPT_H 32 33 #include <cstdio> 34 #include <string> 35 #include <vector> 36 37 #include "script-sections.h" 38 39 namespace gold 40 { 41 42 class General_options; 43 class Command_line; 44 class Symbol_table; 45 class Layout; 46 class Mapfile; 47 class Input_argument; 48 class Input_arguments; 49 class Input_objects; 50 class Input_group; 51 class Input_file; 52 class Output_segment; 53 class Task_token; 54 class Workqueue; 55 struct Version_dependency_list; 56 struct Version_expression_list; 57 struct Version_tree; 58 struct Version_expression; 59 class Lazy_demangler; 60 61 // This class represents an expression in a linker script. 62 63 class Expression 64 { 65 protected: 66 // These should only be created by child classes. 67 Expression() 68 { } 69 70 public: 71 virtual ~Expression() 72 { } 73 74 // Return the value of the expression which is not permitted to 75 // refer to the dot symbol. CHECK_ASSERTIONS is true if we should 76 // check whether assertions are true. 77 uint64_t 78 eval(const Symbol_table*, const Layout*, bool check_assertions); 79 80 // Return the value of an expression which is permitted to refer to 81 // the dot symbol. DOT_VALUE is the absolute value of the dot 82 // symbol. DOT_SECTION is the section in which dot is defined; it 83 // should be NULL if the dot symbol has an absolute value (e.g., is 84 // defined in a SECTIONS clause outside of any output section 85 // definition). This sets *RESULT_SECTION to indicate where the 86 // value is defined. If the value is absolute *RESULT_SECTION will 87 // be NULL. Note that the returned value is still an absolute 88 // value; to get a section relative value the caller must subtract 89 // the section address. If RESULT_ALIGNMENT is not NULL, this sets 90 // *RESULT_ALIGNMENT to the alignment of the value of that alignment 91 // is larger than *RESULT_ALIGNMENT; this will only be non-zero if 92 // this is an ALIGN expression. 93 uint64_t 94 eval_with_dot(const Symbol_table*, const Layout*, bool check_assertions, 95 uint64_t dot_value, Output_section* dot_section, 96 Output_section** result_section, uint64_t* result_alignment); 97 98 // Return the value of an expression which may or may not be 99 // permitted to refer to the dot symbol, depending on 100 // is_dot_available. 101 uint64_t 102 eval_maybe_dot(const Symbol_table*, const Layout*, bool check_assertions, 103 bool is_dot_available, uint64_t dot_value, 104 Output_section* dot_section, 105 Output_section** result_section, uint64_t* result_alignment); 106 107 // Print the expression to the FILE. This is for debugging. 108 virtual void 109 print(FILE*) const = 0; 110 111 protected: 112 struct Expression_eval_info; 113 114 public: 115 // Compute the value of the expression (implemented by child class). 116 // This is public rather than protected because it is called 117 // directly by children of Expression on other Expression objects. 118 virtual uint64_t 119 value(const Expression_eval_info*) = 0; 120 121 private: 122 // May not be copied. 123 Expression(const Expression&); 124 Expression& operator=(const Expression&); 125 }; 126 127 128 // Version_script_info stores information parsed from the version 129 // script, either provided by --version-script or as part of a linker 130 // script. A single Version_script_info object per target is owned by 131 // Script_options. 132 133 class Version_script_info 134 { 135 public: 136 // The languages which can be specified in a versionn script. 137 enum Language 138 { 139 LANGUAGE_C, // No demangling. 140 LANGUAGE_CXX, // C++ demangling. 141 LANGUAGE_JAVA, // Java demangling. 142 LANGUAGE_COUNT 143 }; 144 145 Version_script_info(); 146 147 ~Version_script_info(); 148 149 // Clear everything. 150 void 151 clear(); 152 153 // Finalize the version control information. 154 void 155 finalize(); 156 157 // Return whether the information is finalized. 158 bool 159 is_finalized() const 160 { return this->is_finalized_; } 161 162 // Return whether any version were defined in the version script. 163 bool 164 empty() const 165 { return this->version_trees_.empty(); } 166 167 // If there is a version associated with SYMBOL, return true, and 168 // set *VERSION to the version, and *IS_GLOBAL to whether the symbol 169 // should be global. Otherwise, return false. 170 bool 171 get_symbol_version(const char* symbol, std::string* version, 172 bool* is_global) const; 173 174 // Return whether this symbol matches the local: section of some 175 // version. 176 bool 177 symbol_is_local(const char* symbol) const 178 { 179 bool is_global; 180 return (this->get_symbol_version(symbol, NULL, &is_global) 181 && !is_global); 182 } 183 184 // Return the names of versions defined in the version script. 185 std::vector<std::string> 186 get_versions() const; 187 188 // Return the list of dependencies for this version. 189 std::vector<std::string> 190 get_dependencies(const char* version) const; 191 192 // The following functions should only be used by the bison helper 193 // functions. They allocate new structs whose memory belongs to 194 // Version_script_info. The bison functions copy the information 195 // from the version script into these structs. 196 struct Version_dependency_list* 197 allocate_dependency_list(); 198 199 struct Version_expression_list* 200 allocate_expression_list(); 201 202 struct Version_tree* 203 allocate_version_tree(); 204 205 // Build the lookup tables after all data have been read. 206 void 207 build_lookup_tables(); 208 209 // Give an error if there are any unmatched names in the version 210 // script. 211 void 212 check_unmatched_names(const Symbol_table*) const; 213 214 // Print contents to the FILE. This is for debugging. 215 void 216 print(FILE*) const; 217 218 private: 219 void 220 print_expression_list(FILE* f, const Version_expression_list*) const; 221 222 bool 223 get_symbol_version_helper(const char* symbol, 224 bool check_global, 225 std::string* pversion) const; 226 227 // Fast lookup information for a given language. 228 229 // We map from exact match strings to Version_tree's. Historically 230 // version scripts sometimes have the same symbol multiple times, 231 // which is ambiguous. We warn about that case by storing the 232 // second Version_tree we see. 233 struct Version_tree_match 234 { 235 Version_tree_match(const Version_tree* r, bool ig, 236 const Version_expression* e) 237 : real(r), is_global(ig), expression(e), ambiguous(NULL) 238 { } 239 240 // The Version_tree that we return. 241 const Version_tree* real; 242 // True if this is a global match for the REAL member, false if it 243 // is a local match. 244 bool is_global; 245 // Point back to the Version_expression for which we created this 246 // match. 247 const Version_expression* expression; 248 // If not NULL, another Version_tree that defines the symbol. 249 const Version_tree* ambiguous; 250 }; 251 252 // Map from an exact match string to a Version_tree. 253 254 typedef Unordered_map<std::string, Version_tree_match> Exact; 255 256 // Fast lookup information for a glob pattern. 257 struct Glob 258 { 259 Glob() 260 : expression(NULL), version(NULL), is_global(false) 261 { } 262 263 Glob(const Version_expression* e, const Version_tree* v, bool ig) 264 : expression(e), version(v), is_global(ig) 265 { } 266 267 // A pointer to the version expression holding the pattern to 268 // match and the language to use for demangling the symbol before 269 // doing the match. 270 const Version_expression* expression; 271 // The Version_tree we use if this pattern matches. 272 const Version_tree* version; 273 // True if this is a global symbol. 274 bool is_global; 275 }; 276 277 typedef std::vector<Glob> Globs; 278 279 bool 280 unquote(std::string*) const; 281 282 void 283 add_exact_match(const std::string&, const Version_tree*, bool is_global, 284 const Version_expression*, Exact*); 285 286 void 287 build_expression_list_lookup(const Version_expression_list*, 288 const Version_tree*, bool); 289 290 const char* 291 get_name_to_match(const char*, int, 292 Lazy_demangler*, Lazy_demangler*) const; 293 294 // All the version dependencies we allocate. 295 std::vector<Version_dependency_list*> dependency_lists_; 296 // All the version expressions we allocate. 297 std::vector<Version_expression_list*> expression_lists_; 298 // The list of versions. 299 std::vector<Version_tree*> version_trees_; 300 // Exact matches for global symbols, by language. 301 Exact* exact_[LANGUAGE_COUNT]; 302 // A vector of glob patterns mapping to Version_trees. 303 Globs globs_; 304 // The default version to use, if there is one. This is from a 305 // pattern of "*". 306 const Version_tree* default_version_; 307 // True if the default version is global. 308 bool default_is_global_; 309 // Whether this has been finalized. 310 bool is_finalized_; 311 }; 312 313 // This class manages assignments to symbols. These can appear in 314 // three different locations in scripts: outside of a SECTIONS clause, 315 // within a SECTIONS clause, and within an output section definition 316 // within a SECTIONS clause. This can also appear on the command line 317 // via the --defsym command line option. 318 319 class Symbol_assignment 320 { 321 public: 322 Symbol_assignment(const char* name, size_t namelen, bool is_defsym, 323 Expression* val, bool provide, bool hidden) 324 : name_(name, namelen), val_(val), is_defsym_(is_defsym), 325 provide_(provide), hidden_(hidden), sym_(NULL) 326 { } 327 328 // Add the symbol to the symbol table. 329 void 330 add_to_table(Symbol_table*); 331 332 // Finalize the symbol value. 333 void 334 finalize(Symbol_table*, const Layout*); 335 336 // Finalize the symbol value when it can refer to the dot symbol. 337 void 338 finalize_with_dot(Symbol_table*, const Layout*, uint64_t dot_value, 339 Output_section* dot_section); 340 341 // Set the symbol value, but only if the value is absolute. This is 342 // used while processing a SECTIONS clause. We assume that dot is 343 // an absolute value here. We do not check assertions. 344 void 345 set_if_absolute(Symbol_table*, const Layout*, bool is_dot_available, 346 uint64_t dot_value); 347 348 const std::string& 349 name() const 350 { return this->name_; } 351 352 // Print the assignment to the FILE. This is for debugging. 353 void 354 print(FILE*) const; 355 356 private: 357 // Shared by finalize and finalize_with_dot. 358 void 359 finalize_maybe_dot(Symbol_table*, const Layout*, bool is_dot_available, 360 uint64_t dot_value, Output_section* dot_section); 361 362 // Sized version of finalize. 363 template<int size> 364 void 365 sized_finalize(Symbol_table*, const Layout*, bool is_dot_available, 366 uint64_t dot_value, Output_section*); 367 368 // Symbol name. 369 std::string name_; 370 // Expression to assign to symbol. 371 Expression* val_; 372 // True if this symbol is defined by a --defsym, false if it is 373 // defined in a linker script. 374 bool is_defsym_; 375 // Whether the assignment should be provided (only set if there is 376 // an undefined reference to the symbol. 377 bool provide_; 378 // Whether the assignment should be hidden. 379 bool hidden_; 380 // The entry in the symbol table. 381 Symbol* sym_; 382 }; 383 384 // This class manages assertions in linker scripts. These can appear 385 // in all the places where a Symbol_assignment can appear. 386 387 class Script_assertion 388 { 389 public: 390 Script_assertion(Expression* check, const char* message, 391 size_t messagelen) 392 : check_(check), message_(message, messagelen) 393 { } 394 395 // Check the assertion. 396 void 397 check(const Symbol_table*, const Layout*); 398 399 // Print the assertion to the FILE. This is for debugging. 400 void 401 print(FILE*) const; 402 403 private: 404 // The expression to check. 405 Expression* check_; 406 // The message to issue if the expression fails. 407 std::string message_; 408 }; 409 410 // We can read a linker script in two different contexts: when 411 // initially parsing the command line, and when we find an input file 412 // which is actually a linker script. Also some of the data which can 413 // be set by a linker script can also be set via command line options 414 // like -e and --defsym. This means that we have a type of data which 415 // can be set both during command line option parsing and while 416 // reading input files. We store that data in an instance of this 417 // object. We will keep pointers to that instance in both the 418 // Command_line and Layout objects. 419 420 class Script_options 421 { 422 public: 423 Script_options(); 424 425 // Add a symbol to be defined. 426 void 427 add_symbol_assignment(const char* name, size_t length, bool is_defsym, 428 Expression* value, bool provide, bool hidden); 429 430 // Look for an assigned symbol. 431 bool 432 is_pending_assignment(const char* name); 433 434 // Add a reference to a symbol. 435 void 436 add_symbol_reference(const char* name, size_t length); 437 438 // Add an assertion. 439 void 440 add_assertion(Expression* check, const char* message, size_t messagelen); 441 442 // Define a symbol from the command line. 443 bool 444 define_symbol(const char* definition); 445 446 // Create sections required by any linker scripts. 447 void 448 create_script_sections(Layout*); 449 450 // Add all symbol definitions to the symbol table. 451 void 452 add_symbols_to_table(Symbol_table*); 453 454 // Used to iterate over symbols which are referenced in expressions 455 // but not defined. 456 typedef Unordered_set<std::string>::const_iterator referenced_const_iterator; 457 458 referenced_const_iterator 459 referenced_begin() const 460 { return this->symbol_references_.begin(); } 461 462 referenced_const_iterator 463 referenced_end() const 464 { return this->symbol_references_.end(); } 465 466 // Return whether a symbol is referenced but not defined. 467 bool 468 is_referenced(const std::string& name) const 469 { 470 return (this->symbol_references_.find(name) 471 != this->symbol_references_.end()); 472 } 473 474 // Return whether there are any symbols which were referenced but 475 // not defined. 476 bool 477 any_unreferenced() const 478 { return !this->symbol_references_.empty(); } 479 480 // Finalize the symbol values. Also check assertions. 481 void 482 finalize_symbols(Symbol_table*, const Layout*); 483 484 // Version information parsed from a version script. Everything 485 // else has a pointer to this object. 486 Version_script_info* 487 version_script_info() 488 { return &this->version_script_info_; } 489 490 const Version_script_info* 491 version_script_info() const 492 { return &this->version_script_info_; } 493 494 // A SECTIONS clause parsed from a linker script. Everything else 495 // has a pointer to this object. 496 Script_sections* 497 script_sections() 498 { return &this->script_sections_; } 499 500 const Script_sections* 501 script_sections() const 502 { return &this->script_sections_; } 503 504 // Whether we saw a SECTIONS clause. 505 bool 506 saw_sections_clause() const 507 { return this->script_sections_.saw_sections_clause(); } 508 509 // Whether we saw a PHDRS clause. 510 bool 511 saw_phdrs_clause() const 512 { return this->script_sections_.saw_phdrs_clause(); } 513 514 // Set section addresses using a SECTIONS clause. Return the 515 // segment which should hold the file header and segment headers; 516 // this may return NULL, in which case the headers are not in a 517 // loadable segment. 518 Output_segment* 519 set_section_addresses(Symbol_table*, Layout*); 520 521 // Print the script to the FILE. This is for debugging. 522 void 523 print(FILE*) const; 524 525 private: 526 // We keep a list of symbol assignments which occur outside of a 527 // SECTIONS clause. 528 typedef std::vector<Symbol_assignment*> Symbol_assignments; 529 530 // We keep a list of all assertions whcih occur outside of a 531 // SECTIONS clause. 532 typedef std::vector<Script_assertion*> Assertions; 533 534 // The entry address. This will be empty if not set. 535 std::string entry_; 536 // Symbols to set. 537 Symbol_assignments symbol_assignments_; 538 // Symbols defined in an expression, for faster lookup. 539 Unordered_set<std::string> symbol_definitions_; 540 // Symbols referenced in an expression. 541 Unordered_set<std::string> symbol_references_; 542 // Assertions to check. 543 Assertions assertions_; 544 // Version information parsed from a version script. 545 Version_script_info version_script_info_; 546 // Information from any SECTIONS clauses. 547 Script_sections script_sections_; 548 }; 549 550 // Information about a script input that will persist during the whole linker 551 // run. Needed only during an incremental build to retrieve the input files 552 // added by this script. 553 554 class Script_info 555 { 556 public: 557 Script_info(Input_arguments* inputs) 558 : inputs_(inputs) 559 { } 560 561 // Returns the input files included because of this script. 562 Input_arguments* 563 inputs() 564 { return this->inputs_; } 565 566 private: 567 Input_arguments* inputs_; 568 }; 569 570 // FILE was found as an argument on the command line, but was not 571 // recognized as an ELF file. Try to read it as a script. Return 572 // true if the file was handled. This has to handle /usr/lib/libc.so 573 // on a GNU/Linux system. *USED_NEXT_BLOCKER is set to indicate 574 // whether the function took over NEXT_BLOCKER. 575 576 bool 577 read_input_script(Workqueue*, Symbol_table*, Layout*, Dirsearch*, int, 578 Input_objects*, Mapfile*, Input_group*, 579 const Input_argument*, Input_file*, 580 Task_token* next_blocker, bool* used_next_blocker); 581 582 // FILE was found as an argument to --script (-T). 583 // Read it as a script, and execute its contents immediately. 584 585 bool 586 read_commandline_script(const char* filename, Command_line* cmdline); 587 588 // FILE was found as an argument to --version-script. Read it as a 589 // version script, and store its contents in 590 // cmdline->script_options()->version_script_info(). 591 592 bool 593 read_version_script(const char* filename, Command_line* cmdline); 594 595 // FILENAME was found as an argument to --dynamic-list. Read it as a 596 // version script (actually, a versym_node from a version script), and 597 // store its contents in DYNAMIC_LIST. 598 599 bool 600 read_dynamic_list(const char* filename, Command_line* cmdline, 601 Script_options* dynamic_list); 602 603 } // End namespace gold. 604 605 #endif // !defined(GOLD_SCRIPT_H) 606