1 // fileread.h -- read files for gold -*- C++ -*- 2 3 // Copyright 2006, 2007, 2008, 2009, 2010, 2011 Free Software Foundation, Inc. 4 // Written by Ian Lance Taylor <iant@google.com>. 5 6 // This file is part of gold. 7 8 // This program is free software; you can redistribute it and/or modify 9 // it under the terms of the GNU General Public License as published by 10 // the Free Software Foundation; either version 3 of the License, or 11 // (at your option) any later version. 12 13 // This program is distributed in the hope that it will be useful, 14 // but WITHOUT ANY WARRANTY; without even the implied warranty of 15 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 16 // GNU General Public License for more details. 17 18 // You should have received a copy of the GNU General Public License 19 // along with this program; if not, write to the Free Software 20 // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, 21 // MA 02110-1301, USA. 22 23 // Classes used to read data from binary input files. 24 25 #ifndef GOLD_FILEREAD_H 26 #define GOLD_FILEREAD_H 27 28 #include <list> 29 #include <map> 30 #include <string> 31 #include <vector> 32 33 #include "token.h" 34 35 namespace gold 36 { 37 38 // Since not all system supports stat.st_mtim and struct timespec, 39 // we define our own structure and fill the nanoseconds if we can. 40 41 struct Timespec 42 { 43 Timespec() 44 : seconds(0), nanoseconds(0) 45 { } 46 47 Timespec(time_t a_seconds, int a_nanoseconds) 48 : seconds(a_seconds), nanoseconds(a_nanoseconds) 49 { } 50 51 time_t seconds; 52 int nanoseconds; 53 }; 54 55 class Position_dependent_options; 56 class Input_file_argument; 57 class Dirsearch; 58 class File_view; 59 60 // File_read manages a file descriptor and mappings for a file we are 61 // reading. 62 63 class File_read 64 { 65 public: 66 File_read() 67 : name_(), descriptor_(-1), is_descriptor_opened_(false), object_count_(0), 68 size_(0), token_(false), views_(), saved_views_(), mapped_bytes_(0), 69 released_(true), whole_file_view_(NULL) 70 { } 71 72 ~File_read(); 73 74 // Open a file. 75 bool 76 open(const Task*, const std::string& name); 77 78 // Pretend to open the file, but provide the file contents. No 79 // actual file system activity will occur. This is used for 80 // testing. 81 bool 82 open(const Task*, const std::string& name, const unsigned char* contents, 83 off_t size); 84 85 // Return the file name. 86 const std::string& 87 filename() const 88 { return this->name_; } 89 90 // Add an object associated with a file. 91 void 92 add_object() 93 { ++this->object_count_; } 94 95 // Remove an object associated with a file. 96 void 97 remove_object() 98 { --this->object_count_; } 99 100 // Lock the file for exclusive access within a particular Task::run 101 // execution. This routine may only be called when the workqueue 102 // lock is held. 103 void 104 lock(const Task* t); 105 106 // Unlock the file. 107 void 108 unlock(const Task* t); 109 110 // Test whether the object is locked. 111 bool 112 is_locked() const; 113 114 // Return the token, so that the task can be queued. 115 Task_token* 116 token() 117 { return &this->token_; } 118 119 // Release the file. This indicates that we aren't going to do 120 // anything further with it until it is unlocked. This is used 121 // because a Task which locks the file never calls either lock or 122 // unlock; it just locks the token. The basic rule is that a Task 123 // which locks a file via the Task::locks interface must explicitly 124 // call release() when it is done. This is not necessary for code 125 // which calls unlock() on the file. 126 void 127 release(); 128 129 // Return the size of the file. 130 off_t 131 filesize() const 132 { return this->size_; } 133 134 // Return a view into the file starting at file offset START for 135 // SIZE bytes. OFFSET is the offset into the input file for the 136 // file we are reading; this is zero for a normal object file, 137 // non-zero for an object file in an archive. ALIGNED is true if 138 // the data must be naturally aligned; this only matters when OFFSET 139 // is not zero. The pointer will remain valid until the File_read 140 // is unlocked. It is an error if we can not read enough data from 141 // the file. The CACHE parameter is a hint as to whether it will be 142 // useful to cache this data for later accesses--i.e., later calls 143 // to get_view, read, or get_lasting_view which retrieve the same 144 // data. 145 const unsigned char* 146 get_view(off_t offset, off_t start, section_size_type size, bool aligned, 147 bool cache); 148 149 // Read data from the file into the buffer P starting at file offset 150 // START for SIZE bytes. 151 void 152 read(off_t start, section_size_type size, void* p); 153 154 // Return a lasting view into the file starting at file offset START 155 // for SIZE bytes. This is allocated with new, and the caller is 156 // responsible for deleting it when done. The data associated with 157 // this view will remain valid until the view is deleted. It is an 158 // error if we can not read enough data from the file. The OFFSET, 159 // ALIGNED and CACHE parameters are as in get_view. 160 File_view* 161 get_lasting_view(off_t offset, off_t start, section_size_type size, 162 bool aligned, bool cache); 163 164 // Mark all views as no longer cached. 165 void 166 clear_view_cache_marks(); 167 168 // Discard all uncached views. This is normally done by release(), 169 // but not for objects in archives. FIXME: This is a complicated 170 // interface, and it would be nice to have something more automatic. 171 void 172 clear_uncached_views() 173 { this->clear_views(CLEAR_VIEWS_ARCHIVE); } 174 175 // A struct used to do a multiple read. 176 struct Read_multiple_entry 177 { 178 // The file offset of the data to read. 179 off_t file_offset; 180 // The amount of data to read. 181 section_size_type size; 182 // The buffer where the data should be placed. 183 unsigned char* buffer; 184 185 Read_multiple_entry(off_t o, section_size_type s, unsigned char* b) 186 : file_offset(o), size(s), buffer(b) 187 { } 188 }; 189 190 typedef std::vector<Read_multiple_entry> Read_multiple; 191 192 // Read a bunch of data from the file into various different 193 // locations. The vector must be sorted by ascending file_offset. 194 // BASE is a base offset to be added to all the offsets in the 195 // vector. 196 void 197 read_multiple(off_t base, const Read_multiple&); 198 199 // Dump statistical information to stderr. 200 static void 201 print_stats(); 202 203 // Return the open file descriptor (for plugins). 204 int 205 descriptor() 206 { 207 this->reopen_descriptor(); 208 return this->descriptor_; 209 } 210 211 // Return the file last modification time. Calls gold_fatal if the stat 212 // system call failed. 213 Timespec 214 get_mtime(); 215 216 private: 217 // Control for what views to clear. 218 enum Clear_views_mode 219 { 220 // Clear uncached views not used by an archive. 221 CLEAR_VIEWS_NORMAL, 222 // Clear all uncached views (including in an archive). 223 CLEAR_VIEWS_ARCHIVE, 224 // Clear all views (i.e., we're destroying the file). 225 CLEAR_VIEWS_ALL 226 }; 227 228 // This class may not be copied. 229 File_read(const File_read&); 230 File_read& operator=(const File_read&); 231 232 // Total bytes mapped into memory during the link if --stats. 233 static unsigned long long total_mapped_bytes; 234 235 // Current number of bytes mapped into memory during the link if 236 // --stats. 237 static unsigned long long current_mapped_bytes; 238 239 // High water mark of bytes mapped into memory during the link if 240 // --stats. 241 static unsigned long long maximum_mapped_bytes; 242 243 // A view into the file. 244 class View 245 { 246 public: 247 // Specifies how to dispose the data on destruction of the view. 248 enum Data_ownership 249 { 250 // Data owned by File object - nothing done in destructor. 251 DATA_NOT_OWNED, 252 // Data alocated with new[] and owned by this object - should 253 // use delete[]. 254 DATA_ALLOCATED_ARRAY, 255 // Data mmapped and owned by this object - should munmap. 256 DATA_MMAPPED 257 }; 258 259 View(off_t start, section_size_type size, const unsigned char* data, 260 unsigned int byteshift, bool cache, Data_ownership data_ownership) 261 : start_(start), size_(size), data_(data), lock_count_(0), 262 byteshift_(byteshift), cache_(cache), data_ownership_(data_ownership), 263 accessed_(true) 264 { } 265 266 ~View(); 267 268 off_t 269 start() const 270 { return this->start_; } 271 272 section_size_type 273 size() const 274 { return this->size_; } 275 276 const unsigned char* 277 data() const 278 { return this->data_; } 279 280 void 281 lock(); 282 283 void 284 unlock(); 285 286 bool 287 is_locked(); 288 289 unsigned int 290 byteshift() const 291 { return this->byteshift_; } 292 293 void 294 set_cache() 295 { this->cache_ = true; } 296 297 void 298 clear_cache() 299 { this->cache_ = false; } 300 301 bool 302 should_cache() const 303 { return this->cache_; } 304 305 void 306 set_accessed() 307 { this->accessed_ = true; } 308 309 void 310 clear_accessed() 311 { this->accessed_= false; } 312 313 bool 314 accessed() const 315 { return this->accessed_; } 316 317 // Returns TRUE if this view contains permanent data -- e.g., data that 318 // was supplied by the owner of the File object. 319 bool 320 is_permanent_view() const 321 { return this->data_ownership_ == DATA_NOT_OWNED; } 322 323 private: 324 View(const View&); 325 View& operator=(const View&); 326 327 // The file offset of the start of the view. 328 off_t start_; 329 // The size of the view. 330 section_size_type size_; 331 // A pointer to the actual bytes. 332 const unsigned char* data_; 333 // The number of locks on this view. 334 int lock_count_; 335 // The number of bytes that the view is shifted relative to the 336 // underlying file. This is used to align data. This is normally 337 // zero, except possibly for an object in an archive. 338 unsigned int byteshift_; 339 // Whether the view is cached. 340 bool cache_; 341 // Whether the view is mapped into memory. If not, data_ points 342 // to memory allocated using new[]. 343 Data_ownership data_ownership_; 344 // Whether the view has been accessed recently. 345 bool accessed_; 346 }; 347 348 friend class View; 349 friend class File_view; 350 351 // The type of a mapping from page start and byte shift to views. 352 typedef std::map<std::pair<off_t, unsigned int>, View*> Views; 353 354 // A simple list of Views. 355 typedef std::list<View*> Saved_views; 356 357 // Open the descriptor if necessary. 358 void 359 reopen_descriptor(); 360 361 // Find a view into the file. 362 View* 363 find_view(off_t start, section_size_type size, unsigned int byteshift, 364 View** vshifted) const; 365 366 // Read data from the file into a buffer. 367 void 368 do_read(off_t start, section_size_type size, void* p); 369 370 // Add a view. 371 void 372 add_view(View*); 373 374 // Make a view into the file. 375 View* 376 make_view(off_t start, section_size_type size, unsigned int byteshift, 377 bool cache); 378 379 // Find or make a view into the file. 380 View* 381 find_or_make_view(off_t offset, off_t start, section_size_type size, 382 bool aligned, bool cache); 383 384 // Clear the file views. 385 void 386 clear_views(Clear_views_mode); 387 388 // The size of a file page for buffering data. 389 static const off_t page_size = 8192; 390 391 // Given a file offset, return the page offset. 392 static off_t 393 page_offset(off_t file_offset) 394 { return file_offset & ~ (page_size - 1); } 395 396 // Given a file size, return the size to read integral pages. 397 static off_t 398 pages(off_t file_size) 399 { return (file_size + (page_size - 1)) & ~ (page_size - 1); } 400 401 // The maximum number of entries we will pass to ::readv. 402 static const size_t max_readv_entries = 128; 403 404 // Use readv to read data. 405 void 406 do_readv(off_t base, const Read_multiple&, size_t start, size_t count); 407 408 // File name. 409 std::string name_; 410 // File descriptor. 411 int descriptor_; 412 // Whether we have regained the descriptor after releasing the file. 413 bool is_descriptor_opened_; 414 // The number of objects associated with this file. This will be 415 // more than 1 in the case of an archive. 416 int object_count_; 417 // File size. 418 off_t size_; 419 // A token used to lock the file. 420 Task_token token_; 421 // Buffered views into the file. 422 Views views_; 423 // List of views which were locked but had to be removed from views_ 424 // because they were not large enough. 425 Saved_views saved_views_; 426 // Total amount of space mapped into memory. This is only changed 427 // while the file is locked. When we unlock the file, we transfer 428 // the total to total_mapped_bytes, and reset this to zero. 429 size_t mapped_bytes_; 430 // Whether the file was released. 431 bool released_; 432 // A view containing the whole file. May be NULL if we mmap only 433 // the relevant parts of the file. Not NULL if: 434 // - Flag --mmap_whole_files is set (default on 64-bit hosts). 435 // - The contents was specified in the constructor. Used only for 436 // testing purposes). 437 View* whole_file_view_; 438 }; 439 440 // A view of file data that persists even when the file is unlocked. 441 // Callers should destroy these when no longer required. These are 442 // obtained form File_read::get_lasting_view. They may only be 443 // destroyed when the underlying File_read is locked. 444 445 class File_view 446 { 447 public: 448 // This may only be called when the underlying File_read is locked. 449 ~File_view(); 450 451 // Return a pointer to the data associated with this view. 452 const unsigned char* 453 data() const 454 { return this->data_; } 455 456 private: 457 File_view(const File_view&); 458 File_view& operator=(const File_view&); 459 460 friend class File_read; 461 462 // Callers have to get these via File_read::get_lasting_view. 463 File_view(File_read& file, File_read::View* view, const unsigned char* data) 464 : file_(file), view_(view), data_(data) 465 { } 466 467 File_read& file_; 468 File_read::View* view_; 469 const unsigned char* data_; 470 }; 471 472 // All the information we hold for a single input file. This can be 473 // an object file, a shared library, or an archive. 474 475 class Input_file 476 { 477 public: 478 enum Format 479 { 480 FORMAT_NONE, 481 FORMAT_ELF, 482 FORMAT_BINARY 483 }; 484 485 Input_file(const Input_file_argument* input_argument) 486 : input_argument_(input_argument), found_name_(), file_(), 487 is_in_sysroot_(false), format_(FORMAT_NONE) 488 { } 489 490 // Create an input file with the contents already provided. This is 491 // only used for testing. With this path, don't call the open 492 // method. 493 Input_file(const Task*, const char* name, const unsigned char* contents, 494 off_t size); 495 496 // Return the command line argument. 497 const Input_file_argument* 498 input_file_argument() const 499 { return this->input_argument_; } 500 501 // Return whether this is a file that we will search for in the list 502 // of directories. 503 bool 504 will_search_for() const; 505 506 // Open the file. If the open fails, this will report an error and 507 // return false. If there is a search, it starts at directory 508 // *PINDEX. *PINDEX should be initialized to zero. It may be 509 // restarted to find the next file with a matching name by 510 // incrementing the result and calling this again. 511 bool 512 open(const Dirsearch&, const Task*, int* pindex); 513 514 // Return the name given by the user. For -lc this will return "c". 515 const char* 516 name() const; 517 518 // Return the file name. For -lc this will return something like 519 // "/usr/lib/libc.so". 520 const std::string& 521 filename() const 522 { return this->file_.filename(); } 523 524 // Return the name under which we found the file, corresponding to 525 // the command line. For -lc this will return something like 526 // "libc.so". 527 const std::string& 528 found_name() const 529 { return this->found_name_; } 530 531 // Return the position dependent options. 532 const Position_dependent_options& 533 options() const; 534 535 // Return the file. 536 File_read& 537 file() 538 { return this->file_; } 539 540 const File_read& 541 file() const 542 { return this->file_; } 543 544 // Whether we found the file in a directory in the system root. 545 bool 546 is_in_sysroot() const 547 { return this->is_in_sysroot_; } 548 549 // Whether this file is in a system directory. 550 bool 551 is_in_system_directory() const; 552 553 // Return whether this file is to be read only for its symbols. 554 bool 555 just_symbols() const; 556 557 // Return the format of the unconverted input file. 558 Format 559 format() const 560 { return this->format_; } 561 562 // Try to find a file in the extra search dirs. Returns true on success. 563 static bool 564 try_extra_search_path(int* pindex, 565 const Input_file_argument* input_argument, 566 std::string filename, std::string* found_name, 567 std::string* namep); 568 569 // Find the actual file. 570 static bool 571 find_file(const Dirsearch& dirpath, int* pindex, 572 const Input_file_argument* input_argument, 573 bool* is_in_sysroot, 574 std::string* found_name, std::string* namep); 575 576 private: 577 Input_file(const Input_file&); 578 Input_file& operator=(const Input_file&); 579 580 // Open a binary file. 581 bool 582 open_binary(const Task* task, const std::string& name); 583 584 // The argument from the command line. 585 const Input_file_argument* input_argument_; 586 // The name under which we opened the file. This is like the name 587 // on the command line, but -lc turns into libc.so (or whatever). 588 // It only includes the full path if the path was on the command 589 // line. 590 std::string found_name_; 591 // The file after we open it. 592 File_read file_; 593 // Whether we found the file in a directory in the system root. 594 bool is_in_sysroot_; 595 // Format of unconverted input file. 596 Format format_; 597 }; 598 599 } // end namespace gold 600 601 #endif // !defined(GOLD_FILEREAD_H) 602