2009-07-03 Tristan Gingold <gingold@adacore.com>
[binutils.git] / gold / fileread.h
blob4d19824f04174e181fc29d70ee726e92cf6a6a3e
1 // fileread.h -- read files for gold -*- C++ -*-
3 // Copyright 2006, 2007, 2008, 2009 Free Software Foundation, Inc.
4 // Written by Ian Lance Taylor <iant@google.com>.
6 // This file is part of gold.
8 // This program is free software; you can redistribute it and/or modify
9 // it under the terms of the GNU General Public License as published by
10 // the Free Software Foundation; either version 3 of the License, or
11 // (at your option) any later version.
13 // This program is distributed in the hope that it will be useful,
14 // but WITHOUT ANY WARRANTY; without even the implied warranty of
15 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 // GNU General Public License for more details.
18 // You should have received a copy of the GNU General Public License
19 // along with this program; if not, write to the Free Software
20 // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston,
21 // MA 02110-1301, USA.
23 // Classes used to read data from binary input files.
25 #ifndef GOLD_FILEREAD_H
26 #define GOLD_FILEREAD_H
28 #include <list>
29 #include <map>
30 #include <string>
31 #include <vector>
33 #include "token.h"
35 namespace gold
38 class Position_dependent_options;
39 class Input_file_argument;
40 class Dirsearch;
41 class File_view;
43 // File_read manages a file descriptor and mappings for a file we are
44 // reading.
46 class File_read
48 public:
49 File_read()
50 : name_(), descriptor_(-1), is_descriptor_opened_(false), object_count_(0),
51 size_(0), token_(false), views_(), saved_views_(), contents_(NULL),
52 mapped_bytes_(0), released_(true)
53 { }
55 ~File_read();
57 // Open a file.
58 bool
59 open(const Task*, const std::string& name);
61 // Pretend to open the file, but provide the file contents. No
62 // actual file system activity will occur. This is used for
63 // testing.
64 bool
65 open(const Task*, const std::string& name, const unsigned char* contents,
66 off_t size);
68 // Return the file name.
69 const std::string&
70 filename() const
71 { return this->name_; }
73 // Add an object associated with a file.
74 void
75 add_object()
76 { ++this->object_count_; }
78 // Remove an object associated with a file.
79 void
80 remove_object()
81 { --this->object_count_; }
83 // Lock the file for exclusive access within a particular Task::run
84 // execution. This routine may only be called when the workqueue
85 // lock is held.
86 void
87 lock(const Task* t);
89 // Unlock the file.
90 void
91 unlock(const Task* t);
93 // Test whether the object is locked.
94 bool
95 is_locked() const;
97 // Return the token, so that the task can be queued.
98 Task_token*
99 token()
100 { return &this->token_; }
102 // Release the file. This indicates that we aren't going to do
103 // anything further with it until it is unlocked. This is used
104 // because a Task which locks the file never calls either lock or
105 // unlock; it just locks the token. The basic rule is that a Task
106 // which locks a file via the Task::locks interface must explicitly
107 // call release() when it is done. This is not necessary for code
108 // which calls unlock() on the file.
109 void
110 release();
112 // Return the size of the file.
113 off_t
114 filesize() const
115 { return this->size_; }
117 // Return a view into the file starting at file offset START for
118 // SIZE bytes. OFFSET is the offset into the input file for the
119 // file we are reading; this is zero for a normal object file,
120 // non-zero for an object file in an archive. ALIGNED is true if
121 // the data must be naturally aligned; this only matters when OFFSET
122 // is not zero. The pointer will remain valid until the File_read
123 // is unlocked. It is an error if we can not read enough data from
124 // the file. The CACHE parameter is a hint as to whether it will be
125 // useful to cache this data for later accesses--i.e., later calls
126 // to get_view, read, or get_lasting_view which retrieve the same
127 // data.
128 const unsigned char*
129 get_view(off_t offset, off_t start, section_size_type size, bool aligned,
130 bool cache);
132 // Read data from the file into the buffer P starting at file offset
133 // START for SIZE bytes.
134 void
135 read(off_t start, section_size_type size, void* p);
137 // Return a lasting view into the file starting at file offset START
138 // for SIZE bytes. This is allocated with new, and the caller is
139 // responsible for deleting it when done. The data associated with
140 // this view will remain valid until the view is deleted. It is an
141 // error if we can not read enough data from the file. The OFFSET,
142 // ALIGNED and CACHE parameters are as in get_view.
143 File_view*
144 get_lasting_view(off_t offset, off_t start, section_size_type size,
145 bool aligned, bool cache);
147 // Mark all views as no longer cached.
148 void
149 clear_view_cache_marks();
151 // Discard all uncached views. This is normally done by release(),
152 // but not for objects in archives. FIXME: This is a complicated
153 // interface, and it would be nice to have something more automatic.
154 void
155 clear_uncached_views()
156 { this->clear_views(false); }
158 // A struct used to do a multiple read.
159 struct Read_multiple_entry
161 // The file offset of the data to read.
162 off_t file_offset;
163 // The amount of data to read.
164 section_size_type size;
165 // The buffer where the data should be placed.
166 unsigned char* buffer;
168 Read_multiple_entry(off_t o, section_size_type s, unsigned char* b)
169 : file_offset(o), size(s), buffer(b)
173 typedef std::vector<Read_multiple_entry> Read_multiple;
175 // Read a bunch of data from the file into various different
176 // locations. The vector must be sorted by ascending file_offset.
177 // BASE is a base offset to be added to all the offsets in the
178 // vector.
179 void
180 read_multiple(off_t base, const Read_multiple&);
182 // Dump statistical information to stderr.
183 static void
184 print_stats();
186 // Return the open file descriptor (for plugins).
188 descriptor()
190 this->reopen_descriptor();
191 return this->descriptor_;
194 private:
195 // This class may not be copied.
196 File_read(const File_read&);
197 File_read& operator=(const File_read&);
199 // Total bytes mapped into memory during the link. This variable
200 // may not be accurate when running multi-threaded.
201 static unsigned long long total_mapped_bytes;
203 // Current number of bytes mapped into memory during the link. This
204 // variable may not be accurate when running multi-threaded.
205 static unsigned long long current_mapped_bytes;
207 // High water mark of bytes mapped into memory during the link.
208 // This variable may not be accurate when running multi-threaded.
209 static unsigned long long maximum_mapped_bytes;
211 // A view into the file.
212 class View
214 public:
215 View(off_t start, section_size_type size, const unsigned char* data,
216 unsigned int byteshift, bool cache, bool mapped)
217 : start_(start), size_(size), data_(data), lock_count_(0),
218 byteshift_(byteshift), cache_(cache), mapped_(mapped), accessed_(true)
221 ~View();
223 off_t
224 start() const
225 { return this->start_; }
227 section_size_type
228 size() const
229 { return this->size_; }
231 const unsigned char*
232 data() const
233 { return this->data_; }
235 void
236 lock();
238 void
239 unlock();
241 bool
242 is_locked();
244 unsigned int
245 byteshift() const
246 { return this->byteshift_; }
248 void
249 set_cache()
250 { this->cache_ = true; }
252 void
253 clear_cache()
254 { this->cache_ = false; }
256 bool
257 should_cache() const
258 { return this->cache_; }
260 void
261 set_accessed()
262 { this->accessed_ = true; }
264 void
265 clear_accessed()
266 { this->accessed_= false; }
268 bool
269 accessed() const
270 { return this->accessed_; }
272 private:
273 View(const View&);
274 View& operator=(const View&);
276 // The file offset of the start of the view.
277 off_t start_;
278 // The size of the view.
279 section_size_type size_;
280 // A pointer to the actual bytes.
281 const unsigned char* data_;
282 // The number of locks on this view.
283 int lock_count_;
284 // The number of bytes that the view is shifted relative to the
285 // underlying file. This is used to align data. This is normally
286 // zero, except possibly for an object in an archive.
287 unsigned int byteshift_;
288 // Whether the view is cached.
289 bool cache_;
290 // Whether the view is mapped into memory. If not, data_ points
291 // to memory allocated using new[].
292 bool mapped_;
293 // Whether the view has been accessed recently.
294 bool accessed_;
297 friend class View;
298 friend class File_view;
300 // The type of a mapping from page start and byte shift to views.
301 typedef std::map<std::pair<off_t, unsigned int>, View*> Views;
303 // A simple list of Views.
304 typedef std::list<View*> Saved_views;
306 // Open the descriptor if necessary.
307 void
308 reopen_descriptor();
310 // Find a view into the file.
311 View*
312 find_view(off_t start, section_size_type size, unsigned int byteshift,
313 View** vshifted) const;
315 // Read data from the file into a buffer.
316 void
317 do_read(off_t start, section_size_type size, void* p);
319 // Add a view.
320 void
321 add_view(View*);
323 // Make a view into the file.
324 View*
325 make_view(off_t start, section_size_type size, unsigned int byteshift,
326 bool cache);
328 // Find or make a view into the file.
329 View*
330 find_or_make_view(off_t offset, off_t start, section_size_type size,
331 bool aligned, bool cache);
333 // Clear the file views.
334 void
335 clear_views(bool);
337 // The size of a file page for buffering data.
338 static const off_t page_size = 8192;
340 // Given a file offset, return the page offset.
341 static off_t
342 page_offset(off_t file_offset)
343 { return file_offset & ~ (page_size - 1); }
345 // Given a file size, return the size to read integral pages.
346 static off_t
347 pages(off_t file_size)
348 { return (file_size + (page_size - 1)) & ~ (page_size - 1); }
350 // The maximum number of entries we will pass to ::readv.
351 static const size_t max_readv_entries = 128;
353 // Use readv to read data.
354 void
355 do_readv(off_t base, const Read_multiple&, size_t start, size_t count);
357 // File name.
358 std::string name_;
359 // File descriptor.
360 int descriptor_;
361 // Whether we have regained the descriptor after releasing the file.
362 bool is_descriptor_opened_;
363 // The number of objects associated with this file. This will be
364 // more than 1 in the case of an archive.
365 int object_count_;
366 // File size.
367 off_t size_;
368 // A token used to lock the file.
369 Task_token token_;
370 // Buffered views into the file.
371 Views views_;
372 // List of views which were locked but had to be removed from views_
373 // because they were not large enough.
374 Saved_views saved_views_;
375 // Specified file contents. Used only for testing purposes.
376 const unsigned char* contents_;
377 // Total amount of space mapped into memory. This is only changed
378 // while the file is locked. When we unlock the file, we transfer
379 // the total to total_mapped_bytes, and reset this to zero.
380 size_t mapped_bytes_;
381 // Whether the file was released.
382 bool released_;
385 // A view of file data that persists even when the file is unlocked.
386 // Callers should destroy these when no longer required. These are
387 // obtained form File_read::get_lasting_view. They may only be
388 // destroyed when the underlying File_read is locked.
390 class File_view
392 public:
393 // This may only be called when the underlying File_read is locked.
394 ~File_view();
396 // Return a pointer to the data associated with this view.
397 const unsigned char*
398 data() const
399 { return this->data_; }
401 private:
402 File_view(const File_view&);
403 File_view& operator=(const File_view&);
405 friend class File_read;
407 // Callers have to get these via File_read::get_lasting_view.
408 File_view(File_read& file, File_read::View* view, const unsigned char* data)
409 : file_(file), view_(view), data_(data)
412 File_read& file_;
413 File_read::View* view_;
414 const unsigned char* data_;
417 // All the information we hold for a single input file. This can be
418 // an object file, a shared library, or an archive.
420 class Input_file
422 public:
423 Input_file(const Input_file_argument* input_argument)
424 : input_argument_(input_argument), found_name_(), file_(),
425 is_in_sysroot_(false)
428 // Create an input file with the contents already provided. This is
429 // only used for testing. With this path, don't call the open
430 // method.
431 Input_file(const Task*, const char* name, const unsigned char* contents,
432 off_t size);
434 // Return the command line argument.
435 const Input_file_argument*
436 input_file_argument() const
437 { return this->input_argument_; }
439 // Return whether this is a file that we will search for in the list
440 // of directories.
441 bool
442 will_search_for() const;
444 // Open the file. If the open fails, this will report an error and
445 // return false. If there is a search, it starts at directory
446 // *PINDEX. *PINDEX should be initialized to zero. It may be
447 // restarted to find the next file with a matching name by
448 // incrementing the result and calling this again.
449 bool
450 open(const Dirsearch&, const Task*, int *pindex);
452 // Return the name given by the user. For -lc this will return "c".
453 const char*
454 name() const;
456 // Return the file name. For -lc this will return something like
457 // "/usr/lib/libc.so".
458 const std::string&
459 filename() const
460 { return this->file_.filename(); }
462 // Return the name under which we found the file, corresponding to
463 // the command line. For -lc this will return something like
464 // "libc.so".
465 const std::string&
466 found_name() const
467 { return this->found_name_; }
469 // Return the position dependent options.
470 const Position_dependent_options&
471 options() const;
473 // Return the file.
474 File_read&
475 file()
476 { return this->file_; }
478 const File_read&
479 file() const
480 { return this->file_; }
482 // Whether we found the file in a directory in the system root.
483 bool
484 is_in_sysroot() const
485 { return this->is_in_sysroot_; }
487 // Whether this file is in a system directory.
488 bool
489 is_in_system_directory() const;
491 // Return whether this file is to be read only for its symbols.
492 bool
493 just_symbols() const;
495 private:
496 Input_file(const Input_file&);
497 Input_file& operator=(const Input_file&);
499 // Open a binary file.
500 bool
501 open_binary(const Task* task, const std::string& name);
503 // The argument from the command line.
504 const Input_file_argument* input_argument_;
505 // The name under which we opened the file. This is like the name
506 // on the command line, but -lc turns into libc.so (or whatever).
507 // It only includes the full path if the path was on the command
508 // line.
509 std::string found_name_;
510 // The file after we open it.
511 File_read file_;
512 // Whether we found the file in a directory in the system root.
513 bool is_in_sysroot_;
516 } // end namespace gold
518 #endif // !defined(GOLD_FILEREAD_H)