Fix "pushw imm16" for x86-64 disassembler.
[binutils.git] / gold / script.h
blob70e3a59e7b44814caecd08017dacea5f94518a1e
1 // script.h -- handle linker scripts for gold -*- C++ -*-
3 // Copyright 2006, 2007, 2008, 2009, 2010 Free Software Foundation, Inc.
4 // Written by Ian Lance Taylor <iant@google.com>.
6 // This file is part of gold.
8 // This program is free software; you can redistribute it and/or modify
9 // it under the terms of the GNU General Public License as published by
10 // the Free Software Foundation; either version 3 of the License, or
11 // (at your option) any later version.
13 // This program is distributed in the hope that it will be useful,
14 // but WITHOUT ANY WARRANTY; without even the implied warranty of
15 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 // GNU General Public License for more details.
18 // You should have received a copy of the GNU General Public License
19 // along with this program; if not, write to the Free Software
20 // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston,
21 // MA 02110-1301, USA.
23 // We implement a subset of the original GNU ld linker script language
24 // for compatibility. The goal is not to implement the entire
25 // language. It is merely to implement enough to handle common uses.
26 // In particular we need to handle /usr/lib/libc.so on a typical
27 // GNU/Linux system, and we want to handle linker scripts used by the
28 // Linux kernel build.
30 #ifndef GOLD_SCRIPT_H
31 #define GOLD_SCRIPT_H
33 #include <cstdio>
34 #include <string>
35 #include <vector>
37 #include "script-sections.h"
39 namespace gold
42 class General_options;
43 class Command_line;
44 class Symbol_table;
45 class Layout;
46 class Mapfile;
47 class Input_argument;
48 class Input_arguments;
49 class Input_objects;
50 class Input_group;
51 class Input_file;
52 class Output_segment;
53 class Task_token;
54 class Workqueue;
55 struct Version_dependency_list;
56 struct Version_expression_list;
57 struct Version_tree;
58 struct Version_expression;
59 class Lazy_demangler;
61 // This class represents an expression in a linker script.
63 class Expression
65 protected:
66 // These should only be created by child classes.
67 Expression()
68 { }
70 public:
71 virtual ~Expression()
72 { }
74 // Return the value of the expression which is not permitted to
75 // refer to the dot symbol. CHECK_ASSERTIONS is true if we should
76 // check whether assertions are true.
77 uint64_t
78 eval(const Symbol_table*, const Layout*, bool check_assertions);
80 // Return the value of an expression which is permitted to refer to
81 // the dot symbol. DOT_VALUE is the absolute value of the dot
82 // symbol. DOT_SECTION is the section in which dot is defined; it
83 // should be NULL if the dot symbol has an absolute value (e.g., is
84 // defined in a SECTIONS clause outside of any output section
85 // definition). This sets *RESULT_SECTION to indicate where the
86 // value is defined. If the value is absolute *RESULT_SECTION will
87 // be NULL. Note that the returned value is still an absolute
88 // value; to get a section relative value the caller must subtract
89 // the section address. If RESULT_ALIGNMENT is not NULL, this sets
90 // *RESULT_ALIGNMENT to the alignment of the value of that alignment
91 // is larger than *RESULT_ALIGNMENT; this will only be non-zero if
92 // this is an ALIGN expression.
93 uint64_t
94 eval_with_dot(const Symbol_table*, const Layout*, bool check_assertions,
95 uint64_t dot_value, Output_section* dot_section,
96 Output_section** result_section, uint64_t* result_alignment);
98 // Return the value of an expression which may or may not be
99 // permitted to refer to the dot symbol, depending on
100 // is_dot_available.
101 uint64_t
102 eval_maybe_dot(const Symbol_table*, const Layout*, bool check_assertions,
103 bool is_dot_available, uint64_t dot_value,
104 Output_section* dot_section,
105 Output_section** result_section, uint64_t* result_alignment);
107 // Print the expression to the FILE. This is for debugging.
108 virtual void
109 print(FILE*) const = 0;
111 protected:
112 struct Expression_eval_info;
114 public:
115 // Compute the value of the expression (implemented by child class).
116 // This is public rather than protected because it is called
117 // directly by children of Expression on other Expression objects.
118 virtual uint64_t
119 value(const Expression_eval_info*) = 0;
121 private:
122 // May not be copied.
123 Expression(const Expression&);
124 Expression& operator=(const Expression&);
128 // Version_script_info stores information parsed from the version
129 // script, either provided by --version-script or as part of a linker
130 // script. A single Version_script_info object per target is owned by
131 // Script_options.
133 class Version_script_info
135 public:
136 // The languages which can be specified in a versionn script.
137 enum Language
139 LANGUAGE_C, // No demangling.
140 LANGUAGE_CXX, // C++ demangling.
141 LANGUAGE_JAVA, // Java demangling.
142 LANGUAGE_COUNT
145 Version_script_info();
147 ~Version_script_info();
149 // Clear everything.
150 void
151 clear();
153 // Finalize the version control information.
154 void
155 finalize();
157 // Return whether the information is finalized.
158 bool
159 is_finalized() const
160 { return this->is_finalized_; }
162 // Return whether any version were defined in the version script.
163 bool
164 empty() const
165 { return this->version_trees_.empty(); }
167 // If there is a version associated with SYMBOL, return true, and
168 // set *VERSION to the version, and *IS_GLOBAL to whether the symbol
169 // should be global. Otherwise, return false.
170 bool
171 get_symbol_version(const char* symbol, std::string* version,
172 bool* is_global) const;
174 // Return whether this symbol matches the local: section of some
175 // version.
176 bool
177 symbol_is_local(const char* symbol) const
179 bool is_global;
180 return (this->get_symbol_version(symbol, NULL, &is_global)
181 && !is_global);
184 // Return the names of versions defined in the version script.
185 std::vector<std::string>
186 get_versions() const;
188 // Return the list of dependencies for this version.
189 std::vector<std::string>
190 get_dependencies(const char* version) const;
192 // The following functions should only be used by the bison helper
193 // functions. They allocate new structs whose memory belongs to
194 // Version_script_info. The bison functions copy the information
195 // from the version script into these structs.
196 struct Version_dependency_list*
197 allocate_dependency_list();
199 struct Version_expression_list*
200 allocate_expression_list();
202 struct Version_tree*
203 allocate_version_tree();
205 // Build the lookup tables after all data have been read.
206 void
207 build_lookup_tables();
209 // Give an error if there are any unmatched names in the version
210 // script.
211 void
212 check_unmatched_names(const Symbol_table*) const;
214 // Print contents to the FILE. This is for debugging.
215 void
216 print(FILE*) const;
218 private:
219 void
220 print_expression_list(FILE* f, const Version_expression_list*) const;
222 bool
223 get_symbol_version_helper(const char* symbol,
224 bool check_global,
225 std::string* pversion) const;
227 // Fast lookup information for a given language.
229 // We map from exact match strings to Version_tree's. Historically
230 // version scripts sometimes have the same symbol multiple times,
231 // which is ambiguous. We warn about that case by storing the
232 // second Version_tree we see.
233 struct Version_tree_match
235 Version_tree_match(const Version_tree* r, bool ig,
236 const Version_expression* e)
237 : real(r), is_global(ig), expression(e), ambiguous(NULL)
240 // The Version_tree that we return.
241 const Version_tree* real;
242 // True if this is a global match for the REAL member, false if it
243 // is a local match.
244 bool is_global;
245 // Point back to the Version_expression for which we created this
246 // match.
247 const Version_expression* expression;
248 // If not NULL, another Version_tree that defines the symbol.
249 const Version_tree* ambiguous;
252 // Map from an exact match string to a Version_tree.
254 typedef Unordered_map<std::string, Version_tree_match> Exact;
256 // Fast lookup information for a glob pattern.
257 struct Glob
259 Glob()
260 : expression(NULL), version(NULL), is_global(false)
263 Glob(const Version_expression* e, const Version_tree* v, bool ig)
264 : expression(e), version(v), is_global(ig)
267 // A pointer to the version expression holding the pattern to
268 // match and the language to use for demangling the symbol before
269 // doing the match.
270 const Version_expression* expression;
271 // The Version_tree we use if this pattern matches.
272 const Version_tree* version;
273 // True if this is a global symbol.
274 bool is_global;
277 typedef std::vector<Glob> Globs;
279 bool
280 unquote(std::string*) const;
282 void
283 add_exact_match(const std::string&, const Version_tree*, bool is_global,
284 const Version_expression*, Exact*);
286 void
287 build_expression_list_lookup(const Version_expression_list*,
288 const Version_tree*, bool);
290 const char*
291 get_name_to_match(const char*, int,
292 Lazy_demangler*, Lazy_demangler*) const;
294 // All the version dependencies we allocate.
295 std::vector<Version_dependency_list*> dependency_lists_;
296 // All the version expressions we allocate.
297 std::vector<Version_expression_list*> expression_lists_;
298 // The list of versions.
299 std::vector<Version_tree*> version_trees_;
300 // Exact matches for global symbols, by language.
301 Exact* exact_[LANGUAGE_COUNT];
302 // A vector of glob patterns mapping to Version_trees.
303 Globs globs_;
304 // The default version to use, if there is one. This is from a
305 // pattern of "*".
306 const Version_tree* default_version_;
307 // True if the default version is global.
308 bool default_is_global_;
309 // Whether this has been finalized.
310 bool is_finalized_;
313 // This class manages assignments to symbols. These can appear in
314 // three different locations in scripts: outside of a SECTIONS clause,
315 // within a SECTIONS clause, and within an output section definition
316 // within a SECTIONS clause. This can also appear on the command line
317 // via the --defsym command line option.
319 class Symbol_assignment
321 public:
322 Symbol_assignment(const char* name, size_t namelen, bool is_defsym,
323 Expression* val, bool provide, bool hidden)
324 : name_(name, namelen), val_(val), is_defsym_(is_defsym),
325 provide_(provide), hidden_(hidden), sym_(NULL)
328 // Add the symbol to the symbol table.
329 void
330 add_to_table(Symbol_table*);
332 // Finalize the symbol value.
333 void
334 finalize(Symbol_table*, const Layout*);
336 // Finalize the symbol value when it can refer to the dot symbol.
337 void
338 finalize_with_dot(Symbol_table*, const Layout*, uint64_t dot_value,
339 Output_section* dot_section);
341 // Set the symbol value, but only if the value is absolute. This is
342 // used while processing a SECTIONS clause. We assume that dot is
343 // an absolute value here. We do not check assertions.
344 void
345 set_if_absolute(Symbol_table*, const Layout*, bool is_dot_available,
346 uint64_t dot_value);
348 // Print the assignment to the FILE. This is for debugging.
349 void
350 print(FILE*) const;
352 private:
353 // Shared by finalize and finalize_with_dot.
354 void
355 finalize_maybe_dot(Symbol_table*, const Layout*, bool is_dot_available,
356 uint64_t dot_value, Output_section* dot_section);
358 // Sized version of finalize.
359 template<int size>
360 void
361 sized_finalize(Symbol_table*, const Layout*, bool is_dot_available,
362 uint64_t dot_value, Output_section*);
364 // Symbol name.
365 std::string name_;
366 // Expression to assign to symbol.
367 Expression* val_;
368 // True if this symbol is defined by a --defsym, false if it is
369 // defined in a linker script.
370 bool is_defsym_;
371 // Whether the assignment should be provided (only set if there is
372 // an undefined reference to the symbol.
373 bool provide_;
374 // Whether the assignment should be hidden.
375 bool hidden_;
376 // The entry in the symbol table.
377 Symbol* sym_;
380 // This class manages assertions in linker scripts. These can appear
381 // in all the places where a Symbol_assignment can appear.
383 class Script_assertion
385 public:
386 Script_assertion(Expression* check, const char* message,
387 size_t messagelen)
388 : check_(check), message_(message, messagelen)
391 // Check the assertion.
392 void
393 check(const Symbol_table*, const Layout*);
395 // Print the assertion to the FILE. This is for debugging.
396 void
397 print(FILE*) const;
399 private:
400 // The expression to check.
401 Expression* check_;
402 // The message to issue if the expression fails.
403 std::string message_;
406 // We can read a linker script in two different contexts: when
407 // initially parsing the command line, and when we find an input file
408 // which is actually a linker script. Also some of the data which can
409 // be set by a linker script can also be set via command line options
410 // like -e and --defsym. This means that we have a type of data which
411 // can be set both during command line option parsing and while
412 // reading input files. We store that data in an instance of this
413 // object. We will keep pointers to that instance in both the
414 // Command_line and Layout objects.
416 class Script_options
418 public:
419 Script_options();
421 // Add a symbol to be defined.
422 void
423 add_symbol_assignment(const char* name, size_t length, bool is_defsym,
424 Expression* value, bool provide, bool hidden);
426 // Add a reference to a symbol.
427 void
428 add_symbol_reference(const char* name, size_t length);
430 // Add an assertion.
431 void
432 add_assertion(Expression* check, const char* message, size_t messagelen);
434 // Define a symbol from the command line.
435 bool
436 define_symbol(const char* definition);
438 // Create sections required by any linker scripts.
439 void
440 create_script_sections(Layout*);
442 // Add all symbol definitions to the symbol table.
443 void
444 add_symbols_to_table(Symbol_table*);
446 // Used to iterate over symbols which are referenced in expressions
447 // but not defined.
448 typedef Unordered_set<std::string>::const_iterator referenced_const_iterator;
450 referenced_const_iterator
451 referenced_begin() const
452 { return this->symbol_references_.begin(); }
454 referenced_const_iterator
455 referenced_end() const
456 { return this->symbol_references_.end(); }
458 // Return whether a symbol is referenced but not defined.
459 bool
460 is_referenced(const std::string& name) const
462 return (this->symbol_references_.find(name)
463 != this->symbol_references_.end());
466 // Return whether there are any symbols which were referenced but
467 // not defined.
468 bool
469 any_unreferenced() const
470 { return !this->symbol_references_.empty(); }
472 // Finalize the symbol values. Also check assertions.
473 void
474 finalize_symbols(Symbol_table*, const Layout*);
476 // Version information parsed from a version script. Everything
477 // else has a pointer to this object.
478 Version_script_info*
479 version_script_info()
480 { return &this->version_script_info_; }
482 const Version_script_info*
483 version_script_info() const
484 { return &this->version_script_info_; }
486 // A SECTIONS clause parsed from a linker script. Everything else
487 // has a pointer to this object.
488 Script_sections*
489 script_sections()
490 { return &this->script_sections_; }
492 const Script_sections*
493 script_sections() const
494 { return &this->script_sections_; }
496 // Whether we saw a SECTIONS clause.
497 bool
498 saw_sections_clause() const
499 { return this->script_sections_.saw_sections_clause(); }
501 // Whether we saw a PHDRS clause.
502 bool
503 saw_phdrs_clause() const
504 { return this->script_sections_.saw_phdrs_clause(); }
506 // Set section addresses using a SECTIONS clause. Return the
507 // segment which should hold the file header and segment headers;
508 // this may return NULL, in which case the headers are not in a
509 // loadable segment.
510 Output_segment*
511 set_section_addresses(Symbol_table*, Layout*);
513 // Print the script to the FILE. This is for debugging.
514 void
515 print(FILE*) const;
517 private:
518 // We keep a list of symbol assignments which occur outside of a
519 // SECTIONS clause.
520 typedef std::vector<Symbol_assignment*> Symbol_assignments;
522 // We keep a list of all assertions whcih occur outside of a
523 // SECTIONS clause.
524 typedef std::vector<Script_assertion*> Assertions;
526 // The entry address. This will be empty if not set.
527 std::string entry_;
528 // Symbols to set.
529 Symbol_assignments symbol_assignments_;
530 // Symbols defined in an expression, for faster lookup.
531 Unordered_set<std::string> symbol_definitions_;
532 // Symbols referenced in an expression.
533 Unordered_set<std::string> symbol_references_;
534 // Assertions to check.
535 Assertions assertions_;
536 // Version information parsed from a version script.
537 Version_script_info version_script_info_;
538 // Information from any SECTIONS clauses.
539 Script_sections script_sections_;
542 // Information about a script input that will persist during the whole linker
543 // run. Needed only during an incremental build to retrieve the input files
544 // added by this script.
546 class Script_info
548 public:
549 Script_info(Input_arguments* inputs)
550 : inputs_(inputs)
553 // Returns the input files included because of this script.
554 Input_arguments*
555 inputs()
556 { return this->inputs_; }
558 private:
559 Input_arguments* inputs_;
562 // FILE was found as an argument on the command line, but was not
563 // recognized as an ELF file. Try to read it as a script. Return
564 // true if the file was handled. This has to handle /usr/lib/libc.so
565 // on a GNU/Linux system. *USED_NEXT_BLOCKER is set to indicate
566 // whether the function took over NEXT_BLOCKER.
568 bool
569 read_input_script(Workqueue*, Symbol_table*, Layout*, Dirsearch*, int,
570 Input_objects*, Mapfile*, Input_group*,
571 const Input_argument*, Input_file*,
572 Task_token* next_blocker, bool* used_next_blocker);
574 // FILE was found as an argument to --script (-T).
575 // Read it as a script, and execute its contents immediately.
577 bool
578 read_commandline_script(const char* filename, Command_line* cmdline);
580 // FILE was found as an argument to --version-script. Read it as a
581 // version script, and store its contents in
582 // cmdline->script_options()->version_script_info().
584 bool
585 read_version_script(const char* filename, Command_line* cmdline);
587 // FILENAME was found as an argument to --dynamic-list. Read it as a
588 // version script (actually, a versym_node from a version script), and
589 // store its contents in DYNAMIC_LIST.
591 bool
592 read_dynamic_list(const char* filename, Command_line* cmdline,
593 Script_options* dynamic_list);
595 } // End namespace gold.
597 #endif // !defined(GOLD_SCRIPT_H)