1 /* yyscript.y -- linker script grammer for gold. */
3 /* Copyright 2006, 2007, 2008 Free Software Foundation, Inc.
4 Written by Ian Lance Taylor <iant@google.com>.
6 This file is part of gold.
8 This program is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 3 of the License, or
11 (at your option) any later version.
13 This program is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with this program; if not, write to the Free Software
20 Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston,
21 MA 02110-1301, USA. */
23 /* This is a bison grammar to parse a subset of the original GNU ld
24 linker script language. */
39 /* We need to use a pure parser because we might be multi-threaded.
40 We pass some arguments through the parser to the lexer. */
44 %parse
-param
{void* closure
}
45 %lex
-param
{void* closure
}
47 /* Since we require bison anyhow, we take advantage of it. */
51 /* The values associated with tokens. */
55 struct Parser_string
string;
60 /* An output section header. */
61 struct Parser_output_section_header output_section_header
;
62 /* An output section trailer. */
63 struct Parser_output_section_trailer output_section_trailer
;
64 /* A section constraint. */
65 enum Section_constraint constraint
;
66 /* A complete input section specification. */
67 struct Input_section_spec input_section_spec
;
68 /* A list of wildcard specifications, with exclusions. */
69 struct Wildcard_sections wildcard_sections
;
70 /* A single wildcard specification. */
71 struct Wildcard_section wildcard_section
;
72 /* A list of strings. */
73 String_list_ptr string_list
;
74 /* Information for a program header. */
75 struct Phdr_info phdr_info
;
76 /* Used for version scripts and within VERSION {}. */
77 struct Version_dependency_list
* deplist
;
78 struct Version_expression_list
* versyms
;
79 struct Version_tree
* versnode
;
82 /* Operators, including a precedence table for expressions. */
84 %right PLUSEQ MINUSEQ MULTEQ DIVEQ
'=' LSHIFTEQ RSHIFTEQ ANDEQ OREQ
97 /* A fake operator used to indicate unary operator precedence. */
102 %token
<string> STRING
103 %token
<string> QUOTED_STRING
104 %token
<integer
> INTEGER
106 /* Keywords. This list is taken from ldgram.y and ldlex.l in the old
107 GNU linker, with the keywords which only appear in MRI mode
108 removed. Not all these keywords are actually used in this grammar.
109 In most cases the keyword is recognized as the token name in upper
110 case. The comments indicate where this is not the case. */
114 %token ALIGN_K
/* ALIGN */
116 %token ASSERT_K
/* ASSERT */
124 %token CREATE_OBJECT_SYMBOLS
125 %token DATA_SEGMENT_ALIGN
126 %token DATA_SEGMENT_END
127 %token DATA_SEGMENT_RELRO_END
134 %token FORCE_COMMON_ALLOCATION
135 %token GLOBAL
/* global */
139 %token INHIBIT_COMMON_ALLOCATION
142 %token LENGTH
/* LENGTH, l, len */
144 %token LOCAL
/* local */
147 %token MAX_K
/* MAX */
149 %token MIN_K
/* MIN */
155 %token ORIGIN
/* ORIGIN, o, org */
162 %token PROVIDE_HIDDEN
169 %token SIZEOF_HEADERS
/* SIZEOF_HEADERS, sizeof_headers */
170 %token SORT_BY_ALIGNMENT
177 %token TARGET_K
/* TARGET */
179 %token VERSIONK
/* VERSION */
181 /* Keywords, part 2. These are keywords that are unique to gold,
182 and not present in the old GNU linker. As before, unless the
183 comments say otherwise, the keyword is recognized as the token
184 name in upper case. */
188 /* Special tokens used to tell the grammar what type of tokens we are
189 parsing. The token stream always begins with one of these tokens.
190 We do this because version scripts can appear embedded within
191 linker scripts, and because --defsym uses the expression
193 %token PARSING_LINKER_SCRIPT
194 %token PARSING_VERSION_SCRIPT
195 %token PARSING_DEFSYM
197 /* Non-terminal types, where needed. */
199 %type
<expr
> parse_exp exp opt_address_and_section_type
200 %type
<expr
> opt_at opt_align opt_subalign opt_fill
201 %type
<output_section_header
> section_header
202 %type
<output_section_trailer
> section_trailer
203 %type
<constraint
> opt_constraint
204 %type
<string_list
> opt_phdr
205 %type
<integer
> data_length
206 %type
<input_section_spec
> input_section_no_keep
207 %type
<wildcard_sections
> wildcard_sections
208 %type
<wildcard_section
> wildcard_file wildcard_section
209 %type
<string_list
> exclude_names
210 %type
<string> wildcard_name
211 %type
<integer
> phdr_type
212 %type
<phdr_info
> phdr_info
213 %type
<versyms
> vers_defns
214 %type
<versnode
> vers_tag
215 %type
<deplist
> verdep
216 %type
<string> string
220 /* Read the special token to see what to read next. */
222 PARSING_LINKER_SCRIPT linker_script
223 | PARSING_VERSION_SCRIPT version_script
224 | PARSING_DEFSYM defsym_expr
227 /* A file contains a list of commands. */
229 linker_script file_cmd
233 /* A command which may appear at top level of a linker script. */
236 { script_start_group
(closure
); }
238 { script_end_group
(closure
); }
239 | OPTION
'(' string ')'
240 { script_parse_option
(closure
, $3.value
, $3.length
); }
241 | PHDRS
'{' phdrs_defs
'}'
242 | SEARCH_DIR
'(' string ')'
243 { script_add_search_dir
(closure
, $3.value
, $3.length
); }
245 { script_start_sections
(closure
); }
247 { script_finish_sections
(closure
); }
249 { script_push_lex_into_version_mode
(closure
); }
251 { script_pop_lex_mode
(closure
); }
252 | file_or_sections_cmd
257 /* Top level commands which we ignore. The GNU linker uses these to
258 select the output format, but we don't offer a choice. Ignoring
259 these is more-or-less OK since most scripts simply explicitly
260 choose the default. */
262 OUTPUT_FORMAT
'(' string ')'
263 | OUTPUT_FORMAT
'(' string ',' string ',' string ')'
264 | OUTPUT_ARCH
'(' string ')'
267 /* A list of input file names. */
270 | input_list opt_comma input_list_element
273 /* An input file name. */
276 { script_add_file
(closure
, $1.value
, $1.length
); }
278 { script_start_as_needed
(closure
); }
280 { script_end_as_needed
(closure
); }
283 /* Commands in a SECTIONS block. */
285 sections_block section_block_cmd
289 /* A command which may appear within a SECTIONS block. */
292 |
string section_header
293 { script_start_output_section
(closure
, $1.value
, $1.length
, &$2); }
294 '{' section_cmds
'}' section_trailer
295 { script_finish_output_section
(closure
, &$7); }
298 /* The header of an output section in a SECTIONS block--everything
301 { script_push_lex_into_expression_mode
(closure
); }
302 opt_address_and_section_type opt_at opt_align opt_subalign
303 { script_pop_lex_mode
(closure
); }
307 $$.load_address
= $3;
314 /* The optional address followed by the optional section type. This
315 is a separate nonterminal to avoid a shift/reduce conflict on
316 '(' in section_header. */
318 opt_address_and_section_type:
327 | exp
'(' string ')' ':'
329 yyerror(closure
, "section types are not supported");
334 /* The address at which an output section should be loaded. */
342 /* The alignment of an output section. */
346 | ALIGN_K
'(' exp
')'
350 /* The input section alignment within an output section. */
354 | SUBALIGN
'(' exp
')'
358 /* A section constraint. */
361 { $$
= CONSTRAINT_NONE
; }
363 { $$
= CONSTRAINT_ONLY_IF_RO
; }
365 { $$
= CONSTRAINT_ONLY_IF_RW
; }
367 { $$
= CONSTRAINT_SPECIAL
; }
370 /* The trailer of an output section in a SECTIONS block. */
372 opt_memspec opt_at_memspec opt_phdr opt_fill opt_comma
379 /* A memory specification for an output section. */
382 { yyerror(closure
, "memory regions are not supported"); }
386 /* A memory specification for where to load an output section. */
389 { yyerror(closure
, "memory regions are not supported"); }
393 /* The program segment an output section should go into. */
396 { $$
= script_string_list_push_back
($1, $3.value
, $3.length
); }
401 /* The value to use to fill an output section. FIXME: This does not
402 handle a string of arbitrary length. */
410 /* Commands which may appear within the description of an output
411 section in a SECTIONS block. */
414 | section_cmds section_cmd
417 /* A command which may appear within the description of an output
418 section in a SECTIONS block. */
422 | data_length
'(' parse_exp
')'
423 { script_add_data
(closure
, $1, $3); }
424 | ASSERT_K
'(' parse_exp
',' string ')'
425 { script_add_assertion
(closure
, $3, $5.value
, $5.length
); }
426 | FILL
'(' parse_exp
')'
427 { script_add_fill
(closure
, $3); }
430 /* The GNU linker uses CONSTRUCTORS for the a.out object
431 file format. It does nothing when using ELF. Since
432 some ELF linker scripts use it although it does
433 nothing, we accept it and ignore it. */
435 | SORT_BY_NAME
'(' CONSTRUCTORS
')'
439 /* The length of data which may appear within the description of an
440 output section in a SECTIONS block. */
454 /* An input section specification. This may appear within the
455 description of an output section in a SECTIONS block. */
457 input_section_no_keep
458 { script_add_input_section
(closure
, &$1, 0); }
459 | KEEP
'(' input_section_no_keep
')'
460 { script_add_input_section
(closure
, &$3, 1); }
463 /* An input section specification within a KEEP clause. */
464 input_section_no_keep:
468 $$.file.sort
= SORT_WILDCARD_NONE
;
469 $$.input_sections.sections
= NULL
;
470 $$.input_sections.exclude
= NULL
;
472 | wildcard_file
'(' wildcard_sections
')'
475 $$.input_sections
= $3;
479 /* A wildcard file specification. */
484 $$.sort
= SORT_WILDCARD_NONE
;
486 | SORT_BY_NAME
'(' wildcard_name
')'
489 $$.sort
= SORT_WILDCARD_BY_NAME
;
493 /* A list of wild card section specifications. */
495 wildcard_sections opt_comma wildcard_section
497 $$.sections
= script_string_sort_list_add
($1.sections
, &$3);
498 $$.exclude
= $1.exclude
;
502 $$.sections
= script_new_string_sort_list
(&$1);
505 | wildcard_sections opt_comma EXCLUDE_FILE
'(' exclude_names
')'
507 $$.sections
= $1.sections
;
508 $$.exclude
= script_string_list_append
($1.exclude
, $5);
510 | EXCLUDE_FILE
'(' exclude_names
')'
517 /* A single wild card specification. */
522 $$.sort
= SORT_WILDCARD_NONE
;
524 | SORT_BY_NAME
'(' wildcard_section
')'
529 case SORT_WILDCARD_NONE
:
530 $$.sort
= SORT_WILDCARD_BY_NAME
;
532 case SORT_WILDCARD_BY_NAME
:
533 case SORT_WILDCARD_BY_NAME_BY_ALIGNMENT
:
535 case SORT_WILDCARD_BY_ALIGNMENT
:
536 case SORT_WILDCARD_BY_ALIGNMENT_BY_NAME
:
537 $$.sort
= SORT_WILDCARD_BY_NAME_BY_ALIGNMENT
;
543 | SORT_BY_ALIGNMENT
'(' wildcard_section
')'
548 case SORT_WILDCARD_NONE
:
549 $$.sort
= SORT_WILDCARD_BY_ALIGNMENT
;
551 case SORT_WILDCARD_BY_ALIGNMENT
:
552 case SORT_WILDCARD_BY_ALIGNMENT_BY_NAME
:
554 case SORT_WILDCARD_BY_NAME
:
555 case SORT_WILDCARD_BY_NAME_BY_ALIGNMENT
:
556 $$.sort
= SORT_WILDCARD_BY_ALIGNMENT_BY_NAME
;
564 /* A list of file names to exclude. */
566 exclude_names opt_comma wildcard_name
567 { $$
= script_string_list_push_back
($1, $3.value
, $3.length
); }
569 { $$
= script_new_string_list
($1.value
, $1.length
); }
572 /* A single wildcard name. We recognize '*' and '?' specially since
573 they are expression tokens. */
589 /* A command which may appear at the top level of a linker script, or
590 within a SECTIONS block. */
591 file_or_sections_cmd:
593 { script_set_entry
(closure
, $3.value
, $3.length
); }
595 | ASSERT_K
'(' parse_exp
',' string ')'
596 { script_add_assertion
(closure
, $3, $5.value
, $5.length
); }
599 /* A list of program header definitions. */
605 /* A program header definition. */
607 string phdr_type phdr_info
';'
608 { script_add_phdr
(closure
, $1.value
, $1.length
, $2, &$3); }
611 /* A program header type. The GNU linker accepts a general expression
612 here, but that would be a pain because we would have to dig into
613 the expression structure. It's unlikely that anybody uses anything
614 other than a string or a number here, so that is all we expect. */
617 { $$
= script_phdr_string_to_type
(closure
, $1.value
, $1.length
); }
622 /* Additional information for a program header. */
625 { memset
(&$$
, 0, sizeof
(struct Phdr_info
)); }
629 if
($1.length
== 7 && strncmp
($1.value
, "FILEHDR", 7) == 0)
630 $$.includes_filehdr
= 1;
632 yyerror(closure
, "PHDRS syntax error");
637 $$.includes_phdrs
= 1;
639 |
string '(' INTEGER
')' phdr_info
642 if
($1.length
== 5 && strncmp
($1.value
, "FLAGS", 5) == 0)
644 $$.is_flags_valid
= 1;
648 yyerror(closure
, "PHDRS syntax error");
650 | AT
'(' parse_exp
')' phdr_info
653 $$.load_address
= $3;
657 /* Set a symbol to a value. */
660 { script_set_symbol
(closure
, $1.value
, $1.length
, $3, 0, 0); }
661 |
string PLUSEQ parse_exp
663 Expression_ptr s
= script_exp_string
($1.value
, $1.length
);
664 Expression_ptr e
= script_exp_binary_add
(s
, $3);
665 script_set_symbol
(closure
, $1.value
, $1.length
, e
, 0, 0);
667 |
string MINUSEQ parse_exp
669 Expression_ptr s
= script_exp_string
($1.value
, $1.length
);
670 Expression_ptr e
= script_exp_binary_sub
(s
, $3);
671 script_set_symbol
(closure
, $1.value
, $1.length
, e
, 0, 0);
673 |
string MULTEQ parse_exp
675 Expression_ptr s
= script_exp_string
($1.value
, $1.length
);
676 Expression_ptr e
= script_exp_binary_mult
(s
, $3);
677 script_set_symbol
(closure
, $1.value
, $1.length
, e
, 0, 0);
679 |
string DIVEQ parse_exp
681 Expression_ptr s
= script_exp_string
($1.value
, $1.length
);
682 Expression_ptr e
= script_exp_binary_div
(s
, $3);
683 script_set_symbol
(closure
, $1.value
, $1.length
, e
, 0, 0);
685 |
string LSHIFTEQ parse_exp
687 Expression_ptr s
= script_exp_string
($1.value
, $1.length
);
688 Expression_ptr e
= script_exp_binary_lshift
(s
, $3);
689 script_set_symbol
(closure
, $1.value
, $1.length
, e
, 0, 0);
691 |
string RSHIFTEQ parse_exp
693 Expression_ptr s
= script_exp_string
($1.value
, $1.length
);
694 Expression_ptr e
= script_exp_binary_rshift
(s
, $3);
695 script_set_symbol
(closure
, $1.value
, $1.length
, e
, 0, 0);
697 |
string ANDEQ parse_exp
699 Expression_ptr s
= script_exp_string
($1.value
, $1.length
);
700 Expression_ptr e
= script_exp_binary_bitwise_and
(s
, $3);
701 script_set_symbol
(closure
, $1.value
, $1.length
, e
, 0, 0);
703 |
string OREQ parse_exp
705 Expression_ptr s
= script_exp_string
($1.value
, $1.length
);
706 Expression_ptr e
= script_exp_binary_bitwise_or
(s
, $3);
707 script_set_symbol
(closure
, $1.value
, $1.length
, e
, 0, 0);
709 | PROVIDE
'(' string '=' parse_exp
')'
710 { script_set_symbol
(closure
, $3.value
, $3.length
, $5, 1, 0); }
711 | PROVIDE_HIDDEN
'(' string '=' parse_exp
')'
712 { script_set_symbol
(closure
, $3.value
, $3.length
, $5, 1, 1); }
715 /* Parse an expression, putting the lexer into the right mode. */
717 { script_push_lex_into_expression_mode
(closure
); }
720 script_pop_lex_mode
(closure
);
729 |
'-' exp %prec UNARY
730 { $$
= script_exp_unary_minus
($2); }
731 |
'!' exp %prec UNARY
732 { $$
= script_exp_unary_logical_not
($2); }
733 |
'~' exp %prec UNARY
734 { $$
= script_exp_unary_bitwise_not
($2); }
735 |
'+' exp %prec UNARY
738 { $$
= script_exp_binary_mult
($1, $3); }
740 { $$
= script_exp_binary_div
($1, $3); }
742 { $$
= script_exp_binary_mod
($1, $3); }
744 { $$
= script_exp_binary_add
($1, $3); }
746 { $$
= script_exp_binary_sub
($1, $3); }
748 { $$
= script_exp_binary_lshift
($1, $3); }
750 { $$
= script_exp_binary_rshift
($1, $3); }
752 { $$
= script_exp_binary_eq
($1, $3); }
754 { $$
= script_exp_binary_ne
($1, $3); }
756 { $$
= script_exp_binary_le
($1, $3); }
758 { $$
= script_exp_binary_ge
($1, $3); }
760 { $$
= script_exp_binary_lt
($1, $3); }
762 { $$
= script_exp_binary_gt
($1, $3); }
764 { $$
= script_exp_binary_bitwise_and
($1, $3); }
766 { $$
= script_exp_binary_bitwise_xor
($1, $3); }
768 { $$
= script_exp_binary_bitwise_or
($1, $3); }
770 { $$
= script_exp_binary_logical_and
($1, $3); }
772 { $$
= script_exp_binary_logical_or
($1, $3); }
773 | exp
'?' exp
':' exp
774 { $$
= script_exp_trinary_cond
($1, $3, $5); }
776 { $$
= script_exp_integer
($1); }
778 { $$
= script_exp_string
($1.value
, $1.length
); }
779 | MAX_K
'(' exp
',' exp
')'
780 { $$
= script_exp_function_max
($3, $5); }
781 | MIN_K
'(' exp
',' exp
')'
782 { $$
= script_exp_function_min
($3, $5); }
783 | DEFINED
'(' string ')'
784 { $$
= script_exp_function_defined
($3.value
, $3.length
); }
786 { $$
= script_exp_function_sizeof_headers
(); }
787 | ALIGNOF
'(' string ')'
788 { $$
= script_exp_function_alignof
($3.value
, $3.length
); }
789 | SIZEOF
'(' string ')'
790 { $$
= script_exp_function_sizeof
($3.value
, $3.length
); }
791 | ADDR
'(' string ')'
792 { $$
= script_exp_function_addr
($3.value
, $3.length
); }
793 | LOADADDR
'(' string ')'
794 { $$
= script_exp_function_loadaddr
($3.value
, $3.length
); }
795 | ORIGIN
'(' string ')'
796 { $$
= script_exp_function_origin
($3.value
, $3.length
); }
797 | LENGTH
'(' string ')'
798 { $$
= script_exp_function_length
($3.value
, $3.length
); }
799 | CONSTANT
'(' string ')'
800 { $$
= script_exp_function_constant
($3.value
, $3.length
); }
801 | ABSOLUTE
'(' exp
')'
802 { $$
= script_exp_function_absolute
($3); }
803 | ALIGN_K
'(' exp
')'
804 { $$
= script_exp_function_align
(script_exp_string
(".", 1), $3); }
805 | ALIGN_K
'(' exp
',' exp
')'
806 { $$
= script_exp_function_align
($3, $5); }
808 { $$
= script_exp_function_align
(script_exp_string
(".", 1), $3); }
809 | DATA_SEGMENT_ALIGN
'(' exp
',' exp
')'
810 { $$
= script_exp_function_data_segment_align
($3, $5); }
811 | DATA_SEGMENT_RELRO_END
'(' exp
',' exp
')'
812 { $$
= script_exp_function_data_segment_relro_end
($3, $5); }
813 | DATA_SEGMENT_END
'(' exp
')'
814 { $$
= script_exp_function_data_segment_end
($3); }
815 | SEGMENT_START
'(' string ',' exp
')'
817 $$
= script_exp_function_segment_start
($3.value
, $3.length
, $5);
819 | ASSERT_K
'(' exp
',' string ')'
820 { $$
= script_exp_function_assert
($3, $5.value
, $5.length
); }
823 /* Handle the --defsym option. */
826 { script_set_symbol
(closure
, $1.value
, $1.length
, $3, 0, 0); }
829 /* A version script. */
836 | vers_nodes vers_node
842 script_register_vers_node
(closure
, NULL
, 0, $2, NULL
);
844 |
string '{' vers_tag
'}' ';'
846 script_register_vers_node
(closure
, $1.value
, $1.length
, $3,
849 |
string '{' vers_tag
'}' verdep
';'
851 script_register_vers_node
(closure
, $1.value
, $1.length
, $3, $5);
858 $$
= script_add_vers_depend
(closure
, NULL
, $1.value
, $1.length
);
862 $$
= script_add_vers_depend
(closure
, $1, $2.value
, $2.length
);
868 { $$
= script_new_vers_node
(closure
, NULL
, NULL
); }
870 { $$
= script_new_vers_node
(closure
, $1, NULL
); }
871 | GLOBAL
':' vers_defns
';'
872 { $$
= script_new_vers_node
(closure
, $3, NULL
); }
873 | LOCAL
':' vers_defns
';'
874 { $$
= script_new_vers_node
(closure
, NULL
, $3); }
875 | GLOBAL
':' vers_defns
';' LOCAL
':' vers_defns
';'
876 { $$
= script_new_vers_node
(closure
, $3, $7); }
879 /* Here is one of the rare places we care about the distinction
880 between STRING and QUOTED_STRING. For QUOTED_STRING, we do exact
881 matching on the pattern, so we pass in true for the exact_match
882 parameter. For STRING, we do glob matching and pass in false. */
886 $$
= script_new_vers_pattern
(closure
, NULL
, $1.value
,
891 $$
= script_new_vers_pattern
(closure
, NULL
, $1.value
,
894 | vers_defns
';' STRING
896 $$
= script_new_vers_pattern
(closure
, $1, $3.value
,
899 | vers_defns
';' QUOTED_STRING
901 $$
= script_new_vers_pattern
(closure
, $1, $3.value
,
904 |
/* Push string on the language stack. */
906 { version_script_push_lang
(closure
, $2.value
, $2.length
); }
907 vers_defns opt_semicolon
'}'
910 version_script_pop_lang
(closure
);
912 |
/* Push string on the language stack. This is more complicated
913 than the other cases because we need to merge the linked-list
914 state from the pre-EXTERN defns and the post-EXTERN defns. */
915 vers_defns
';' EXTERN
string '{'
916 { version_script_push_lang
(closure
, $4.value
, $4.length
); }
917 vers_defns opt_semicolon
'}'
919 $$
= script_merge_expressions
($1, $7);
920 version_script_pop_lang
(closure
);
922 | EXTERN
// "extern" as a symbol name
924 $$
= script_new_vers_pattern
(closure
, NULL
, "extern",
925 sizeof
("extern") - 1, 1);
927 | vers_defns
';' EXTERN
929 $$
= script_new_vers_pattern
(closure
, $1, "extern",
930 sizeof
("extern") - 1, 1);
934 /* A string can be either a STRING or a QUOTED_STRING. Almost all the
935 time we don't care, and we use this rule. */
943 /* Some statements require a terminator, which may be a semicolon or a
950 /* An optional semicolon. */
956 /* An optional comma. */