1 /* Lexical analyzer for C and Objective C.
2 Copyright (C) 1987, 88, 89, 92, 94-96, 1997 Free Software Foundation, Inc.
4 This file is part of GNU CC.
6 GNU CC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2, or (at your option)
11 GNU CC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GNU CC; see the file COPYING. If not, write to
18 the Free Software Foundation, 59 Temple Place - Suite 330,
19 Boston, MA 02111-1307, USA. */
38 /* MULTIBYTE_CHARS support only works for native compilers.
39 ??? Ideally what we want is to model widechar support after
40 the current floating point support. */
42 #undef MULTIBYTE_CHARS
45 #ifdef MULTIBYTE_CHARS
57 cpp_options parse_options
;
58 static enum cpp_token cpp_token
;
61 /* The elements of `ridpointers' are identifier nodes
62 for the reserved type names and storage classes.
63 It is indexed by a RID_... value. */
64 tree ridpointers
[(int) RID_MAX
];
66 /* Cause the `yydebug' variable to be defined. */
70 static unsigned char *yy_cur
, *yy_lim
;
77 parse_in
.limit
= parse_in
.token_buffer
;
78 cpp_token
= cpp_get_token (&parse_in
);
79 if (cpp_token
== CPP_EOF
)
81 yy_lim
= CPP_PWRITTEN (&parse_in
);
82 yy_cur
= parse_in
.token_buffer
;
88 #define GETC() (yy_cur < yy_lim ? *yy_cur++ : yy_get_token ())
89 #define UNGETC(c) ((c), yy_cur--)
91 #define GETC() getc (finput)
92 #define UNGETC(c) ungetc (c, finput)
95 /* the declaration found for the last IDENTIFIER token read in.
96 yylex must look this up to detect typedefs, which get token type TYPENAME,
97 so it is left around in case the identifier is not a typedef but is
98 used in a context which makes it a reference to a variable. */
101 /* Nonzero enables objc features. */
103 int doing_objc_thang
;
105 extern tree
is_class_name ();
109 /* File used for outputting assembler code. */
110 extern FILE *asm_out_file
;
112 #ifndef WCHAR_TYPE_SIZE
114 #define WCHAR_TYPE_SIZE INT_TYPE_SIZE
116 #define WCHAR_TYPE_SIZE BITS_PER_WORD
120 /* Number of bytes in a wide character. */
121 #define WCHAR_BYTES (WCHAR_TYPE_SIZE / BITS_PER_UNIT)
123 static int maxtoken
; /* Current nominal length of token buffer. */
124 char *token_buffer
; /* Pointer to token buffer.
125 Actual allocated length is maxtoken + 2.
126 This is not static because objc-parse.y uses it. */
128 static int indent_level
= 0; /* Number of { minus number of }. */
130 /* Nonzero if end-of-file has been seen on input. */
131 static int end_of_file
;
134 /* Buffered-back input character; faster than using ungetc. */
135 static int nextchar
= -1;
138 static int skip_which_space
PROTO((int));
139 static char *extend_token_buffer
PROTO((char *));
140 static int readescape
PROTO((int *));
141 int check_newline ();
143 /* Do not insert generated code into the source, instead, include it.
144 This allows us to build gcc automatically even for targets that
145 need to add or modify the reserved keyword lists. */
148 /* Return something to represent absolute declarators containing a *.
149 TARGET is the absolute declarator that the * contains.
150 TYPE_QUALS is a list of modifiers such as const or volatile
151 to apply to the pointer type, represented as identifiers.
153 We return an INDIRECT_REF whose "contents" are TARGET
154 and whose type is the modifier list. */
157 make_pointer_declarator (type_quals
, target
)
158 tree type_quals
, target
;
160 return build1 (INDIRECT_REF
, type_quals
, target
);
164 forget_protocol_qualifiers ()
166 int i
, n
= sizeof wordlist
/ sizeof (struct resword
);
168 for (i
= 0; i
< n
; i
++)
169 if ((int) wordlist
[i
].rid
>= (int) RID_IN
170 && (int) wordlist
[i
].rid
<= (int) RID_ONEWAY
)
171 wordlist
[i
].name
= "";
175 remember_protocol_qualifiers ()
177 int i
, n
= sizeof wordlist
/ sizeof (struct resword
);
179 for (i
= 0; i
< n
; i
++)
180 if (wordlist
[i
].rid
== RID_IN
)
181 wordlist
[i
].name
= "in";
182 else if (wordlist
[i
].rid
== RID_OUT
)
183 wordlist
[i
].name
= "out";
184 else if (wordlist
[i
].rid
== RID_INOUT
)
185 wordlist
[i
].name
= "inout";
186 else if (wordlist
[i
].rid
== RID_BYCOPY
)
187 wordlist
[i
].name
= "bycopy";
188 else if (wordlist
[i
].rid
== RID_ONEWAY
)
189 wordlist
[i
].name
= "oneway";
194 init_parse (filename
)
201 cpp_reader_init (&parse_in
);
202 parse_in
.data
= &parse_options
;
203 cpp_options_init (&parse_options
);
204 cpp_handle_options (&parse_in
, 0, NULL
); /* FIXME */
205 parse_in
.show_column
= 1;
206 if (! cpp_start_read (&parse_in
, filename
))
213 cpp_finish (&parse_in
);
220 /* Make identifier nodes long enough for the language-specific slots. */
221 set_identifier_size (sizeof (struct lang_identifier
));
223 /* Start it at 0, because check_newline is called at the very beginning
224 and will increment it to 1. */
227 #ifdef MULTIBYTE_CHARS
228 /* Change to the native locale for multibyte conversions. */
229 setlocale (LC_CTYPE
, "");
233 token_buffer
= (char *) xmalloc (maxtoken
+ 2);
235 ridpointers
[(int) RID_INT
] = get_identifier ("int");
236 ridpointers
[(int) RID_CHAR
] = get_identifier ("char");
237 ridpointers
[(int) RID_VOID
] = get_identifier ("void");
238 ridpointers
[(int) RID_FLOAT
] = get_identifier ("float");
239 ridpointers
[(int) RID_DOUBLE
] = get_identifier ("double");
240 ridpointers
[(int) RID_SHORT
] = get_identifier ("short");
241 ridpointers
[(int) RID_LONG
] = get_identifier ("long");
242 ridpointers
[(int) RID_UNSIGNED
] = get_identifier ("unsigned");
243 ridpointers
[(int) RID_SIGNED
] = get_identifier ("signed");
244 ridpointers
[(int) RID_INLINE
] = get_identifier ("inline");
245 ridpointers
[(int) RID_CONST
] = get_identifier ("const");
246 ridpointers
[(int) RID_VOLATILE
] = get_identifier ("volatile");
247 ridpointers
[(int) RID_AUTO
] = get_identifier ("auto");
248 ridpointers
[(int) RID_STATIC
] = get_identifier ("static");
249 ridpointers
[(int) RID_EXTERN
] = get_identifier ("extern");
250 ridpointers
[(int) RID_TYPEDEF
] = get_identifier ("typedef");
251 ridpointers
[(int) RID_REGISTER
] = get_identifier ("register");
252 ridpointers
[(int) RID_ITERATOR
] = get_identifier ("iterator");
253 ridpointers
[(int) RID_COMPLEX
] = get_identifier ("complex");
254 ridpointers
[(int) RID_ID
] = get_identifier ("id");
255 ridpointers
[(int) RID_IN
] = get_identifier ("in");
256 ridpointers
[(int) RID_OUT
] = get_identifier ("out");
257 ridpointers
[(int) RID_INOUT
] = get_identifier ("inout");
258 ridpointers
[(int) RID_BYCOPY
] = get_identifier ("bycopy");
259 ridpointers
[(int) RID_ONEWAY
] = get_identifier ("oneway");
260 forget_protocol_qualifiers();
262 /* Some options inhibit certain reserved words.
263 Clear those words out of the hash table so they won't be recognized. */
264 #define UNSET_RESERVED_WORD(STRING) \
265 do { struct resword *s = is_reserved_word (STRING, sizeof (STRING) - 1); \
266 if (s) s->name = ""; } while (0)
268 if (! doing_objc_thang
)
269 UNSET_RESERVED_WORD ("id");
271 if (flag_traditional
)
273 UNSET_RESERVED_WORD ("const");
274 UNSET_RESERVED_WORD ("volatile");
275 UNSET_RESERVED_WORD ("typeof");
276 UNSET_RESERVED_WORD ("signed");
277 UNSET_RESERVED_WORD ("inline");
278 UNSET_RESERVED_WORD ("iterator");
279 UNSET_RESERVED_WORD ("complex");
283 UNSET_RESERVED_WORD ("asm");
284 UNSET_RESERVED_WORD ("typeof");
285 UNSET_RESERVED_WORD ("inline");
286 UNSET_RESERVED_WORD ("iterator");
287 UNSET_RESERVED_WORD ("complex");
292 reinit_parse_for_function ()
296 /* Function used when yydebug is set, to print a token in more detail. */
299 yyprint (file
, yychar
, yylval
)
311 if (IDENTIFIER_POINTER (t
))
312 fprintf (file
, " `%s'", IDENTIFIER_POINTER (t
));
317 if (TREE_CODE (t
) == INTEGER_CST
)
319 #if HOST_BITS_PER_WIDE_INT == 64
320 #if HOST_BITS_PER_WIDE_INT != HOST_BITS_PER_INT
326 #if HOST_BITS_PER_WIDE_INT != HOST_BITS_PER_INT
332 TREE_INT_CST_HIGH (t
), TREE_INT_CST_LOW (t
));
337 /* If C is not whitespace, return C.
338 Otherwise skip whitespace and return first nonwhite char read. */
344 static int newline_warning
= 0;
350 /* We don't recognize comments here, because
351 cpp output can include / and * consecutively as operators.
352 Also, there's no need, since cpp removes all comments. */
355 c
= check_newline ();
367 /* ANSI C says the effects of a carriage return in a source file
369 if (pedantic
&& !newline_warning
)
371 warning ("carriage return in source file");
372 warning ("(we only warn about the first carriage return)");
383 error ("stray '\\' in program");
393 /* Skips all of the white space at the current location in the input file.
394 Must use and reset nextchar if it has the next character. */
397 position_after_white_space ()
403 c
= nextchar
, nextchar
= -1;
408 UNGETC (skip_white_space (c
));
411 /* Make the token buffer longer, preserving the data in it.
412 P should point to just beyond the last valid character in the old buffer.
413 The value we return is a pointer to the new buffer
414 at a place corresponding to P. */
417 extend_token_buffer (p
)
420 int offset
= p
- token_buffer
;
422 maxtoken
= maxtoken
* 2 + 10;
423 token_buffer
= (char *) xrealloc (token_buffer
, maxtoken
+ 2);
425 return token_buffer
+ offset
;
429 #define GET_DIRECTIVE_LINE() get_directive_line (finput)
430 #else /* USE_CPPLIB */
431 /* Read the rest of a #-directive from input stream FINPUT.
432 In normal use, the directive name and the white space after it
433 have already been read, so they won't be included in the result.
434 We allow for the fact that the directive line may contain
435 a newline embedded within a character or string literal which forms
436 a part of the directive.
438 The value is a string in a reusable buffer. It remains valid
439 only until the next time this function is called. */
442 GET_DIRECTIVE_LINE ()
444 static char *directive_buffer
= NULL
;
445 static unsigned buffer_length
= 0;
447 register char *buffer_limit
;
448 register int looking_for
= 0;
449 register int char_escaped
= 0;
451 if (buffer_length
== 0)
453 directive_buffer
= (char *)xmalloc (128);
457 buffer_limit
= &directive_buffer
[buffer_length
];
459 for (p
= directive_buffer
; ; )
463 /* Make buffer bigger if it is full. */
464 if (p
>= buffer_limit
)
466 register unsigned bytes_used
= (p
- directive_buffer
);
470 = (char *)xrealloc (directive_buffer
, buffer_length
);
471 p
= &directive_buffer
[bytes_used
];
472 buffer_limit
= &directive_buffer
[buffer_length
];
477 /* Discard initial whitespace. */
478 if ((c
== ' ' || c
== '\t') && p
== directive_buffer
)
481 /* Detect the end of the directive. */
482 if (c
== '\n' && looking_for
== 0)
491 return directive_buffer
;
493 /* Handle string and character constant syntax. */
496 if (looking_for
== c
&& !char_escaped
)
497 looking_for
= 0; /* Found terminator... stop looking. */
500 if (c
== '\'' || c
== '"')
501 looking_for
= c
; /* Don't stop buffering until we see another
502 another one of these (or an EOF). */
504 /* Handle backslash. */
505 char_escaped
= (c
== '\\' && ! char_escaped
);
508 #endif /* USE_CPPLIB */
510 /* At the beginning of a line, increment the line number
511 and process any #-directive on this line.
512 If the line is a #-directive, read the entire line and return a newline.
513 Otherwise, return the line's first non-whitespace character. */
523 /* Read first nonwhite char on the line. */
526 while (c
== ' ' || c
== '\t')
531 /* If not #, return it so caller will use it. */
535 /* Read first nonwhite char after the `#'. */
538 while (c
== ' ' || c
== '\t')
541 /* If a letter follows, then if the word here is `line', skip
542 it and ignore it; otherwise, ignore the line, with an error
543 if the word isn't `pragma', `ident', `define', or `undef'. */
545 if ((c
>= 'a' && c
<= 'z') || (c
>= 'A' && c
<= 'Z'))
554 && ((c
= GETC()) == ' ' || c
== '\t' || c
== '\n'))
556 while (c
== ' ' || c
== '\t')
560 #ifdef HANDLE_SYSV_PRAGMA
563 if (token
!= IDENTIFIER
)
565 return handle_sysv_pragma (token
);
566 #else /* !HANDLE_SYSV_PRAGMA */
571 if (token
!= IDENTIFIER
)
573 if (HANDLE_PRAGMA (finput
, yylval
.ttype
))
579 ??? do not know what to
do ???;
580 #endif /* !USE_CPPLIB */
581 #endif /* HANDLE_PRAGMA */
582 #endif /* !HANDLE_SYSV_PRAGMA */
594 && ((c
= GETC()) == ' ' || c
== '\t' || c
== '\n'))
597 debug_define (lineno
, GET_DIRECTIVE_LINE ());
607 && ((c
= GETC()) == ' ' || c
== '\t' || c
== '\n'))
610 debug_undef (lineno
, GET_DIRECTIVE_LINE ());
619 && ((c
= GETC()) == ' ' || c
== '\t'))
628 && ((c
= GETC()) == ' ' || c
== '\t'))
630 /* #ident. The pedantic warning is now in cccp.c. */
632 /* Here we have just seen `#ident '.
633 A string constant should follow. */
635 while (c
== ' ' || c
== '\t')
638 /* If no argument, ignore the line. */
645 || TREE_CODE (yylval
.ttype
) != STRING_CST
)
647 error ("invalid #ident");
653 #ifdef ASM_OUTPUT_IDENT
654 ASM_OUTPUT_IDENT (asm_out_file
, TREE_STRING_POINTER (yylval
.ttype
));
658 /* Skip the rest of this line. */
663 error ("undefined or invalid # directive");
668 /* Here we have either `#line' or `# <nonletter>'.
669 In either case, it should be a line number; a digit should follow. */
671 while (c
== ' ' || c
== '\t')
674 /* If the # is the only nonwhite char on the line,
675 just ignore it. Check the new newline. */
679 /* Something follows the #; read a token. */
684 if (token
== CONSTANT
685 && TREE_CODE (yylval
.ttype
) == INTEGER_CST
)
687 int old_lineno
= lineno
;
689 /* subtract one, because it is the following line that
690 gets the specified number */
692 int l
= TREE_INT_CST_LOW (yylval
.ttype
) - 1;
694 /* Is this the last nonwhite stuff on the line? */
696 while (c
== ' ' || c
== '\t')
700 /* No more: store the line number and check following line. */
706 /* More follows: it must be a string constant (filename). */
708 /* Read the string constant. */
711 if (token
!= STRING
|| TREE_CODE (yylval
.ttype
) != STRING_CST
)
713 error ("invalid #line");
718 = (char *) permalloc (TREE_STRING_LENGTH (yylval
.ttype
) + 1);
719 strcpy (input_filename
, TREE_STRING_POINTER (yylval
.ttype
));
722 /* Each change of file name
723 reinitializes whether we are now in a system header. */
724 in_system_header
= 0;
726 if (main_input_filename
== 0)
727 main_input_filename
= input_filename
;
729 /* Is this the last nonwhite stuff on the line? */
731 while (c
== ' ' || c
== '\t')
735 /* Update the name in the top element of input_file_stack. */
736 if (input_file_stack
)
737 input_file_stack
->name
= input_filename
;
746 /* `1' after file name means entering new file.
747 `2' after file name means just left a file. */
749 if (token
== CONSTANT
750 && TREE_CODE (yylval
.ttype
) == INTEGER_CST
)
752 if (TREE_INT_CST_LOW (yylval
.ttype
) == 1)
754 /* Pushing to a new file. */
756 = (struct file_stack
*) xmalloc (sizeof (struct file_stack
));
757 input_file_stack
->line
= old_lineno
;
758 p
->next
= input_file_stack
;
759 p
->name
= input_filename
;
760 p
->indent_level
= indent_level
;
761 input_file_stack
= p
;
762 input_file_stack_tick
++;
763 debug_start_source_file (input_filename
);
766 else if (TREE_INT_CST_LOW (yylval
.ttype
) == 2)
768 /* Popping out of a file. */
769 if (input_file_stack
->next
)
771 struct file_stack
*p
= input_file_stack
;
772 if (indent_level
!= p
->indent_level
)
774 warning_with_file_and_line
775 (p
->name
, old_lineno
,
776 "This file contains more `%c's than `%c's.",
777 indent_level
> p
->indent_level
? '{' : '}',
778 indent_level
> p
->indent_level
? '}' : '{');
780 input_file_stack
= p
->next
;
782 input_file_stack_tick
++;
783 debug_end_source_file (input_file_stack
->line
);
786 error ("#-lines for entering and leaving files don't match");
792 /* Now that we've pushed or popped the input stack,
793 update the name in the top element. */
794 if (input_file_stack
)
795 input_file_stack
->name
= input_filename
;
797 /* If we have handled a `1' or a `2',
798 see if there is another number to read. */
801 /* Is this the last nonwhite stuff on the line? */
803 while (c
== ' ' || c
== '\t')
813 /* `3' after file name means this is a system header file. */
815 if (token
== CONSTANT
816 && TREE_CODE (yylval
.ttype
) == INTEGER_CST
817 && TREE_INT_CST_LOW (yylval
.ttype
) == 3)
818 in_system_header
= 1, used_up
= 1;
822 /* Is this the last nonwhite stuff on the line? */
824 while (c
== ' ' || c
== '\t')
831 warning ("unrecognized text at end of #line");
834 error ("invalid #-line");
836 /* skip the rest of this line. */
839 if (c
!= '\n' && c
!= EOF
&& nextchar
>= 0)
840 c
= nextchar
, nextchar
= -1;
842 while (c
!= '\n' && c
!= EOF
)
847 #ifdef HANDLE_SYSV_PRAGMA
849 /* Handle a #pragma directive.
850 TOKEN is the token we read after `#pragma'. Processes the entire input
851 line and returns a character for the caller to reread: either \n or EOF. */
853 /* This function has to be in this file, in order to get at
857 handle_sysv_pragma (token
)
870 handle_pragma_token (token_buffer
, yylval
.ttype
);
873 handle_pragma_token (token_buffer
, 0);
877 c
= nextchar
, nextchar
= -1;
882 while (c
== ' ' || c
== '\t')
884 if (c
== '\n' || c
== EOF
)
886 handle_pragma_token (0, 0);
894 #endif /* HANDLE_SYSV_PRAGMA */
896 #define ENDFILE -1 /* token that represents end-of-file */
898 /* Read an escape sequence, returning its equivalent as a character,
899 or store 1 in *ignore_ptr if it is backslash-newline. */
902 readescape (ignore_ptr
)
905 register int c
= GETC();
907 register unsigned count
;
908 unsigned firstdig
= 0;
914 if (warn_traditional
)
915 warning ("the meaning of `\\x' varies with -traditional");
917 if (flag_traditional
)
926 if (!(c
>= 'a' && c
<= 'f')
927 && !(c
>= 'A' && c
<= 'F')
928 && !(c
>= '0' && c
<= '9'))
934 if (c
>= 'a' && c
<= 'f')
935 code
+= c
- 'a' + 10;
936 if (c
>= 'A' && c
<= 'F')
937 code
+= c
- 'A' + 10;
938 if (c
>= '0' && c
<= '9')
940 if (code
!= 0 || count
!= 0)
949 error ("\\x used with no following hex digits");
951 /* Digits are all 0's. Ok. */
953 else if ((count
- 1) * 4 >= TYPE_PRECISION (integer_type_node
)
955 && ((1 << (TYPE_PRECISION (integer_type_node
) - (count
- 1) * 4))
957 pedwarn ("hex escape out of range");
960 case '0': case '1': case '2': case '3': case '4':
961 case '5': case '6': case '7':
964 while ((c
<= '7') && (c
>= '0') && (count
++ < 3))
966 code
= (code
* 8) + (c
- '0');
972 case '\\': case '\'': case '"':
981 return TARGET_NEWLINE
;
996 if (warn_traditional
)
997 warning ("the meaning of `\\a' varies with -traditional");
999 if (flag_traditional
)
1004 #if 0 /* Vertical tab is present in common usage compilers. */
1005 if (flag_traditional
)
1013 pedwarn ("non-ANSI-standard escape sequence, `\\%c'", c
);
1019 /* `\(', etc, are used at beginning of line to avoid confusing Emacs. */
1023 /* `\%' is used to prevent SCCS from getting confused. */
1026 pedwarn ("non-ANSI escape sequence `\\%c'", c
);
1029 if (c
>= 040 && c
< 0177)
1030 pedwarn ("unknown escape sequence `\\%c'", c
);
1032 pedwarn ("unknown escape sequence: `\\' followed by char code 0x%x", c
);
1042 strcpy (buf
, string
);
1044 /* We can't print string and character constants well
1045 because the token_buffer contains the result of processing escapes. */
1047 strcat (buf
, " at end of input");
1048 else if (token_buffer
[0] == 0)
1049 strcat (buf
, " at null character");
1050 else if (token_buffer
[0] == '"')
1051 strcat (buf
, " before string constant");
1052 else if (token_buffer
[0] == '\'')
1053 strcat (buf
, " before character constant");
1054 else if (token_buffer
[0] < 040 || (unsigned char) token_buffer
[0] >= 0177)
1055 sprintf (buf
+ strlen (buf
), " before character 0%o",
1056 (unsigned char) token_buffer
[0]);
1058 strcat (buf
, " before `%s'");
1060 error (buf
, token_buffer
);
1070 char long_long_flag
;
1073 struct try_type type_sequence
[] =
1075 { &integer_type_node
, 0, 0, 0},
1076 { &unsigned_type_node
, 1, 0, 0},
1077 { &long_integer_type_node
, 0, 1, 0},
1078 { &long_unsigned_type_node
, 1, 1, 0},
1079 { &long_long_integer_type_node
, 0, 1, 1},
1080 { &long_long_unsigned_type_node
, 1, 1, 1}
1095 c
= nextchar
, nextchar
= -1;
1100 /* Effectively do c = skip_white_space (c)
1101 but do it faster in the usual cases. */
1114 /* Call skip_white_space so we can warn if appropriate. */
1119 c
= skip_white_space (c
);
1121 goto found_nonwhite
;
1125 token_buffer
[0] = c
;
1126 token_buffer
[1] = 0;
1128 /* yylloc.first_line = lineno; */
1134 token_buffer
[0] = 0;
1139 /* Capital L may start a wide-string or wide-character constant. */
1141 register int c
= GETC();
1150 goto string_constant
;
1157 if (!doing_objc_thang
)
1164 /* '@' may start a constant string object. */
1165 register int c
= GETC ();
1169 goto string_constant
;
1172 /* Fall through to treat '@' as the start of an identifier. */
1175 case 'A': case 'B': case 'C': case 'D': case 'E':
1176 case 'F': case 'G': case 'H': case 'I': case 'J':
1177 case 'K': case 'M': case 'N': case 'O':
1178 case 'P': case 'Q': case 'R': case 'S': case 'T':
1179 case 'U': case 'V': case 'W': case 'X': case 'Y':
1181 case 'a': case 'b': case 'c': case 'd': case 'e':
1182 case 'f': case 'g': case 'h': case 'i': case 'j':
1183 case 'k': case 'l': case 'm': case 'n': case 'o':
1184 case 'p': case 'q': case 'r': case 's': case 't':
1185 case 'u': case 'v': case 'w': case 'x': case 'y':
1191 while (isalnum (c
) || c
== '_' || c
== '$' || c
== '@')
1193 /* Make sure this char really belongs in an identifier. */
1194 if (c
== '@' && ! doing_objc_thang
)
1198 if (! dollars_in_ident
)
1199 error ("`$' in identifier");
1201 pedwarn ("`$' in identifier");
1204 if (p
>= token_buffer
+ maxtoken
)
1205 p
= extend_token_buffer (p
);
1221 /* Try to recognize a keyword. Uses minimum-perfect hash function */
1224 register struct resword
*ptr
;
1226 if (ptr
= is_reserved_word (token_buffer
, p
- token_buffer
))
1229 yylval
.ttype
= ridpointers
[(int) ptr
->rid
];
1230 value
= (int) ptr
->token
;
1232 /* Only return OBJECTNAME if it is a typedef. */
1233 if (doing_objc_thang
&& value
== OBJECTNAME
)
1235 lastiddecl
= lookup_name(yylval
.ttype
);
1237 if (lastiddecl
== NULL_TREE
1238 || TREE_CODE (lastiddecl
) != TYPE_DECL
)
1242 /* Even if we decided to recognize asm, still perhaps warn. */
1244 && (value
== ASM_KEYWORD
|| value
== TYPEOF
1245 || ptr
->rid
== RID_INLINE
)
1246 && token_buffer
[0] != '_')
1247 pedwarn ("ANSI does not permit the keyword `%s'",
1252 /* If we did not find a keyword, look for an identifier
1255 if (value
== IDENTIFIER
)
1257 if (token_buffer
[0] == '@')
1258 error("invalid identifier `%s'", token_buffer
);
1260 yylval
.ttype
= get_identifier (token_buffer
);
1261 lastiddecl
= lookup_name (yylval
.ttype
);
1263 if (lastiddecl
!= 0 && TREE_CODE (lastiddecl
) == TYPE_DECL
)
1265 /* A user-invisible read-only initialized variable
1266 should be replaced by its value.
1267 We handle only strings since that's the only case used in C. */
1268 else if (lastiddecl
!= 0 && TREE_CODE (lastiddecl
) == VAR_DECL
1269 && DECL_IGNORED_P (lastiddecl
)
1270 && TREE_READONLY (lastiddecl
)
1271 && DECL_INITIAL (lastiddecl
) != 0
1272 && TREE_CODE (DECL_INITIAL (lastiddecl
)) == STRING_CST
)
1274 tree stringval
= DECL_INITIAL (lastiddecl
);
1276 /* Copy the string value so that we won't clobber anything
1277 if we put something in the TREE_CHAIN of this one. */
1278 yylval
.ttype
= build_string (TREE_STRING_LENGTH (stringval
),
1279 TREE_STRING_POINTER (stringval
));
1282 else if (doing_objc_thang
)
1284 tree objc_interface_decl
= is_class_name (yylval
.ttype
);
1286 if (objc_interface_decl
)
1289 yylval
.ttype
= objc_interface_decl
;
1299 /* Check first for common special case: single-digit 0 or 1. */
1302 UNGETC (next_c
); /* Always undo this lookahead. */
1303 if (!isalnum (next_c
) && next_c
!= '.')
1305 token_buffer
[0] = (char)c
, token_buffer
[1] = '\0';
1306 yylval
.ttype
= (c
== '0') ? integer_zero_node
: integer_one_node
;
1312 case '2': case '3': case '4':
1313 case '5': case '6': case '7': case '8': case '9':
1318 int largest_digit
= 0;
1320 /* for multi-precision arithmetic,
1321 we actually store only HOST_BITS_PER_CHAR bits in each part.
1322 The number of parts is chosen so as to be sufficient to hold
1323 the enough bits to fit into the two HOST_WIDE_INTs that contain
1324 the integer value (this is always at least as many bits as are
1325 in a target `long long' value, but may be wider). */
1326 #define TOTAL_PARTS ((HOST_BITS_PER_WIDE_INT / HOST_BITS_PER_CHAR) * 2 + 2)
1327 int parts
[TOTAL_PARTS
];
1330 enum anon1
{ NOT_FLOAT
, AFTER_POINT
, TOO_MANY_POINTS
} floatflag
1333 for (count
= 0; count
< TOTAL_PARTS
; count
++)
1341 *p
++ = (c
= GETC());
1342 if ((c
== 'x') || (c
== 'X'))
1345 *p
++ = (c
= GETC());
1347 /* Leading 0 forces octal unless the 0 is the only digit. */
1348 else if (c
>= '0' && c
<= '9')
1357 /* Read all the digits-and-decimal-points. */
1360 || (isalnum (c
) && c
!= 'l' && c
!= 'L'
1361 && c
!= 'u' && c
!= 'U'
1362 && c
!= 'i' && c
!= 'I' && c
!= 'j' && c
!= 'J'
1363 && (floatflag
== NOT_FLOAT
|| ((c
!= 'f') && (c
!= 'F')))))
1368 error ("floating constant may not be in radix 16");
1369 if (floatflag
== TOO_MANY_POINTS
)
1370 /* We have already emitted an error. Don't need another. */
1372 else if (floatflag
== AFTER_POINT
)
1374 error ("malformed floating constant");
1375 floatflag
= TOO_MANY_POINTS
;
1376 /* Avoid another error from atof by forcing all characters
1377 from here on to be ignored. */
1381 floatflag
= AFTER_POINT
;
1385 /* Accept '.' as the start of a floating-point number
1386 only when it is followed by a digit.
1387 Otherwise, unread the following non-digit
1388 and use the '.' as a structural token. */
1389 if (p
== token_buffer
+ 2 && !isdigit (c
))
1400 error ("parse error at `..'");
1403 token_buffer
[1] = 0;
1410 /* It is not a decimal point.
1411 It should be a digit (perhaps a hex digit). */
1417 else if (base
<= 10)
1419 if (c
== 'e' || c
== 'E')
1422 floatflag
= AFTER_POINT
;
1423 break; /* start of exponent */
1425 error ("nondigits in number and not hexadecimal");
1436 if (c
>= largest_digit
)
1440 for (count
= 0; count
< TOTAL_PARTS
; count
++)
1442 parts
[count
] *= base
;
1446 += (parts
[count
-1] >> HOST_BITS_PER_CHAR
);
1448 &= (1 << HOST_BITS_PER_CHAR
) - 1;
1454 /* If the extra highest-order part ever gets anything in it,
1455 the number is certainly too big. */
1456 if (parts
[TOTAL_PARTS
- 1] != 0)
1459 if (p
>= token_buffer
+ maxtoken
- 3)
1460 p
= extend_token_buffer (p
);
1461 *p
++ = (c
= GETC());
1466 error ("numeric constant with no digits");
1468 if (largest_digit
>= base
)
1469 error ("numeric constant contains digits beyond the radix");
1471 /* Remove terminating char from the token buffer and delimit the string */
1474 if (floatflag
!= NOT_FLOAT
)
1476 tree type
= double_type_node
;
1477 int exceeds_double
= 0;
1479 REAL_VALUE_TYPE value
;
1482 /* Read explicit exponent if any, and put it in tokenbuf. */
1484 if ((c
== 'e') || (c
== 'E'))
1486 if (p
>= token_buffer
+ maxtoken
- 3)
1487 p
= extend_token_buffer (p
);
1490 if ((c
== '+') || (c
== '-'))
1496 error ("floating constant exponent has no digits");
1499 if (p
>= token_buffer
+ maxtoken
- 3)
1500 p
= extend_token_buffer (p
);
1509 /* Convert string to a double, checking for overflow. */
1510 if (setjmp (handler
))
1512 error ("floating constant out of range");
1517 int fflag
= 0, lflag
= 0;
1518 /* Copy token_buffer now, while it has just the number
1519 and not the suffixes; once we add `f' or `i',
1520 REAL_VALUE_ATOF may not work any more. */
1521 char *copy
= (char *) alloca (p
- token_buffer
+ 1);
1522 bcopy (token_buffer
, copy
, p
- token_buffer
+ 1);
1524 set_float_handler (handler
);
1530 /* Read the suffixes to choose a data type. */
1535 error ("more than one `f' in numeric constant");
1541 error ("more than one `l' in numeric constant");
1547 error ("more than one `i' or `j' in numeric constant");
1549 pedwarn ("ANSI C forbids imaginary numeric constants");
1560 if (p
>= token_buffer
+ maxtoken
- 3)
1561 p
= extend_token_buffer (p
);
1567 /* The second argument, machine_mode, of REAL_VALUE_ATOF
1568 tells the desired precision of the binary result
1569 of decimal-to-binary conversion. */
1574 error ("both `f' and `l' in floating constant");
1576 type
= float_type_node
;
1577 value
= REAL_VALUE_ATOF (copy
, TYPE_MODE (type
));
1578 /* A diagnostic is required here by some ANSI C testsuites.
1579 This is not pedwarn, become some people don't want
1580 an error for this. */
1581 if (REAL_VALUE_ISINF (value
) && pedantic
)
1582 warning ("floating point number exceeds range of `float'");
1586 type
= long_double_type_node
;
1587 value
= REAL_VALUE_ATOF (copy
, TYPE_MODE (type
));
1588 if (REAL_VALUE_ISINF (value
) && pedantic
)
1589 warning ("floating point number exceeds range of `long double'");
1593 value
= REAL_VALUE_ATOF (copy
, TYPE_MODE (type
));
1594 if (REAL_VALUE_ISINF (value
) && pedantic
)
1595 warning ("floating point number exceeds range of `double'");
1598 set_float_handler (NULL_PTR
);
1601 if (errno
== ERANGE
&& !flag_traditional
&& pedantic
)
1603 /* ERANGE is also reported for underflow,
1604 so test the value to distinguish overflow from that. */
1605 if (REAL_VALUES_LESS (dconst1
, value
)
1606 || REAL_VALUES_LESS (value
, dconstm1
))
1608 warning ("floating point number exceeds range of `double'");
1614 /* If the result is not a number, assume it must have been
1615 due to some error message above, so silently convert
1617 if (REAL_VALUE_ISNAN (value
))
1620 /* Create a node with determined type and value. */
1622 yylval
.ttype
= build_complex (NULL_TREE
,
1623 convert (type
, integer_zero_node
),
1624 build_real (type
, value
));
1626 yylval
.ttype
= build_real (type
, value
);
1630 tree traditional_type
, ansi_type
, type
;
1631 HOST_WIDE_INT high
, low
;
1632 int spec_unsigned
= 0;
1634 int spec_long_long
= 0;
1640 if (c
== 'u' || c
== 'U')
1643 error ("two `u's in integer constant");
1646 else if (c
== 'l' || c
== 'L')
1651 error ("three `l's in integer constant");
1653 pedwarn ("ANSI C forbids long long integer constants");
1658 else if (c
== 'i' || c
== 'j' || c
== 'I' || c
== 'J')
1661 error ("more than one `i' or `j' in numeric constant");
1663 pedwarn ("ANSI C forbids imaginary numeric constants");
1668 if (p
>= token_buffer
+ maxtoken
- 3)
1669 p
= extend_token_buffer (p
);
1674 /* If the constant won't fit in an unsigned long long,
1675 then warn that the constant is out of range. */
1677 /* ??? This assumes that long long and long integer types are
1678 a multiple of 8 bits. This better than the original code
1679 though which assumed that long was exactly 32 bits and long
1680 long was exactly 64 bits. */
1682 bytes
= TYPE_PRECISION (long_long_integer_type_node
) / 8;
1685 for (i
= bytes
; i
< TOTAL_PARTS
; i
++)
1689 pedwarn ("integer constant out of range");
1691 /* This is simplified by the fact that our constant
1692 is always positive. */
1696 for (i
= 0; i
< HOST_BITS_PER_WIDE_INT
/ HOST_BITS_PER_CHAR
; i
++)
1698 high
|= ((HOST_WIDE_INT
) parts
[i
+ (HOST_BITS_PER_WIDE_INT
1699 / HOST_BITS_PER_CHAR
)]
1700 << (i
* HOST_BITS_PER_CHAR
));
1701 low
|= (HOST_WIDE_INT
) parts
[i
] << (i
* HOST_BITS_PER_CHAR
);
1704 yylval
.ttype
= build_int_2 (low
, high
);
1705 TREE_TYPE (yylval
.ttype
) = long_long_unsigned_type_node
;
1707 /* If warn_traditional, calculate both the ANSI type and the
1708 traditional type, then see if they disagree.
1709 Otherwise, calculate only the type for the dialect in use. */
1710 if (warn_traditional
|| flag_traditional
)
1712 /* Calculate the traditional type. */
1713 /* Traditionally, any constant is signed;
1714 but if unsigned is specified explicitly, obey that.
1715 Use the smallest size with the right number of bits,
1716 except for one special case with decimal constants. */
1717 if (! spec_long
&& base
!= 10
1718 && int_fits_type_p (yylval
.ttype
, unsigned_type_node
))
1719 traditional_type
= (spec_unsigned
? unsigned_type_node
1720 : integer_type_node
);
1721 /* A decimal constant must be long
1722 if it does not fit in type int.
1723 I think this is independent of whether
1724 the constant is signed. */
1725 else if (! spec_long
&& base
== 10
1726 && int_fits_type_p (yylval
.ttype
, integer_type_node
))
1727 traditional_type
= (spec_unsigned
? unsigned_type_node
1728 : integer_type_node
);
1729 else if (! spec_long_long
)
1730 traditional_type
= (spec_unsigned
? long_unsigned_type_node
1731 : long_integer_type_node
);
1733 traditional_type
= (spec_unsigned
1734 ? long_long_unsigned_type_node
1735 : long_long_integer_type_node
);
1737 if (warn_traditional
|| ! flag_traditional
)
1739 /* Calculate the ANSI type. */
1740 if (! spec_long
&& ! spec_unsigned
1741 && int_fits_type_p (yylval
.ttype
, integer_type_node
))
1742 ansi_type
= integer_type_node
;
1743 else if (! spec_long
&& (base
!= 10 || spec_unsigned
)
1744 && int_fits_type_p (yylval
.ttype
, unsigned_type_node
))
1745 ansi_type
= unsigned_type_node
;
1746 else if (! spec_unsigned
&& !spec_long_long
1747 && int_fits_type_p (yylval
.ttype
, long_integer_type_node
))
1748 ansi_type
= long_integer_type_node
;
1749 else if (! spec_long_long
1750 && int_fits_type_p (yylval
.ttype
,
1751 long_unsigned_type_node
))
1752 ansi_type
= long_unsigned_type_node
;
1753 else if (! spec_unsigned
1754 && int_fits_type_p (yylval
.ttype
,
1755 long_long_integer_type_node
))
1756 ansi_type
= long_long_integer_type_node
;
1758 ansi_type
= long_long_unsigned_type_node
;
1761 type
= flag_traditional
? traditional_type
: ansi_type
;
1763 if (warn_traditional
&& traditional_type
!= ansi_type
)
1765 if (TYPE_PRECISION (traditional_type
)
1766 != TYPE_PRECISION (ansi_type
))
1767 warning ("width of integer constant changes with -traditional");
1768 else if (TREE_UNSIGNED (traditional_type
)
1769 != TREE_UNSIGNED (ansi_type
))
1770 warning ("integer constant is unsigned in ANSI C, signed with -traditional");
1772 warning ("width of integer constant may change on other systems with -traditional");
1775 if (pedantic
&& !flag_traditional
&& !spec_long_long
&& !warn
1776 && (TYPE_PRECISION (long_integer_type_node
)
1777 < TYPE_PRECISION (type
)))
1778 pedwarn ("integer constant out of range");
1780 if (base
== 10 && ! spec_unsigned
&& TREE_UNSIGNED (type
))
1781 warning ("decimal constant is so large that it is unsigned");
1785 if (TYPE_PRECISION (type
)
1786 <= TYPE_PRECISION (integer_type_node
))
1788 = build_complex (NULL_TREE
, integer_zero_node
,
1789 convert (integer_type_node
,
1792 error ("complex integer constant is too wide for `complex int'");
1794 else if (flag_traditional
&& !int_fits_type_p (yylval
.ttype
, type
))
1795 /* The traditional constant 0x80000000 is signed
1796 but doesn't fit in the range of int.
1797 This will change it to -0x80000000, which does fit. */
1799 TREE_TYPE (yylval
.ttype
) = unsigned_type (type
);
1800 yylval
.ttype
= convert (type
, yylval
.ttype
);
1801 TREE_OVERFLOW (yylval
.ttype
)
1802 = TREE_CONSTANT_OVERFLOW (yylval
.ttype
) = 0;
1805 TREE_TYPE (yylval
.ttype
) = type
;
1811 if (isalnum (c
) || c
== '.' || c
== '_' || c
== '$'
1812 || (!flag_traditional
&& (c
== '-' || c
== '+')
1813 && (p
[-1] == 'e' || p
[-1] == 'E')))
1814 error ("missing white space after number `%s'", token_buffer
);
1816 value
= CONSTANT
; break;
1822 register int result
= 0;
1823 register int num_chars
= 0;
1824 unsigned width
= TYPE_PRECISION (char_type_node
);
1829 width
= WCHAR_TYPE_SIZE
;
1830 #ifdef MULTIBYTE_CHARS
1831 max_chars
= MB_CUR_MAX
;
1837 max_chars
= TYPE_PRECISION (integer_type_node
) / width
;
1845 if (c
== '\'' || c
== EOF
)
1851 c
= readescape (&ignore
);
1854 if (width
< HOST_BITS_PER_INT
1855 && (unsigned) c
>= (1 << width
))
1856 pedwarn ("escape sequence out of range for character");
1857 #ifdef MAP_CHARACTER
1859 c
= MAP_CHARACTER (c
);
1865 pedwarn ("ANSI C forbids newline in character constant");
1868 #ifdef MAP_CHARACTER
1870 c
= MAP_CHARACTER (c
);
1874 if (num_chars
> maxtoken
- 4)
1875 extend_token_buffer (token_buffer
);
1877 token_buffer
[num_chars
] = c
;
1879 /* Merge character into result; ignore excess chars. */
1880 if (num_chars
< max_chars
+ 1)
1882 if (width
< HOST_BITS_PER_INT
)
1883 result
= (result
<< width
) | (c
& ((1 << width
) - 1));
1889 token_buffer
[num_chars
+ 1] = '\'';
1890 token_buffer
[num_chars
+ 2] = 0;
1893 error ("malformatted character constant");
1894 else if (num_chars
== 0)
1895 error ("empty character constant");
1896 else if (num_chars
> max_chars
)
1898 num_chars
= max_chars
;
1899 error ("character constant too long");
1901 else if (num_chars
!= 1 && ! flag_traditional
)
1902 warning ("multi-character character constant");
1904 /* If char type is signed, sign-extend the constant. */
1907 int num_bits
= num_chars
* width
;
1909 /* We already got an error; avoid invalid shift. */
1910 yylval
.ttype
= build_int_2 (0, 0);
1911 else if (TREE_UNSIGNED (char_type_node
)
1912 || ((result
>> (num_bits
- 1)) & 1) == 0)
1914 = build_int_2 (result
& ((unsigned HOST_WIDE_INT
) ~0
1915 >> (HOST_BITS_PER_WIDE_INT
- num_bits
)),
1919 = build_int_2 (result
| ~((unsigned HOST_WIDE_INT
) ~0
1920 >> (HOST_BITS_PER_WIDE_INT
- num_bits
)),
1922 TREE_TYPE (yylval
.ttype
) = integer_type_node
;
1926 #ifdef MULTIBYTE_CHARS
1927 /* Set the initial shift state and convert the next sequence. */
1929 /* In all locales L'\0' is zero and mbtowc will return zero,
1932 || (num_chars
== 1 && token_buffer
[1] != '\0'))
1935 (void) mbtowc (NULL_PTR
, NULL_PTR
, 0);
1936 if (mbtowc (& wc
, token_buffer
+ 1, num_chars
) == num_chars
)
1939 warning ("Ignoring invalid multibyte character");
1942 yylval
.ttype
= build_int_2 (result
, 0);
1943 TREE_TYPE (yylval
.ttype
) = wchar_type_node
;
1954 p
= token_buffer
+ 1;
1956 while (c
!= '"' && c
>= 0)
1961 c
= readescape (&ignore
);
1965 && TYPE_PRECISION (char_type_node
) < HOST_BITS_PER_INT
1966 && c
>= (1 << TYPE_PRECISION (char_type_node
)))
1967 pedwarn ("escape sequence out of range for character");
1972 pedwarn ("ANSI C forbids newline in string constant");
1976 if (p
== token_buffer
+ maxtoken
)
1977 p
= extend_token_buffer (p
);
1986 error ("Unterminated string constant");
1988 /* We have read the entire constant.
1989 Construct a STRING_CST for the result. */
1993 /* If this is a L"..." wide-string, convert the multibyte string
1994 to a wide character string. */
1995 char *widep
= (char *) alloca ((p
- token_buffer
) * WCHAR_BYTES
);
1998 #ifdef MULTIBYTE_CHARS
1999 len
= mbstowcs ((wchar_t *) widep
, token_buffer
+ 1, p
- token_buffer
);
2000 if (len
< 0 || len
>= (p
- token_buffer
))
2002 warning ("Ignoring invalid multibyte string");
2005 bzero (widep
+ (len
* WCHAR_BYTES
), WCHAR_BYTES
);
2010 wp
= widep
+ (BYTES_BIG_ENDIAN
? WCHAR_BYTES
- 1 : 0);
2011 bzero (widep
, (p
- token_buffer
) * WCHAR_BYTES
);
2012 for (cp
= token_buffer
+ 1; cp
< p
; cp
++)
2013 *wp
= *cp
, wp
+= WCHAR_BYTES
;
2014 len
= p
- token_buffer
- 1;
2017 yylval
.ttype
= build_string ((len
+ 1) * WCHAR_BYTES
, widep
);
2018 TREE_TYPE (yylval
.ttype
) = wchar_array_type_node
;
2023 extern tree
build_objc_string();
2024 /* Return an Objective-C @"..." constant string object. */
2025 yylval
.ttype
= build_objc_string (p
- token_buffer
,
2027 TREE_TYPE (yylval
.ttype
) = char_array_type_node
;
2028 value
= OBJC_STRING
;
2032 yylval
.ttype
= build_string (p
- token_buffer
, token_buffer
+ 1);
2033 TREE_TYPE (yylval
.ttype
) = char_array_type_node
;
2064 yylval
.code
= PLUS_EXPR
; break;
2066 yylval
.code
= MINUS_EXPR
; break;
2068 yylval
.code
= BIT_AND_EXPR
; break;
2070 yylval
.code
= BIT_IOR_EXPR
; break;
2072 yylval
.code
= MULT_EXPR
; break;
2074 yylval
.code
= TRUNC_DIV_EXPR
; break;
2076 yylval
.code
= TRUNC_MOD_EXPR
; break;
2078 yylval
.code
= BIT_XOR_EXPR
; break;
2080 yylval
.code
= LSHIFT_EXPR
; break;
2082 yylval
.code
= RSHIFT_EXPR
; break;
2084 yylval
.code
= LT_EXPR
; break;
2086 yylval
.code
= GT_EXPR
; break;
2089 token_buffer
[1] = c1
= GETC();
2090 token_buffer
[2] = 0;
2097 value
= ARITHCOMPARE
; yylval
.code
= LE_EXPR
; goto done
;
2099 value
= ARITHCOMPARE
; yylval
.code
= GE_EXPR
; goto done
;
2101 value
= EQCOMPARE
; yylval
.code
= NE_EXPR
; goto done
;
2103 value
= EQCOMPARE
; yylval
.code
= EQ_EXPR
; goto done
;
2105 value
= ASSIGN
; goto done
;
2111 value
= PLUSPLUS
; goto done
;
2113 value
= MINUSMINUS
; goto done
;
2115 value
= ANDAND
; goto done
;
2117 value
= OROR
; goto done
;
2130 { value
= POINTSAT
; goto done
; }
2134 { value
= ']'; goto done
; }
2138 { value
= '{'; indent_level
++; goto done
; }
2140 { value
= '['; goto done
; }
2144 { value
= '}'; indent_level
--; goto done
; }
2148 token_buffer
[1] = 0;
2150 if ((c
== '<') || (c
== '>'))
2151 value
= ARITHCOMPARE
;
2157 /* Don't make yyparse think this is eof. */
2176 /* yylloc.last_line = lineno; */
2181 /* Sets the value of the 'yydebug' variable to VALUE.
2182 This is a function so we don't have to have YYDEBUG defined
2183 in order to build the compiler. */
2192 warning ("YYDEBUG not defined.");