1 /* Mainly the interface between cpplib and the C front ends.
2 Copyright (C) 1987, 1988, 1989, 1992, 1994, 1995, 1996, 1997
3 1998, 1999, 2000, 2001, 2002, 2003, 2004 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
24 #include "coretypes.h"
41 #include "splay-tree.h"
44 /* We may keep statistics about how long which files took to compile. */
45 static int header_time
, body_time
;
46 static splay_tree file_info_tree
;
48 #undef WCHAR_TYPE_SIZE
49 #define WCHAR_TYPE_SIZE TYPE_PRECISION (wchar_type_node)
51 /* Number of bytes in a wide character. */
52 #define WCHAR_BYTES (WCHAR_TYPE_SIZE / BITS_PER_UNIT)
54 int pending_lang_change
; /* If we need to switch languages - C++ only */
55 int c_header_level
; /* depth in C headers - C++ only */
57 /* If we need to translate characters received. This is tri-state:
58 0 means use only the untranslated string; 1 means use only
59 the translated string; -1 means chain the translated string
60 to the untranslated one. */
61 int c_lex_string_translate
= 1;
63 static tree
interpret_integer (const cpp_token
*, unsigned int);
64 static tree
interpret_float (const cpp_token
*, unsigned int);
65 static enum integer_type_kind
66 narrowest_unsigned_type (tree
, unsigned int);
67 static enum integer_type_kind
68 narrowest_signed_type (tree
, unsigned int);
69 static enum cpp_ttype
lex_string (const cpp_token
*, tree
*, bool);
70 static tree
lex_charconst (const cpp_token
*);
71 static void update_header_times (const char *);
72 static int dump_one_header (splay_tree_node
, void *);
73 static void cb_line_change (cpp_reader
*, const cpp_token
*, int);
74 static void cb_ident (cpp_reader
*, unsigned int, const cpp_string
*);
75 static void cb_def_pragma (cpp_reader
*, unsigned int);
76 static void cb_define (cpp_reader
*, unsigned int, cpp_hashnode
*);
77 static void cb_undef (cpp_reader
*, unsigned int, cpp_hashnode
*);
82 struct cpp_callbacks
*cb
;
83 struct c_fileinfo
*toplevel
;
85 /* Set up filename timing. Must happen before cpp_read_main_file. */
86 file_info_tree
= splay_tree_new ((splay_tree_compare_fn
)strcmp
,
88 (splay_tree_delete_value_fn
)free
);
89 toplevel
= get_fileinfo ("<top level>");
90 if (flag_detailed_statistics
)
93 body_time
= get_run_time ();
94 toplevel
->time
= body_time
;
97 cb
= cpp_get_callbacks (parse_in
);
99 cb
->line_change
= cb_line_change
;
100 cb
->ident
= cb_ident
;
101 cb
->def_pragma
= cb_def_pragma
;
102 cb
->valid_pch
= c_common_valid_pch
;
103 cb
->read_pch
= c_common_read_pch
;
105 /* Set the debug callbacks if we can use them. */
106 if (debug_info_level
== DINFO_LEVEL_VERBOSE
107 && (write_symbols
== DWARF_DEBUG
|| write_symbols
== DWARF2_DEBUG
108 || write_symbols
== VMS_AND_DWARF2_DEBUG
))
110 cb
->define
= cb_define
;
111 cb
->undef
= cb_undef
;
116 get_fileinfo (const char *name
)
119 struct c_fileinfo
*fi
;
121 n
= splay_tree_lookup (file_info_tree
, (splay_tree_key
) name
);
123 return (struct c_fileinfo
*) n
->value
;
125 fi
= xmalloc (sizeof (struct c_fileinfo
));
127 fi
->interface_only
= 0;
128 fi
->interface_unknown
= 1;
129 splay_tree_insert (file_info_tree
, (splay_tree_key
) name
,
130 (splay_tree_value
) fi
);
135 update_header_times (const char *name
)
137 /* Changing files again. This means currently collected time
138 is charged against header time, and body time starts back at 0. */
139 if (flag_detailed_statistics
)
141 int this_time
= get_run_time ();
142 struct c_fileinfo
*file
= get_fileinfo (name
);
143 header_time
+= this_time
- body_time
;
144 file
->time
+= this_time
- body_time
;
145 body_time
= this_time
;
150 dump_one_header (splay_tree_node n
, void *dummy ATTRIBUTE_UNUSED
)
152 print_time ((const char *) n
->key
,
153 ((struct c_fileinfo
*) n
->value
)->time
);
158 dump_time_statistics (void)
160 struct c_fileinfo
*file
= get_fileinfo (input_filename
);
161 int this_time
= get_run_time ();
162 file
->time
+= this_time
- body_time
;
164 fprintf (stderr
, "\n******\n");
165 print_time ("header files (total)", header_time
);
166 print_time ("main file (total)", this_time
- body_time
);
167 fprintf (stderr
, "ratio = %g : 1\n",
168 (double)header_time
/ (double)(this_time
- body_time
));
169 fprintf (stderr
, "\n******\n");
171 splay_tree_foreach (file_info_tree
, dump_one_header
, 0);
175 cb_ident (cpp_reader
*pfile ATTRIBUTE_UNUSED
,
176 unsigned int line ATTRIBUTE_UNUSED
,
177 const cpp_string
*str ATTRIBUTE_UNUSED
)
179 #ifdef ASM_OUTPUT_IDENT
182 /* Convert escapes in the string. */
183 cpp_string cstr
= { 0, 0 };
184 if (cpp_interpret_string (pfile
, str
, 1, &cstr
, false))
186 ASM_OUTPUT_IDENT (asm_out_file
, (const char *) cstr
.text
);
187 free ((void *)cstr
.text
);
193 /* Called at the start of every non-empty line. TOKEN is the first
194 lexed token on the line. Used for diagnostic line numbers. */
196 cb_line_change (cpp_reader
*pfile ATTRIBUTE_UNUSED
, const cpp_token
*token
,
199 if (token
->type
!= CPP_EOF
&& !parsing_args
)
200 #ifdef USE_MAPPED_LOCATION
201 input_location
= token
->src_loc
;
204 source_location loc
= token
->src_loc
;
205 const struct line_map
*map
= linemap_lookup (&line_table
, loc
);
206 input_line
= SOURCE_LINE (map
, loc
);
212 fe_file_change (const struct line_map
*new_map
)
217 if (new_map
->reason
== LC_ENTER
)
219 /* Don't stack the main buffer on the input stack;
220 we already did in compile_file. */
221 if (! MAIN_FILE_P (new_map
))
223 #ifdef USE_MAPPED_LOCATION
224 int included_at
= LAST_SOURCE_LINE_LOCATION (new_map
- 1);
226 input_location
= included_at
;
227 push_srcloc (new_map
->start_location
);
229 int included_at
= LAST_SOURCE_LINE (new_map
- 1);
231 input_line
= included_at
;
232 push_srcloc (new_map
->to_file
, 1);
234 (*debug_hooks
->start_source_file
) (included_at
, new_map
->to_file
);
235 #ifndef NO_IMPLICIT_EXTERN_C
238 else if (new_map
->sysp
== 2)
241 ++pending_lang_change
;
246 else if (new_map
->reason
== LC_LEAVE
)
248 #ifndef NO_IMPLICIT_EXTERN_C
249 if (c_header_level
&& --c_header_level
== 0)
251 if (new_map
->sysp
== 2)
252 warning ("badly nested C headers from preprocessor");
253 --pending_lang_change
;
258 (*debug_hooks
->end_source_file
) (new_map
->to_line
);
261 update_header_times (new_map
->to_file
);
262 in_system_header
= new_map
->sysp
!= 0;
263 #ifdef USE_MAPPED_LOCATION
264 input_location
= new_map
->start_location
;
266 input_filename
= new_map
->to_file
;
267 input_line
= new_map
->to_line
;
271 extract_interface_info ();
275 cb_def_pragma (cpp_reader
*pfile
, source_location loc
)
277 /* Issue a warning message if we have been asked to do so. Ignore
278 unknown pragmas in system headers unless an explicit
279 -Wunknown-pragmas has been given. */
280 if (warn_unknown_pragmas
> in_system_header
)
282 #ifndef USE_MAPPED_LOCATION
283 const struct line_map
*map
= linemap_lookup (&line_table
, loc
);
285 const unsigned char *space
, *name
;
288 space
= name
= (const unsigned char *) "";
289 s
= cpp_get_token (pfile
);
290 if (s
->type
!= CPP_EOF
)
292 space
= cpp_token_as_text (pfile
, s
);
293 s
= cpp_get_token (pfile
);
294 if (s
->type
== CPP_NAME
)
295 name
= cpp_token_as_text (pfile
, s
);
298 #ifdef USE_MAPPED_LOCATION
299 input_location
= loc
;
301 input_line
= SOURCE_LINE (map
, loc
);
303 warning ("ignoring #pragma %s %s", space
, name
);
307 /* #define callback for DWARF and DWARF2 debug info. */
309 cb_define (cpp_reader
*pfile
, source_location loc
, cpp_hashnode
*node
)
311 const struct line_map
*map
= linemap_lookup (&line_table
, loc
);
312 (*debug_hooks
->define
) (SOURCE_LINE (map
, loc
),
313 (const char *) cpp_macro_definition (pfile
, node
));
316 /* #undef callback for DWARF and DWARF2 debug info. */
318 cb_undef (cpp_reader
*pfile ATTRIBUTE_UNUSED
, source_location loc
,
321 const struct line_map
*map
= linemap_lookup (&line_table
, loc
);
322 (*debug_hooks
->undef
) (SOURCE_LINE (map
, loc
),
323 (const char *) NODE_NAME (node
));
326 static inline const cpp_token
*
327 get_nonpadding_token (void)
329 const cpp_token
*tok
;
330 timevar_push (TV_CPP
);
332 tok
= cpp_get_token (parse_in
);
333 while (tok
->type
== CPP_PADDING
);
334 timevar_pop (TV_CPP
);
340 c_lex_with_flags (tree
*value
, unsigned char *cpp_flags
)
342 const cpp_token
*tok
;
344 static bool no_more_pch
;
347 tok
= get_nonpadding_token ();
353 *value
= HT_IDENT_TO_GCC_IDENT (HT_NODE (tok
->val
.node
));
358 unsigned int flags
= cpp_classify_number (parse_in
, tok
);
360 switch (flags
& CPP_N_CATEGORY
)
363 /* cpplib has issued an error. */
364 *value
= error_mark_node
;
368 *value
= interpret_integer (tok
, flags
);
372 *value
= interpret_float (tok
, flags
);
382 /* An @ may give the next token special significance in Objective-C. */
383 atloc
= input_location
;
384 tok
= get_nonpadding_token ();
385 if (c_dialect_objc ())
391 val
= HT_IDENT_TO_GCC_IDENT (HT_NODE (tok
->val
.node
));
392 if (C_IS_RESERVED_WORD (val
)
393 && OBJC_IS_AT_KEYWORD (C_RID_CODE (val
)))
402 return lex_string (tok
, value
, true);
409 error ("%Hstray '@' in program", &atloc
);
414 cppchar_t c
= tok
->val
.str
.text
[0];
416 if (c
== '"' || c
== '\'')
417 error ("missing terminating %c character", (int) c
);
418 else if (ISGRAPH (c
))
419 error ("stray '%c' in program", (int) c
);
421 error ("stray '\\%o' in program", (int) c
);
427 *value
= lex_charconst (tok
);
432 return lex_string (tok
, value
, false);
435 /* These tokens should not be visible outside cpplib. */
436 case CPP_HEADER_NAME
:
449 c_common_no_more_pch ();
453 *cpp_flags
= tok
->flags
;
460 return c_lex_with_flags (value
, NULL
);
463 /* Returns the narrowest C-visible unsigned type, starting with the
464 minimum specified by FLAGS, that can fit VALUE, or itk_none if
466 static enum integer_type_kind
467 narrowest_unsigned_type (tree value
, unsigned int flags
)
469 enum integer_type_kind itk
;
471 if ((flags
& CPP_N_WIDTH
) == CPP_N_SMALL
)
472 itk
= itk_unsigned_int
;
473 else if ((flags
& CPP_N_WIDTH
) == CPP_N_MEDIUM
)
474 itk
= itk_unsigned_long
;
476 itk
= itk_unsigned_long_long
;
478 /* int_fits_type_p must think the type of its first argument is
479 wider than its second argument, or it won't do the proper check. */
480 TREE_TYPE (value
) = widest_unsigned_literal_type_node
;
482 for (; itk
< itk_none
; itk
+= 2 /* skip unsigned types */)
483 if (int_fits_type_p (value
, integer_types
[itk
]))
489 /* Ditto, but narrowest signed type. */
490 static enum integer_type_kind
491 narrowest_signed_type (tree value
, unsigned int flags
)
493 enum integer_type_kind itk
;
495 if ((flags
& CPP_N_WIDTH
) == CPP_N_SMALL
)
497 else if ((flags
& CPP_N_WIDTH
) == CPP_N_MEDIUM
)
502 /* int_fits_type_p must think the type of its first argument is
503 wider than its second argument, or it won't do the proper check. */
504 TREE_TYPE (value
) = widest_unsigned_literal_type_node
;
506 for (; itk
< itk_none
; itk
+= 2 /* skip signed types */)
507 if (int_fits_type_p (value
, integer_types
[itk
]))
513 /* Interpret TOKEN, an integer with FLAGS as classified by cpplib. */
515 interpret_integer (const cpp_token
*token
, unsigned int flags
)
518 enum integer_type_kind itk
;
520 cpp_options
*options
= cpp_get_options (parse_in
);
522 integer
= cpp_interpret_integer (parse_in
, token
, flags
);
523 integer
= cpp_num_sign_extend (integer
, options
->precision
);
524 value
= build_int_2 (integer
.low
, integer
.high
);
526 /* The type of a constant with a U suffix is straightforward. */
527 if (flags
& CPP_N_UNSIGNED
)
528 itk
= narrowest_unsigned_type (value
, flags
);
531 /* The type of a potentially-signed integer constant varies
532 depending on the base it's in, the standard in use, and the
534 enum integer_type_kind itk_u
= narrowest_unsigned_type (value
, flags
);
535 enum integer_type_kind itk_s
= narrowest_signed_type (value
, flags
);
537 /* In both C89 and C99, octal and hex constants may be signed or
538 unsigned, whichever fits tighter. We do not warn about this
539 choice differing from the traditional choice, as the constant
540 is probably a bit pattern and either way will work. */
541 if ((flags
& CPP_N_RADIX
) != CPP_N_DECIMAL
)
542 itk
= MIN (itk_u
, itk_s
);
545 /* In C99, decimal constants are always signed.
546 In C89, decimal constants that don't fit in long have
547 undefined behavior; we try to make them unsigned long.
548 In GCC's extended C89, that last is true of decimal
549 constants that don't fit in long long, too. */
552 if (itk_s
> itk_u
&& itk_s
> itk_long
)
556 if (itk_u
< itk_unsigned_long
)
557 itk_u
= itk_unsigned_long
;
559 warning ("this decimal constant is unsigned only in ISO C90");
561 else if (warn_traditional
)
562 warning ("this decimal constant would be unsigned in ISO C90");
568 /* cpplib has already issued a warning for overflow. */
569 type
= ((flags
& CPP_N_UNSIGNED
)
570 ? widest_unsigned_literal_type_node
571 : widest_integer_literal_type_node
);
573 type
= integer_types
[itk
];
575 if (itk
> itk_unsigned_long
576 && (flags
& CPP_N_WIDTH
) != CPP_N_LARGE
577 && ! in_system_header
&& ! flag_isoc99
)
578 pedwarn ("integer constant is too large for \"%s\" type",
579 (flags
& CPP_N_UNSIGNED
) ? "unsigned long" : "long");
581 TREE_TYPE (value
) = type
;
583 /* Convert imaginary to a complex type. */
584 if (flags
& CPP_N_IMAGINARY
)
585 value
= build_complex (NULL_TREE
, convert (type
, integer_zero_node
), value
);
590 /* Interpret TOKEN, a floating point number with FLAGS as classified
593 interpret_float (const cpp_token
*token
, unsigned int flags
)
597 REAL_VALUE_TYPE real
;
600 const char *typename
;
602 /* FIXME: make %T work in error/warning, then we don't need typename. */
603 if ((flags
& CPP_N_WIDTH
) == CPP_N_LARGE
)
605 type
= long_double_type_node
;
606 typename
= "long double";
608 else if ((flags
& CPP_N_WIDTH
) == CPP_N_SMALL
609 || flag_single_precision_constant
)
611 type
= float_type_node
;
616 type
= double_type_node
;
620 /* Copy the constant to a nul-terminated buffer. If the constant
621 has any suffixes, cut them off; REAL_VALUE_ATOF/ REAL_VALUE_HTOF
622 can't handle them. */
623 copylen
= token
->val
.str
.len
;
624 if ((flags
& CPP_N_WIDTH
) != CPP_N_MEDIUM
)
625 /* Must be an F or L suffix. */
627 if (flags
& CPP_N_IMAGINARY
)
631 copy
= alloca (copylen
+ 1);
632 memcpy (copy
, token
->val
.str
.text
, copylen
);
633 copy
[copylen
] = '\0';
635 real_from_string (&real
, copy
);
636 real_convert (&real
, TYPE_MODE (type
), &real
);
638 /* A diagnostic is required for "soft" overflow by some ISO C
639 testsuites. This is not pedwarn, because some people don't want
641 ??? That's a dubious reason... is this a mandatory diagnostic or
642 isn't it? -- zw, 2001-08-21. */
643 if (REAL_VALUE_ISINF (real
) && pedantic
)
644 warning ("floating constant exceeds range of \"%s\"", typename
);
646 /* Create a node with determined type and value. */
647 value
= build_real (type
, real
);
648 if (flags
& CPP_N_IMAGINARY
)
649 value
= build_complex (NULL_TREE
, convert (type
, integer_zero_node
), value
);
654 /* Convert a series of STRING and/or WSTRING tokens into a tree,
655 performing string constant concatenation. TOK is the first of
656 these. VALP is the location to write the string into. OBJC_STRING
657 indicates whether an '@' token preceded the incoming token.
658 Returns the CPP token type of the result (CPP_STRING, CPP_WSTRING,
661 This is unfortunately more work than it should be. If any of the
662 strings in the series has an L prefix, the result is a wide string
663 (6.4.5p4). Whether or not the result is a wide string affects the
664 meaning of octal and hexadecimal escapes (6.4.4.4p6,9). But escape
665 sequences do not continue across the boundary between two strings in
666 a series (6.4.5p7), so we must not lose the boundaries. Therefore
667 cpp_interpret_string takes a vector of cpp_string structures, which
668 we must arrange to provide. */
670 static enum cpp_ttype
671 lex_string (const cpp_token
*tok
, tree
*valp
, bool objc_string
)
676 struct obstack str_ob
;
679 /* Try to avoid the overhead of creating and destroying an obstack
680 for the common case of just one string. */
681 cpp_string str
= tok
->val
.str
;
682 cpp_string
*strs
= &str
;
684 if (tok
->type
== CPP_WSTRING
)
687 tok
= get_nonpadding_token ();
688 if (c_dialect_objc () && tok
->type
== CPP_ATSIGN
)
691 tok
= get_nonpadding_token ();
693 if (tok
->type
== CPP_STRING
|| tok
->type
== CPP_WSTRING
)
695 gcc_obstack_init (&str_ob
);
696 obstack_grow (&str_ob
, &str
, sizeof (cpp_string
));
701 if (tok
->type
== CPP_WSTRING
)
703 obstack_grow (&str_ob
, &tok
->val
.str
, sizeof (cpp_string
));
705 tok
= get_nonpadding_token ();
706 if (c_dialect_objc () && tok
->type
== CPP_ATSIGN
)
709 tok
= get_nonpadding_token ();
712 while (tok
->type
== CPP_STRING
|| tok
->type
== CPP_WSTRING
);
713 strs
= obstack_finish (&str_ob
);
716 /* We have read one more token than we want. */
717 _cpp_backup_tokens (parse_in
, 1);
719 if (count
> 1 && !objc_string
&& warn_traditional
&& !in_system_header
)
720 warning ("traditional C rejects string constant concatenation");
722 if ((c_lex_string_translate
723 ? cpp_interpret_string
: cpp_interpret_string_notranslate
)
724 (parse_in
, strs
, count
, &istr
, wide
))
726 value
= build_string (istr
.len
, (char *)istr
.text
);
727 free ((void *)istr
.text
);
729 if (c_lex_string_translate
== -1)
731 if (!cpp_interpret_string_notranslate (parse_in
, strs
, count
,
733 /* Assume that, if we managed to translate the string
734 above, then the untranslated parsing will always
738 if (TREE_STRING_LENGTH (value
) != (int)istr
.len
739 || 0 != strncmp (TREE_STRING_POINTER (value
), (char *)istr
.text
,
742 /* Arrange for us to return the untranslated string in
743 *valp, but to set up the C type of the translated
745 *valp
= build_string (istr
.len
, (char *)istr
.text
);
746 valp
= &TREE_CHAIN (*valp
);
748 free ((void *)istr
.text
);
753 /* Callers cannot generally handle error_mark_node in this context,
754 so return the empty string instead. cpp_interpret_string has
757 value
= build_string (TYPE_PRECISION (wchar_type_node
)
758 / TYPE_PRECISION (char_type_node
),
759 "\0\0\0"); /* widest supported wchar_t
762 value
= build_string (1, "");
765 TREE_TYPE (value
) = wide
? wchar_array_type_node
: char_array_type_node
;
766 *valp
= fix_string_type (value
);
769 obstack_free (&str_ob
, 0);
771 return objc_string
? CPP_OBJC_STRING
: wide
? CPP_WSTRING
: CPP_STRING
;
774 /* Converts a (possibly wide) character constant token into a tree. */
776 lex_charconst (const cpp_token
*token
)
780 unsigned int chars_seen
;
783 result
= cpp_interpret_charconst (parse_in
, token
,
784 &chars_seen
, &unsignedp
);
786 /* Cast to cppchar_signed_t to get correct sign-extension of RESULT
787 before possibly widening to HOST_WIDE_INT for build_int_2. */
788 if (unsignedp
|| (cppchar_signed_t
) result
>= 0)
789 value
= build_int_2 (result
, 0);
791 value
= build_int_2 ((cppchar_signed_t
) result
, -1);
793 if (token
->type
== CPP_WCHAR
)
794 type
= wchar_type_node
;
795 /* In C, a character constant has type 'int'.
796 In C++ 'char', but multi-char charconsts have type 'int'. */
797 else if (!c_dialect_cxx () || chars_seen
> 1)
798 type
= integer_type_node
;
800 type
= char_type_node
;
802 TREE_TYPE (value
) = type
;