Add emergency dump after an ICE
[official-gcc.git] / gcc / c-family / c-lex.c
blobb1cef2345f491a600eaae4173b05b49e5bdf954b
1 /* Mainly the interface between cpplib and the C front ends.
2 Copyright (C) 1987-2020 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "target.h"
24 #include "c-common.h"
25 #include "timevar.h"
26 #include "stringpool.h"
27 #include "stor-layout.h"
28 #include "c-pragma.h"
29 #include "debug.h"
30 #include "file-prefix-map.h" /* remap_macro_filename() */
32 #include "attribs.h"
34 /* We may keep statistics about how long which files took to compile. */
35 static int header_time, body_time;
36 static splay_tree file_info_tree;
38 int pending_lang_change; /* If we need to switch languages - C++ only */
39 int c_header_level; /* depth in C headers - C++ only */
41 static tree interpret_integer (const cpp_token *, unsigned int,
42 enum overflow_type *);
43 static tree interpret_float (const cpp_token *, unsigned int, const char *,
44 enum overflow_type *);
45 static tree interpret_fixed (const cpp_token *, unsigned int);
46 static enum integer_type_kind narrowest_unsigned_type
47 (const widest_int &, unsigned int);
48 static enum integer_type_kind narrowest_signed_type
49 (const widest_int &, unsigned int);
50 static enum cpp_ttype lex_string (const cpp_token *, tree *, bool, bool);
51 static tree lex_charconst (const cpp_token *);
52 static void update_header_times (const char *);
53 static int dump_one_header (splay_tree_node, void *);
54 static void cb_line_change (cpp_reader *, const cpp_token *, int);
55 static void cb_ident (cpp_reader *, unsigned int, const cpp_string *);
56 static void cb_def_pragma (cpp_reader *, unsigned int);
57 static void cb_define (cpp_reader *, unsigned int, cpp_hashnode *);
58 static void cb_undef (cpp_reader *, unsigned int, cpp_hashnode *);
60 void
61 init_c_lex (void)
63 struct c_fileinfo *toplevel;
65 /* The get_fileinfo data structure must be initialized before
66 cpp_read_main_file is called. */
67 toplevel = get_fileinfo ("<top level>");
68 if (flag_detailed_statistics)
70 header_time = 0;
71 body_time = get_run_time ();
72 toplevel->time = body_time;
75 struct cpp_callbacks *cb = cpp_get_callbacks (parse_in);
77 cb->line_change = cb_line_change;
78 cb->ident = cb_ident;
79 cb->def_pragma = cb_def_pragma;
80 cb->valid_pch = c_common_valid_pch;
81 cb->read_pch = c_common_read_pch;
82 cb->has_attribute = c_common_has_attribute;
83 cb->has_builtin = c_common_has_builtin;
84 cb->get_source_date_epoch = cb_get_source_date_epoch;
85 cb->get_suggestion = cb_get_suggestion;
86 cb->remap_filename = remap_macro_filename;
88 /* Set the debug callbacks if we can use them. */
89 if ((debug_info_level == DINFO_LEVEL_VERBOSE
90 && (write_symbols == DWARF2_DEBUG
91 || write_symbols == VMS_AND_DWARF2_DEBUG))
92 || flag_dump_go_spec != NULL)
94 cb->define = cb_define;
95 cb->undef = cb_undef;
99 struct c_fileinfo *
100 get_fileinfo (const char *name)
102 splay_tree_node n;
103 struct c_fileinfo *fi;
105 if (!file_info_tree)
106 file_info_tree = splay_tree_new (splay_tree_compare_strings,
108 splay_tree_delete_pointers);
110 n = splay_tree_lookup (file_info_tree, (splay_tree_key) name);
111 if (n)
112 return (struct c_fileinfo *) n->value;
114 fi = XNEW (struct c_fileinfo);
115 fi->time = 0;
116 fi->interface_only = 0;
117 fi->interface_unknown = 1;
118 splay_tree_insert (file_info_tree, (splay_tree_key) name,
119 (splay_tree_value) fi);
120 return fi;
123 static void
124 update_header_times (const char *name)
126 /* Changing files again. This means currently collected time
127 is charged against header time, and body time starts back at 0. */
128 if (flag_detailed_statistics)
130 int this_time = get_run_time ();
131 struct c_fileinfo *file = get_fileinfo (name);
132 header_time += this_time - body_time;
133 file->time += this_time - body_time;
134 body_time = this_time;
138 static int
139 dump_one_header (splay_tree_node n, void * ARG_UNUSED (dummy))
141 print_time ((const char *) n->key,
142 ((struct c_fileinfo *) n->value)->time);
143 return 0;
146 void
147 dump_time_statistics (void)
149 struct c_fileinfo *file = get_fileinfo (LOCATION_FILE (input_location));
150 int this_time = get_run_time ();
151 file->time += this_time - body_time;
153 fprintf (stderr, "\n******\n");
154 print_time ("header files (total)", header_time);
155 print_time ("main file (total)", this_time - body_time);
156 fprintf (stderr, "ratio = %g : 1\n",
157 (double) header_time / (double) (this_time - body_time));
158 fprintf (stderr, "\n******\n");
160 splay_tree_foreach (file_info_tree, dump_one_header, 0);
163 static void
164 cb_ident (cpp_reader * ARG_UNUSED (pfile),
165 unsigned int ARG_UNUSED (line),
166 const cpp_string * ARG_UNUSED (str))
168 if (!flag_no_ident)
170 /* Convert escapes in the string. */
171 cpp_string cstr = { 0, 0 };
172 if (cpp_interpret_string (pfile, str, 1, &cstr, CPP_STRING))
174 targetm.asm_out.output_ident ((const char *) cstr.text);
175 free (CONST_CAST (unsigned char *, cstr.text));
180 /* Called at the start of every non-empty line. TOKEN is the first
181 lexed token on the line. Used for diagnostic line numbers. */
182 static void
183 cb_line_change (cpp_reader * ARG_UNUSED (pfile), const cpp_token *token,
184 int parsing_args)
186 if (token->type != CPP_EOF && !parsing_args)
187 input_location = token->src_loc;
190 void
191 fe_file_change (const line_map_ordinary *new_map)
193 if (new_map == NULL)
194 return;
196 if (new_map->reason == LC_ENTER)
198 /* Don't stack the main buffer on the input stack;
199 we already did in compile_file. */
200 if (!MAIN_FILE_P (new_map))
202 location_t included_at = linemap_included_from (new_map);
203 int line = 0;
204 if (included_at > BUILTINS_LOCATION)
205 line = SOURCE_LINE (new_map - 1, included_at);
207 input_location = new_map->start_location;
208 (*debug_hooks->start_source_file) (line, LINEMAP_FILE (new_map));
209 #ifdef SYSTEM_IMPLICIT_EXTERN_C
210 if (c_header_level)
211 ++c_header_level;
212 else if (LINEMAP_SYSP (new_map) == 2)
214 c_header_level = 1;
215 ++pending_lang_change;
217 #endif
220 else if (new_map->reason == LC_LEAVE)
222 #ifdef SYSTEM_IMPLICIT_EXTERN_C
223 if (c_header_level && --c_header_level == 0)
225 if (LINEMAP_SYSP (new_map) == 2)
226 warning (0, "badly nested C headers from preprocessor");
227 --pending_lang_change;
229 #endif
230 input_location = new_map->start_location;
232 (*debug_hooks->end_source_file) (LINEMAP_LINE (new_map));
235 update_header_times (LINEMAP_FILE (new_map));
236 input_location = new_map->start_location;
239 static void
240 cb_def_pragma (cpp_reader *pfile, location_t loc)
242 /* Issue a warning message if we have been asked to do so. Ignore
243 unknown pragmas in system headers unless an explicit
244 -Wunknown-pragmas has been given. */
245 if (warn_unknown_pragmas > in_system_header_at (input_location))
247 const unsigned char *space, *name;
248 const cpp_token *s;
249 location_t fe_loc = loc;
251 space = name = (const unsigned char *) "";
252 s = cpp_get_token (pfile);
253 if (s->type != CPP_EOF)
255 space = cpp_token_as_text (pfile, s);
256 s = cpp_get_token (pfile);
257 if (s->type == CPP_NAME)
258 name = cpp_token_as_text (pfile, s);
261 warning_at (fe_loc, OPT_Wunknown_pragmas, "ignoring %<#pragma %s %s%>",
262 space, name);
266 /* #define callback for DWARF and DWARF2 debug info. */
267 static void
268 cb_define (cpp_reader *pfile, location_t loc, cpp_hashnode *node)
270 const struct line_map *map = linemap_lookup (line_table, loc);
271 (*debug_hooks->define) (SOURCE_LINE (linemap_check_ordinary (map), loc),
272 (const char *) cpp_macro_definition (pfile, node));
275 /* #undef callback for DWARF and DWARF2 debug info. */
276 static void
277 cb_undef (cpp_reader * ARG_UNUSED (pfile), location_t loc,
278 cpp_hashnode *node)
280 const struct line_map *map = linemap_lookup (line_table, loc);
281 (*debug_hooks->undef) (SOURCE_LINE (linemap_check_ordinary (map), loc),
282 (const char *) NODE_NAME (node));
285 /* Wrapper around cpp_get_token to skip CPP_PADDING tokens
286 and not consume CPP_EOF. */
287 static const cpp_token *
288 get_token_no_padding (cpp_reader *pfile)
290 for (;;)
292 const cpp_token *ret = cpp_peek_token (pfile, 0);
293 if (ret->type == CPP_EOF)
294 return ret;
295 ret = cpp_get_token (pfile);
296 if (ret->type != CPP_PADDING)
297 return ret;
301 /* Callback for has_attribute. */
303 c_common_has_attribute (cpp_reader *pfile)
305 int result = 0;
306 tree attr_name = NULL_TREE;
307 const cpp_token *token;
309 token = get_token_no_padding (pfile);
310 if (token->type != CPP_OPEN_PAREN)
312 cpp_error (pfile, CPP_DL_ERROR,
313 "missing '(' after \"__has_attribute\"");
314 return 0;
316 token = get_token_no_padding (pfile);
317 if (token->type == CPP_NAME)
319 attr_name = get_identifier ((const char *)
320 cpp_token_as_text (pfile, token));
321 attr_name = canonicalize_attr_name (attr_name);
322 if (c_dialect_cxx ())
324 int idx = 0;
325 const cpp_token *nxt_token;
327 nxt_token = cpp_peek_token (pfile, idx++);
328 while (nxt_token->type == CPP_PADDING);
329 if (nxt_token->type == CPP_SCOPE)
331 get_token_no_padding (pfile); // Eat scope.
332 nxt_token = get_token_no_padding (pfile);
333 if (nxt_token->type == CPP_NAME)
335 tree attr_ns = attr_name;
336 tree attr_id
337 = get_identifier ((const char *)
338 cpp_token_as_text (pfile, nxt_token));
339 attr_name = build_tree_list (attr_ns, attr_id);
341 else
343 cpp_error (pfile, CPP_DL_ERROR,
344 "attribute identifier required after scope");
345 attr_name = NULL_TREE;
348 else
350 /* Some standard attributes need special handling. */
351 if (is_attribute_p ("noreturn", attr_name))
352 result = 200809;
353 else if (is_attribute_p ("deprecated", attr_name))
354 result = 201309;
355 else if (is_attribute_p ("maybe_unused", attr_name)
356 || is_attribute_p ("fallthrough", attr_name))
357 result = 201603;
358 else if (is_attribute_p ("no_unique_address", attr_name)
359 || is_attribute_p ("likely", attr_name)
360 || is_attribute_p ("unlikely", attr_name))
361 result = 201803;
362 else if (is_attribute_p ("nodiscard", attr_name))
363 result = 201907;
364 if (result)
365 attr_name = NULL_TREE;
368 if (attr_name)
370 init_attributes ();
371 const struct attribute_spec *attr = lookup_attribute_spec (attr_name);
372 if (attr)
373 result = 1;
376 else
378 cpp_error (pfile, CPP_DL_ERROR,
379 "macro \"__has_attribute\" requires an identifier");
380 return 0;
383 if (get_token_no_padding (pfile)->type != CPP_CLOSE_PAREN)
384 cpp_error (pfile, CPP_DL_ERROR,
385 "missing ')' after \"__has_attribute\"");
387 return result;
390 /* Callback for has_builtin. */
393 c_common_has_builtin (cpp_reader *pfile)
395 const cpp_token *token = get_token_no_padding (pfile);
396 if (token->type != CPP_OPEN_PAREN)
398 cpp_error (pfile, CPP_DL_ERROR,
399 "missing '(' after \"__has_builtin\"");
400 return 0;
403 const char *name = "";
404 token = get_token_no_padding (pfile);
405 if (token->type == CPP_NAME)
407 name = (const char *) cpp_token_as_text (pfile, token);
408 token = get_token_no_padding (pfile);
409 if (token->type != CPP_CLOSE_PAREN)
411 cpp_error (pfile, CPP_DL_ERROR,
412 "expected ')' after \"%s\"", name);
413 name = "";
416 else
418 cpp_error (pfile, CPP_DL_ERROR,
419 "macro \"__has_builtin\" requires an identifier");
420 if (token->type == CPP_CLOSE_PAREN)
421 return 0;
424 /* Consume tokens up to the closing parenthesis, including any nested
425 pairs of parentheses, to avoid confusing redundant errors. */
426 for (unsigned nparen = 1; ; token = get_token_no_padding (pfile))
428 if (token->type == CPP_OPEN_PAREN)
429 ++nparen;
430 else if (token->type == CPP_CLOSE_PAREN)
431 --nparen;
432 else if (token->type == CPP_EOF)
433 break;
434 if (!nparen)
435 break;
438 return names_builtin_p (name);
442 /* Read a token and return its type. Fill *VALUE with its value, if
443 applicable. Fill *CPP_FLAGS with the token's flags, if it is
444 non-NULL. */
446 enum cpp_ttype
447 c_lex_with_flags (tree *value, location_t *loc, unsigned char *cpp_flags,
448 int lex_flags)
450 const cpp_token *tok;
451 enum cpp_ttype type;
452 unsigned char add_flags = 0;
453 enum overflow_type overflow = OT_NONE;
455 timevar_push (TV_CPP);
456 retry:
457 tok = cpp_get_token_with_location (parse_in, loc);
458 type = tok->type;
460 retry_after_at:
461 switch (type)
463 case CPP_PADDING:
464 goto retry;
466 case CPP_NAME:
467 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
468 break;
470 case CPP_NUMBER:
472 const char *suffix = NULL;
473 unsigned int flags = cpp_classify_number (parse_in, tok, &suffix, *loc);
475 switch (flags & CPP_N_CATEGORY)
477 case CPP_N_INVALID:
478 /* cpplib has issued an error. */
479 *value = error_mark_node;
480 break;
482 case CPP_N_INTEGER:
483 /* C++ uses '0' to mark virtual functions as pure.
484 Set PURE_ZERO to pass this information to the C++ parser. */
485 if (tok->val.str.len == 1 && *tok->val.str.text == '0')
486 add_flags = PURE_ZERO;
487 *value = interpret_integer (tok, flags, &overflow);
488 break;
490 case CPP_N_FLOATING:
491 *value = interpret_float (tok, flags, suffix, &overflow);
492 break;
494 default:
495 gcc_unreachable ();
498 if (flags & CPP_N_USERDEF)
500 char *str;
501 tree literal;
502 tree suffix_id = get_identifier (suffix);
503 int len = tok->val.str.len - strlen (suffix);
504 /* If this is going to be used as a C string to pass to a
505 raw literal operator, we need to add a trailing NUL. */
506 tree num_string = build_string (len + 1,
507 (const char *) tok->val.str.text);
508 TREE_TYPE (num_string) = char_array_type_node;
509 num_string = fix_string_type (num_string);
510 str = CONST_CAST (char *, TREE_STRING_POINTER (num_string));
511 str[len] = '\0';
512 literal = build_userdef_literal (suffix_id, *value, overflow,
513 num_string);
514 *value = literal;
517 break;
519 case CPP_ATSIGN:
520 /* An @ may give the next token special significance in Objective-C. */
521 if (c_dialect_objc ())
523 location_t atloc = *loc;
524 location_t newloc;
526 retry_at:
527 tok = cpp_get_token_with_location (parse_in, &newloc);
528 type = tok->type;
529 switch (type)
531 case CPP_PADDING:
532 goto retry_at;
534 case CPP_STRING:
535 case CPP_WSTRING:
536 case CPP_STRING16:
537 case CPP_STRING32:
538 case CPP_UTF8STRING:
539 type = lex_string (tok, value, true, true);
540 break;
542 case CPP_NAME:
543 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
544 if (OBJC_IS_AT_KEYWORD (C_RID_CODE (*value))
545 || OBJC_IS_CXX_KEYWORD (C_RID_CODE (*value)))
547 type = CPP_AT_NAME;
548 /* Note the complication: if we found an OBJC_CXX
549 keyword, for example, 'class', we will be
550 returning a token of type CPP_AT_NAME and rid
551 code RID_CLASS (not RID_AT_CLASS). The language
552 parser needs to convert that to RID_AT_CLASS.
554 break;
556 /* FALLTHROUGH */
558 default:
559 /* ... or not. */
560 error_at (atloc, "stray %<@%> in program");
561 *loc = newloc;
562 goto retry_after_at;
564 break;
567 /* FALLTHROUGH */
568 case CPP_HASH:
569 case CPP_PASTE:
571 unsigned char name[8];
573 *cpp_spell_token (parse_in, tok, name, true) = 0;
575 error_at (*loc, "stray %qs in program", name);
578 goto retry;
580 case CPP_OTHER:
582 cppchar_t c = tok->val.str.text[0];
584 if (c == '"' || c == '\'')
585 error_at (*loc, "missing terminating %c character", (int) c);
586 else if (ISGRAPH (c))
587 error_at (*loc, "stray %qc in program", (int) c);
588 else
589 error_at (*loc, "stray %<\\%o%> in program", (int) c);
591 goto retry;
593 case CPP_CHAR_USERDEF:
594 case CPP_WCHAR_USERDEF:
595 case CPP_CHAR16_USERDEF:
596 case CPP_CHAR32_USERDEF:
597 case CPP_UTF8CHAR_USERDEF:
599 tree literal;
600 cpp_token temp_tok = *tok;
601 const char *suffix = cpp_get_userdef_suffix (tok);
602 temp_tok.val.str.len -= strlen (suffix);
603 temp_tok.type = cpp_userdef_char_remove_type (type);
604 literal = build_userdef_literal (get_identifier (suffix),
605 lex_charconst (&temp_tok),
606 OT_NONE, NULL_TREE);
607 *value = literal;
609 break;
611 case CPP_CHAR:
612 case CPP_WCHAR:
613 case CPP_CHAR16:
614 case CPP_CHAR32:
615 case CPP_UTF8CHAR:
616 *value = lex_charconst (tok);
617 break;
619 case CPP_STRING_USERDEF:
620 case CPP_WSTRING_USERDEF:
621 case CPP_STRING16_USERDEF:
622 case CPP_STRING32_USERDEF:
623 case CPP_UTF8STRING_USERDEF:
625 tree literal, string;
626 const char *suffix = cpp_get_userdef_suffix (tok);
627 string = build_string (tok->val.str.len - strlen (suffix),
628 (const char *) tok->val.str.text);
629 literal = build_userdef_literal (get_identifier (suffix),
630 string, OT_NONE, NULL_TREE);
631 *value = literal;
633 break;
635 case CPP_STRING:
636 case CPP_WSTRING:
637 case CPP_STRING16:
638 case CPP_STRING32:
639 case CPP_UTF8STRING:
640 if ((lex_flags & C_LEX_STRING_NO_JOIN) == 0)
642 type = lex_string (tok, value, false,
643 (lex_flags & C_LEX_STRING_NO_TRANSLATE) == 0);
644 break;
646 *value = build_string (tok->val.str.len, (const char *) tok->val.str.text);
647 break;
649 case CPP_PRAGMA:
650 *value = build_int_cst (integer_type_node, tok->val.pragma);
651 break;
653 /* These tokens should not be visible outside cpplib. */
654 case CPP_HEADER_NAME:
655 case CPP_MACRO_ARG:
656 gcc_unreachable ();
658 /* CPP_COMMENT will appear when compiling with -C. Ignore, except
659 when it is a FALLTHROUGH comment, in that case set
660 PREV_FALLTHROUGH flag on the next non-comment token. */
661 case CPP_COMMENT:
662 if (tok->flags & PREV_FALLTHROUGH)
666 tok = cpp_get_token_with_location (parse_in, loc);
667 type = tok->type;
669 while (type == CPP_PADDING || type == CPP_COMMENT);
670 add_flags |= PREV_FALLTHROUGH;
671 goto retry_after_at;
673 goto retry;
675 default:
676 *value = NULL_TREE;
677 break;
680 if (cpp_flags)
681 *cpp_flags = tok->flags | add_flags;
683 timevar_pop (TV_CPP);
685 return type;
688 /* Returns the narrowest C-visible unsigned type, starting with the
689 minimum specified by FLAGS, that can fit HIGH:LOW, or itk_none if
690 there isn't one. */
692 static enum integer_type_kind
693 narrowest_unsigned_type (const widest_int &val, unsigned int flags)
695 int itk;
697 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
698 itk = itk_unsigned_int;
699 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
700 itk = itk_unsigned_long;
701 else
702 itk = itk_unsigned_long_long;
704 for (; itk < itk_none; itk += 2 /* skip unsigned types */)
706 tree upper;
708 if (integer_types[itk] == NULL_TREE)
709 continue;
710 upper = TYPE_MAX_VALUE (integer_types[itk]);
712 if (wi::geu_p (wi::to_widest (upper), val))
713 return (enum integer_type_kind) itk;
716 return itk_none;
719 /* Ditto, but narrowest signed type. */
720 static enum integer_type_kind
721 narrowest_signed_type (const widest_int &val, unsigned int flags)
723 int itk;
725 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
726 itk = itk_int;
727 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
728 itk = itk_long;
729 else
730 itk = itk_long_long;
732 for (; itk < itk_none; itk += 2 /* skip signed types */)
734 tree upper;
736 if (integer_types[itk] == NULL_TREE)
737 continue;
738 upper = TYPE_MAX_VALUE (integer_types[itk]);
740 if (wi::geu_p (wi::to_widest (upper), val))
741 return (enum integer_type_kind) itk;
744 return itk_none;
747 /* Interpret TOKEN, an integer with FLAGS as classified by cpplib. */
748 static tree
749 interpret_integer (const cpp_token *token, unsigned int flags,
750 enum overflow_type *overflow)
752 tree value, type;
753 enum integer_type_kind itk;
754 cpp_num integer;
755 HOST_WIDE_INT ival[3];
757 *overflow = OT_NONE;
759 integer = cpp_interpret_integer (parse_in, token, flags);
760 if (integer.overflow)
761 *overflow = OT_OVERFLOW;
763 ival[0] = integer.low;
764 ival[1] = integer.high;
765 ival[2] = 0;
766 widest_int wval = widest_int::from_array (ival, 3);
768 /* The type of a constant with a U suffix is straightforward. */
769 if (flags & CPP_N_UNSIGNED)
770 itk = narrowest_unsigned_type (wval, flags);
771 else
773 /* The type of a potentially-signed integer constant varies
774 depending on the base it's in, the standard in use, and the
775 length suffixes. */
776 enum integer_type_kind itk_u
777 = narrowest_unsigned_type (wval, flags);
778 enum integer_type_kind itk_s
779 = narrowest_signed_type (wval, flags);
781 /* In both C89 and C99, octal and hex constants may be signed or
782 unsigned, whichever fits tighter. We do not warn about this
783 choice differing from the traditional choice, as the constant
784 is probably a bit pattern and either way will work. */
785 if ((flags & CPP_N_RADIX) != CPP_N_DECIMAL)
786 itk = MIN (itk_u, itk_s);
787 else
789 /* In C99, decimal constants are always signed.
790 In C89, decimal constants that don't fit in long have
791 undefined behavior; we try to make them unsigned long.
792 In GCC's extended C89, that last is true of decimal
793 constants that don't fit in long long, too. */
795 itk = itk_s;
796 if (itk_s > itk_u && itk_s > itk_long)
798 if (!flag_isoc99)
800 if (itk_u < itk_unsigned_long)
801 itk_u = itk_unsigned_long;
802 itk = itk_u;
803 warning (0, "this decimal constant is unsigned only in ISO C90");
805 else
806 warning (OPT_Wtraditional,
807 "this decimal constant would be unsigned in ISO C90");
812 if (itk == itk_none)
813 /* cpplib has already issued a warning for overflow. */
814 type = ((flags & CPP_N_UNSIGNED)
815 ? widest_unsigned_literal_type_node
816 : widest_integer_literal_type_node);
817 else
819 type = integer_types[itk];
820 if (itk > itk_unsigned_long
821 && (flags & CPP_N_WIDTH) != CPP_N_LARGE)
822 emit_diagnostic
823 ((c_dialect_cxx () ? cxx_dialect == cxx98 : !flag_isoc99)
824 ? DK_PEDWARN : DK_WARNING,
825 input_location, OPT_Wlong_long,
826 (flags & CPP_N_UNSIGNED)
827 ? "integer constant is too large for %<unsigned long%> type"
828 : "integer constant is too large for %<long%> type");
831 value = wide_int_to_tree (type, wval);
833 /* Convert imaginary to a complex type. */
834 if (flags & CPP_N_IMAGINARY)
835 value = build_complex (NULL_TREE, build_int_cst (type, 0), value);
837 return value;
840 /* Interpret TOKEN, a floating point number with FLAGS as classified
841 by cpplib. For C++11 SUFFIX may contain a user-defined literal suffix. */
842 static tree
843 interpret_float (const cpp_token *token, unsigned int flags,
844 const char *suffix, enum overflow_type *overflow)
846 tree type;
847 tree const_type;
848 tree value;
849 REAL_VALUE_TYPE real;
850 REAL_VALUE_TYPE real_trunc;
851 char *copy;
852 size_t copylen;
854 *overflow = OT_NONE;
856 /* Default (no suffix) depends on whether the FLOAT_CONST_DECIMAL64
857 pragma has been used and is either double or _Decimal64. Types
858 that are not allowed with decimal float default to double. */
859 if (flags & CPP_N_DEFAULT)
861 flags ^= CPP_N_DEFAULT;
862 flags |= CPP_N_MEDIUM;
864 if (((flags & CPP_N_HEX) == 0) && ((flags & CPP_N_IMAGINARY) == 0))
866 warning (OPT_Wunsuffixed_float_constants,
867 "unsuffixed floating constant");
868 if (float_const_decimal64_p ())
869 flags |= CPP_N_DFLOAT;
873 /* Decode _Fract and _Accum. */
874 if (flags & CPP_N_FRACT || flags & CPP_N_ACCUM)
875 return interpret_fixed (token, flags);
877 /* Decode type based on width and properties. */
878 if (flags & CPP_N_DFLOAT)
879 if (!targetm.decimal_float_supported_p ())
881 error ("decimal floating-point not supported for this target");
882 return error_mark_node;
884 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
885 type = dfloat128_type_node;
886 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
887 type = dfloat32_type_node;
888 else
889 type = dfloat64_type_node;
890 else
891 if (flags & CPP_N_WIDTH_MD)
893 char suffix;
894 machine_mode mode;
896 if ((flags & CPP_N_WIDTH_MD) == CPP_N_MD_W)
897 suffix = 'w';
898 else
899 suffix = 'q';
901 mode = targetm.c.mode_for_suffix (suffix);
902 if (mode == VOIDmode)
904 error ("unsupported non-standard suffix on floating constant");
906 return error_mark_node;
908 else
909 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
911 type = c_common_type_for_mode (mode, 0);
912 gcc_assert (type);
914 else if ((flags & (CPP_N_FLOATN | CPP_N_FLOATNX)) != 0)
916 unsigned int n = (flags & CPP_N_WIDTH_FLOATN_NX) >> CPP_FLOATN_SHIFT;
917 bool extended = (flags & CPP_N_FLOATNX) != 0;
918 type = NULL_TREE;
919 for (int i = 0; i < NUM_FLOATN_NX_TYPES; i++)
920 if (floatn_nx_types[i].n == (int) n
921 && floatn_nx_types[i].extended == extended)
923 type = FLOATN_NX_TYPE_NODE (i);
924 break;
926 if (type == NULL_TREE)
928 error ("unsupported non-standard suffix on floating constant");
929 return error_mark_node;
931 else
932 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
934 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
935 type = long_double_type_node;
936 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL
937 || flag_single_precision_constant)
938 type = float_type_node;
939 else
940 type = double_type_node;
942 const_type = excess_precision_type (type);
943 if (!const_type)
944 const_type = type;
946 /* Copy the constant to a nul-terminated buffer. If the constant
947 has any suffixes, cut them off; REAL_VALUE_ATOF/ REAL_VALUE_HTOF
948 can't handle them. */
949 copylen = token->val.str.len;
950 if (flags & CPP_N_USERDEF)
951 copylen -= strlen (suffix);
952 else if (flags & CPP_N_DFLOAT)
953 copylen -= 2;
954 else
956 if ((flags & CPP_N_WIDTH) != CPP_N_MEDIUM)
957 /* Must be an F or L or machine defined suffix. */
958 copylen--;
959 if (flags & CPP_N_IMAGINARY)
960 /* I or J suffix. */
961 copylen--;
962 if (flags & CPP_N_FLOATNX)
963 copylen--;
964 if (flags & (CPP_N_FLOATN | CPP_N_FLOATNX))
966 unsigned int n = (flags & CPP_N_WIDTH_FLOATN_NX) >> CPP_FLOATN_SHIFT;
967 while (n > 0)
969 copylen--;
970 n /= 10;
975 copy = (char *) alloca (copylen + 1);
976 if (cxx_dialect > cxx11)
978 size_t maxlen = 0;
979 for (size_t i = 0; i < copylen; ++i)
980 if (token->val.str.text[i] != '\'')
981 copy[maxlen++] = token->val.str.text[i];
982 copy[maxlen] = '\0';
984 else
986 memcpy (copy, token->val.str.text, copylen);
987 copy[copylen] = '\0';
990 real_from_string3 (&real, copy, TYPE_MODE (const_type));
991 if (const_type != type)
992 /* Diagnosing if the result of converting the value with excess
993 precision to the semantic type would overflow (with associated
994 double rounding) is more appropriate than diagnosing if the
995 result of converting the string directly to the semantic type
996 would overflow. */
997 real_convert (&real_trunc, TYPE_MODE (type), &real);
999 /* Both C and C++ require a diagnostic for a floating constant
1000 outside the range of representable values of its type. Since we
1001 have __builtin_inf* to produce an infinity, this is now a
1002 mandatory pedwarn if the target does not support infinities. */
1003 if (REAL_VALUE_ISINF (real)
1004 || (const_type != type && REAL_VALUE_ISINF (real_trunc)))
1006 *overflow = OT_OVERFLOW;
1007 if (!(flags & CPP_N_USERDEF))
1009 if (!MODE_HAS_INFINITIES (TYPE_MODE (type)))
1010 pedwarn (input_location, 0,
1011 "floating constant exceeds range of %qT", type);
1012 else
1013 warning (OPT_Woverflow,
1014 "floating constant exceeds range of %qT", type);
1017 /* We also give a warning if the value underflows. */
1018 else if (real_equal (&real, &dconst0)
1019 || (const_type != type
1020 && real_equal (&real_trunc, &dconst0)))
1022 REAL_VALUE_TYPE realvoidmode;
1023 int oflow = real_from_string (&realvoidmode, copy);
1024 *overflow = (oflow == 0 ? OT_NONE
1025 : (oflow < 0 ? OT_UNDERFLOW : OT_OVERFLOW));
1026 if (!(flags & CPP_N_USERDEF))
1028 if (oflow < 0 || !real_equal (&realvoidmode, &dconst0))
1029 warning (OPT_Woverflow, "floating constant truncated to zero");
1033 /* Create a node with determined type and value. */
1034 value = build_real (const_type, real);
1035 if (flags & CPP_N_IMAGINARY)
1037 value = build_complex (NULL_TREE,
1038 fold_convert (const_type,
1039 integer_zero_node), value);
1040 if (type != const_type)
1042 const_type = TREE_TYPE (value);
1043 type = build_complex_type (type);
1047 if (type != const_type)
1048 value = build1_loc (token->src_loc, EXCESS_PRECISION_EXPR, type, value);
1050 return value;
1053 /* Interpret TOKEN, a fixed-point number with FLAGS as classified
1054 by cpplib. */
1056 static tree
1057 interpret_fixed (const cpp_token *token, unsigned int flags)
1059 tree type;
1060 tree value;
1061 FIXED_VALUE_TYPE fixed;
1062 char *copy;
1063 size_t copylen;
1065 copylen = token->val.str.len;
1067 if (flags & CPP_N_FRACT) /* _Fract. */
1069 if (flags & CPP_N_UNSIGNED) /* Unsigned _Fract. */
1071 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1073 type = unsigned_long_long_fract_type_node;
1074 copylen -= 4;
1076 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1078 type = unsigned_long_fract_type_node;
1079 copylen -= 3;
1081 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1083 type = unsigned_short_fract_type_node;
1084 copylen -= 3;
1086 else
1088 type = unsigned_fract_type_node;
1089 copylen -= 2;
1092 else /* Signed _Fract. */
1094 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1096 type = long_long_fract_type_node;
1097 copylen -= 3;
1099 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1101 type = long_fract_type_node;
1102 copylen -= 2;
1104 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1106 type = short_fract_type_node;
1107 copylen -= 2;
1109 else
1111 type = fract_type_node;
1112 copylen --;
1116 else /* _Accum. */
1118 if (flags & CPP_N_UNSIGNED) /* Unsigned _Accum. */
1120 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1122 type = unsigned_long_long_accum_type_node;
1123 copylen -= 4;
1125 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1127 type = unsigned_long_accum_type_node;
1128 copylen -= 3;
1130 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1132 type = unsigned_short_accum_type_node;
1133 copylen -= 3;
1135 else
1137 type = unsigned_accum_type_node;
1138 copylen -= 2;
1141 else /* Signed _Accum. */
1143 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1145 type = long_long_accum_type_node;
1146 copylen -= 3;
1148 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1150 type = long_accum_type_node;
1151 copylen -= 2;
1153 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1155 type = short_accum_type_node;
1156 copylen -= 2;
1158 else
1160 type = accum_type_node;
1161 copylen --;
1166 copy = (char *) alloca (copylen + 1);
1167 memcpy (copy, token->val.str.text, copylen);
1168 copy[copylen] = '\0';
1170 fixed_from_string (&fixed, copy, SCALAR_TYPE_MODE (type));
1172 /* Create a node with determined type and value. */
1173 value = build_fixed (type, fixed);
1175 return value;
1178 /* Convert a series of STRING, WSTRING, STRING16, STRING32 and/or
1179 UTF8STRING tokens into a tree, performing string constant
1180 concatenation. TOK is the first of these. VALP is the location to
1181 write the string into. OBJC_STRING indicates whether an '@' token
1182 preceded the incoming token (in that case, the strings can either
1183 be ObjC strings, preceded by a single '@', or normal strings, not
1184 preceded by '@'. The result will be a CPP_OBJC_STRING). Returns
1185 the CPP token type of the result (CPP_STRING, CPP_WSTRING,
1186 CPP_STRING32, CPP_STRING16, CPP_UTF8STRING, or CPP_OBJC_STRING).
1188 This is unfortunately more work than it should be. If any of the
1189 strings in the series has an L prefix, the result is a wide string
1190 (6.4.5p4). Whether or not the result is a wide string affects the
1191 meaning of octal and hexadecimal escapes (6.4.4.4p6,9). But escape
1192 sequences do not continue across the boundary between two strings in
1193 a series (6.4.5p7), so we must not lose the boundaries. Therefore
1194 cpp_interpret_string takes a vector of cpp_string structures, which
1195 we must arrange to provide. */
1197 static enum cpp_ttype
1198 lex_string (const cpp_token *tok, tree *valp, bool objc_string, bool translate)
1200 tree value;
1201 size_t concats = 0;
1202 struct obstack str_ob;
1203 struct obstack loc_ob;
1204 cpp_string istr;
1205 enum cpp_ttype type = tok->type;
1207 /* Try to avoid the overhead of creating and destroying an obstack
1208 for the common case of just one string. */
1209 cpp_string str = tok->val.str;
1210 location_t init_loc = tok->src_loc;
1211 cpp_string *strs = &str;
1212 location_t *locs = NULL;
1214 /* objc_at_sign_was_seen is only used when doing Objective-C string
1215 concatenation. It is 'true' if we have seen an '@' before the
1216 current string, and 'false' if not. We must see exactly one or
1217 zero '@' before each string. */
1218 bool objc_at_sign_was_seen = false;
1220 retry:
1221 tok = cpp_get_token (parse_in);
1222 switch (tok->type)
1224 case CPP_PADDING:
1225 goto retry;
1226 case CPP_ATSIGN:
1227 if (objc_string)
1229 if (objc_at_sign_was_seen)
1230 error ("repeated %<@%> before Objective-C string");
1232 objc_at_sign_was_seen = true;
1233 goto retry;
1235 /* FALLTHROUGH */
1237 default:
1238 break;
1240 case CPP_WSTRING:
1241 case CPP_STRING16:
1242 case CPP_STRING32:
1243 case CPP_UTF8STRING:
1244 if (type != tok->type)
1246 if (type == CPP_STRING)
1247 type = tok->type;
1248 else
1249 error ("unsupported non-standard concatenation of string literals");
1251 /* FALLTHROUGH */
1253 case CPP_STRING:
1254 if (!concats)
1256 gcc_obstack_init (&str_ob);
1257 gcc_obstack_init (&loc_ob);
1258 obstack_grow (&str_ob, &str, sizeof (cpp_string));
1259 obstack_grow (&loc_ob, &init_loc, sizeof (location_t));
1262 concats++;
1263 obstack_grow (&str_ob, &tok->val.str, sizeof (cpp_string));
1264 obstack_grow (&loc_ob, &tok->src_loc, sizeof (location_t));
1266 if (objc_string)
1267 objc_at_sign_was_seen = false;
1268 goto retry;
1271 /* It is an error if we saw a '@' with no following string. */
1272 if (objc_at_sign_was_seen)
1273 error ("stray %<@%> in program");
1275 /* We have read one more token than we want. */
1276 _cpp_backup_tokens (parse_in, 1);
1277 if (concats)
1279 strs = XOBFINISH (&str_ob, cpp_string *);
1280 locs = XOBFINISH (&loc_ob, location_t *);
1283 if (concats && !objc_string && !in_system_header_at (input_location))
1284 warning (OPT_Wtraditional,
1285 "traditional C rejects string constant concatenation");
1287 if ((translate
1288 ? cpp_interpret_string : cpp_interpret_string_notranslate)
1289 (parse_in, strs, concats + 1, &istr, type))
1291 value = build_string (istr.len, (const char *) istr.text);
1292 free (CONST_CAST (unsigned char *, istr.text));
1293 if (concats)
1295 gcc_assert (locs);
1296 gcc_assert (g_string_concat_db);
1297 g_string_concat_db->record_string_concatenation (concats + 1, locs);
1300 else
1302 /* Callers cannot generally handle error_mark_node in this context,
1303 so return the empty string instead. cpp_interpret_string has
1304 issued an error. */
1305 switch (type)
1307 default:
1308 case CPP_STRING:
1309 case CPP_UTF8STRING:
1310 value = build_string (1, "");
1311 break;
1312 case CPP_STRING16:
1313 value = build_string (TYPE_PRECISION (char16_type_node)
1314 / TYPE_PRECISION (char_type_node),
1315 "\0"); /* char16_t is 16 bits */
1316 break;
1317 case CPP_STRING32:
1318 value = build_string (TYPE_PRECISION (char32_type_node)
1319 / TYPE_PRECISION (char_type_node),
1320 "\0\0\0"); /* char32_t is 32 bits */
1321 break;
1322 case CPP_WSTRING:
1323 value = build_string (TYPE_PRECISION (wchar_type_node)
1324 / TYPE_PRECISION (char_type_node),
1325 "\0\0\0"); /* widest supported wchar_t
1326 is 32 bits */
1327 break;
1331 switch (type)
1333 default:
1334 case CPP_STRING:
1335 TREE_TYPE (value) = char_array_type_node;
1336 break;
1337 case CPP_UTF8STRING:
1338 if (flag_char8_t)
1339 TREE_TYPE (value) = char8_array_type_node;
1340 else
1341 TREE_TYPE (value) = char_array_type_node;
1342 break;
1343 case CPP_STRING16:
1344 TREE_TYPE (value) = char16_array_type_node;
1345 break;
1346 case CPP_STRING32:
1347 TREE_TYPE (value) = char32_array_type_node;
1348 break;
1349 case CPP_WSTRING:
1350 TREE_TYPE (value) = wchar_array_type_node;
1352 *valp = fix_string_type (value);
1354 if (concats)
1356 obstack_free (&str_ob, 0);
1357 obstack_free (&loc_ob, 0);
1360 return objc_string ? CPP_OBJC_STRING : type;
1363 /* Converts a (possibly wide) character constant token into a tree. */
1364 static tree
1365 lex_charconst (const cpp_token *token)
1367 cppchar_t result;
1368 tree type, value;
1369 unsigned int chars_seen;
1370 int unsignedp = 0;
1372 result = cpp_interpret_charconst (parse_in, token,
1373 &chars_seen, &unsignedp);
1375 if (token->type == CPP_WCHAR)
1376 type = wchar_type_node;
1377 else if (token->type == CPP_CHAR32)
1378 type = char32_type_node;
1379 else if (token->type == CPP_CHAR16)
1380 type = char16_type_node;
1381 else if (token->type == CPP_UTF8CHAR)
1383 if (!c_dialect_cxx ())
1384 type = unsigned_char_type_node;
1385 else if (flag_char8_t)
1386 type = char8_type_node;
1387 else
1388 type = char_type_node;
1390 /* In C, a character constant has type 'int'.
1391 In C++ 'char', but multi-char charconsts have type 'int'. */
1392 else if (!c_dialect_cxx () || chars_seen > 1)
1393 type = integer_type_node;
1394 else
1395 type = char_type_node;
1397 /* Cast to cppchar_signed_t to get correct sign-extension of RESULT
1398 before possibly widening to HOST_WIDE_INT for build_int_cst. */
1399 if (unsignedp || (cppchar_signed_t) result >= 0)
1400 value = build_int_cst (type, result);
1401 else
1402 value = build_int_cst (type, (cppchar_signed_t) result);
1404 return value;
1407 /* Helper function for c_parser_peek_conflict_marker
1408 and cp_lexer_peek_conflict_marker.
1409 Given a possible conflict marker token of kind TOK1_KIND
1410 consisting of a pair of characters, get the token kind for the
1411 standalone final character. */
1413 enum cpp_ttype
1414 conflict_marker_get_final_tok_kind (enum cpp_ttype tok1_kind)
1416 switch (tok1_kind)
1418 default: gcc_unreachable ();
1419 case CPP_LSHIFT:
1420 /* "<<" and '<' */
1421 return CPP_LESS;
1423 case CPP_EQ_EQ:
1424 /* "==" and '=' */
1425 return CPP_EQ;
1427 case CPP_RSHIFT:
1428 /* ">>" and '>' */
1429 return CPP_GREATER;