c++: fix array cleanup with throwing temp dtor
[official-gcc.git] / gcc / c-family / c-lex.c
blob2651331e683162cadd16e5e313006e0437e66fa1
1 /* Mainly the interface between cpplib and the C front ends.
2 Copyright (C) 1987-2021 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "target.h"
24 #include "c-common.h"
25 #include "timevar.h"
26 #include "stringpool.h"
27 #include "stor-layout.h"
28 #include "c-pragma.h"
29 #include "debug.h"
30 #include "flags.h"
31 #include "file-prefix-map.h" /* remap_macro_filename() */
32 #include "langhooks.h"
33 #include "attribs.h"
35 /* We may keep statistics about how long which files took to compile. */
36 static int header_time, body_time;
37 static splay_tree file_info_tree;
39 int pending_lang_change; /* If we need to switch languages - C++ only */
40 int c_header_level; /* depth in C headers - C++ only */
42 static tree interpret_integer (const cpp_token *, unsigned int,
43 enum overflow_type *);
44 static tree interpret_float (const cpp_token *, unsigned int, const char *,
45 enum overflow_type *);
46 static tree interpret_fixed (const cpp_token *, unsigned int);
47 static enum integer_type_kind narrowest_unsigned_type
48 (const widest_int &, unsigned int);
49 static enum integer_type_kind narrowest_signed_type
50 (const widest_int &, unsigned int);
51 static enum cpp_ttype lex_string (const cpp_token *, tree *, bool, bool);
52 static tree lex_charconst (const cpp_token *);
53 static void update_header_times (const char *);
54 static int dump_one_header (splay_tree_node, void *);
55 static void cb_line_change (cpp_reader *, const cpp_token *, int);
56 static void cb_ident (cpp_reader *, unsigned int, const cpp_string *);
57 static void cb_def_pragma (cpp_reader *, unsigned int);
58 static void cb_define (cpp_reader *, unsigned int, cpp_hashnode *);
59 static void cb_undef (cpp_reader *, unsigned int, cpp_hashnode *);
61 void
62 init_c_lex (void)
64 struct c_fileinfo *toplevel;
66 /* The get_fileinfo data structure must be initialized before
67 cpp_read_main_file is called. */
68 toplevel = get_fileinfo ("<top level>");
69 if (flag_detailed_statistics)
71 header_time = 0;
72 body_time = get_run_time ();
73 toplevel->time = body_time;
76 struct cpp_callbacks *cb = cpp_get_callbacks (parse_in);
78 cb->line_change = cb_line_change;
79 cb->ident = cb_ident;
80 cb->def_pragma = cb_def_pragma;
81 cb->valid_pch = c_common_valid_pch;
82 cb->read_pch = c_common_read_pch;
83 cb->has_attribute = c_common_has_attribute;
84 cb->has_builtin = c_common_has_builtin;
85 cb->get_source_date_epoch = cb_get_source_date_epoch;
86 cb->get_suggestion = cb_get_suggestion;
87 cb->remap_filename = remap_macro_filename;
89 /* Set the debug callbacks if we can use them. */
90 if ((debug_info_level == DINFO_LEVEL_VERBOSE
91 && dwarf_debuginfo_p ())
92 || flag_dump_go_spec != NULL)
94 cb->define = cb_define;
95 cb->undef = cb_undef;
99 struct c_fileinfo *
100 get_fileinfo (const char *name)
102 splay_tree_node n;
103 struct c_fileinfo *fi;
105 if (!file_info_tree)
106 file_info_tree = splay_tree_new (splay_tree_compare_strings,
108 splay_tree_delete_pointers);
110 n = splay_tree_lookup (file_info_tree, (splay_tree_key) name);
111 if (n)
112 return (struct c_fileinfo *) n->value;
114 fi = XNEW (struct c_fileinfo);
115 fi->time = 0;
116 fi->interface_only = 0;
117 fi->interface_unknown = 1;
118 splay_tree_insert (file_info_tree, (splay_tree_key) name,
119 (splay_tree_value) fi);
120 return fi;
123 static void
124 update_header_times (const char *name)
126 /* Changing files again. This means currently collected time
127 is charged against header time, and body time starts back at 0. */
128 if (flag_detailed_statistics)
130 int this_time = get_run_time ();
131 struct c_fileinfo *file = get_fileinfo (name);
132 header_time += this_time - body_time;
133 file->time += this_time - body_time;
134 body_time = this_time;
138 static int
139 dump_one_header (splay_tree_node n, void * ARG_UNUSED (dummy))
141 print_time ((const char *) n->key,
142 ((struct c_fileinfo *) n->value)->time);
143 return 0;
146 void
147 dump_time_statistics (void)
149 struct c_fileinfo *file = get_fileinfo (LOCATION_FILE (input_location));
150 int this_time = get_run_time ();
151 file->time += this_time - body_time;
153 fprintf (stderr, "\n******\n");
154 print_time ("header files (total)", header_time);
155 print_time ("main file (total)", this_time - body_time);
156 fprintf (stderr, "ratio = %g : 1\n",
157 (double) header_time / (double) (this_time - body_time));
158 fprintf (stderr, "\n******\n");
160 splay_tree_foreach (file_info_tree, dump_one_header, 0);
163 static void
164 cb_ident (cpp_reader * ARG_UNUSED (pfile),
165 unsigned int ARG_UNUSED (line),
166 const cpp_string * ARG_UNUSED (str))
168 if (!flag_no_ident)
170 /* Convert escapes in the string. */
171 cpp_string cstr = { 0, 0 };
172 if (cpp_interpret_string (pfile, str, 1, &cstr, CPP_STRING))
174 targetm.asm_out.output_ident ((const char *) cstr.text);
175 free (CONST_CAST (unsigned char *, cstr.text));
180 /* Called at the start of every non-empty line. TOKEN is the first
181 lexed token on the line. Used for diagnostic line numbers. */
182 static void
183 cb_line_change (cpp_reader * ARG_UNUSED (pfile), const cpp_token *token,
184 int parsing_args)
186 if (token->type != CPP_EOF && !parsing_args)
187 input_location = token->src_loc;
190 void
191 fe_file_change (const line_map_ordinary *new_map)
193 if (new_map == NULL)
194 return;
196 if (new_map->reason == LC_ENTER)
198 /* Don't stack the main buffer on the input stack;
199 we already did in compile_file. */
200 if (!MAIN_FILE_P (new_map))
202 location_t included_at = linemap_included_from (new_map);
203 int line = 0;
204 if (included_at > BUILTINS_LOCATION)
205 line = SOURCE_LINE (new_map - 1, included_at);
207 input_location = new_map->start_location;
208 (*debug_hooks->start_source_file) (line, LINEMAP_FILE (new_map));
209 #ifdef SYSTEM_IMPLICIT_EXTERN_C
210 if (c_header_level)
211 ++c_header_level;
212 else if (LINEMAP_SYSP (new_map) == 2)
214 c_header_level = 1;
215 ++pending_lang_change;
217 #endif
220 else if (new_map->reason == LC_LEAVE)
222 #ifdef SYSTEM_IMPLICIT_EXTERN_C
223 if (c_header_level && --c_header_level == 0)
225 if (LINEMAP_SYSP (new_map) == 2)
226 warning (0, "badly nested C headers from preprocessor");
227 --pending_lang_change;
229 #endif
230 input_location = new_map->start_location;
232 (*debug_hooks->end_source_file) (LINEMAP_LINE (new_map));
235 update_header_times (LINEMAP_FILE (new_map));
236 input_location = new_map->start_location;
239 static void
240 cb_def_pragma (cpp_reader *pfile, location_t loc)
242 /* Issue a warning message if we have been asked to do so. Ignore
243 unknown pragmas in system headers unless an explicit
244 -Wunknown-pragmas has been given. */
245 if (warn_unknown_pragmas > in_system_header_at (input_location))
247 const unsigned char *space, *name;
248 const cpp_token *s;
249 location_t fe_loc = loc;
251 space = name = (const unsigned char *) "";
252 s = cpp_get_token (pfile);
253 if (s->type != CPP_EOF)
255 space = cpp_token_as_text (pfile, s);
256 s = cpp_get_token (pfile);
257 if (s->type == CPP_NAME)
258 name = cpp_token_as_text (pfile, s);
261 warning_at (fe_loc, OPT_Wunknown_pragmas, "ignoring %<#pragma %s %s%>",
262 space, name);
266 /* #define callback for DWARF and DWARF2 debug info. */
267 static void
268 cb_define (cpp_reader *pfile, location_t loc, cpp_hashnode *node)
270 const struct line_map *map = linemap_lookup (line_table, loc);
271 (*debug_hooks->define) (SOURCE_LINE (linemap_check_ordinary (map), loc),
272 (const char *) cpp_macro_definition (pfile, node));
275 /* #undef callback for DWARF and DWARF2 debug info. */
276 static void
277 cb_undef (cpp_reader *pfile, location_t loc, cpp_hashnode *node)
279 if (lang_hooks.preprocess_undef)
280 lang_hooks.preprocess_undef (pfile, loc, node);
282 const struct line_map *map = linemap_lookup (line_table, loc);
283 (*debug_hooks->undef) (SOURCE_LINE (linemap_check_ordinary (map), loc),
284 (const char *) NODE_NAME (node));
287 /* Wrapper around cpp_get_token to skip CPP_PADDING tokens
288 and not consume CPP_EOF. */
289 static const cpp_token *
290 get_token_no_padding (cpp_reader *pfile)
292 for (;;)
294 const cpp_token *ret = cpp_peek_token (pfile, 0);
295 if (ret->type == CPP_EOF)
296 return ret;
297 ret = cpp_get_token (pfile);
298 if (ret->type != CPP_PADDING)
299 return ret;
303 /* Callback for has_attribute. */
305 c_common_has_attribute (cpp_reader *pfile, bool std_syntax)
307 int result = 0;
308 tree attr_name = NULL_TREE;
309 const cpp_token *token;
311 token = get_token_no_padding (pfile);
312 if (token->type != CPP_OPEN_PAREN)
314 cpp_error (pfile, CPP_DL_ERROR,
315 "missing '(' after \"__has_attribute\"");
316 return 0;
318 token = get_token_no_padding (pfile);
319 if (token->type == CPP_NAME)
321 attr_name = get_identifier ((const char *)
322 cpp_token_as_text (pfile, token));
323 attr_name = canonicalize_attr_name (attr_name);
324 bool have_scope = false;
325 int idx = 0;
326 const cpp_token *nxt_token;
328 nxt_token = cpp_peek_token (pfile, idx++);
329 while (nxt_token->type == CPP_PADDING);
330 if (nxt_token->type == CPP_SCOPE)
332 have_scope = true;
333 get_token_no_padding (pfile); // Eat scope.
334 nxt_token = get_token_no_padding (pfile);
335 if (nxt_token->type == CPP_NAME)
337 tree attr_ns = attr_name;
338 tree attr_id
339 = get_identifier ((const char *)
340 cpp_token_as_text (pfile, nxt_token));
341 attr_id = canonicalize_attr_name (attr_id);
342 if (c_dialect_cxx ())
344 /* OpenMP attributes need special handling. */
345 if ((flag_openmp || flag_openmp_simd)
346 && is_attribute_p ("omp", attr_ns)
347 && (is_attribute_p ("directive", attr_id)
348 || is_attribute_p ("sequence", attr_id)))
349 result = 1;
351 if (result)
352 attr_name = NULL_TREE;
353 else
354 attr_name = build_tree_list (attr_ns, attr_id);
356 else
358 cpp_error (pfile, CPP_DL_ERROR,
359 "attribute identifier required after scope");
360 attr_name = NULL_TREE;
363 else
365 /* Some standard attributes need special handling. */
366 if (c_dialect_cxx ())
368 if (is_attribute_p ("noreturn", attr_name))
369 result = 200809;
370 else if (is_attribute_p ("deprecated", attr_name))
371 result = 201309;
372 else if (is_attribute_p ("maybe_unused", attr_name)
373 || is_attribute_p ("fallthrough", attr_name))
374 result = 201603;
375 else if (is_attribute_p ("no_unique_address", attr_name)
376 || is_attribute_p ("likely", attr_name)
377 || is_attribute_p ("unlikely", attr_name))
378 result = 201803;
379 else if (is_attribute_p ("nodiscard", attr_name))
380 result = 201907;
382 else
384 if (is_attribute_p ("deprecated", attr_name)
385 || is_attribute_p ("maybe_unused", attr_name)
386 || is_attribute_p ("fallthrough", attr_name))
387 result = 201904;
388 else if (is_attribute_p ("nodiscard", attr_name))
389 result = 202003;
391 if (result)
392 attr_name = NULL_TREE;
394 if (attr_name && (have_scope || !std_syntax))
396 init_attributes ();
397 const struct attribute_spec *attr = lookup_attribute_spec (attr_name);
398 if (attr)
399 result = 1;
402 else
404 cpp_error (pfile, CPP_DL_ERROR,
405 "macro \"__has_attribute\" requires an identifier");
406 return 0;
409 if (get_token_no_padding (pfile)->type != CPP_CLOSE_PAREN)
410 cpp_error (pfile, CPP_DL_ERROR,
411 "missing ')' after \"__has_attribute\"");
413 return result;
416 /* Callback for has_builtin. */
419 c_common_has_builtin (cpp_reader *pfile)
421 const cpp_token *token = get_token_no_padding (pfile);
422 if (token->type != CPP_OPEN_PAREN)
424 cpp_error (pfile, CPP_DL_ERROR,
425 "missing '(' after \"__has_builtin\"");
426 return 0;
429 const char *name = "";
430 token = get_token_no_padding (pfile);
431 if (token->type == CPP_NAME)
433 name = (const char *) cpp_token_as_text (pfile, token);
434 token = get_token_no_padding (pfile);
435 if (token->type != CPP_CLOSE_PAREN)
437 cpp_error (pfile, CPP_DL_ERROR,
438 "expected ')' after \"%s\"", name);
439 name = "";
442 else
444 cpp_error (pfile, CPP_DL_ERROR,
445 "macro \"__has_builtin\" requires an identifier");
446 if (token->type == CPP_CLOSE_PAREN)
447 return 0;
450 /* Consume tokens up to the closing parenthesis, including any nested
451 pairs of parentheses, to avoid confusing redundant errors. */
452 for (unsigned nparen = 1; ; token = get_token_no_padding (pfile))
454 if (token->type == CPP_OPEN_PAREN)
455 ++nparen;
456 else if (token->type == CPP_CLOSE_PAREN)
457 --nparen;
458 else if (token->type == CPP_EOF)
459 break;
460 if (!nparen)
461 break;
464 return names_builtin_p (name);
468 /* Read a token and return its type. Fill *VALUE with its value, if
469 applicable. Fill *CPP_FLAGS with the token's flags, if it is
470 non-NULL. */
472 enum cpp_ttype
473 c_lex_with_flags (tree *value, location_t *loc, unsigned char *cpp_flags,
474 int lex_flags)
476 const cpp_token *tok;
477 enum cpp_ttype type;
478 unsigned char add_flags = 0;
479 enum overflow_type overflow = OT_NONE;
481 timevar_push (TV_CPP);
482 retry:
483 tok = cpp_get_token_with_location (parse_in, loc);
484 type = tok->type;
486 retry_after_at:
487 switch (type)
489 case CPP_PADDING:
490 goto retry;
492 case CPP_NAME:
493 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
494 break;
496 case CPP_NUMBER:
498 const char *suffix = NULL;
499 unsigned int flags = cpp_classify_number (parse_in, tok, &suffix, *loc);
501 switch (flags & CPP_N_CATEGORY)
503 case CPP_N_INVALID:
504 /* cpplib has issued an error. */
505 *value = error_mark_node;
506 break;
508 case CPP_N_INTEGER:
509 /* C++ uses '0' to mark virtual functions as pure.
510 Set PURE_ZERO to pass this information to the C++ parser. */
511 if (tok->val.str.len == 1 && *tok->val.str.text == '0')
512 add_flags = PURE_ZERO;
513 *value = interpret_integer (tok, flags, &overflow);
514 break;
516 case CPP_N_FLOATING:
517 *value = interpret_float (tok, flags, suffix, &overflow);
518 break;
520 default:
521 gcc_unreachable ();
524 if (flags & CPP_N_USERDEF)
526 char *str;
527 tree literal;
528 tree suffix_id = get_identifier (suffix);
529 int len = tok->val.str.len - strlen (suffix);
530 /* If this is going to be used as a C string to pass to a
531 raw literal operator, we need to add a trailing NUL. */
532 tree num_string = build_string (len + 1,
533 (const char *) tok->val.str.text);
534 TREE_TYPE (num_string) = char_array_type_node;
535 num_string = fix_string_type (num_string);
536 str = CONST_CAST (char *, TREE_STRING_POINTER (num_string));
537 str[len] = '\0';
538 literal = build_userdef_literal (suffix_id, *value, overflow,
539 num_string);
540 *value = literal;
543 break;
545 case CPP_ATSIGN:
546 /* An @ may give the next token special significance in Objective-C. */
547 if (c_dialect_objc ())
549 location_t atloc = *loc;
550 location_t newloc;
552 retry_at:
553 tok = cpp_get_token_with_location (parse_in, &newloc);
554 type = tok->type;
555 switch (type)
557 case CPP_PADDING:
558 goto retry_at;
560 case CPP_STRING:
561 case CPP_WSTRING:
562 case CPP_STRING16:
563 case CPP_STRING32:
564 case CPP_UTF8STRING:
565 type = lex_string (tok, value, true, true);
566 break;
568 case CPP_NAME:
569 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
570 if (OBJC_IS_AT_KEYWORD (C_RID_CODE (*value))
571 || OBJC_IS_CXX_KEYWORD (C_RID_CODE (*value)))
573 type = CPP_AT_NAME;
574 /* Note the complication: if we found an OBJC_CXX
575 keyword, for example, 'class', we will be
576 returning a token of type CPP_AT_NAME and rid
577 code RID_CLASS (not RID_AT_CLASS). The language
578 parser needs to convert that to RID_AT_CLASS.
579 However, we've now spliced the '@' together with the
580 keyword that follows; Adjust the location so that we
581 get a source range covering the composite.
583 *loc = make_location (atloc, atloc, newloc);
584 break;
586 /* FALLTHROUGH */
588 default:
589 /* ... or not. */
590 error_at (atloc, "stray %<@%> in program");
591 *loc = newloc;
592 goto retry_after_at;
594 break;
597 /* FALLTHROUGH */
598 case CPP_HASH:
599 case CPP_PASTE:
601 unsigned char name[8];
603 *cpp_spell_token (parse_in, tok, name, true) = 0;
605 error_at (*loc, "stray %qs in program", name);
608 goto retry;
610 case CPP_OTHER:
612 cppchar_t c = tok->val.str.text[0];
614 if (c == '"' || c == '\'')
615 error_at (*loc, "missing terminating %c character", (int) c);
616 else if (ISGRAPH (c))
617 error_at (*loc, "stray %qc in program", (int) c);
618 else
620 rich_location rich_loc (line_table, *loc);
621 rich_loc.set_escape_on_output (true);
622 error_at (&rich_loc, "stray %<\\%o%> in program", (int) c);
625 goto retry;
627 case CPP_CHAR_USERDEF:
628 case CPP_WCHAR_USERDEF:
629 case CPP_CHAR16_USERDEF:
630 case CPP_CHAR32_USERDEF:
631 case CPP_UTF8CHAR_USERDEF:
633 tree literal;
634 cpp_token temp_tok = *tok;
635 const char *suffix = cpp_get_userdef_suffix (tok);
636 temp_tok.val.str.len -= strlen (suffix);
637 temp_tok.type = cpp_userdef_char_remove_type (type);
638 literal = build_userdef_literal (get_identifier (suffix),
639 lex_charconst (&temp_tok),
640 OT_NONE, NULL_TREE);
641 *value = literal;
643 break;
645 case CPP_CHAR:
646 case CPP_WCHAR:
647 case CPP_CHAR16:
648 case CPP_CHAR32:
649 case CPP_UTF8CHAR:
650 *value = lex_charconst (tok);
651 break;
653 case CPP_STRING_USERDEF:
654 case CPP_WSTRING_USERDEF:
655 case CPP_STRING16_USERDEF:
656 case CPP_STRING32_USERDEF:
657 case CPP_UTF8STRING_USERDEF:
659 tree literal, string;
660 const char *suffix = cpp_get_userdef_suffix (tok);
661 string = build_string (tok->val.str.len - strlen (suffix),
662 (const char *) tok->val.str.text);
663 literal = build_userdef_literal (get_identifier (suffix),
664 string, OT_NONE, NULL_TREE);
665 *value = literal;
667 break;
669 case CPP_STRING:
670 case CPP_WSTRING:
671 case CPP_STRING16:
672 case CPP_STRING32:
673 case CPP_UTF8STRING:
674 if ((lex_flags & C_LEX_STRING_NO_JOIN) == 0)
676 type = lex_string (tok, value, false,
677 (lex_flags & C_LEX_STRING_NO_TRANSLATE) == 0);
678 break;
680 *value = build_string (tok->val.str.len, (const char *) tok->val.str.text);
681 break;
683 case CPP_PRAGMA:
684 *value = build_int_cst (integer_type_node, tok->val.pragma);
685 break;
687 case CPP_HEADER_NAME:
688 *value = build_string (tok->val.str.len, (const char *)tok->val.str.text);
689 break;
691 /* This token should not be visible outside cpplib. */
692 case CPP_MACRO_ARG:
693 gcc_unreachable ();
695 /* CPP_COMMENT will appear when compiling with -C. Ignore, except
696 when it is a FALLTHROUGH comment, in that case set
697 PREV_FALLTHROUGH flag on the next non-comment token. */
698 case CPP_COMMENT:
699 if (tok->flags & PREV_FALLTHROUGH)
703 tok = cpp_get_token_with_location (parse_in, loc);
704 type = tok->type;
706 while (type == CPP_PADDING || type == CPP_COMMENT);
707 add_flags |= PREV_FALLTHROUGH;
708 goto retry_after_at;
710 goto retry;
712 default:
713 *value = NULL_TREE;
714 break;
717 if (cpp_flags)
718 *cpp_flags = tok->flags | add_flags;
720 timevar_pop (TV_CPP);
722 return type;
725 /* Returns the narrowest C-visible unsigned type, starting with the
726 minimum specified by FLAGS, that can fit HIGH:LOW, or itk_none if
727 there isn't one. */
729 static enum integer_type_kind
730 narrowest_unsigned_type (const widest_int &val, unsigned int flags)
732 int itk;
734 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
735 itk = itk_unsigned_int;
736 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
737 itk = itk_unsigned_long;
738 else
739 itk = itk_unsigned_long_long;
741 for (; itk < itk_none; itk += 2 /* skip unsigned types */)
743 tree upper;
745 if (integer_types[itk] == NULL_TREE)
746 continue;
747 upper = TYPE_MAX_VALUE (integer_types[itk]);
749 if (wi::geu_p (wi::to_widest (upper), val))
750 return (enum integer_type_kind) itk;
753 return itk_none;
756 /* Ditto, but narrowest signed type. */
757 static enum integer_type_kind
758 narrowest_signed_type (const widest_int &val, unsigned int flags)
760 int itk;
762 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
763 itk = itk_int;
764 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
765 itk = itk_long;
766 else
767 itk = itk_long_long;
769 for (; itk < itk_none; itk += 2 /* skip signed types */)
771 tree upper;
773 if (integer_types[itk] == NULL_TREE)
774 continue;
775 upper = TYPE_MAX_VALUE (integer_types[itk]);
777 if (wi::geu_p (wi::to_widest (upper), val))
778 return (enum integer_type_kind) itk;
781 return itk_none;
784 /* Interpret TOKEN, an integer with FLAGS as classified by cpplib. */
785 static tree
786 interpret_integer (const cpp_token *token, unsigned int flags,
787 enum overflow_type *overflow)
789 tree value, type;
790 enum integer_type_kind itk;
791 cpp_num integer;
792 HOST_WIDE_INT ival[3];
794 *overflow = OT_NONE;
796 integer = cpp_interpret_integer (parse_in, token, flags);
797 if (integer.overflow)
798 *overflow = OT_OVERFLOW;
800 ival[0] = integer.low;
801 ival[1] = integer.high;
802 ival[2] = 0;
803 widest_int wval = widest_int::from_array (ival, 3);
805 /* The type of a constant with a U suffix is straightforward. */
806 if (flags & CPP_N_UNSIGNED)
807 itk = narrowest_unsigned_type (wval, flags);
808 else
810 /* The type of a potentially-signed integer constant varies
811 depending on the base it's in, the standard in use, and the
812 length suffixes. */
813 enum integer_type_kind itk_u
814 = narrowest_unsigned_type (wval, flags);
815 enum integer_type_kind itk_s
816 = narrowest_signed_type (wval, flags);
818 /* In both C89 and C99, octal and hex constants may be signed or
819 unsigned, whichever fits tighter. We do not warn about this
820 choice differing from the traditional choice, as the constant
821 is probably a bit pattern and either way will work. */
822 if ((flags & CPP_N_RADIX) != CPP_N_DECIMAL)
823 itk = MIN (itk_u, itk_s);
824 else
826 /* In C99, decimal constants are always signed.
827 In C89, decimal constants that don't fit in long have
828 undefined behavior; we try to make them unsigned long.
829 In GCC's extended C89, that last is true of decimal
830 constants that don't fit in long long, too. */
832 itk = itk_s;
833 if (itk_s > itk_u && itk_s > itk_long)
835 if (!flag_isoc99)
837 if (itk_u < itk_unsigned_long)
838 itk_u = itk_unsigned_long;
839 itk = itk_u;
840 warning (0, "this decimal constant is unsigned only in ISO C90");
842 else
843 warning (OPT_Wtraditional,
844 "this decimal constant would be unsigned in ISO C90");
849 if (itk == itk_none)
850 /* cpplib has already issued a warning for overflow. */
851 type = ((flags & CPP_N_UNSIGNED)
852 ? widest_unsigned_literal_type_node
853 : widest_integer_literal_type_node);
854 else if (flags & CPP_N_SIZE_T)
856 /* itk refers to fundamental types not aliased size types. */
857 if (flags & CPP_N_UNSIGNED)
858 type = size_type_node;
859 else
860 type = signed_size_type_node;
862 else
864 type = integer_types[itk];
865 if (itk > itk_unsigned_long
866 && (flags & CPP_N_WIDTH) != CPP_N_LARGE)
867 emit_diagnostic
868 ((c_dialect_cxx () ? cxx_dialect == cxx98 : !flag_isoc99)
869 ? DK_PEDWARN : DK_WARNING,
870 input_location, OPT_Wlong_long,
871 (flags & CPP_N_UNSIGNED)
872 ? "integer constant is too large for %<unsigned long%> type"
873 : "integer constant is too large for %<long%> type");
876 value = wide_int_to_tree (type, wval);
878 /* Convert imaginary to a complex type. */
879 if (flags & CPP_N_IMAGINARY)
880 value = build_complex (NULL_TREE, build_int_cst (type, 0), value);
882 return value;
885 /* Interpret TOKEN, a floating point number with FLAGS as classified
886 by cpplib. For C++11 SUFFIX may contain a user-defined literal suffix. */
887 static tree
888 interpret_float (const cpp_token *token, unsigned int flags,
889 const char *suffix, enum overflow_type *overflow)
891 tree type;
892 tree const_type;
893 tree value;
894 REAL_VALUE_TYPE real;
895 REAL_VALUE_TYPE real_trunc;
896 char *copy;
897 size_t copylen;
899 *overflow = OT_NONE;
901 /* Default (no suffix) depends on whether the FLOAT_CONST_DECIMAL64
902 pragma has been used and is either double or _Decimal64. Types
903 that are not allowed with decimal float default to double. */
904 if (flags & CPP_N_DEFAULT)
906 flags ^= CPP_N_DEFAULT;
907 flags |= CPP_N_MEDIUM;
909 if (((flags & CPP_N_HEX) == 0) && ((flags & CPP_N_IMAGINARY) == 0))
911 warning (OPT_Wunsuffixed_float_constants,
912 "unsuffixed floating constant");
913 if (float_const_decimal64_p ())
914 flags |= CPP_N_DFLOAT;
918 /* Decode _Fract and _Accum. */
919 if (flags & CPP_N_FRACT || flags & CPP_N_ACCUM)
920 return interpret_fixed (token, flags);
922 /* Decode type based on width and properties. */
923 if (flags & CPP_N_DFLOAT)
924 if (!targetm.decimal_float_supported_p ())
926 error ("decimal floating-point not supported for this target");
927 return error_mark_node;
929 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
930 type = dfloat128_type_node;
931 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
932 type = dfloat32_type_node;
933 else
934 type = dfloat64_type_node;
935 else
936 if (flags & CPP_N_WIDTH_MD)
938 char suffix;
939 machine_mode mode;
941 if ((flags & CPP_N_WIDTH_MD) == CPP_N_MD_W)
942 suffix = 'w';
943 else
944 suffix = 'q';
946 mode = targetm.c.mode_for_suffix (suffix);
947 if (mode == VOIDmode)
949 error ("unsupported non-standard suffix on floating constant");
951 return error_mark_node;
953 else
954 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
956 type = c_common_type_for_mode (mode, 0);
957 gcc_assert (type);
959 else if ((flags & (CPP_N_FLOATN | CPP_N_FLOATNX)) != 0)
961 unsigned int n = (flags & CPP_N_WIDTH_FLOATN_NX) >> CPP_FLOATN_SHIFT;
962 bool extended = (flags & CPP_N_FLOATNX) != 0;
963 type = NULL_TREE;
964 for (int i = 0; i < NUM_FLOATN_NX_TYPES; i++)
965 if (floatn_nx_types[i].n == (int) n
966 && floatn_nx_types[i].extended == extended)
968 type = FLOATN_NX_TYPE_NODE (i);
969 break;
971 if (type == NULL_TREE)
973 error ("unsupported non-standard suffix on floating constant");
974 return error_mark_node;
976 else
977 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
979 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
980 type = long_double_type_node;
981 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL
982 || flag_single_precision_constant)
983 type = float_type_node;
984 else
985 type = double_type_node;
987 const_type = excess_precision_type (type);
988 if (!const_type)
989 const_type = type;
991 /* Copy the constant to a nul-terminated buffer. If the constant
992 has any suffixes, cut them off; REAL_VALUE_ATOF/ REAL_VALUE_HTOF
993 can't handle them. */
994 copylen = token->val.str.len;
995 if (flags & CPP_N_USERDEF)
996 copylen -= strlen (suffix);
997 else if (flags & CPP_N_DFLOAT)
998 copylen -= 2;
999 else
1001 if ((flags & CPP_N_WIDTH) != CPP_N_MEDIUM)
1002 /* Must be an F or L or machine defined suffix. */
1003 copylen--;
1004 if (flags & CPP_N_IMAGINARY)
1005 /* I or J suffix. */
1006 copylen--;
1007 if (flags & CPP_N_FLOATNX)
1008 copylen--;
1009 if (flags & (CPP_N_FLOATN | CPP_N_FLOATNX))
1011 unsigned int n = (flags & CPP_N_WIDTH_FLOATN_NX) >> CPP_FLOATN_SHIFT;
1012 while (n > 0)
1014 copylen--;
1015 n /= 10;
1020 copy = (char *) alloca (copylen + 1);
1021 if (c_dialect_cxx () ? cxx_dialect > cxx11 : flag_isoc2x)
1023 size_t maxlen = 0;
1024 for (size_t i = 0; i < copylen; ++i)
1025 if (token->val.str.text[i] != '\'')
1026 copy[maxlen++] = token->val.str.text[i];
1027 copy[maxlen] = '\0';
1029 else
1031 memcpy (copy, token->val.str.text, copylen);
1032 copy[copylen] = '\0';
1035 real_from_string3 (&real, copy, TYPE_MODE (const_type));
1036 if (const_type != type)
1037 /* Diagnosing if the result of converting the value with excess
1038 precision to the semantic type would overflow (with associated
1039 double rounding) is more appropriate than diagnosing if the
1040 result of converting the string directly to the semantic type
1041 would overflow. */
1042 real_convert (&real_trunc, TYPE_MODE (type), &real);
1044 /* Both C and C++ require a diagnostic for a floating constant
1045 outside the range of representable values of its type. Since we
1046 have __builtin_inf* to produce an infinity, this is now a
1047 mandatory pedwarn if the target does not support infinities. */
1048 if (REAL_VALUE_ISINF (real)
1049 || (const_type != type && REAL_VALUE_ISINF (real_trunc)))
1051 *overflow = OT_OVERFLOW;
1052 if (!(flags & CPP_N_USERDEF))
1054 if (!MODE_HAS_INFINITIES (TYPE_MODE (type)))
1055 pedwarn (input_location, 0,
1056 "floating constant exceeds range of %qT", type);
1057 else
1058 warning (OPT_Woverflow,
1059 "floating constant exceeds range of %qT", type);
1062 /* We also give a warning if the value underflows. */
1063 else if (real_equal (&real, &dconst0)
1064 || (const_type != type
1065 && real_equal (&real_trunc, &dconst0)))
1067 REAL_VALUE_TYPE realvoidmode;
1068 int oflow = real_from_string (&realvoidmode, copy);
1069 *overflow = (oflow == 0 ? OT_NONE
1070 : (oflow < 0 ? OT_UNDERFLOW : OT_OVERFLOW));
1071 if (!(flags & CPP_N_USERDEF))
1073 if (oflow < 0 || !real_equal (&realvoidmode, &dconst0))
1074 warning (OPT_Woverflow, "floating constant truncated to zero");
1078 /* Create a node with determined type and value. */
1079 value = build_real (const_type, real);
1080 if (flags & CPP_N_IMAGINARY)
1082 value = build_complex (NULL_TREE,
1083 fold_convert (const_type,
1084 integer_zero_node), value);
1085 if (type != const_type)
1087 const_type = TREE_TYPE (value);
1088 type = build_complex_type (type);
1092 if (type != const_type)
1093 value = build1_loc (token->src_loc, EXCESS_PRECISION_EXPR, type, value);
1095 return value;
1098 /* Interpret TOKEN, a fixed-point number with FLAGS as classified
1099 by cpplib. */
1101 static tree
1102 interpret_fixed (const cpp_token *token, unsigned int flags)
1104 tree type;
1105 tree value;
1106 FIXED_VALUE_TYPE fixed;
1107 char *copy;
1108 size_t copylen;
1110 copylen = token->val.str.len;
1112 if (flags & CPP_N_FRACT) /* _Fract. */
1114 if (flags & CPP_N_UNSIGNED) /* Unsigned _Fract. */
1116 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1118 type = unsigned_long_long_fract_type_node;
1119 copylen -= 4;
1121 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1123 type = unsigned_long_fract_type_node;
1124 copylen -= 3;
1126 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1128 type = unsigned_short_fract_type_node;
1129 copylen -= 3;
1131 else
1133 type = unsigned_fract_type_node;
1134 copylen -= 2;
1137 else /* Signed _Fract. */
1139 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1141 type = long_long_fract_type_node;
1142 copylen -= 3;
1144 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1146 type = long_fract_type_node;
1147 copylen -= 2;
1149 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1151 type = short_fract_type_node;
1152 copylen -= 2;
1154 else
1156 type = fract_type_node;
1157 copylen --;
1161 else /* _Accum. */
1163 if (flags & CPP_N_UNSIGNED) /* Unsigned _Accum. */
1165 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1167 type = unsigned_long_long_accum_type_node;
1168 copylen -= 4;
1170 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1172 type = unsigned_long_accum_type_node;
1173 copylen -= 3;
1175 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1177 type = unsigned_short_accum_type_node;
1178 copylen -= 3;
1180 else
1182 type = unsigned_accum_type_node;
1183 copylen -= 2;
1186 else /* Signed _Accum. */
1188 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1190 type = long_long_accum_type_node;
1191 copylen -= 3;
1193 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1195 type = long_accum_type_node;
1196 copylen -= 2;
1198 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1200 type = short_accum_type_node;
1201 copylen -= 2;
1203 else
1205 type = accum_type_node;
1206 copylen --;
1211 copy = (char *) alloca (copylen + 1);
1212 memcpy (copy, token->val.str.text, copylen);
1213 copy[copylen] = '\0';
1215 fixed_from_string (&fixed, copy, SCALAR_TYPE_MODE (type));
1217 /* Create a node with determined type and value. */
1218 value = build_fixed (type, fixed);
1220 return value;
1223 /* Convert a series of STRING, WSTRING, STRING16, STRING32 and/or
1224 UTF8STRING tokens into a tree, performing string constant
1225 concatenation. TOK is the first of these. VALP is the location to
1226 write the string into. OBJC_STRING indicates whether an '@' token
1227 preceded the incoming token (in that case, the strings can either
1228 be ObjC strings, preceded by a single '@', or normal strings, not
1229 preceded by '@'. The result will be a CPP_OBJC_STRING). Returns
1230 the CPP token type of the result (CPP_STRING, CPP_WSTRING,
1231 CPP_STRING32, CPP_STRING16, CPP_UTF8STRING, or CPP_OBJC_STRING).
1233 This is unfortunately more work than it should be. If any of the
1234 strings in the series has an L prefix, the result is a wide string
1235 (6.4.5p4). Whether or not the result is a wide string affects the
1236 meaning of octal and hexadecimal escapes (6.4.4.4p6,9). But escape
1237 sequences do not continue across the boundary between two strings in
1238 a series (6.4.5p7), so we must not lose the boundaries. Therefore
1239 cpp_interpret_string takes a vector of cpp_string structures, which
1240 we must arrange to provide. */
1242 static enum cpp_ttype
1243 lex_string (const cpp_token *tok, tree *valp, bool objc_string, bool translate)
1245 tree value;
1246 size_t concats = 0;
1247 struct obstack str_ob;
1248 struct obstack loc_ob;
1249 cpp_string istr;
1250 enum cpp_ttype type = tok->type;
1252 /* Try to avoid the overhead of creating and destroying an obstack
1253 for the common case of just one string. */
1254 cpp_string str = tok->val.str;
1255 location_t init_loc = tok->src_loc;
1256 cpp_string *strs = &str;
1257 location_t *locs = NULL;
1259 /* objc_at_sign_was_seen is only used when doing Objective-C string
1260 concatenation. It is 'true' if we have seen an '@' before the
1261 current string, and 'false' if not. We must see exactly one or
1262 zero '@' before each string. */
1263 bool objc_at_sign_was_seen = false;
1265 retry:
1266 tok = cpp_get_token (parse_in);
1267 switch (tok->type)
1269 case CPP_PADDING:
1270 goto retry;
1271 case CPP_ATSIGN:
1272 if (objc_string)
1274 if (objc_at_sign_was_seen)
1275 error ("repeated %<@%> before Objective-C string");
1277 objc_at_sign_was_seen = true;
1278 goto retry;
1280 /* FALLTHROUGH */
1282 default:
1283 break;
1285 case CPP_WSTRING:
1286 case CPP_STRING16:
1287 case CPP_STRING32:
1288 case CPP_UTF8STRING:
1289 if (type != tok->type)
1291 if (type == CPP_STRING)
1292 type = tok->type;
1293 else
1294 error ("unsupported non-standard concatenation of string literals");
1296 /* FALLTHROUGH */
1298 case CPP_STRING:
1299 if (!concats)
1301 gcc_obstack_init (&str_ob);
1302 gcc_obstack_init (&loc_ob);
1303 obstack_grow (&str_ob, &str, sizeof (cpp_string));
1304 obstack_grow (&loc_ob, &init_loc, sizeof (location_t));
1307 concats++;
1308 obstack_grow (&str_ob, &tok->val.str, sizeof (cpp_string));
1309 obstack_grow (&loc_ob, &tok->src_loc, sizeof (location_t));
1311 if (objc_string)
1312 objc_at_sign_was_seen = false;
1313 goto retry;
1316 /* It is an error if we saw a '@' with no following string. */
1317 if (objc_at_sign_was_seen)
1318 error ("stray %<@%> in program");
1320 /* We have read one more token than we want. */
1321 _cpp_backup_tokens (parse_in, 1);
1322 if (concats)
1324 strs = XOBFINISH (&str_ob, cpp_string *);
1325 locs = XOBFINISH (&loc_ob, location_t *);
1328 if (concats && !objc_string && !in_system_header_at (input_location))
1329 warning (OPT_Wtraditional,
1330 "traditional C rejects string constant concatenation");
1332 if ((translate
1333 ? cpp_interpret_string : cpp_interpret_string_notranslate)
1334 (parse_in, strs, concats + 1, &istr, type))
1336 value = build_string (istr.len, (const char *) istr.text);
1337 free (CONST_CAST (unsigned char *, istr.text));
1338 if (concats)
1340 gcc_assert (locs);
1341 gcc_assert (g_string_concat_db);
1342 g_string_concat_db->record_string_concatenation (concats + 1, locs);
1345 else
1347 /* Callers cannot generally handle error_mark_node in this context,
1348 so return the empty string instead. cpp_interpret_string has
1349 issued an error. */
1350 switch (type)
1352 default:
1353 case CPP_STRING:
1354 case CPP_UTF8STRING:
1355 value = build_string (1, "");
1356 break;
1357 case CPP_STRING16:
1358 value = build_string (TYPE_PRECISION (char16_type_node)
1359 / TYPE_PRECISION (char_type_node),
1360 "\0"); /* char16_t is 16 bits */
1361 break;
1362 case CPP_STRING32:
1363 value = build_string (TYPE_PRECISION (char32_type_node)
1364 / TYPE_PRECISION (char_type_node),
1365 "\0\0\0"); /* char32_t is 32 bits */
1366 break;
1367 case CPP_WSTRING:
1368 value = build_string (TYPE_PRECISION (wchar_type_node)
1369 / TYPE_PRECISION (char_type_node),
1370 "\0\0\0"); /* widest supported wchar_t
1371 is 32 bits */
1372 break;
1376 switch (type)
1378 default:
1379 case CPP_STRING:
1380 TREE_TYPE (value) = char_array_type_node;
1381 break;
1382 case CPP_UTF8STRING:
1383 if (flag_char8_t)
1384 TREE_TYPE (value) = char8_array_type_node;
1385 else
1386 TREE_TYPE (value) = char_array_type_node;
1387 break;
1388 case CPP_STRING16:
1389 TREE_TYPE (value) = char16_array_type_node;
1390 break;
1391 case CPP_STRING32:
1392 TREE_TYPE (value) = char32_array_type_node;
1393 break;
1394 case CPP_WSTRING:
1395 TREE_TYPE (value) = wchar_array_type_node;
1397 *valp = fix_string_type (value);
1399 if (concats)
1401 obstack_free (&str_ob, 0);
1402 obstack_free (&loc_ob, 0);
1405 return objc_string ? CPP_OBJC_STRING : type;
1408 /* Converts a (possibly wide) character constant token into a tree. */
1409 static tree
1410 lex_charconst (const cpp_token *token)
1412 cppchar_t result;
1413 tree type, value;
1414 unsigned int chars_seen;
1415 int unsignedp = 0;
1417 result = cpp_interpret_charconst (parse_in, token,
1418 &chars_seen, &unsignedp);
1420 if (token->type == CPP_WCHAR)
1421 type = wchar_type_node;
1422 else if (token->type == CPP_CHAR32)
1423 type = char32_type_node;
1424 else if (token->type == CPP_CHAR16)
1425 type = char16_type_node;
1426 else if (token->type == CPP_UTF8CHAR)
1428 if (!c_dialect_cxx ())
1429 type = unsigned_char_type_node;
1430 else if (flag_char8_t)
1431 type = char8_type_node;
1432 else
1433 type = char_type_node;
1435 /* In C, a character constant has type 'int'.
1436 In C++ 'char', but multi-char charconsts have type 'int'. */
1437 else if (!c_dialect_cxx () || chars_seen > 1)
1438 type = integer_type_node;
1439 else
1440 type = char_type_node;
1442 /* Cast to cppchar_signed_t to get correct sign-extension of RESULT
1443 before possibly widening to HOST_WIDE_INT for build_int_cst. */
1444 if (unsignedp || (cppchar_signed_t) result >= 0)
1445 value = build_int_cst (type, result);
1446 else
1447 value = build_int_cst (type, (cppchar_signed_t) result);
1449 return value;
1452 /* Helper function for c_parser_peek_conflict_marker
1453 and cp_lexer_peek_conflict_marker.
1454 Given a possible conflict marker token of kind TOK1_KIND
1455 consisting of a pair of characters, get the token kind for the
1456 standalone final character. */
1458 enum cpp_ttype
1459 conflict_marker_get_final_tok_kind (enum cpp_ttype tok1_kind)
1461 switch (tok1_kind)
1463 default: gcc_unreachable ();
1464 case CPP_LSHIFT:
1465 /* "<<" and '<' */
1466 return CPP_LESS;
1468 case CPP_EQ_EQ:
1469 /* "==" and '=' */
1470 return CPP_EQ;
1472 case CPP_RSHIFT:
1473 /* ">>" and '>' */
1474 return CPP_GREATER;