Fix ICE with SLP and -fdbg-cnt
[official-gcc.git] / gcc / c-family / c-lex.cc
blob06c2453c89a6c543dbb1f39d9d32ede18b299cf4
1 /* Mainly the interface between cpplib and the C front ends.
2 Copyright (C) 1987-2023 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "target.h"
24 #include "c-common.h"
25 #include "timevar.h"
26 #include "stringpool.h"
27 #include "stor-layout.h"
28 #include "c-pragma.h"
29 #include "debug.h"
30 #include "flags.h"
31 #include "file-prefix-map.h" /* remap_macro_filename() */
32 #include "langhooks.h"
33 #include "attribs.h"
35 /* We may keep statistics about how long which files took to compile. */
36 static int header_time, body_time;
37 static splay_tree file_info_tree;
39 int pending_lang_change; /* If we need to switch languages - C++ only */
40 int c_header_level; /* depth in C headers - C++ only */
42 static tree interpret_integer (const cpp_token *, unsigned int,
43 enum overflow_type *);
44 static tree interpret_float (const cpp_token *, unsigned int, const char *,
45 enum overflow_type *);
46 static tree interpret_fixed (const cpp_token *, unsigned int);
47 static enum integer_type_kind narrowest_unsigned_type
48 (const widest_int &, unsigned int);
49 static enum integer_type_kind narrowest_signed_type
50 (const widest_int &, unsigned int);
51 static enum cpp_ttype lex_string (const cpp_token *, tree *, bool, bool);
52 static tree lex_charconst (const cpp_token *);
53 static void update_header_times (const char *);
54 static int dump_one_header (splay_tree_node, void *);
55 static void cb_line_change (cpp_reader *, const cpp_token *, int);
56 static void cb_ident (cpp_reader *, unsigned int, const cpp_string *);
57 static void cb_def_pragma (cpp_reader *, unsigned int);
58 static void cb_define (cpp_reader *, unsigned int, cpp_hashnode *);
59 static void cb_undef (cpp_reader *, unsigned int, cpp_hashnode *);
61 void
62 init_c_lex (void)
64 struct c_fileinfo *toplevel;
66 /* The get_fileinfo data structure must be initialized before
67 cpp_read_main_file is called. */
68 toplevel = get_fileinfo ("<top level>");
69 if (flag_detailed_statistics)
71 header_time = 0;
72 body_time = get_run_time ();
73 toplevel->time = body_time;
76 struct cpp_callbacks *cb = cpp_get_callbacks (parse_in);
78 cb->line_change = cb_line_change;
79 cb->ident = cb_ident;
80 cb->def_pragma = cb_def_pragma;
81 cb->valid_pch = c_common_valid_pch;
82 cb->read_pch = c_common_read_pch;
83 cb->has_attribute = c_common_has_attribute;
84 cb->has_builtin = c_common_has_builtin;
85 cb->get_source_date_epoch = cb_get_source_date_epoch;
86 cb->get_suggestion = cb_get_suggestion;
87 cb->remap_filename = remap_macro_filename;
89 /* Set the debug callbacks if we can use them. */
90 if ((debug_info_level == DINFO_LEVEL_VERBOSE
91 && dwarf_debuginfo_p ())
92 || flag_dump_go_spec != NULL)
94 cb->define = cb_define;
95 cb->undef = cb_undef;
99 struct c_fileinfo *
100 get_fileinfo (const char *name)
102 splay_tree_node n;
103 struct c_fileinfo *fi;
105 if (!file_info_tree)
106 file_info_tree = splay_tree_new (splay_tree_compare_strings,
108 splay_tree_delete_pointers);
110 n = splay_tree_lookup (file_info_tree, (splay_tree_key) name);
111 if (n)
112 return (struct c_fileinfo *) n->value;
114 fi = XNEW (struct c_fileinfo);
115 fi->time = 0;
116 fi->interface_only = 0;
117 fi->interface_unknown = 1;
118 splay_tree_insert (file_info_tree, (splay_tree_key) name,
119 (splay_tree_value) fi);
120 return fi;
123 static void
124 update_header_times (const char *name)
126 /* Changing files again. This means currently collected time
127 is charged against header time, and body time starts back at 0. */
128 if (flag_detailed_statistics)
130 int this_time = get_run_time ();
131 struct c_fileinfo *file = get_fileinfo (name);
132 header_time += this_time - body_time;
133 file->time += this_time - body_time;
134 body_time = this_time;
138 static int
139 dump_one_header (splay_tree_node n, void * ARG_UNUSED (dummy))
141 print_time ((const char *) n->key,
142 ((struct c_fileinfo *) n->value)->time);
143 return 0;
146 void
147 dump_time_statistics (void)
149 struct c_fileinfo *file = get_fileinfo (LOCATION_FILE (input_location));
150 int this_time = get_run_time ();
151 file->time += this_time - body_time;
153 fprintf (stderr, "\n******\n");
154 print_time ("header files (total)", header_time);
155 print_time ("main file (total)", this_time - body_time);
156 fprintf (stderr, "ratio = %g : 1\n",
157 (double) header_time / (double) (this_time - body_time));
158 fprintf (stderr, "\n******\n");
160 splay_tree_foreach (file_info_tree, dump_one_header, 0);
163 static void
164 cb_ident (cpp_reader * ARG_UNUSED (pfile),
165 unsigned int ARG_UNUSED (line),
166 const cpp_string * ARG_UNUSED (str))
168 if (!flag_no_ident)
170 /* Convert escapes in the string. */
171 cpp_string cstr = { 0, 0 };
172 if (cpp_interpret_string (pfile, str, 1, &cstr, CPP_STRING))
174 targetm.asm_out.output_ident ((const char *) cstr.text);
175 free (CONST_CAST (unsigned char *, cstr.text));
180 /* Called at the start of every non-empty line. TOKEN is the first
181 lexed token on the line. Used for diagnostic line numbers. */
182 static void
183 cb_line_change (cpp_reader * ARG_UNUSED (pfile), const cpp_token *token,
184 int parsing_args)
186 if (token->type != CPP_EOF && !parsing_args)
187 input_location = token->src_loc;
190 void
191 fe_file_change (const line_map_ordinary *new_map)
193 if (new_map == NULL)
194 return;
196 if (new_map->reason == LC_ENTER)
198 /* Don't stack the main buffer on the input stack;
199 we already did in compile_file. */
200 if (!MAIN_FILE_P (new_map))
202 location_t included_at = linemap_included_from (new_map);
203 int line = 0;
204 if (included_at > BUILTINS_LOCATION)
205 line = SOURCE_LINE (new_map - 1, included_at);
207 input_location = new_map->start_location;
208 (*debug_hooks->start_source_file) (line, LINEMAP_FILE (new_map));
209 #ifdef SYSTEM_IMPLICIT_EXTERN_C
210 if (c_header_level)
211 ++c_header_level;
212 else if (LINEMAP_SYSP (new_map) == 2)
214 c_header_level = 1;
215 ++pending_lang_change;
217 #endif
220 else if (new_map->reason == LC_LEAVE)
222 #ifdef SYSTEM_IMPLICIT_EXTERN_C
223 if (c_header_level && --c_header_level == 0)
225 if (LINEMAP_SYSP (new_map) == 2)
226 warning (0, "badly nested C headers from preprocessor");
227 --pending_lang_change;
229 #endif
230 input_location = new_map->start_location;
232 (*debug_hooks->end_source_file) (LINEMAP_LINE (new_map));
235 update_header_times (LINEMAP_FILE (new_map));
236 input_location = new_map->start_location;
239 static void
240 cb_def_pragma (cpp_reader *pfile, location_t loc)
242 /* Issue a warning message if we have been asked to do so. Ignore
243 unknown pragmas in system headers unless an explicit
244 -Wunknown-pragmas has been given. */
245 if (warn_unknown_pragmas > in_system_header_at (input_location))
247 const unsigned char *space, *name;
248 const cpp_token *s;
249 location_t fe_loc = loc;
251 space = name = (const unsigned char *) "";
253 /* N.B. It's fine to call cpp_get_token () directly here (rather than our
254 local wrapper get_token ()), because this callback is not used with
255 flag_preprocess_only==true. */
256 s = cpp_get_token (pfile);
257 if (s->type != CPP_EOF)
259 space = cpp_token_as_text (pfile, s);
260 s = cpp_get_token (pfile);
261 if (s->type == CPP_NAME)
262 name = cpp_token_as_text (pfile, s);
265 warning_at (fe_loc, OPT_Wunknown_pragmas, "ignoring %<#pragma %s %s%>",
266 space, name);
270 /* #define callback for DWARF and DWARF2 debug info. */
271 static void
272 cb_define (cpp_reader *pfile, location_t loc, cpp_hashnode *node)
274 const struct line_map *map = linemap_lookup (line_table, loc);
275 (*debug_hooks->define) (SOURCE_LINE (linemap_check_ordinary (map), loc),
276 (const char *) cpp_macro_definition (pfile, node));
279 /* #undef callback for DWARF and DWARF2 debug info. */
280 static void
281 cb_undef (cpp_reader *pfile, location_t loc, cpp_hashnode *node)
283 if (lang_hooks.preprocess_undef)
284 lang_hooks.preprocess_undef (pfile, loc, node);
286 const struct line_map *map = linemap_lookup (line_table, loc);
287 (*debug_hooks->undef) (SOURCE_LINE (linemap_check_ordinary (map), loc),
288 (const char *) NODE_NAME (node));
291 /* Wrapper around cpp_get_token_with_location to stream the token to the
292 preprocessor so it can output it. This is necessary with
293 flag_preprocess_only if we are obtaining tokens here instead of from the loop
294 in c-ppoutput.cc, such as while processing a #pragma. */
296 static const cpp_token *
297 get_token (cpp_reader *pfile, location_t *loc = nullptr)
299 if (flag_preprocess_only)
301 location_t x;
302 if (!loc)
303 loc = &x;
304 const auto tok = cpp_get_token_with_location (pfile, loc);
305 c_pp_stream_token (pfile, tok, *loc);
306 return tok;
308 else
309 return cpp_get_token_with_location (pfile, loc);
312 /* Wrapper around cpp_get_token to skip CPP_PADDING tokens
313 and not consume CPP_EOF. This does not perform the optional
314 streaming in preprocess_only mode, so is suitable to be used
315 when processing builtin expansions such as c_common_has_attribute. */
317 static const cpp_token *
318 get_token_no_padding (cpp_reader *pfile)
320 for (;;)
322 const cpp_token *ret = cpp_peek_token (pfile, 0);
323 if (ret->type == CPP_EOF)
324 return ret;
325 ret = cpp_get_token (pfile);
326 if (ret->type != CPP_PADDING)
327 return ret;
331 /* Callback for has_attribute. */
333 c_common_has_attribute (cpp_reader *pfile, bool std_syntax)
335 int result = 0;
336 tree attr_name = NULL_TREE;
337 const cpp_token *token;
339 token = get_token_no_padding (pfile);
340 if (token->type != CPP_OPEN_PAREN)
342 cpp_error (pfile, CPP_DL_ERROR,
343 "missing '(' after \"__has_attribute\"");
344 return 0;
346 token = get_token_no_padding (pfile);
347 if (token->type == CPP_NAME)
349 attr_name = get_identifier ((const char *)
350 cpp_token_as_text (pfile, token));
351 attr_name = canonicalize_attr_name (attr_name);
352 bool have_scope = false;
353 int idx = 0;
354 const cpp_token *nxt_token;
356 nxt_token = cpp_peek_token (pfile, idx++);
357 while (nxt_token->type == CPP_PADDING);
358 if (nxt_token->type == CPP_SCOPE)
360 have_scope = true;
361 get_token_no_padding (pfile); // Eat scope.
362 nxt_token = get_token_no_padding (pfile);
363 if (nxt_token->type == CPP_NAME)
365 tree attr_ns = attr_name;
366 tree attr_id
367 = get_identifier ((const char *)
368 cpp_token_as_text (pfile, nxt_token));
369 attr_id = canonicalize_attr_name (attr_id);
370 /* OpenMP attributes need special handling. */
371 if ((flag_openmp || flag_openmp_simd)
372 && is_attribute_p ("omp", attr_ns)
373 && (is_attribute_p ("directive", attr_id)
374 || is_attribute_p ("sequence", attr_id)
375 || is_attribute_p ("decl", attr_id)))
376 result = 1;
377 if (result)
378 attr_name = NULL_TREE;
379 else
380 attr_name = build_tree_list (attr_ns, attr_id);
382 else
384 cpp_error (pfile, CPP_DL_ERROR,
385 "attribute identifier required after scope");
386 attr_name = NULL_TREE;
389 else
391 /* Some standard attributes need special handling. */
392 if (c_dialect_cxx ())
394 if (is_attribute_p ("noreturn", attr_name))
395 result = 200809;
396 else if (is_attribute_p ("deprecated", attr_name))
397 result = 201309;
398 else if (is_attribute_p ("maybe_unused", attr_name)
399 || is_attribute_p ("fallthrough", attr_name))
400 result = 201603;
401 else if (is_attribute_p ("no_unique_address", attr_name)
402 || is_attribute_p ("likely", attr_name)
403 || is_attribute_p ("unlikely", attr_name))
404 result = 201803;
405 else if (is_attribute_p ("nodiscard", attr_name))
406 result = 201907;
407 else if (is_attribute_p ("assume", attr_name))
408 result = 202207;
409 else if (is_attribute_p ("init_priority", attr_name))
411 /* The (non-standard) init_priority attribute is always
412 included in the attribute table, but we don't want to
413 advertise the attribute unless the target actually
414 supports init priorities. */
415 result = SUPPORTS_INIT_PRIORITY ? 1 : 0;
416 attr_name = NULL_TREE;
419 else
421 if (is_attribute_p ("deprecated", attr_name)
422 || is_attribute_p ("fallthrough", attr_name)
423 || is_attribute_p ("maybe_unused", attr_name)
424 || is_attribute_p ("nodiscard", attr_name)
425 || is_attribute_p ("noreturn", attr_name)
426 || is_attribute_p ("_Noreturn", attr_name))
427 result = 202311;
429 if (result)
430 attr_name = NULL_TREE;
432 if (attr_name && (have_scope || !std_syntax))
434 init_attributes ();
435 const struct attribute_spec *attr = lookup_attribute_spec (attr_name);
436 if (attr)
437 result = 1;
440 else
442 cpp_error (pfile, CPP_DL_ERROR,
443 "macro \"__has_attribute\" requires an identifier");
444 return 0;
447 if (get_token_no_padding (pfile)->type != CPP_CLOSE_PAREN)
448 cpp_error (pfile, CPP_DL_ERROR,
449 "missing ')' after \"__has_attribute\"");
451 return result;
454 /* Callback for has_builtin. */
457 c_common_has_builtin (cpp_reader *pfile)
459 const cpp_token *token = get_token_no_padding (pfile);
460 if (token->type != CPP_OPEN_PAREN)
462 cpp_error (pfile, CPP_DL_ERROR,
463 "missing '(' after \"__has_builtin\"");
464 return 0;
467 const char *name = "";
468 token = get_token_no_padding (pfile);
469 if (token->type == CPP_NAME)
471 name = (const char *) cpp_token_as_text (pfile, token);
472 token = get_token_no_padding (pfile);
473 if (token->type != CPP_CLOSE_PAREN)
475 cpp_error (pfile, CPP_DL_ERROR,
476 "expected ')' after \"%s\"", name);
477 name = "";
480 else
482 cpp_error (pfile, CPP_DL_ERROR,
483 "macro \"__has_builtin\" requires an identifier");
484 if (token->type == CPP_CLOSE_PAREN)
485 return 0;
488 /* Consume tokens up to the closing parenthesis, including any nested
489 pairs of parentheses, to avoid confusing redundant errors. */
490 for (unsigned nparen = 1; ; token = get_token_no_padding (pfile))
492 if (token->type == CPP_OPEN_PAREN)
493 ++nparen;
494 else if (token->type == CPP_CLOSE_PAREN)
495 --nparen;
496 else if (token->type == CPP_EOF)
497 break;
498 if (!nparen)
499 break;
502 return names_builtin_p (name);
506 /* Read a token and return its type. Fill *VALUE with its value, if
507 applicable. Fill *CPP_FLAGS with the token's flags, if it is
508 non-NULL. */
510 enum cpp_ttype
511 c_lex_with_flags (tree *value, location_t *loc, unsigned char *cpp_flags,
512 int lex_flags)
514 const cpp_token *tok;
515 enum cpp_ttype type;
516 unsigned char add_flags = 0;
517 enum overflow_type overflow = OT_NONE;
519 timevar_push (TV_CPP);
520 retry:
521 tok = get_token (parse_in, loc);
522 type = tok->type;
524 retry_after_at:
525 switch (type)
527 case CPP_PADDING:
528 goto retry;
530 case CPP_NAME:
531 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
532 break;
534 case CPP_NUMBER:
536 const char *suffix = NULL;
537 unsigned int flags = cpp_classify_number (parse_in, tok, &suffix, *loc);
539 switch (flags & CPP_N_CATEGORY)
541 case CPP_N_INVALID:
542 /* cpplib has issued an error. */
543 *value = error_mark_node;
544 break;
546 case CPP_N_INTEGER:
547 /* C++ uses '0' to mark virtual functions as pure.
548 Set PURE_ZERO to pass this information to the C++ parser. */
549 if (tok->val.str.len == 1 && *tok->val.str.text == '0')
550 add_flags = PURE_ZERO | DECIMAL_INT;
551 else if ((flags & CPP_N_INTEGER) && (flags & CPP_N_DECIMAL))
552 /* -Wxor-used-as-pow is only active for LHS of ^ expressed
553 as a decimal integer. */
554 add_flags = DECIMAL_INT;
555 *value = interpret_integer (tok, flags, &overflow);
556 break;
558 case CPP_N_FLOATING:
559 *value = interpret_float (tok, flags, suffix, &overflow);
560 break;
562 default:
563 gcc_unreachable ();
566 if (flags & CPP_N_USERDEF)
568 char *str;
569 tree literal;
570 tree suffix_id = get_identifier (suffix);
571 int len = tok->val.str.len - strlen (suffix);
572 /* If this is going to be used as a C string to pass to a
573 raw literal operator, we need to add a trailing NUL. */
574 tree num_string = build_string (len + 1,
575 (const char *) tok->val.str.text);
576 TREE_TYPE (num_string) = char_array_type_node;
577 num_string = fix_string_type (num_string);
578 str = CONST_CAST (char *, TREE_STRING_POINTER (num_string));
579 str[len] = '\0';
580 literal = build_userdef_literal (suffix_id, *value, overflow,
581 num_string);
582 *value = literal;
585 break;
587 case CPP_ATSIGN:
588 /* An @ may give the next token special significance in Objective-C. */
589 if (c_dialect_objc ())
591 location_t atloc = *loc;
592 location_t newloc;
594 retry_at:
595 tok = get_token (parse_in, &newloc);
596 type = tok->type;
597 switch (type)
599 case CPP_PADDING:
600 goto retry_at;
602 case CPP_STRING:
603 case CPP_WSTRING:
604 case CPP_STRING16:
605 case CPP_STRING32:
606 case CPP_UTF8STRING:
607 type = lex_string (tok, value, true, true);
608 break;
610 case CPP_NAME:
611 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
612 if (OBJC_IS_AT_KEYWORD (C_RID_CODE (*value))
613 || OBJC_IS_CXX_KEYWORD (C_RID_CODE (*value)))
615 type = CPP_AT_NAME;
616 /* Note the complication: if we found an OBJC_CXX
617 keyword, for example, 'class', we will be
618 returning a token of type CPP_AT_NAME and rid
619 code RID_CLASS (not RID_AT_CLASS). The language
620 parser needs to convert that to RID_AT_CLASS.
621 However, we've now spliced the '@' together with the
622 keyword that follows; Adjust the location so that we
623 get a source range covering the composite.
625 *loc = make_location (atloc, atloc, newloc);
626 break;
628 /* FALLTHROUGH */
630 default:
631 /* ... or not. */
632 error_at (atloc, "stray %<@%> in program");
633 *loc = newloc;
634 goto retry_after_at;
636 break;
639 /* FALLTHROUGH */
640 case CPP_HASH:
641 case CPP_PASTE:
643 unsigned char name[8];
645 *cpp_spell_token (parse_in, tok, name, true) = 0;
647 error_at (*loc, "stray %qs in program", name);
650 goto retry;
652 case CPP_OTHER:
654 cppchar_t c = tok->val.str.text[0];
656 if (c == '"' || c == '\'')
657 error_at (*loc, "missing terminating %c character", (int) c);
658 else if (ISGRAPH (c))
659 error_at (*loc, "stray %qc in program", (int) c);
660 else
662 rich_location rich_loc (line_table, *loc);
663 rich_loc.set_escape_on_output (true);
664 error_at (&rich_loc, "stray %<\\%o%> in program", (int) c);
667 goto retry;
669 case CPP_CHAR_USERDEF:
670 case CPP_WCHAR_USERDEF:
671 case CPP_CHAR16_USERDEF:
672 case CPP_CHAR32_USERDEF:
673 case CPP_UTF8CHAR_USERDEF:
675 tree literal;
676 cpp_token temp_tok = *tok;
677 const char *suffix = cpp_get_userdef_suffix (tok);
678 temp_tok.val.str.len -= strlen (suffix);
679 temp_tok.type = cpp_userdef_char_remove_type (type);
680 literal = build_userdef_literal (get_identifier (suffix),
681 lex_charconst (&temp_tok),
682 OT_NONE, NULL_TREE);
683 *value = literal;
685 break;
687 case CPP_CHAR:
688 case CPP_WCHAR:
689 case CPP_CHAR16:
690 case CPP_CHAR32:
691 case CPP_UTF8CHAR:
692 *value = lex_charconst (tok);
693 break;
695 case CPP_STRING_USERDEF:
696 case CPP_WSTRING_USERDEF:
697 case CPP_STRING16_USERDEF:
698 case CPP_STRING32_USERDEF:
699 case CPP_UTF8STRING_USERDEF:
701 tree literal, string;
702 const char *suffix = cpp_get_userdef_suffix (tok);
703 string = build_string (tok->val.str.len - strlen (suffix),
704 (const char *) tok->val.str.text);
705 literal = build_userdef_literal (get_identifier (suffix),
706 string, OT_NONE, NULL_TREE);
707 *value = literal;
709 break;
711 case CPP_STRING:
712 case CPP_WSTRING:
713 case CPP_STRING16:
714 case CPP_STRING32:
715 case CPP_UTF8STRING:
716 if ((lex_flags & C_LEX_STRING_NO_JOIN) == 0)
718 type = lex_string (tok, value, false,
719 (lex_flags & C_LEX_STRING_NO_TRANSLATE) == 0);
720 break;
722 *value = build_string (tok->val.str.len, (const char *) tok->val.str.text);
723 break;
725 case CPP_PRAGMA:
726 *value = build_int_cst (integer_type_node, tok->val.pragma);
727 break;
729 case CPP_HEADER_NAME:
730 *value = build_string (tok->val.str.len, (const char *)tok->val.str.text);
731 break;
733 /* This token should not be visible outside cpplib. */
734 case CPP_MACRO_ARG:
735 gcc_unreachable ();
737 /* CPP_COMMENT will appear when compiling with -C. Ignore, except
738 when it is a FALLTHROUGH comment, in that case set
739 PREV_FALLTHROUGH flag on the next non-comment token. */
740 case CPP_COMMENT:
741 if (tok->flags & PREV_FALLTHROUGH)
745 tok = get_token (parse_in, loc);
746 type = tok->type;
748 while (type == CPP_PADDING || type == CPP_COMMENT);
749 add_flags |= PREV_FALLTHROUGH;
750 goto retry_after_at;
752 goto retry;
754 default:
755 *value = NULL_TREE;
756 break;
759 if (cpp_flags)
760 *cpp_flags = tok->flags | add_flags;
762 timevar_pop (TV_CPP);
764 return type;
767 /* Returns the narrowest C-visible unsigned type, starting with the
768 minimum specified by FLAGS, that can fit HIGH:LOW, or itk_none if
769 there isn't one. */
771 static enum integer_type_kind
772 narrowest_unsigned_type (const widest_int &val, unsigned int flags)
774 int itk;
776 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
777 itk = itk_unsigned_int;
778 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
779 itk = itk_unsigned_long;
780 else
781 itk = itk_unsigned_long_long;
783 for (; itk < itk_none; itk += 2 /* skip unsigned types */)
785 tree upper;
787 if (integer_types[itk] == NULL_TREE)
788 continue;
789 upper = TYPE_MAX_VALUE (integer_types[itk]);
791 if (wi::geu_p (wi::to_widest (upper), val))
792 return (enum integer_type_kind) itk;
795 return itk_none;
798 /* Ditto, but narrowest signed type. */
799 static enum integer_type_kind
800 narrowest_signed_type (const widest_int &val, unsigned int flags)
802 int itk;
804 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
805 itk = itk_int;
806 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
807 itk = itk_long;
808 else
809 itk = itk_long_long;
811 for (; itk < itk_none; itk += 2 /* skip signed types */)
813 tree upper;
815 if (integer_types[itk] == NULL_TREE)
816 continue;
817 upper = TYPE_MAX_VALUE (integer_types[itk]);
819 if (wi::geu_p (wi::to_widest (upper), val))
820 return (enum integer_type_kind) itk;
823 return itk_none;
826 /* Interpret TOKEN, an integer with FLAGS as classified by cpplib. */
827 static tree
828 interpret_integer (const cpp_token *token, unsigned int flags,
829 enum overflow_type *overflow)
831 tree value, type;
832 enum integer_type_kind itk;
833 cpp_num integer;
834 HOST_WIDE_INT ival[3];
836 *overflow = OT_NONE;
838 if (UNLIKELY (flags & CPP_N_BITINT))
840 unsigned int suffix_len = 2 + ((flags & CPP_N_UNSIGNED) ? 1 : 0);
841 int max_bits_per_digit = 4; // ceil (log2 (10))
842 unsigned int prefix_len = 0;
843 bool hex = false;
844 const int bitint_maxwidth = WIDE_INT_MAX_PRECISION - 1;
845 if ((flags & CPP_N_RADIX) == CPP_N_OCTAL)
847 max_bits_per_digit = 3;
848 prefix_len = 1;
850 else if ((flags & CPP_N_RADIX) == CPP_N_HEX)
852 max_bits_per_digit = 4;
853 prefix_len = 2;
854 hex = true;
856 else if ((flags & CPP_N_RADIX) == CPP_N_BINARY)
858 max_bits_per_digit = 1;
859 prefix_len = 2;
861 int max_digits
862 = TYPE_PRECISION (intmax_type_node) >> max_bits_per_digit;
863 const int max_buf = 128;
864 if (max_digits > max_buf)
865 max_digits = max_buf;
867 widest_int wval;
868 unsigned int prec;
869 gcc_checking_assert (token->val.str.len > prefix_len + suffix_len
870 || token->val.str.len == 1 + suffix_len);
871 if (token->val.str.len - (prefix_len + suffix_len)
872 <= (unsigned) max_digits)
874 integer = cpp_interpret_integer (parse_in, token,
875 (flags & CPP_N_RADIX)
876 | CPP_N_UNSIGNED);
877 ival[0] = integer.low;
878 ival[1] = integer.high;
879 ival[2] = 0;
880 wval = widest_int::from_array (ival, 3);
882 else
884 unsigned char buf[3 + max_buf];
885 memcpy (buf, token->val.str.text, prefix_len);
886 wval = 0U;
887 const unsigned char *p = token->val.str.text + prefix_len;
888 cpp_token tok = *token;
889 tok.val.str.text = buf;
890 if (!prefix_len)
891 max_digits = 19;
894 unsigned char *q = buf + prefix_len;
897 unsigned char c = *p++;
898 if (ISDIGIT (c) || (hex && ISXDIGIT (c)))
900 *q++ = c;
901 if (q == buf + prefix_len + max_digits)
902 break;
904 else if (c != '\'')
906 --p;
907 break;
910 while (1);
911 if (q == buf + prefix_len)
912 break;
913 else
915 wi::overflow_type wioverflow;
916 *q = '\0';
917 tok.val.str.len = q - buf;
918 if (wval == 0)
920 else if (prefix_len)
922 prec = wi::min_precision (wval, UNSIGNED);
923 unsigned HOST_WIDE_INT shift
924 = (tok.val.str.len - prefix_len) * max_bits_per_digit;
925 if (prec + shift > bitint_maxwidth)
926 goto bitint_overflow;
927 wval = wi::lshift (wval, shift);
929 else
931 static unsigned HOST_WIDE_INT tens[]
932 = { 1U, 10U, 100U, 1000U,
933 HOST_WIDE_INT_UC (10000),
934 HOST_WIDE_INT_UC (100000),
935 HOST_WIDE_INT_UC (1000000),
936 HOST_WIDE_INT_UC (10000000),
937 HOST_WIDE_INT_UC (100000000),
938 HOST_WIDE_INT_UC (1000000000),
939 HOST_WIDE_INT_UC (10000000000),
940 HOST_WIDE_INT_UC (100000000000),
941 HOST_WIDE_INT_UC (1000000000000),
942 HOST_WIDE_INT_UC (10000000000000),
943 HOST_WIDE_INT_UC (100000000000000),
944 HOST_WIDE_INT_UC (1000000000000000),
945 HOST_WIDE_INT_UC (10000000000000000),
946 HOST_WIDE_INT_UC (100000000000000000),
947 HOST_WIDE_INT_UC (1000000000000000000),
948 HOST_WIDE_INT_UC (10000000000000000000) };
949 widest_int ten = tens[q - buf];
950 wval = wi::umul (wval, ten, &wioverflow);
951 if (wioverflow)
952 goto bitint_overflow;
954 integer = cpp_interpret_integer (parse_in, &tok,
955 (flags & CPP_N_RADIX)
956 | CPP_N_UNSIGNED);
957 ival[0] = integer.low;
958 ival[1] = integer.high;
959 ival[2] = 0;
960 if (prefix_len)
961 wval = wval + widest_int::from_array (ival, 3);
962 else
964 widest_int addend = widest_int::from_array (ival, 3);
965 wval = wi::add (wval, addend, UNSIGNED, &wioverflow);
966 if (wioverflow)
967 goto bitint_overflow;
971 while (1);
974 prec = wi::min_precision (wval, UNSIGNED);
975 if (prec == 0)
976 prec = 1;
977 if ((flags & CPP_N_UNSIGNED) == 0)
978 ++prec;
979 if (prec > bitint_maxwidth)
981 bitint_overflow:
982 if ((flags & CPP_N_UNSIGNED) != 0)
983 error ("integer constant is too large for "
984 "%<unsigned _BitInt(%d)%> type", bitint_maxwidth);
985 else
986 error ("integer constant is too large for "
987 "%<_BitInt(%d)%> type", bitint_maxwidth);
988 return integer_zero_node;
991 struct bitint_info info;
992 if (!targetm.c.bitint_type_info (prec, &info))
994 sorry ("%<_BitInt(%d)%> is not supported on this target", prec);
995 return integer_zero_node;
998 type = build_bitint_type (prec, (flags & CPP_N_UNSIGNED) != 0);
999 return wide_int_to_tree (type, wval);
1002 integer = cpp_interpret_integer (parse_in, token, flags);
1003 if (integer.overflow)
1004 *overflow = OT_OVERFLOW;
1006 ival[0] = integer.low;
1007 ival[1] = integer.high;
1008 ival[2] = 0;
1009 widest_int wval = widest_int::from_array (ival, 3);
1011 /* The type of a constant with a U suffix is straightforward. */
1012 if (flags & CPP_N_UNSIGNED)
1013 itk = narrowest_unsigned_type (wval, flags);
1014 else
1016 /* The type of a potentially-signed integer constant varies
1017 depending on the base it's in, the standard in use, and the
1018 length suffixes. */
1019 enum integer_type_kind itk_u
1020 = narrowest_unsigned_type (wval, flags);
1021 enum integer_type_kind itk_s
1022 = narrowest_signed_type (wval, flags);
1024 /* In both C89 and C99, octal and hex constants may be signed or
1025 unsigned, whichever fits tighter. We do not warn about this
1026 choice differing from the traditional choice, as the constant
1027 is probably a bit pattern and either way will work. */
1028 if ((flags & CPP_N_RADIX) != CPP_N_DECIMAL)
1029 itk = MIN (itk_u, itk_s);
1030 else
1032 /* In C99, decimal constants are always signed.
1033 In C89, decimal constants that don't fit in long have
1034 undefined behavior; we try to make them unsigned long.
1035 In GCC's extended C89, that last is true of decimal
1036 constants that don't fit in long long, too. */
1038 itk = itk_s;
1039 if (itk_s > itk_u && itk_s > itk_long)
1041 if (!flag_isoc99)
1043 if (itk_u < itk_unsigned_long)
1044 itk_u = itk_unsigned_long;
1045 itk = itk_u;
1046 warning (0, "this decimal constant is unsigned only in ISO C90");
1048 else
1049 warning (OPT_Wtraditional,
1050 "this decimal constant would be unsigned in ISO C90");
1055 if (itk == itk_none)
1056 /* cpplib has already issued a warning for overflow. */
1057 type = ((flags & CPP_N_UNSIGNED)
1058 ? widest_unsigned_literal_type_node
1059 : widest_integer_literal_type_node);
1060 else if (flags & CPP_N_SIZE_T)
1062 /* itk refers to fundamental types not aliased size types. */
1063 if (flags & CPP_N_UNSIGNED)
1064 type = size_type_node;
1065 else
1066 type = signed_size_type_node;
1068 else
1070 type = integer_types[itk];
1071 if (itk > itk_unsigned_long
1072 && (flags & CPP_N_WIDTH) != CPP_N_LARGE)
1073 emit_diagnostic
1074 ((c_dialect_cxx () ? cxx_dialect == cxx98 : !flag_isoc99)
1075 ? DK_PEDWARN : DK_WARNING,
1076 input_location, OPT_Wlong_long,
1077 (flags & CPP_N_UNSIGNED)
1078 ? "integer constant is too large for %<unsigned long%> type"
1079 : "integer constant is too large for %<long%> type");
1082 value = wide_int_to_tree (type, wval);
1084 /* Convert imaginary to a complex type. */
1085 if (flags & CPP_N_IMAGINARY)
1086 value = build_complex (NULL_TREE, build_int_cst (type, 0), value);
1088 return value;
1091 /* Interpret TOKEN, a floating point number with FLAGS as classified
1092 by cpplib. For C++11 SUFFIX may contain a user-defined literal suffix. */
1093 static tree
1094 interpret_float (const cpp_token *token, unsigned int flags,
1095 const char *suffix, enum overflow_type *overflow)
1097 tree type;
1098 tree const_type;
1099 tree value;
1100 REAL_VALUE_TYPE real;
1101 REAL_VALUE_TYPE real_trunc;
1102 char *copy;
1103 size_t copylen;
1105 *overflow = OT_NONE;
1107 /* Default (no suffix) depends on whether the FLOAT_CONST_DECIMAL64
1108 pragma has been used and is either double or _Decimal64. Types
1109 that are not allowed with decimal float default to double. */
1110 if (flags & CPP_N_DEFAULT)
1112 flags ^= CPP_N_DEFAULT;
1113 flags |= CPP_N_MEDIUM;
1115 if (((flags & CPP_N_HEX) == 0) && ((flags & CPP_N_IMAGINARY) == 0))
1117 warning (OPT_Wunsuffixed_float_constants,
1118 "unsuffixed floating constant");
1119 if (float_const_decimal64_p ())
1120 flags |= CPP_N_DFLOAT;
1124 /* Decode _Fract and _Accum. */
1125 if (flags & CPP_N_FRACT || flags & CPP_N_ACCUM)
1126 return interpret_fixed (token, flags);
1128 /* Decode type based on width and properties. */
1129 if (flags & CPP_N_DFLOAT)
1130 if (!targetm.decimal_float_supported_p ())
1132 error ("decimal floating-point not supported for this target");
1133 return error_mark_node;
1135 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1136 type = dfloat128_type_node;
1137 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1138 type = dfloat32_type_node;
1139 else
1140 type = dfloat64_type_node;
1141 else
1142 if (flags & CPP_N_WIDTH_MD)
1144 char suffix;
1145 machine_mode mode;
1147 if ((flags & CPP_N_WIDTH_MD) == CPP_N_MD_W)
1148 suffix = 'w';
1149 else
1150 suffix = 'q';
1152 mode = targetm.c.mode_for_suffix (suffix);
1153 if (mode == VOIDmode)
1155 error ("unsupported non-standard suffix on floating constant");
1157 return error_mark_node;
1159 else
1160 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
1162 type = c_common_type_for_mode (mode, 0);
1163 /* For Q suffix, prefer float128t_type_node (__float128) type
1164 over float128_type_node (_Float128) type if they are distinct. */
1165 if (type == float128_type_node && float128t_type_node)
1166 type = float128t_type_node;
1167 gcc_assert (type);
1169 else if ((flags & (CPP_N_FLOATN | CPP_N_FLOATNX)) != 0)
1171 unsigned int n = (flags & CPP_N_WIDTH_FLOATN_NX) >> CPP_FLOATN_SHIFT;
1172 bool extended = (flags & CPP_N_FLOATNX) != 0;
1173 type = NULL_TREE;
1174 for (int i = 0; i < NUM_FLOATN_NX_TYPES; i++)
1175 if (floatn_nx_types[i].n == (int) n
1176 && floatn_nx_types[i].extended == extended)
1178 type = FLOATN_NX_TYPE_NODE (i);
1179 break;
1181 if (type == NULL_TREE)
1183 error ("unsupported non-standard suffix on floating constant");
1184 return error_mark_node;
1186 else if (!c_dialect_cxx ())
1188 if (warn_c11_c23_compat > 0)
1190 if (pedantic && !flag_isoc23)
1191 pedwarn (input_location, OPT_Wc11_c23_compat,
1192 "non-standard suffix on floating constant "
1193 "before C23");
1194 else
1195 warning (OPT_Wc11_c23_compat,
1196 "non-standard suffix on floating constant "
1197 "before C23");
1199 else if (warn_c11_c23_compat != 0 && pedantic && !flag_isoc23)
1200 pedwarn (input_location, OPT_Wpedantic,
1201 "non-standard suffix on floating constant "
1202 "before C23");
1204 else if (!extended)
1206 if (cxx_dialect < cxx23)
1207 pedwarn (input_location, OPT_Wpedantic,
1208 "%<f%d%> or %<F%d%> suffix on floating constant only "
1209 "available with %<-std=c++2b%> or %<-std=gnu++2b%>",
1210 n, n);
1212 else
1213 pedwarn (input_location, OPT_Wpedantic,
1214 "non-standard suffix on floating constant");
1216 else if ((flags & CPP_N_BFLOAT16) != 0)
1218 type = bfloat16_type_node;
1219 if (type == NULL_TREE)
1221 error ("unsupported non-standard suffix on floating constant");
1222 return error_mark_node;
1224 if (!c_dialect_cxx ())
1225 pedwarn (input_location, OPT_Wpedantic,
1226 "non-standard suffix on floating constant");
1227 else if (cxx_dialect < cxx23)
1228 pedwarn (input_location, OPT_Wpedantic,
1229 "%<bf16%> or %<BF16%> suffix on floating constant only "
1230 "available with %<-std=c++2b%> or %<-std=gnu++2b%>");
1232 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1233 type = long_double_type_node;
1234 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL
1235 || flag_single_precision_constant)
1236 type = float_type_node;
1237 else
1238 type = double_type_node;
1240 const_type = excess_precision_type (type);
1241 if (!const_type)
1242 const_type = type;
1244 /* Copy the constant to a nul-terminated buffer. If the constant
1245 has any suffixes, cut them off; REAL_VALUE_ATOF/ REAL_VALUE_HTOF
1246 can't handle them. */
1247 copylen = token->val.str.len;
1248 if (flags & CPP_N_USERDEF)
1249 copylen -= strlen (suffix);
1250 else if (flags & CPP_N_DFLOAT)
1251 copylen -= 2;
1252 else
1254 if ((flags & CPP_N_WIDTH) != CPP_N_MEDIUM)
1255 /* Must be an F or L or machine defined suffix. */
1256 copylen--;
1257 if (flags & CPP_N_IMAGINARY)
1258 /* I or J suffix. */
1259 copylen--;
1260 if (flags & CPP_N_FLOATNX)
1261 copylen--;
1262 if (flags & (CPP_N_FLOATN | CPP_N_FLOATNX))
1264 unsigned int n = (flags & CPP_N_WIDTH_FLOATN_NX) >> CPP_FLOATN_SHIFT;
1265 while (n > 0)
1267 copylen--;
1268 n /= 10;
1273 copy = (char *) alloca (copylen + 1);
1274 if (c_dialect_cxx () ? cxx_dialect > cxx11 : flag_isoc23)
1276 size_t maxlen = 0;
1277 for (size_t i = 0; i < copylen; ++i)
1278 if (token->val.str.text[i] != '\'')
1279 copy[maxlen++] = token->val.str.text[i];
1280 copy[maxlen] = '\0';
1282 else
1284 memcpy (copy, token->val.str.text, copylen);
1285 copy[copylen] = '\0';
1288 real_from_string3 (&real, copy, TYPE_MODE (const_type));
1289 if (const_type != type)
1290 /* Diagnosing if the result of converting the value with excess
1291 precision to the semantic type would overflow (with associated
1292 double rounding) is more appropriate than diagnosing if the
1293 result of converting the string directly to the semantic type
1294 would overflow. */
1295 real_convert (&real_trunc, TYPE_MODE (type), &real);
1297 /* Both C and C++ require a diagnostic for a floating constant
1298 outside the range of representable values of its type. Since we
1299 have __builtin_inf* to produce an infinity, this is now a
1300 mandatory pedwarn if the target does not support infinities. */
1301 if (REAL_VALUE_ISINF (real)
1302 || (const_type != type && REAL_VALUE_ISINF (real_trunc)))
1304 *overflow = OT_OVERFLOW;
1305 if (!(flags & CPP_N_USERDEF))
1307 if (!MODE_HAS_INFINITIES (TYPE_MODE (type)))
1308 pedwarn (input_location, 0,
1309 "floating constant exceeds range of %qT", type);
1310 else
1311 warning (OPT_Woverflow,
1312 "floating constant exceeds range of %qT", type);
1315 /* We also give a warning if the value underflows. */
1316 else if (real_equal (&real, &dconst0)
1317 || (const_type != type
1318 && real_equal (&real_trunc, &dconst0)))
1320 REAL_VALUE_TYPE realvoidmode;
1321 int oflow = real_from_string (&realvoidmode, copy);
1322 *overflow = (oflow == 0 ? OT_NONE
1323 : (oflow < 0 ? OT_UNDERFLOW : OT_OVERFLOW));
1324 if (!(flags & CPP_N_USERDEF))
1326 if (oflow < 0 || !real_equal (&realvoidmode, &dconst0))
1327 warning (OPT_Woverflow, "floating constant truncated to zero");
1331 /* Create a node with determined type and value. */
1332 value = build_real (const_type, real);
1333 if (flags & CPP_N_IMAGINARY)
1335 value = build_complex (NULL_TREE,
1336 fold_convert (const_type,
1337 integer_zero_node), value);
1338 if (type != const_type)
1340 const_type = TREE_TYPE (value);
1341 type = build_complex_type (type);
1345 if (type != const_type)
1346 value = build1_loc (token->src_loc, EXCESS_PRECISION_EXPR, type, value);
1348 return value;
1351 /* Interpret TOKEN, a fixed-point number with FLAGS as classified
1352 by cpplib. */
1354 static tree
1355 interpret_fixed (const cpp_token *token, unsigned int flags)
1357 tree type;
1358 tree value;
1359 FIXED_VALUE_TYPE fixed;
1360 char *copy;
1361 size_t copylen;
1363 copylen = token->val.str.len;
1365 if (flags & CPP_N_FRACT) /* _Fract. */
1367 if (flags & CPP_N_UNSIGNED) /* Unsigned _Fract. */
1369 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1371 type = unsigned_long_long_fract_type_node;
1372 copylen -= 4;
1374 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1376 type = unsigned_long_fract_type_node;
1377 copylen -= 3;
1379 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1381 type = unsigned_short_fract_type_node;
1382 copylen -= 3;
1384 else
1386 type = unsigned_fract_type_node;
1387 copylen -= 2;
1390 else /* Signed _Fract. */
1392 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1394 type = long_long_fract_type_node;
1395 copylen -= 3;
1397 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1399 type = long_fract_type_node;
1400 copylen -= 2;
1402 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1404 type = short_fract_type_node;
1405 copylen -= 2;
1407 else
1409 type = fract_type_node;
1410 copylen --;
1414 else /* _Accum. */
1416 if (flags & CPP_N_UNSIGNED) /* Unsigned _Accum. */
1418 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1420 type = unsigned_long_long_accum_type_node;
1421 copylen -= 4;
1423 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1425 type = unsigned_long_accum_type_node;
1426 copylen -= 3;
1428 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1430 type = unsigned_short_accum_type_node;
1431 copylen -= 3;
1433 else
1435 type = unsigned_accum_type_node;
1436 copylen -= 2;
1439 else /* Signed _Accum. */
1441 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1443 type = long_long_accum_type_node;
1444 copylen -= 3;
1446 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1448 type = long_accum_type_node;
1449 copylen -= 2;
1451 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1453 type = short_accum_type_node;
1454 copylen -= 2;
1456 else
1458 type = accum_type_node;
1459 copylen --;
1464 copy = (char *) alloca (copylen + 1);
1465 memcpy (copy, token->val.str.text, copylen);
1466 copy[copylen] = '\0';
1468 fixed_from_string (&fixed, copy, SCALAR_TYPE_MODE (type));
1470 /* Create a node with determined type and value. */
1471 value = build_fixed (type, fixed);
1473 return value;
1476 /* Convert a series of STRING, WSTRING, STRING16, STRING32 and/or
1477 UTF8STRING tokens into a tree, performing string constant
1478 concatenation. TOK is the first of these. VALP is the location to
1479 write the string into. OBJC_STRING indicates whether an '@' token
1480 preceded the incoming token (in that case, the strings can either
1481 be ObjC strings, preceded by a single '@', or normal strings, not
1482 preceded by '@'. The result will be a CPP_OBJC_STRING). Returns
1483 the CPP token type of the result (CPP_STRING, CPP_WSTRING,
1484 CPP_STRING32, CPP_STRING16, CPP_UTF8STRING, or CPP_OBJC_STRING).
1486 This is unfortunately more work than it should be. If any of the
1487 strings in the series has an L prefix, the result is a wide string
1488 (6.4.5p4). Whether or not the result is a wide string affects the
1489 meaning of octal and hexadecimal escapes (6.4.4.4p6,9). But escape
1490 sequences do not continue across the boundary between two strings in
1491 a series (6.4.5p7), so we must not lose the boundaries. Therefore
1492 cpp_interpret_string takes a vector of cpp_string structures, which
1493 we must arrange to provide. */
1495 static enum cpp_ttype
1496 lex_string (const cpp_token *tok, tree *valp, bool objc_string, bool translate)
1498 tree value;
1499 size_t concats = 0;
1500 struct obstack str_ob;
1501 struct obstack loc_ob;
1502 cpp_string istr;
1503 enum cpp_ttype type = tok->type;
1505 /* Try to avoid the overhead of creating and destroying an obstack
1506 for the common case of just one string. */
1507 cpp_string str = tok->val.str;
1508 location_t init_loc = tok->src_loc;
1509 cpp_string *strs = &str;
1510 location_t *locs = NULL;
1512 /* objc_at_sign_was_seen is only used when doing Objective-C string
1513 concatenation. It is 'true' if we have seen an '@' before the
1514 current string, and 'false' if not. We must see exactly one or
1515 zero '@' before each string. */
1516 bool objc_at_sign_was_seen = false;
1518 retry:
1519 tok = get_token (parse_in);
1520 switch (tok->type)
1522 case CPP_PADDING:
1523 goto retry;
1524 case CPP_ATSIGN:
1525 if (objc_string)
1527 if (objc_at_sign_was_seen)
1528 error ("repeated %<@%> before Objective-C string");
1530 objc_at_sign_was_seen = true;
1531 goto retry;
1533 /* FALLTHROUGH */
1535 default:
1536 break;
1538 case CPP_WSTRING:
1539 case CPP_STRING16:
1540 case CPP_STRING32:
1541 case CPP_UTF8STRING:
1542 if (type != tok->type)
1544 if (type == CPP_STRING)
1545 type = tok->type;
1546 else
1547 error ("unsupported non-standard concatenation of string literals");
1549 /* FALLTHROUGH */
1551 case CPP_STRING:
1552 if (!concats)
1554 gcc_obstack_init (&str_ob);
1555 gcc_obstack_init (&loc_ob);
1556 obstack_grow (&str_ob, &str, sizeof (cpp_string));
1557 obstack_grow (&loc_ob, &init_loc, sizeof (location_t));
1560 concats++;
1561 obstack_grow (&str_ob, &tok->val.str, sizeof (cpp_string));
1562 obstack_grow (&loc_ob, &tok->src_loc, sizeof (location_t));
1564 if (objc_string)
1565 objc_at_sign_was_seen = false;
1566 goto retry;
1569 /* It is an error if we saw a '@' with no following string. */
1570 if (objc_at_sign_was_seen)
1571 error ("stray %<@%> in program");
1573 /* We have read one more token than we want. */
1574 _cpp_backup_tokens (parse_in, 1);
1575 if (concats)
1577 strs = XOBFINISH (&str_ob, cpp_string *);
1578 locs = XOBFINISH (&loc_ob, location_t *);
1581 if (concats && !objc_string && !in_system_header_at (input_location))
1582 warning (OPT_Wtraditional,
1583 "traditional C rejects string constant concatenation");
1585 if ((translate
1586 ? cpp_interpret_string : cpp_interpret_string_notranslate)
1587 (parse_in, strs, concats + 1, &istr, type))
1589 value = build_string (istr.len, (const char *) istr.text);
1590 free (CONST_CAST (unsigned char *, istr.text));
1591 if (concats)
1593 gcc_assert (locs);
1594 gcc_assert (g_string_concat_db);
1595 g_string_concat_db->record_string_concatenation (concats + 1, locs);
1598 else
1600 /* Callers cannot generally handle error_mark_node in this context,
1601 so return the empty string instead. cpp_interpret_string has
1602 issued an error. */
1603 switch (type)
1605 default:
1606 case CPP_STRING:
1607 case CPP_UTF8STRING:
1608 if (type == CPP_UTF8STRING && flag_char8_t)
1610 value = build_string (TYPE_PRECISION (char8_type_node)
1611 / TYPE_PRECISION (char_type_node),
1612 ""); /* char8_t is 8 bits */
1614 else
1615 value = build_string (1, "");
1616 break;
1617 case CPP_STRING16:
1618 value = build_string (TYPE_PRECISION (char16_type_node)
1619 / TYPE_PRECISION (char_type_node),
1620 "\0"); /* char16_t is 16 bits */
1621 break;
1622 case CPP_STRING32:
1623 value = build_string (TYPE_PRECISION (char32_type_node)
1624 / TYPE_PRECISION (char_type_node),
1625 "\0\0\0"); /* char32_t is 32 bits */
1626 break;
1627 case CPP_WSTRING:
1628 value = build_string (TYPE_PRECISION (wchar_type_node)
1629 / TYPE_PRECISION (char_type_node),
1630 "\0\0\0"); /* widest supported wchar_t
1631 is 32 bits */
1632 break;
1636 switch (type)
1638 default:
1639 case CPP_STRING:
1640 TREE_TYPE (value) = char_array_type_node;
1641 break;
1642 case CPP_UTF8STRING:
1643 if (flag_char8_t)
1644 TREE_TYPE (value) = char8_array_type_node;
1645 else
1646 TREE_TYPE (value) = char_array_type_node;
1647 break;
1648 case CPP_STRING16:
1649 TREE_TYPE (value) = char16_array_type_node;
1650 break;
1651 case CPP_STRING32:
1652 TREE_TYPE (value) = char32_array_type_node;
1653 break;
1654 case CPP_WSTRING:
1655 TREE_TYPE (value) = wchar_array_type_node;
1657 *valp = fix_string_type (value);
1659 if (concats)
1661 obstack_free (&str_ob, 0);
1662 obstack_free (&loc_ob, 0);
1665 return objc_string ? CPP_OBJC_STRING : type;
1668 /* Converts a (possibly wide) character constant token into a tree. */
1669 static tree
1670 lex_charconst (const cpp_token *token)
1672 cppchar_t result;
1673 tree type, value;
1674 unsigned int chars_seen;
1675 int unsignedp = 0;
1677 result = cpp_interpret_charconst (parse_in, token,
1678 &chars_seen, &unsignedp);
1680 if (token->type == CPP_WCHAR)
1681 type = wchar_type_node;
1682 else if (token->type == CPP_CHAR32)
1683 type = char32_type_node;
1684 else if (token->type == CPP_CHAR16)
1685 type = char16_type_node;
1686 else if (token->type == CPP_UTF8CHAR)
1688 if (flag_char8_t)
1689 type = char8_type_node;
1690 else
1691 type = char_type_node;
1693 /* In C, a character constant has type 'int'.
1694 In C++ 'char', but multi-char charconsts have type 'int'. */
1695 else if (!c_dialect_cxx () || chars_seen > 1)
1696 type = integer_type_node;
1697 else
1698 type = char_type_node;
1700 /* Cast to cppchar_signed_t to get correct sign-extension of RESULT
1701 before possibly widening to HOST_WIDE_INT for build_int_cst. */
1702 if (unsignedp || (cppchar_signed_t) result >= 0)
1703 value = build_int_cst (type, result);
1704 else
1705 value = build_int_cst (type, (cppchar_signed_t) result);
1707 return value;
1710 /* Helper function for c_parser_peek_conflict_marker
1711 and cp_lexer_peek_conflict_marker.
1712 Given a possible conflict marker token of kind TOK1_KIND
1713 consisting of a pair of characters, get the token kind for the
1714 standalone final character. */
1716 enum cpp_ttype
1717 conflict_marker_get_final_tok_kind (enum cpp_ttype tok1_kind)
1719 switch (tok1_kind)
1721 default: gcc_unreachable ();
1722 case CPP_LSHIFT:
1723 /* "<<" and '<' */
1724 return CPP_LESS;
1726 case CPP_EQ_EQ:
1727 /* "==" and '=' */
1728 return CPP_EQ;
1730 case CPP_RSHIFT:
1731 /* ">>" and '>' */
1732 return CPP_GREATER;