Fix warning with -Wsign-compare -Wsystem-headers
[official-gcc.git] / gcc / c-family / c-lex.c
blobac58335cf3ad908509c321556402cb98b378826e
1 /* Mainly the interface between cpplib and the C front ends.
2 Copyright (C) 1987-2018 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "target.h"
24 #include "c-common.h"
25 #include "timevar.h"
26 #include "stringpool.h"
27 #include "stor-layout.h"
28 #include "c-pragma.h"
29 #include "debug.h"
30 #include "file-prefix-map.h" /* remap_macro_filename() */
32 #include "attribs.h"
34 /* We may keep statistics about how long which files took to compile. */
35 static int header_time, body_time;
36 static splay_tree file_info_tree;
38 int pending_lang_change; /* If we need to switch languages - C++ only */
39 int c_header_level; /* depth in C headers - C++ only */
41 static tree interpret_integer (const cpp_token *, unsigned int,
42 enum overflow_type *);
43 static tree interpret_float (const cpp_token *, unsigned int, const char *,
44 enum overflow_type *);
45 static tree interpret_fixed (const cpp_token *, unsigned int);
46 static enum integer_type_kind narrowest_unsigned_type
47 (const widest_int &, unsigned int);
48 static enum integer_type_kind narrowest_signed_type
49 (const widest_int &, unsigned int);
50 static enum cpp_ttype lex_string (const cpp_token *, tree *, bool, bool);
51 static tree lex_charconst (const cpp_token *);
52 static void update_header_times (const char *);
53 static int dump_one_header (splay_tree_node, void *);
54 static void cb_line_change (cpp_reader *, const cpp_token *, int);
55 static void cb_ident (cpp_reader *, unsigned int, const cpp_string *);
56 static void cb_def_pragma (cpp_reader *, unsigned int);
57 static void cb_define (cpp_reader *, unsigned int, cpp_hashnode *);
58 static void cb_undef (cpp_reader *, unsigned int, cpp_hashnode *);
60 void
61 init_c_lex (void)
63 struct cpp_callbacks *cb;
64 struct c_fileinfo *toplevel;
66 /* The get_fileinfo data structure must be initialized before
67 cpp_read_main_file is called. */
68 toplevel = get_fileinfo ("<top level>");
69 if (flag_detailed_statistics)
71 header_time = 0;
72 body_time = get_run_time ();
73 toplevel->time = body_time;
76 cb = cpp_get_callbacks (parse_in);
78 cb->line_change = cb_line_change;
79 cb->ident = cb_ident;
80 cb->def_pragma = cb_def_pragma;
81 cb->valid_pch = c_common_valid_pch;
82 cb->read_pch = c_common_read_pch;
83 cb->has_attribute = c_common_has_attribute;
84 cb->get_source_date_epoch = cb_get_source_date_epoch;
85 cb->get_suggestion = cb_get_suggestion;
86 cb->remap_filename = remap_macro_filename;
88 /* Set the debug callbacks if we can use them. */
89 if ((debug_info_level == DINFO_LEVEL_VERBOSE
90 && (write_symbols == DWARF2_DEBUG
91 || write_symbols == VMS_AND_DWARF2_DEBUG))
92 || flag_dump_go_spec != NULL)
94 cb->define = cb_define;
95 cb->undef = cb_undef;
99 struct c_fileinfo *
100 get_fileinfo (const char *name)
102 splay_tree_node n;
103 struct c_fileinfo *fi;
105 if (!file_info_tree)
106 file_info_tree = splay_tree_new (splay_tree_compare_strings,
108 splay_tree_delete_pointers);
110 n = splay_tree_lookup (file_info_tree, (splay_tree_key) name);
111 if (n)
112 return (struct c_fileinfo *) n->value;
114 fi = XNEW (struct c_fileinfo);
115 fi->time = 0;
116 fi->interface_only = 0;
117 fi->interface_unknown = 1;
118 splay_tree_insert (file_info_tree, (splay_tree_key) name,
119 (splay_tree_value) fi);
120 return fi;
123 static void
124 update_header_times (const char *name)
126 /* Changing files again. This means currently collected time
127 is charged against header time, and body time starts back at 0. */
128 if (flag_detailed_statistics)
130 int this_time = get_run_time ();
131 struct c_fileinfo *file = get_fileinfo (name);
132 header_time += this_time - body_time;
133 file->time += this_time - body_time;
134 body_time = this_time;
138 static int
139 dump_one_header (splay_tree_node n, void * ARG_UNUSED (dummy))
141 print_time ((const char *) n->key,
142 ((struct c_fileinfo *) n->value)->time);
143 return 0;
146 void
147 dump_time_statistics (void)
149 struct c_fileinfo *file = get_fileinfo (LOCATION_FILE (input_location));
150 int this_time = get_run_time ();
151 file->time += this_time - body_time;
153 fprintf (stderr, "\n******\n");
154 print_time ("header files (total)", header_time);
155 print_time ("main file (total)", this_time - body_time);
156 fprintf (stderr, "ratio = %g : 1\n",
157 (double) header_time / (double) (this_time - body_time));
158 fprintf (stderr, "\n******\n");
160 splay_tree_foreach (file_info_tree, dump_one_header, 0);
163 static void
164 cb_ident (cpp_reader * ARG_UNUSED (pfile),
165 unsigned int ARG_UNUSED (line),
166 const cpp_string * ARG_UNUSED (str))
168 if (!flag_no_ident)
170 /* Convert escapes in the string. */
171 cpp_string cstr = { 0, 0 };
172 if (cpp_interpret_string (pfile, str, 1, &cstr, CPP_STRING))
174 targetm.asm_out.output_ident ((const char *) cstr.text);
175 free (CONST_CAST (unsigned char *, cstr.text));
180 /* Called at the start of every non-empty line. TOKEN is the first
181 lexed token on the line. Used for diagnostic line numbers. */
182 static void
183 cb_line_change (cpp_reader * ARG_UNUSED (pfile), const cpp_token *token,
184 int parsing_args)
186 if (token->type != CPP_EOF && !parsing_args)
187 input_location = token->src_loc;
190 void
191 fe_file_change (const line_map_ordinary *new_map)
193 if (new_map == NULL)
194 return;
196 if (new_map->reason == LC_ENTER)
198 /* Don't stack the main buffer on the input stack;
199 we already did in compile_file. */
200 if (!MAIN_FILE_P (new_map))
202 location_t included_at = linemap_included_from (new_map);
203 int line = 0;
204 if (included_at > BUILTINS_LOCATION)
205 line = SOURCE_LINE (new_map - 1, included_at);
207 input_location = new_map->start_location;
208 (*debug_hooks->start_source_file) (line, LINEMAP_FILE (new_map));
209 #ifdef SYSTEM_IMPLICIT_EXTERN_C
210 if (c_header_level)
211 ++c_header_level;
212 else if (LINEMAP_SYSP (new_map) == 2)
214 c_header_level = 1;
215 ++pending_lang_change;
217 #endif
220 else if (new_map->reason == LC_LEAVE)
222 #ifdef SYSTEM_IMPLICIT_EXTERN_C
223 if (c_header_level && --c_header_level == 0)
225 if (LINEMAP_SYSP (new_map) == 2)
226 warning (0, "badly nested C headers from preprocessor");
227 --pending_lang_change;
229 #endif
230 input_location = new_map->start_location;
232 (*debug_hooks->end_source_file) (LINEMAP_LINE (new_map));
235 update_header_times (LINEMAP_FILE (new_map));
236 input_location = new_map->start_location;
239 static void
240 cb_def_pragma (cpp_reader *pfile, source_location loc)
242 /* Issue a warning message if we have been asked to do so. Ignore
243 unknown pragmas in system headers unless an explicit
244 -Wunknown-pragmas has been given. */
245 if (warn_unknown_pragmas > in_system_header_at (input_location))
247 const unsigned char *space, *name;
248 const cpp_token *s;
249 location_t fe_loc = loc;
251 space = name = (const unsigned char *) "";
252 s = cpp_get_token (pfile);
253 if (s->type != CPP_EOF)
255 space = cpp_token_as_text (pfile, s);
256 s = cpp_get_token (pfile);
257 if (s->type == CPP_NAME)
258 name = cpp_token_as_text (pfile, s);
261 warning_at (fe_loc, OPT_Wunknown_pragmas, "ignoring #pragma %s %s",
262 space, name);
266 /* #define callback for DWARF and DWARF2 debug info. */
267 static void
268 cb_define (cpp_reader *pfile, source_location loc, cpp_hashnode *node)
270 const struct line_map *map = linemap_lookup (line_table, loc);
271 (*debug_hooks->define) (SOURCE_LINE (linemap_check_ordinary (map), loc),
272 (const char *) cpp_macro_definition (pfile, node));
275 /* #undef callback for DWARF and DWARF2 debug info. */
276 static void
277 cb_undef (cpp_reader * ARG_UNUSED (pfile), source_location loc,
278 cpp_hashnode *node)
280 const struct line_map *map = linemap_lookup (line_table, loc);
281 (*debug_hooks->undef) (SOURCE_LINE (linemap_check_ordinary (map), loc),
282 (const char *) NODE_NAME (node));
285 /* Wrapper around cpp_get_token to skip CPP_PADDING tokens
286 and not consume CPP_EOF. */
287 static const cpp_token *
288 get_token_no_padding (cpp_reader *pfile)
290 for (;;)
292 const cpp_token *ret = cpp_peek_token (pfile, 0);
293 if (ret->type == CPP_EOF)
294 return ret;
295 ret = cpp_get_token (pfile);
296 if (ret->type != CPP_PADDING)
297 return ret;
301 /* Callback for has_attribute. */
303 c_common_has_attribute (cpp_reader *pfile)
305 int result = 0;
306 tree attr_name = NULL_TREE;
307 const cpp_token *token;
309 token = get_token_no_padding (pfile);
310 if (token->type != CPP_OPEN_PAREN)
312 cpp_error (pfile, CPP_DL_ERROR,
313 "missing '(' after \"__has_attribute\"");
314 return 0;
316 token = get_token_no_padding (pfile);
317 if (token->type == CPP_NAME)
319 attr_name = get_identifier ((const char *)
320 cpp_token_as_text (pfile, token));
321 attr_name = canonicalize_attr_name (attr_name);
322 if (c_dialect_cxx ())
324 int idx = 0;
325 const cpp_token *nxt_token;
327 nxt_token = cpp_peek_token (pfile, idx++);
328 while (nxt_token->type == CPP_PADDING);
329 if (nxt_token->type == CPP_SCOPE)
331 get_token_no_padding (pfile); // Eat scope.
332 nxt_token = get_token_no_padding (pfile);
333 if (nxt_token->type == CPP_NAME)
335 tree attr_ns = attr_name;
336 tree attr_id
337 = get_identifier ((const char *)
338 cpp_token_as_text (pfile, nxt_token));
339 attr_name = build_tree_list (attr_ns, attr_id);
341 else
343 cpp_error (pfile, CPP_DL_ERROR,
344 "attribute identifier required after scope");
345 attr_name = NULL_TREE;
348 else
350 /* Some standard attributes need special handling. */
351 if (is_attribute_p ("noreturn", attr_name))
352 result = 200809;
353 else if (is_attribute_p ("deprecated", attr_name))
354 result = 201309;
355 else if (is_attribute_p ("maybe_unused", attr_name)
356 || is_attribute_p ("nodiscard", attr_name)
357 || is_attribute_p ("fallthrough", attr_name))
358 result = 201603;
359 if (result)
360 attr_name = NULL_TREE;
363 if (attr_name)
365 init_attributes ();
366 const struct attribute_spec *attr = lookup_attribute_spec (attr_name);
367 if (attr)
368 result = 1;
371 else
373 cpp_error (pfile, CPP_DL_ERROR,
374 "macro \"__has_attribute\" requires an identifier");
375 return 0;
378 if (get_token_no_padding (pfile)->type != CPP_CLOSE_PAREN)
379 cpp_error (pfile, CPP_DL_ERROR,
380 "missing ')' after \"__has_attribute\"");
382 return result;
385 /* Read a token and return its type. Fill *VALUE with its value, if
386 applicable. Fill *CPP_FLAGS with the token's flags, if it is
387 non-NULL. */
389 enum cpp_ttype
390 c_lex_with_flags (tree *value, location_t *loc, unsigned char *cpp_flags,
391 int lex_flags)
393 static bool no_more_pch;
394 const cpp_token *tok;
395 enum cpp_ttype type;
396 unsigned char add_flags = 0;
397 enum overflow_type overflow = OT_NONE;
399 timevar_push (TV_CPP);
400 retry:
401 tok = cpp_get_token_with_location (parse_in, loc);
402 type = tok->type;
404 retry_after_at:
405 switch (type)
407 case CPP_PADDING:
408 goto retry;
410 case CPP_NAME:
411 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
412 break;
414 case CPP_NUMBER:
416 const char *suffix = NULL;
417 unsigned int flags = cpp_classify_number (parse_in, tok, &suffix, *loc);
419 switch (flags & CPP_N_CATEGORY)
421 case CPP_N_INVALID:
422 /* cpplib has issued an error. */
423 *value = error_mark_node;
424 break;
426 case CPP_N_INTEGER:
427 /* C++ uses '0' to mark virtual functions as pure.
428 Set PURE_ZERO to pass this information to the C++ parser. */
429 if (tok->val.str.len == 1 && *tok->val.str.text == '0')
430 add_flags = PURE_ZERO;
431 *value = interpret_integer (tok, flags, &overflow);
432 break;
434 case CPP_N_FLOATING:
435 *value = interpret_float (tok, flags, suffix, &overflow);
436 break;
438 default:
439 gcc_unreachable ();
442 if (flags & CPP_N_USERDEF)
444 char *str;
445 tree literal;
446 tree suffix_id = get_identifier (suffix);
447 int len = tok->val.str.len - strlen (suffix);
448 /* If this is going to be used as a C string to pass to a
449 raw literal operator, we need to add a trailing NUL. */
450 tree num_string = build_string (len + 1,
451 (const char *) tok->val.str.text);
452 TREE_TYPE (num_string) = char_array_type_node;
453 num_string = fix_string_type (num_string);
454 str = CONST_CAST (char *, TREE_STRING_POINTER (num_string));
455 str[len] = '\0';
456 literal = build_userdef_literal (suffix_id, *value, overflow,
457 num_string);
458 *value = literal;
461 break;
463 case CPP_ATSIGN:
464 /* An @ may give the next token special significance in Objective-C. */
465 if (c_dialect_objc ())
467 location_t atloc = *loc;
468 location_t newloc;
470 retry_at:
471 tok = cpp_get_token_with_location (parse_in, &newloc);
472 type = tok->type;
473 switch (type)
475 case CPP_PADDING:
476 goto retry_at;
478 case CPP_STRING:
479 case CPP_WSTRING:
480 case CPP_STRING16:
481 case CPP_STRING32:
482 case CPP_UTF8STRING:
483 type = lex_string (tok, value, true, true);
484 break;
486 case CPP_NAME:
487 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
488 if (OBJC_IS_AT_KEYWORD (C_RID_CODE (*value))
489 || OBJC_IS_CXX_KEYWORD (C_RID_CODE (*value)))
491 type = CPP_AT_NAME;
492 /* Note the complication: if we found an OBJC_CXX
493 keyword, for example, 'class', we will be
494 returning a token of type CPP_AT_NAME and rid
495 code RID_CLASS (not RID_AT_CLASS). The language
496 parser needs to convert that to RID_AT_CLASS.
498 break;
500 /* FALLTHROUGH */
502 default:
503 /* ... or not. */
504 error_at (atloc, "stray %<@%> in program");
505 *loc = newloc;
506 goto retry_after_at;
508 break;
511 /* FALLTHROUGH */
512 case CPP_HASH:
513 case CPP_PASTE:
515 unsigned char name[8];
517 *cpp_spell_token (parse_in, tok, name, true) = 0;
519 error_at (*loc, "stray %qs in program", name);
522 goto retry;
524 case CPP_OTHER:
526 cppchar_t c = tok->val.str.text[0];
528 if (c == '"' || c == '\'')
529 error_at (*loc, "missing terminating %c character", (int) c);
530 else if (ISGRAPH (c))
531 error_at (*loc, "stray %qc in program", (int) c);
532 else
533 error_at (*loc, "stray %<\\%o%> in program", (int) c);
535 goto retry;
537 case CPP_CHAR_USERDEF:
538 case CPP_WCHAR_USERDEF:
539 case CPP_CHAR16_USERDEF:
540 case CPP_CHAR32_USERDEF:
541 case CPP_UTF8CHAR_USERDEF:
543 tree literal;
544 cpp_token temp_tok = *tok;
545 const char *suffix = cpp_get_userdef_suffix (tok);
546 temp_tok.val.str.len -= strlen (suffix);
547 temp_tok.type = cpp_userdef_char_remove_type (type);
548 literal = build_userdef_literal (get_identifier (suffix),
549 lex_charconst (&temp_tok),
550 OT_NONE, NULL_TREE);
551 *value = literal;
553 break;
555 case CPP_CHAR:
556 case CPP_WCHAR:
557 case CPP_CHAR16:
558 case CPP_CHAR32:
559 case CPP_UTF8CHAR:
560 *value = lex_charconst (tok);
561 break;
563 case CPP_STRING_USERDEF:
564 case CPP_WSTRING_USERDEF:
565 case CPP_STRING16_USERDEF:
566 case CPP_STRING32_USERDEF:
567 case CPP_UTF8STRING_USERDEF:
569 tree literal, string;
570 const char *suffix = cpp_get_userdef_suffix (tok);
571 string = build_string (tok->val.str.len - strlen (suffix),
572 (const char *) tok->val.str.text);
573 literal = build_userdef_literal (get_identifier (suffix),
574 string, OT_NONE, NULL_TREE);
575 *value = literal;
577 break;
579 case CPP_STRING:
580 case CPP_WSTRING:
581 case CPP_STRING16:
582 case CPP_STRING32:
583 case CPP_UTF8STRING:
584 if ((lex_flags & C_LEX_STRING_NO_JOIN) == 0)
586 type = lex_string (tok, value, false,
587 (lex_flags & C_LEX_STRING_NO_TRANSLATE) == 0);
588 break;
590 *value = build_string (tok->val.str.len, (const char *) tok->val.str.text);
591 break;
593 case CPP_PRAGMA:
594 *value = build_int_cst (integer_type_node, tok->val.pragma);
595 break;
597 /* These tokens should not be visible outside cpplib. */
598 case CPP_HEADER_NAME:
599 case CPP_MACRO_ARG:
600 gcc_unreachable ();
602 /* CPP_COMMENT will appear when compiling with -C. Ignore, except
603 when it is a FALLTHROUGH comment, in that case set
604 PREV_FALLTHROUGH flag on the next non-comment token. */
605 case CPP_COMMENT:
606 if (tok->flags & PREV_FALLTHROUGH)
610 tok = cpp_get_token_with_location (parse_in, loc);
611 type = tok->type;
613 while (type == CPP_PADDING || type == CPP_COMMENT);
614 add_flags |= PREV_FALLTHROUGH;
615 goto retry_after_at;
617 goto retry;
619 default:
620 *value = NULL_TREE;
621 break;
624 if (cpp_flags)
625 *cpp_flags = tok->flags | add_flags;
627 if (!no_more_pch)
629 no_more_pch = true;
630 c_common_no_more_pch ();
633 timevar_pop (TV_CPP);
635 return type;
638 /* Returns the narrowest C-visible unsigned type, starting with the
639 minimum specified by FLAGS, that can fit HIGH:LOW, or itk_none if
640 there isn't one. */
642 static enum integer_type_kind
643 narrowest_unsigned_type (const widest_int &val, unsigned int flags)
645 int itk;
647 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
648 itk = itk_unsigned_int;
649 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
650 itk = itk_unsigned_long;
651 else
652 itk = itk_unsigned_long_long;
654 for (; itk < itk_none; itk += 2 /* skip unsigned types */)
656 tree upper;
658 if (integer_types[itk] == NULL_TREE)
659 continue;
660 upper = TYPE_MAX_VALUE (integer_types[itk]);
662 if (wi::geu_p (wi::to_widest (upper), val))
663 return (enum integer_type_kind) itk;
666 return itk_none;
669 /* Ditto, but narrowest signed type. */
670 static enum integer_type_kind
671 narrowest_signed_type (const widest_int &val, unsigned int flags)
673 int itk;
675 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
676 itk = itk_int;
677 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
678 itk = itk_long;
679 else
680 itk = itk_long_long;
682 for (; itk < itk_none; itk += 2 /* skip signed types */)
684 tree upper;
686 if (integer_types[itk] == NULL_TREE)
687 continue;
688 upper = TYPE_MAX_VALUE (integer_types[itk]);
690 if (wi::geu_p (wi::to_widest (upper), val))
691 return (enum integer_type_kind) itk;
694 return itk_none;
697 /* Interpret TOKEN, an integer with FLAGS as classified by cpplib. */
698 static tree
699 interpret_integer (const cpp_token *token, unsigned int flags,
700 enum overflow_type *overflow)
702 tree value, type;
703 enum integer_type_kind itk;
704 cpp_num integer;
705 HOST_WIDE_INT ival[3];
707 *overflow = OT_NONE;
709 integer = cpp_interpret_integer (parse_in, token, flags);
710 if (integer.overflow)
711 *overflow = OT_OVERFLOW;
713 ival[0] = integer.low;
714 ival[1] = integer.high;
715 ival[2] = 0;
716 widest_int wval = widest_int::from_array (ival, 3);
718 /* The type of a constant with a U suffix is straightforward. */
719 if (flags & CPP_N_UNSIGNED)
720 itk = narrowest_unsigned_type (wval, flags);
721 else
723 /* The type of a potentially-signed integer constant varies
724 depending on the base it's in, the standard in use, and the
725 length suffixes. */
726 enum integer_type_kind itk_u
727 = narrowest_unsigned_type (wval, flags);
728 enum integer_type_kind itk_s
729 = narrowest_signed_type (wval, flags);
731 /* In both C89 and C99, octal and hex constants may be signed or
732 unsigned, whichever fits tighter. We do not warn about this
733 choice differing from the traditional choice, as the constant
734 is probably a bit pattern and either way will work. */
735 if ((flags & CPP_N_RADIX) != CPP_N_DECIMAL)
736 itk = MIN (itk_u, itk_s);
737 else
739 /* In C99, decimal constants are always signed.
740 In C89, decimal constants that don't fit in long have
741 undefined behavior; we try to make them unsigned long.
742 In GCC's extended C89, that last is true of decimal
743 constants that don't fit in long long, too. */
745 itk = itk_s;
746 if (itk_s > itk_u && itk_s > itk_long)
748 if (!flag_isoc99)
750 if (itk_u < itk_unsigned_long)
751 itk_u = itk_unsigned_long;
752 itk = itk_u;
753 warning (0, "this decimal constant is unsigned only in ISO C90");
755 else
756 warning (OPT_Wtraditional,
757 "this decimal constant would be unsigned in ISO C90");
762 if (itk == itk_none)
763 /* cpplib has already issued a warning for overflow. */
764 type = ((flags & CPP_N_UNSIGNED)
765 ? widest_unsigned_literal_type_node
766 : widest_integer_literal_type_node);
767 else
769 type = integer_types[itk];
770 if (itk > itk_unsigned_long
771 && (flags & CPP_N_WIDTH) != CPP_N_LARGE)
772 emit_diagnostic
773 ((c_dialect_cxx () ? cxx_dialect == cxx98 : !flag_isoc99)
774 ? DK_PEDWARN : DK_WARNING,
775 input_location, OPT_Wlong_long,
776 (flags & CPP_N_UNSIGNED)
777 ? "integer constant is too large for %<unsigned long%> type"
778 : "integer constant is too large for %<long%> type");
781 value = wide_int_to_tree (type, wval);
783 /* Convert imaginary to a complex type. */
784 if (flags & CPP_N_IMAGINARY)
785 value = build_complex (NULL_TREE, build_int_cst (type, 0), value);
787 return value;
790 /* Interpret TOKEN, a floating point number with FLAGS as classified
791 by cpplib. For C++11 SUFFIX may contain a user-defined literal suffix. */
792 static tree
793 interpret_float (const cpp_token *token, unsigned int flags,
794 const char *suffix, enum overflow_type *overflow)
796 tree type;
797 tree const_type;
798 tree value;
799 REAL_VALUE_TYPE real;
800 REAL_VALUE_TYPE real_trunc;
801 char *copy;
802 size_t copylen;
804 *overflow = OT_NONE;
806 /* Default (no suffix) depends on whether the FLOAT_CONST_DECIMAL64
807 pragma has been used and is either double or _Decimal64. Types
808 that are not allowed with decimal float default to double. */
809 if (flags & CPP_N_DEFAULT)
811 flags ^= CPP_N_DEFAULT;
812 flags |= CPP_N_MEDIUM;
814 if (((flags & CPP_N_HEX) == 0) && ((flags & CPP_N_IMAGINARY) == 0))
816 warning (OPT_Wunsuffixed_float_constants,
817 "unsuffixed float constant");
818 if (float_const_decimal64_p ())
819 flags |= CPP_N_DFLOAT;
823 /* Decode _Fract and _Accum. */
824 if (flags & CPP_N_FRACT || flags & CPP_N_ACCUM)
825 return interpret_fixed (token, flags);
827 /* Decode type based on width and properties. */
828 if (flags & CPP_N_DFLOAT)
829 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
830 type = dfloat128_type_node;
831 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
832 type = dfloat32_type_node;
833 else
834 type = dfloat64_type_node;
835 else
836 if (flags & CPP_N_WIDTH_MD)
838 char suffix;
839 machine_mode mode;
841 if ((flags & CPP_N_WIDTH_MD) == CPP_N_MD_W)
842 suffix = 'w';
843 else
844 suffix = 'q';
846 mode = targetm.c.mode_for_suffix (suffix);
847 if (mode == VOIDmode)
849 error ("unsupported non-standard suffix on floating constant");
851 return error_mark_node;
853 else
854 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
856 type = c_common_type_for_mode (mode, 0);
857 gcc_assert (type);
859 else if ((flags & (CPP_N_FLOATN | CPP_N_FLOATNX)) != 0)
861 unsigned int n = (flags & CPP_N_WIDTH_FLOATN_NX) >> CPP_FLOATN_SHIFT;
862 bool extended = (flags & CPP_N_FLOATNX) != 0;
863 type = NULL_TREE;
864 for (int i = 0; i < NUM_FLOATN_NX_TYPES; i++)
865 if (floatn_nx_types[i].n == (int) n
866 && floatn_nx_types[i].extended == extended)
868 type = FLOATN_NX_TYPE_NODE (i);
869 break;
871 if (type == NULL_TREE)
873 error ("unsupported non-standard suffix on floating constant");
874 return error_mark_node;
876 else
877 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
879 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
880 type = long_double_type_node;
881 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL
882 || flag_single_precision_constant)
883 type = float_type_node;
884 else
885 type = double_type_node;
887 const_type = excess_precision_type (type);
888 if (!const_type)
889 const_type = type;
891 /* Copy the constant to a nul-terminated buffer. If the constant
892 has any suffixes, cut them off; REAL_VALUE_ATOF/ REAL_VALUE_HTOF
893 can't handle them. */
894 copylen = token->val.str.len;
895 if (flags & CPP_N_USERDEF)
896 copylen -= strlen (suffix);
897 else if (flags & CPP_N_DFLOAT)
898 copylen -= 2;
899 else
901 if ((flags & CPP_N_WIDTH) != CPP_N_MEDIUM)
902 /* Must be an F or L or machine defined suffix. */
903 copylen--;
904 if (flags & CPP_N_IMAGINARY)
905 /* I or J suffix. */
906 copylen--;
907 if (flags & CPP_N_FLOATNX)
908 copylen--;
909 if (flags & (CPP_N_FLOATN | CPP_N_FLOATNX))
911 unsigned int n = (flags & CPP_N_WIDTH_FLOATN_NX) >> CPP_FLOATN_SHIFT;
912 while (n > 0)
914 copylen--;
915 n /= 10;
920 copy = (char *) alloca (copylen + 1);
921 if (cxx_dialect > cxx11)
923 size_t maxlen = 0;
924 for (size_t i = 0; i < copylen; ++i)
925 if (token->val.str.text[i] != '\'')
926 copy[maxlen++] = token->val.str.text[i];
927 copy[maxlen] = '\0';
929 else
931 memcpy (copy, token->val.str.text, copylen);
932 copy[copylen] = '\0';
935 real_from_string3 (&real, copy, TYPE_MODE (const_type));
936 if (const_type != type)
937 /* Diagnosing if the result of converting the value with excess
938 precision to the semantic type would overflow (with associated
939 double rounding) is more appropriate than diagnosing if the
940 result of converting the string directly to the semantic type
941 would overflow. */
942 real_convert (&real_trunc, TYPE_MODE (type), &real);
944 /* Both C and C++ require a diagnostic for a floating constant
945 outside the range of representable values of its type. Since we
946 have __builtin_inf* to produce an infinity, this is now a
947 mandatory pedwarn if the target does not support infinities. */
948 if (REAL_VALUE_ISINF (real)
949 || (const_type != type && REAL_VALUE_ISINF (real_trunc)))
951 *overflow = OT_OVERFLOW;
952 if (!(flags & CPP_N_USERDEF))
954 if (!MODE_HAS_INFINITIES (TYPE_MODE (type)))
955 pedwarn (input_location, 0,
956 "floating constant exceeds range of %qT", type);
957 else
958 warning (OPT_Woverflow,
959 "floating constant exceeds range of %qT", type);
962 /* We also give a warning if the value underflows. */
963 else if (real_equal (&real, &dconst0)
964 || (const_type != type
965 && real_equal (&real_trunc, &dconst0)))
967 REAL_VALUE_TYPE realvoidmode;
968 int oflow = real_from_string (&realvoidmode, copy);
969 *overflow = (oflow == 0 ? OT_NONE
970 : (oflow < 0 ? OT_UNDERFLOW : OT_OVERFLOW));
971 if (!(flags & CPP_N_USERDEF))
973 if (oflow < 0 || !real_equal (&realvoidmode, &dconst0))
974 warning (OPT_Woverflow, "floating constant truncated to zero");
978 /* Create a node with determined type and value. */
979 value = build_real (const_type, real);
980 if (flags & CPP_N_IMAGINARY)
982 value = build_complex (NULL_TREE,
983 fold_convert (const_type,
984 integer_zero_node), value);
985 if (type != const_type)
987 const_type = TREE_TYPE (value);
988 type = build_complex_type (type);
992 if (type != const_type)
993 value = build1_loc (token->src_loc, EXCESS_PRECISION_EXPR, type, value);
995 return value;
998 /* Interpret TOKEN, a fixed-point number with FLAGS as classified
999 by cpplib. */
1001 static tree
1002 interpret_fixed (const cpp_token *token, unsigned int flags)
1004 tree type;
1005 tree value;
1006 FIXED_VALUE_TYPE fixed;
1007 char *copy;
1008 size_t copylen;
1010 copylen = token->val.str.len;
1012 if (flags & CPP_N_FRACT) /* _Fract. */
1014 if (flags & CPP_N_UNSIGNED) /* Unsigned _Fract. */
1016 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1018 type = unsigned_long_long_fract_type_node;
1019 copylen -= 4;
1021 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1023 type = unsigned_long_fract_type_node;
1024 copylen -= 3;
1026 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1028 type = unsigned_short_fract_type_node;
1029 copylen -= 3;
1031 else
1033 type = unsigned_fract_type_node;
1034 copylen -= 2;
1037 else /* Signed _Fract. */
1039 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1041 type = long_long_fract_type_node;
1042 copylen -= 3;
1044 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1046 type = long_fract_type_node;
1047 copylen -= 2;
1049 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1051 type = short_fract_type_node;
1052 copylen -= 2;
1054 else
1056 type = fract_type_node;
1057 copylen --;
1061 else /* _Accum. */
1063 if (flags & CPP_N_UNSIGNED) /* Unsigned _Accum. */
1065 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1067 type = unsigned_long_long_accum_type_node;
1068 copylen -= 4;
1070 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1072 type = unsigned_long_accum_type_node;
1073 copylen -= 3;
1075 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1077 type = unsigned_short_accum_type_node;
1078 copylen -= 3;
1080 else
1082 type = unsigned_accum_type_node;
1083 copylen -= 2;
1086 else /* Signed _Accum. */
1088 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1090 type = long_long_accum_type_node;
1091 copylen -= 3;
1093 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1095 type = long_accum_type_node;
1096 copylen -= 2;
1098 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1100 type = short_accum_type_node;
1101 copylen -= 2;
1103 else
1105 type = accum_type_node;
1106 copylen --;
1111 copy = (char *) alloca (copylen + 1);
1112 memcpy (copy, token->val.str.text, copylen);
1113 copy[copylen] = '\0';
1115 fixed_from_string (&fixed, copy, SCALAR_TYPE_MODE (type));
1117 /* Create a node with determined type and value. */
1118 value = build_fixed (type, fixed);
1120 return value;
1123 /* Convert a series of STRING, WSTRING, STRING16, STRING32 and/or
1124 UTF8STRING tokens into a tree, performing string constant
1125 concatenation. TOK is the first of these. VALP is the location to
1126 write the string into. OBJC_STRING indicates whether an '@' token
1127 preceded the incoming token (in that case, the strings can either
1128 be ObjC strings, preceded by a single '@', or normal strings, not
1129 preceded by '@'. The result will be a CPP_OBJC_STRING). Returns
1130 the CPP token type of the result (CPP_STRING, CPP_WSTRING,
1131 CPP_STRING32, CPP_STRING16, CPP_UTF8STRING, or CPP_OBJC_STRING).
1133 This is unfortunately more work than it should be. If any of the
1134 strings in the series has an L prefix, the result is a wide string
1135 (6.4.5p4). Whether or not the result is a wide string affects the
1136 meaning of octal and hexadecimal escapes (6.4.4.4p6,9). But escape
1137 sequences do not continue across the boundary between two strings in
1138 a series (6.4.5p7), so we must not lose the boundaries. Therefore
1139 cpp_interpret_string takes a vector of cpp_string structures, which
1140 we must arrange to provide. */
1142 static enum cpp_ttype
1143 lex_string (const cpp_token *tok, tree *valp, bool objc_string, bool translate)
1145 tree value;
1146 size_t concats = 0;
1147 struct obstack str_ob;
1148 struct obstack loc_ob;
1149 cpp_string istr;
1150 enum cpp_ttype type = tok->type;
1152 /* Try to avoid the overhead of creating and destroying an obstack
1153 for the common case of just one string. */
1154 cpp_string str = tok->val.str;
1155 location_t init_loc = tok->src_loc;
1156 cpp_string *strs = &str;
1157 location_t *locs = NULL;
1159 /* objc_at_sign_was_seen is only used when doing Objective-C string
1160 concatenation. It is 'true' if we have seen an '@' before the
1161 current string, and 'false' if not. We must see exactly one or
1162 zero '@' before each string. */
1163 bool objc_at_sign_was_seen = false;
1165 retry:
1166 tok = cpp_get_token (parse_in);
1167 switch (tok->type)
1169 case CPP_PADDING:
1170 goto retry;
1171 case CPP_ATSIGN:
1172 if (objc_string)
1174 if (objc_at_sign_was_seen)
1175 error ("repeated %<@%> before Objective-C string");
1177 objc_at_sign_was_seen = true;
1178 goto retry;
1180 /* FALLTHROUGH */
1182 default:
1183 break;
1185 case CPP_WSTRING:
1186 case CPP_STRING16:
1187 case CPP_STRING32:
1188 case CPP_UTF8STRING:
1189 if (type != tok->type)
1191 if (type == CPP_STRING)
1192 type = tok->type;
1193 else
1194 error ("unsupported non-standard concatenation of string literals");
1196 /* FALLTHROUGH */
1198 case CPP_STRING:
1199 if (!concats)
1201 gcc_obstack_init (&str_ob);
1202 gcc_obstack_init (&loc_ob);
1203 obstack_grow (&str_ob, &str, sizeof (cpp_string));
1204 obstack_grow (&loc_ob, &init_loc, sizeof (location_t));
1207 concats++;
1208 obstack_grow (&str_ob, &tok->val.str, sizeof (cpp_string));
1209 obstack_grow (&loc_ob, &tok->src_loc, sizeof (location_t));
1211 if (objc_string)
1212 objc_at_sign_was_seen = false;
1213 goto retry;
1216 /* It is an error if we saw a '@' with no following string. */
1217 if (objc_at_sign_was_seen)
1218 error ("stray %<@%> in program");
1220 /* We have read one more token than we want. */
1221 _cpp_backup_tokens (parse_in, 1);
1222 if (concats)
1224 strs = XOBFINISH (&str_ob, cpp_string *);
1225 locs = XOBFINISH (&loc_ob, location_t *);
1228 if (concats && !objc_string && !in_system_header_at (input_location))
1229 warning (OPT_Wtraditional,
1230 "traditional C rejects string constant concatenation");
1232 if ((translate
1233 ? cpp_interpret_string : cpp_interpret_string_notranslate)
1234 (parse_in, strs, concats + 1, &istr, type))
1236 value = build_string (istr.len, (const char *) istr.text);
1237 free (CONST_CAST (unsigned char *, istr.text));
1238 if (concats)
1240 gcc_assert (locs);
1241 gcc_assert (g_string_concat_db);
1242 g_string_concat_db->record_string_concatenation (concats + 1, locs);
1245 else
1247 /* Callers cannot generally handle error_mark_node in this context,
1248 so return the empty string instead. cpp_interpret_string has
1249 issued an error. */
1250 switch (type)
1252 default:
1253 case CPP_STRING:
1254 case CPP_UTF8STRING:
1255 value = build_string (1, "");
1256 break;
1257 case CPP_STRING16:
1258 value = build_string (TYPE_PRECISION (char16_type_node)
1259 / TYPE_PRECISION (char_type_node),
1260 "\0"); /* char16_t is 16 bits */
1261 break;
1262 case CPP_STRING32:
1263 value = build_string (TYPE_PRECISION (char32_type_node)
1264 / TYPE_PRECISION (char_type_node),
1265 "\0\0\0"); /* char32_t is 32 bits */
1266 break;
1267 case CPP_WSTRING:
1268 value = build_string (TYPE_PRECISION (wchar_type_node)
1269 / TYPE_PRECISION (char_type_node),
1270 "\0\0\0"); /* widest supported wchar_t
1271 is 32 bits */
1272 break;
1276 switch (type)
1278 default:
1279 case CPP_STRING:
1280 case CPP_UTF8STRING:
1281 TREE_TYPE (value) = char_array_type_node;
1282 break;
1283 case CPP_STRING16:
1284 TREE_TYPE (value) = char16_array_type_node;
1285 break;
1286 case CPP_STRING32:
1287 TREE_TYPE (value) = char32_array_type_node;
1288 break;
1289 case CPP_WSTRING:
1290 TREE_TYPE (value) = wchar_array_type_node;
1292 *valp = fix_string_type (value);
1294 if (concats)
1296 obstack_free (&str_ob, 0);
1297 obstack_free (&loc_ob, 0);
1300 return objc_string ? CPP_OBJC_STRING : type;
1303 /* Converts a (possibly wide) character constant token into a tree. */
1304 static tree
1305 lex_charconst (const cpp_token *token)
1307 cppchar_t result;
1308 tree type, value;
1309 unsigned int chars_seen;
1310 int unsignedp = 0;
1312 result = cpp_interpret_charconst (parse_in, token,
1313 &chars_seen, &unsignedp);
1315 if (token->type == CPP_WCHAR)
1316 type = wchar_type_node;
1317 else if (token->type == CPP_CHAR32)
1318 type = char32_type_node;
1319 else if (token->type == CPP_CHAR16)
1320 type = char16_type_node;
1321 else if (token->type == CPP_UTF8CHAR)
1322 type = char_type_node;
1323 /* In C, a character constant has type 'int'.
1324 In C++ 'char', but multi-char charconsts have type 'int'. */
1325 else if (!c_dialect_cxx () || chars_seen > 1)
1326 type = integer_type_node;
1327 else
1328 type = char_type_node;
1330 /* Cast to cppchar_signed_t to get correct sign-extension of RESULT
1331 before possibly widening to HOST_WIDE_INT for build_int_cst. */
1332 if (unsignedp || (cppchar_signed_t) result >= 0)
1333 value = build_int_cst (type, result);
1334 else
1335 value = build_int_cst (type, (cppchar_signed_t) result);
1337 return value;
1340 /* Helper function for c_parser_peek_conflict_marker
1341 and cp_lexer_peek_conflict_marker.
1342 Given a possible conflict marker token of kind TOK1_KIND
1343 consisting of a pair of characters, get the token kind for the
1344 standalone final character. */
1346 enum cpp_ttype
1347 conflict_marker_get_final_tok_kind (enum cpp_ttype tok1_kind)
1349 switch (tok1_kind)
1351 default: gcc_unreachable ();
1352 case CPP_LSHIFT:
1353 /* "<<" and '<' */
1354 return CPP_LESS;
1356 case CPP_EQ_EQ:
1357 /* "==" and '=' */
1358 return CPP_EQ;
1360 case CPP_RSHIFT:
1361 /* ">>" and '>' */
1362 return CPP_GREATER;