2015-06-25 Zhouyi Zhou <yizhouzhou@ict.ac.cn>
[official-gcc.git] / gcc / c-family / c-lex.c
blob9c56832219b273ce4aaf98d072b686850b77a4de
1 /* Mainly the interface between cpplib and the C front ends.
2 Copyright (C) 1987-2015 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "tm.h"
24 #include "alias.h"
25 #include "symtab.h"
26 #include "tree.h"
27 #include "stringpool.h"
28 #include "stor-layout.h"
29 #include "c-common.h"
30 #include "flags.h"
31 #include "timevar.h"
32 #include "cpplib.h"
33 #include "c-pragma.h"
34 #include "intl.h"
35 #include "splay-tree.h"
36 #include "debug.h"
37 #include "target.h"
39 #include "attribs.h"
41 /* We may keep statistics about how long which files took to compile. */
42 static int header_time, body_time;
43 static splay_tree file_info_tree;
45 int pending_lang_change; /* If we need to switch languages - C++ only */
46 int c_header_level; /* depth in C headers - C++ only */
48 static tree interpret_integer (const cpp_token *, unsigned int,
49 enum overflow_type *);
50 static tree interpret_float (const cpp_token *, unsigned int, const char *,
51 enum overflow_type *);
52 static tree interpret_fixed (const cpp_token *, unsigned int);
53 static enum integer_type_kind narrowest_unsigned_type
54 (const widest_int &, unsigned int);
55 static enum integer_type_kind narrowest_signed_type
56 (const widest_int &, unsigned int);
57 static enum cpp_ttype lex_string (const cpp_token *, tree *, bool, bool);
58 static tree lex_charconst (const cpp_token *);
59 static void update_header_times (const char *);
60 static int dump_one_header (splay_tree_node, void *);
61 static void cb_line_change (cpp_reader *, const cpp_token *, int);
62 static void cb_ident (cpp_reader *, unsigned int, const cpp_string *);
63 static void cb_def_pragma (cpp_reader *, unsigned int);
64 static void cb_define (cpp_reader *, unsigned int, cpp_hashnode *);
65 static void cb_undef (cpp_reader *, unsigned int, cpp_hashnode *);
67 void
68 init_c_lex (void)
70 struct cpp_callbacks *cb;
71 struct c_fileinfo *toplevel;
73 /* The get_fileinfo data structure must be initialized before
74 cpp_read_main_file is called. */
75 toplevel = get_fileinfo ("<top level>");
76 if (flag_detailed_statistics)
78 header_time = 0;
79 body_time = get_run_time ();
80 toplevel->time = body_time;
83 cb = cpp_get_callbacks (parse_in);
85 cb->line_change = cb_line_change;
86 cb->ident = cb_ident;
87 cb->def_pragma = cb_def_pragma;
88 cb->valid_pch = c_common_valid_pch;
89 cb->read_pch = c_common_read_pch;
90 cb->has_attribute = c_common_has_attribute;
92 /* Set the debug callbacks if we can use them. */
93 if ((debug_info_level == DINFO_LEVEL_VERBOSE
94 && (write_symbols == DWARF2_DEBUG
95 || write_symbols == VMS_AND_DWARF2_DEBUG))
96 || flag_dump_go_spec != NULL)
98 cb->define = cb_define;
99 cb->undef = cb_undef;
103 struct c_fileinfo *
104 get_fileinfo (const char *name)
106 splay_tree_node n;
107 struct c_fileinfo *fi;
109 if (!file_info_tree)
110 file_info_tree = splay_tree_new ((splay_tree_compare_fn) strcmp,
112 (splay_tree_delete_value_fn) free);
114 n = splay_tree_lookup (file_info_tree, (splay_tree_key) name);
115 if (n)
116 return (struct c_fileinfo *) n->value;
118 fi = XNEW (struct c_fileinfo);
119 fi->time = 0;
120 fi->interface_only = 0;
121 fi->interface_unknown = 1;
122 splay_tree_insert (file_info_tree, (splay_tree_key) name,
123 (splay_tree_value) fi);
124 return fi;
127 static void
128 update_header_times (const char *name)
130 /* Changing files again. This means currently collected time
131 is charged against header time, and body time starts back at 0. */
132 if (flag_detailed_statistics)
134 int this_time = get_run_time ();
135 struct c_fileinfo *file = get_fileinfo (name);
136 header_time += this_time - body_time;
137 file->time += this_time - body_time;
138 body_time = this_time;
142 static int
143 dump_one_header (splay_tree_node n, void * ARG_UNUSED (dummy))
145 print_time ((const char *) n->key,
146 ((struct c_fileinfo *) n->value)->time);
147 return 0;
150 void
151 dump_time_statistics (void)
153 struct c_fileinfo *file = get_fileinfo (LOCATION_FILE (input_location));
154 int this_time = get_run_time ();
155 file->time += this_time - body_time;
157 fprintf (stderr, "\n******\n");
158 print_time ("header files (total)", header_time);
159 print_time ("main file (total)", this_time - body_time);
160 fprintf (stderr, "ratio = %g : 1\n",
161 (double) header_time / (double) (this_time - body_time));
162 fprintf (stderr, "\n******\n");
164 splay_tree_foreach (file_info_tree, dump_one_header, 0);
167 static void
168 cb_ident (cpp_reader * ARG_UNUSED (pfile),
169 unsigned int ARG_UNUSED (line),
170 const cpp_string * ARG_UNUSED (str))
172 if (!flag_no_ident)
174 /* Convert escapes in the string. */
175 cpp_string cstr = { 0, 0 };
176 if (cpp_interpret_string (pfile, str, 1, &cstr, CPP_STRING))
178 targetm.asm_out.output_ident ((const char *) cstr.text);
179 free (CONST_CAST (unsigned char *, cstr.text));
184 /* Called at the start of every non-empty line. TOKEN is the first
185 lexed token on the line. Used for diagnostic line numbers. */
186 static void
187 cb_line_change (cpp_reader * ARG_UNUSED (pfile), const cpp_token *token,
188 int parsing_args)
190 if (token->type != CPP_EOF && !parsing_args)
191 input_location = token->src_loc;
194 void
195 fe_file_change (const line_map_ordinary *new_map)
197 if (new_map == NULL)
198 return;
200 if (new_map->reason == LC_ENTER)
202 /* Don't stack the main buffer on the input stack;
203 we already did in compile_file. */
204 if (!MAIN_FILE_P (new_map))
206 unsigned int included_at = LAST_SOURCE_LINE_LOCATION (new_map - 1);
207 int line = 0;
208 if (included_at > BUILTINS_LOCATION)
209 line = SOURCE_LINE (new_map - 1, included_at);
211 input_location = new_map->start_location;
212 (*debug_hooks->start_source_file) (line, LINEMAP_FILE (new_map));
213 #ifndef NO_IMPLICIT_EXTERN_C
214 if (c_header_level)
215 ++c_header_level;
216 else if (LINEMAP_SYSP (new_map) == 2)
218 c_header_level = 1;
219 ++pending_lang_change;
221 #endif
224 else if (new_map->reason == LC_LEAVE)
226 #ifndef NO_IMPLICIT_EXTERN_C
227 if (c_header_level && --c_header_level == 0)
229 if (LINEMAP_SYSP (new_map) == 2)
230 warning (0, "badly nested C headers from preprocessor");
231 --pending_lang_change;
233 #endif
234 input_location = new_map->start_location;
236 (*debug_hooks->end_source_file) (LINEMAP_LINE (new_map));
239 update_header_times (LINEMAP_FILE (new_map));
240 input_location = new_map->start_location;
243 static void
244 cb_def_pragma (cpp_reader *pfile, source_location loc)
246 /* Issue a warning message if we have been asked to do so. Ignore
247 unknown pragmas in system headers unless an explicit
248 -Wunknown-pragmas has been given. */
249 if (warn_unknown_pragmas > in_system_header_at (input_location))
251 const unsigned char *space, *name;
252 const cpp_token *s;
253 location_t fe_loc = loc;
255 space = name = (const unsigned char *) "";
256 s = cpp_get_token (pfile);
257 if (s->type != CPP_EOF)
259 space = cpp_token_as_text (pfile, s);
260 s = cpp_get_token (pfile);
261 if (s->type == CPP_NAME)
262 name = cpp_token_as_text (pfile, s);
265 warning_at (fe_loc, OPT_Wunknown_pragmas, "ignoring #pragma %s %s",
266 space, name);
270 /* #define callback for DWARF and DWARF2 debug info. */
271 static void
272 cb_define (cpp_reader *pfile, source_location loc, cpp_hashnode *node)
274 const struct line_map *map = linemap_lookup (line_table, loc);
275 (*debug_hooks->define) (SOURCE_LINE (linemap_check_ordinary (map), loc),
276 (const char *) cpp_macro_definition (pfile, node));
279 /* #undef callback for DWARF and DWARF2 debug info. */
280 static void
281 cb_undef (cpp_reader * ARG_UNUSED (pfile), source_location loc,
282 cpp_hashnode *node)
284 const struct line_map *map = linemap_lookup (line_table, loc);
285 (*debug_hooks->undef) (SOURCE_LINE (linemap_check_ordinary (map), loc),
286 (const char *) NODE_NAME (node));
289 /* Wrapper around cpp_get_token to skip CPP_PADDING tokens
290 and not consume CPP_EOF. */
291 static const cpp_token *
292 get_token_no_padding (cpp_reader *pfile)
294 for (;;)
296 const cpp_token *ret = cpp_peek_token (pfile, 0);
297 if (ret->type == CPP_EOF)
298 return ret;
299 ret = cpp_get_token (pfile);
300 if (ret->type != CPP_PADDING)
301 return ret;
305 /* Callback for has_attribute. */
307 c_common_has_attribute (cpp_reader *pfile)
309 int result = 0;
310 tree attr_name = NULL_TREE;
311 const cpp_token *token;
313 token = get_token_no_padding (pfile);
314 if (token->type != CPP_OPEN_PAREN)
316 cpp_error (pfile, CPP_DL_ERROR,
317 "missing '(' after \"__has_attribute\"");
318 return 0;
320 token = get_token_no_padding (pfile);
321 if (token->type == CPP_NAME)
323 attr_name = get_identifier ((const char *)
324 cpp_token_as_text (pfile, token));
325 if (c_dialect_cxx ())
327 int idx = 0;
328 const cpp_token *nxt_token;
330 nxt_token = cpp_peek_token (pfile, idx++);
331 while (nxt_token->type == CPP_PADDING);
332 if (nxt_token->type == CPP_SCOPE)
334 get_token_no_padding (pfile); // Eat scope.
335 nxt_token = get_token_no_padding (pfile);
336 if (nxt_token->type == CPP_NAME)
338 tree attr_ns = attr_name;
339 tree attr_id
340 = get_identifier ((const char *)
341 cpp_token_as_text (pfile, nxt_token));
342 attr_name = build_tree_list (attr_ns, attr_id);
344 else
346 cpp_error (pfile, CPP_DL_ERROR,
347 "attribute identifier required after scope");
348 attr_name = NULL_TREE;
352 if (attr_name)
354 init_attributes ();
355 const struct attribute_spec *attr = lookup_attribute_spec (attr_name);
356 if (attr)
358 if (TREE_CODE (attr_name) == TREE_LIST)
359 attr_name = TREE_VALUE (attr_name);
360 if (is_attribute_p ("noreturn", attr_name))
361 result = 200809;
362 else if (is_attribute_p ("deprecated", attr_name))
363 result = 201309;
364 else
365 result = 1;
369 else
371 cpp_error (pfile, CPP_DL_ERROR,
372 "macro \"__has_attribute\" requires an identifier");
373 return 0;
376 if (get_token_no_padding (pfile)->type != CPP_CLOSE_PAREN)
377 cpp_error (pfile, CPP_DL_ERROR,
378 "missing ')' after \"__has_attribute\"");
380 return result;
383 /* Read a token and return its type. Fill *VALUE with its value, if
384 applicable. Fill *CPP_FLAGS with the token's flags, if it is
385 non-NULL. */
387 enum cpp_ttype
388 c_lex_with_flags (tree *value, location_t *loc, unsigned char *cpp_flags,
389 int lex_flags)
391 static bool no_more_pch;
392 const cpp_token *tok;
393 enum cpp_ttype type;
394 unsigned char add_flags = 0;
395 enum overflow_type overflow = OT_NONE;
397 timevar_push (TV_CPP);
398 retry:
399 tok = cpp_get_token_with_location (parse_in, loc);
400 type = tok->type;
402 retry_after_at:
403 switch (type)
405 case CPP_PADDING:
406 goto retry;
408 case CPP_NAME:
409 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
410 break;
412 case CPP_NUMBER:
414 const char *suffix = NULL;
415 unsigned int flags = cpp_classify_number (parse_in, tok, &suffix, *loc);
417 switch (flags & CPP_N_CATEGORY)
419 case CPP_N_INVALID:
420 /* cpplib has issued an error. */
421 *value = error_mark_node;
422 break;
424 case CPP_N_INTEGER:
425 /* C++ uses '0' to mark virtual functions as pure.
426 Set PURE_ZERO to pass this information to the C++ parser. */
427 if (tok->val.str.len == 1 && *tok->val.str.text == '0')
428 add_flags = PURE_ZERO;
429 *value = interpret_integer (tok, flags, &overflow);
430 break;
432 case CPP_N_FLOATING:
433 *value = interpret_float (tok, flags, suffix, &overflow);
434 break;
436 default:
437 gcc_unreachable ();
440 if (flags & CPP_N_USERDEF)
442 char *str;
443 tree literal;
444 tree suffix_id = get_identifier (suffix);
445 int len = tok->val.str.len - strlen (suffix);
446 /* If this is going to be used as a C string to pass to a
447 raw literal operator, we need to add a trailing NUL. */
448 tree num_string = build_string (len + 1,
449 (const char *) tok->val.str.text);
450 TREE_TYPE (num_string) = char_array_type_node;
451 num_string = fix_string_type (num_string);
452 str = CONST_CAST (char *, TREE_STRING_POINTER (num_string));
453 str[len] = '\0';
454 literal = build_userdef_literal (suffix_id, *value, overflow,
455 num_string);
456 *value = literal;
459 break;
461 case CPP_ATSIGN:
462 /* An @ may give the next token special significance in Objective-C. */
463 if (c_dialect_objc ())
465 location_t atloc = *loc;
466 location_t newloc;
468 retry_at:
469 tok = cpp_get_token_with_location (parse_in, &newloc);
470 type = tok->type;
471 switch (type)
473 case CPP_PADDING:
474 goto retry_at;
476 case CPP_STRING:
477 case CPP_WSTRING:
478 case CPP_STRING16:
479 case CPP_STRING32:
480 case CPP_UTF8STRING:
481 type = lex_string (tok, value, true, true);
482 break;
484 case CPP_NAME:
485 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
486 if (OBJC_IS_AT_KEYWORD (C_RID_CODE (*value))
487 || OBJC_IS_CXX_KEYWORD (C_RID_CODE (*value)))
489 type = CPP_AT_NAME;
490 /* Note the complication: if we found an OBJC_CXX
491 keyword, for example, 'class', we will be
492 returning a token of type CPP_AT_NAME and rid
493 code RID_CLASS (not RID_AT_CLASS). The language
494 parser needs to convert that to RID_AT_CLASS.
496 break;
498 /* FALLTHROUGH */
500 default:
501 /* ... or not. */
502 error_at (atloc, "stray %<@%> in program");
503 *loc = newloc;
504 goto retry_after_at;
506 break;
509 /* FALLTHROUGH */
510 case CPP_HASH:
511 case CPP_PASTE:
513 unsigned char name[8];
515 *cpp_spell_token (parse_in, tok, name, true) = 0;
517 error_at (*loc, "stray %qs in program", name);
520 goto retry;
522 case CPP_OTHER:
524 cppchar_t c = tok->val.str.text[0];
526 if (c == '"' || c == '\'')
527 error ("missing terminating %c character", (int) c);
528 else if (ISGRAPH (c))
529 error ("stray %qc in program", (int) c);
530 else
531 error ("stray %<\\%o%> in program", (int) c);
533 goto retry;
535 case CPP_CHAR_USERDEF:
536 case CPP_WCHAR_USERDEF:
537 case CPP_CHAR16_USERDEF:
538 case CPP_CHAR32_USERDEF:
540 tree literal;
541 cpp_token temp_tok = *tok;
542 const char *suffix = cpp_get_userdef_suffix (tok);
543 temp_tok.val.str.len -= strlen (suffix);
544 temp_tok.type = cpp_userdef_char_remove_type (type);
545 literal = build_userdef_literal (get_identifier (suffix),
546 lex_charconst (&temp_tok),
547 OT_NONE, NULL_TREE);
548 *value = literal;
550 break;
552 case CPP_CHAR:
553 case CPP_WCHAR:
554 case CPP_CHAR16:
555 case CPP_CHAR32:
556 *value = lex_charconst (tok);
557 break;
559 case CPP_STRING_USERDEF:
560 case CPP_WSTRING_USERDEF:
561 case CPP_STRING16_USERDEF:
562 case CPP_STRING32_USERDEF:
563 case CPP_UTF8STRING_USERDEF:
565 tree literal, string;
566 const char *suffix = cpp_get_userdef_suffix (tok);
567 string = build_string (tok->val.str.len - strlen (suffix),
568 (const char *) tok->val.str.text);
569 literal = build_userdef_literal (get_identifier (suffix),
570 string, OT_NONE, NULL_TREE);
571 *value = literal;
573 break;
575 case CPP_STRING:
576 case CPP_WSTRING:
577 case CPP_STRING16:
578 case CPP_STRING32:
579 case CPP_UTF8STRING:
580 if ((lex_flags & C_LEX_STRING_NO_JOIN) == 0)
582 type = lex_string (tok, value, false,
583 (lex_flags & C_LEX_STRING_NO_TRANSLATE) == 0);
584 break;
586 *value = build_string (tok->val.str.len, (const char *) tok->val.str.text);
587 break;
589 case CPP_PRAGMA:
590 *value = build_int_cst (integer_type_node, tok->val.pragma);
591 break;
593 /* These tokens should not be visible outside cpplib. */
594 case CPP_HEADER_NAME:
595 case CPP_MACRO_ARG:
596 gcc_unreachable ();
598 /* CPP_COMMENT will appear when compiling with -C and should be
599 ignored. */
600 case CPP_COMMENT:
601 goto retry;
603 default:
604 *value = NULL_TREE;
605 break;
608 if (cpp_flags)
609 *cpp_flags = tok->flags | add_flags;
611 if (!no_more_pch)
613 no_more_pch = true;
614 c_common_no_more_pch ();
617 timevar_pop (TV_CPP);
619 return type;
622 /* Returns the narrowest C-visible unsigned type, starting with the
623 minimum specified by FLAGS, that can fit HIGH:LOW, or itk_none if
624 there isn't one. */
626 static enum integer_type_kind
627 narrowest_unsigned_type (const widest_int &val, unsigned int flags)
629 int itk;
631 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
632 itk = itk_unsigned_int;
633 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
634 itk = itk_unsigned_long;
635 else
636 itk = itk_unsigned_long_long;
638 for (; itk < itk_none; itk += 2 /* skip unsigned types */)
640 tree upper;
642 if (integer_types[itk] == NULL_TREE)
643 continue;
644 upper = TYPE_MAX_VALUE (integer_types[itk]);
646 if (wi::geu_p (wi::to_widest (upper), val))
647 return (enum integer_type_kind) itk;
650 return itk_none;
653 /* Ditto, but narrowest signed type. */
654 static enum integer_type_kind
655 narrowest_signed_type (const widest_int &val, unsigned int flags)
657 int itk;
659 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
660 itk = itk_int;
661 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
662 itk = itk_long;
663 else
664 itk = itk_long_long;
666 for (; itk < itk_none; itk += 2 /* skip signed types */)
668 tree upper;
670 if (integer_types[itk] == NULL_TREE)
671 continue;
672 upper = TYPE_MAX_VALUE (integer_types[itk]);
674 if (wi::geu_p (wi::to_widest (upper), val))
675 return (enum integer_type_kind) itk;
678 return itk_none;
681 /* Interpret TOKEN, an integer with FLAGS as classified by cpplib. */
682 static tree
683 interpret_integer (const cpp_token *token, unsigned int flags,
684 enum overflow_type *overflow)
686 tree value, type;
687 enum integer_type_kind itk;
688 cpp_num integer;
689 HOST_WIDE_INT ival[3];
691 *overflow = OT_NONE;
693 integer = cpp_interpret_integer (parse_in, token, flags);
694 if (integer.overflow)
695 *overflow = OT_OVERFLOW;
697 ival[0] = integer.low;
698 ival[1] = integer.high;
699 ival[2] = 0;
700 widest_int wval = widest_int::from_array (ival, 3);
702 /* The type of a constant with a U suffix is straightforward. */
703 if (flags & CPP_N_UNSIGNED)
704 itk = narrowest_unsigned_type (wval, flags);
705 else
707 /* The type of a potentially-signed integer constant varies
708 depending on the base it's in, the standard in use, and the
709 length suffixes. */
710 enum integer_type_kind itk_u
711 = narrowest_unsigned_type (wval, flags);
712 enum integer_type_kind itk_s
713 = narrowest_signed_type (wval, flags);
715 /* In both C89 and C99, octal and hex constants may be signed or
716 unsigned, whichever fits tighter. We do not warn about this
717 choice differing from the traditional choice, as the constant
718 is probably a bit pattern and either way will work. */
719 if ((flags & CPP_N_RADIX) != CPP_N_DECIMAL)
720 itk = MIN (itk_u, itk_s);
721 else
723 /* In C99, decimal constants are always signed.
724 In C89, decimal constants that don't fit in long have
725 undefined behavior; we try to make them unsigned long.
726 In GCC's extended C89, that last is true of decimal
727 constants that don't fit in long long, too. */
729 itk = itk_s;
730 if (itk_s > itk_u && itk_s > itk_long)
732 if (!flag_isoc99)
734 if (itk_u < itk_unsigned_long)
735 itk_u = itk_unsigned_long;
736 itk = itk_u;
737 warning (0, "this decimal constant is unsigned only in ISO C90");
739 else
740 warning (OPT_Wtraditional,
741 "this decimal constant would be unsigned in ISO C90");
746 if (itk == itk_none)
747 /* cpplib has already issued a warning for overflow. */
748 type = ((flags & CPP_N_UNSIGNED)
749 ? widest_unsigned_literal_type_node
750 : widest_integer_literal_type_node);
751 else
753 type = integer_types[itk];
754 if (itk > itk_unsigned_long
755 && (flags & CPP_N_WIDTH) != CPP_N_LARGE)
756 emit_diagnostic
757 ((c_dialect_cxx () ? cxx_dialect == cxx98 : !flag_isoc99)
758 ? DK_PEDWARN : DK_WARNING,
759 input_location, OPT_Wlong_long,
760 (flags & CPP_N_UNSIGNED)
761 ? "integer constant is too large for %<unsigned long%> type"
762 : "integer constant is too large for %<long%> type");
765 value = wide_int_to_tree (type, wval);
767 /* Convert imaginary to a complex type. */
768 if (flags & CPP_N_IMAGINARY)
769 value = build_complex (NULL_TREE, build_int_cst (type, 0), value);
771 return value;
774 /* Interpret TOKEN, a floating point number with FLAGS as classified
775 by cpplib. For C++0X SUFFIX may contain a user-defined literal suffix. */
776 static tree
777 interpret_float (const cpp_token *token, unsigned int flags,
778 const char *suffix, enum overflow_type *overflow)
780 tree type;
781 tree const_type;
782 tree value;
783 REAL_VALUE_TYPE real;
784 REAL_VALUE_TYPE real_trunc;
785 char *copy;
786 size_t copylen;
788 *overflow = OT_NONE;
790 /* Default (no suffix) depends on whether the FLOAT_CONST_DECIMAL64
791 pragma has been used and is either double or _Decimal64. Types
792 that are not allowed with decimal float default to double. */
793 if (flags & CPP_N_DEFAULT)
795 flags ^= CPP_N_DEFAULT;
796 flags |= CPP_N_MEDIUM;
798 if (((flags & CPP_N_HEX) == 0) && ((flags & CPP_N_IMAGINARY) == 0))
800 warning (OPT_Wunsuffixed_float_constants,
801 "unsuffixed float constant");
802 if (float_const_decimal64_p ())
803 flags |= CPP_N_DFLOAT;
807 /* Decode _Fract and _Accum. */
808 if (flags & CPP_N_FRACT || flags & CPP_N_ACCUM)
809 return interpret_fixed (token, flags);
811 /* Decode type based on width and properties. */
812 if (flags & CPP_N_DFLOAT)
813 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
814 type = dfloat128_type_node;
815 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
816 type = dfloat32_type_node;
817 else
818 type = dfloat64_type_node;
819 else
820 if (flags & CPP_N_WIDTH_MD)
822 char suffix;
823 machine_mode mode;
825 if ((flags & CPP_N_WIDTH_MD) == CPP_N_MD_W)
826 suffix = 'w';
827 else
828 suffix = 'q';
830 mode = targetm.c.mode_for_suffix (suffix);
831 if (mode == VOIDmode)
833 error ("unsupported non-standard suffix on floating constant");
835 return error_mark_node;
837 else
838 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
840 type = c_common_type_for_mode (mode, 0);
841 gcc_assert (type);
843 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
844 type = long_double_type_node;
845 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL
846 || flag_single_precision_constant)
847 type = float_type_node;
848 else
849 type = double_type_node;
851 const_type = excess_precision_type (type);
852 if (!const_type)
853 const_type = type;
855 /* Copy the constant to a nul-terminated buffer. If the constant
856 has any suffixes, cut them off; REAL_VALUE_ATOF/ REAL_VALUE_HTOF
857 can't handle them. */
858 copylen = token->val.str.len;
859 if (flags & CPP_N_USERDEF)
860 copylen -= strlen (suffix);
861 else if (flags & CPP_N_DFLOAT)
862 copylen -= 2;
863 else
865 if ((flags & CPP_N_WIDTH) != CPP_N_MEDIUM)
866 /* Must be an F or L or machine defined suffix. */
867 copylen--;
868 if (flags & CPP_N_IMAGINARY)
869 /* I or J suffix. */
870 copylen--;
873 copy = (char *) alloca (copylen + 1);
874 if (cxx_dialect > cxx11)
876 size_t maxlen = 0;
877 for (size_t i = 0; i < copylen; ++i)
878 if (token->val.str.text[i] != '\'')
879 copy[maxlen++] = token->val.str.text[i];
880 copy[maxlen] = '\0';
882 else
884 memcpy (copy, token->val.str.text, copylen);
885 copy[copylen] = '\0';
888 real_from_string3 (&real, copy, TYPE_MODE (const_type));
889 if (const_type != type)
890 /* Diagnosing if the result of converting the value with excess
891 precision to the semantic type would overflow (with associated
892 double rounding) is more appropriate than diagnosing if the
893 result of converting the string directly to the semantic type
894 would overflow. */
895 real_convert (&real_trunc, TYPE_MODE (type), &real);
897 /* Both C and C++ require a diagnostic for a floating constant
898 outside the range of representable values of its type. Since we
899 have __builtin_inf* to produce an infinity, this is now a
900 mandatory pedwarn if the target does not support infinities. */
901 if (REAL_VALUE_ISINF (real)
902 || (const_type != type && REAL_VALUE_ISINF (real_trunc)))
904 *overflow = OT_OVERFLOW;
905 if (!(flags & CPP_N_USERDEF))
907 if (!MODE_HAS_INFINITIES (TYPE_MODE (type)))
908 pedwarn (input_location, 0,
909 "floating constant exceeds range of %qT", type);
910 else
911 warning (OPT_Woverflow,
912 "floating constant exceeds range of %qT", type);
915 /* We also give a warning if the value underflows. */
916 else if (REAL_VALUES_EQUAL (real, dconst0)
917 || (const_type != type
918 && REAL_VALUES_EQUAL (real_trunc, dconst0)))
920 REAL_VALUE_TYPE realvoidmode;
921 int oflow = real_from_string (&realvoidmode, copy);
922 *overflow = (oflow == 0 ? OT_NONE
923 : (oflow < 0 ? OT_UNDERFLOW : OT_OVERFLOW));
924 if (!(flags & CPP_N_USERDEF))
926 if (oflow < 0 || !REAL_VALUES_EQUAL (realvoidmode, dconst0))
927 warning (OPT_Woverflow, "floating constant truncated to zero");
931 /* Create a node with determined type and value. */
932 value = build_real (const_type, real);
933 if (flags & CPP_N_IMAGINARY)
935 value = build_complex (NULL_TREE, convert (const_type,
936 integer_zero_node), value);
937 if (type != const_type)
939 const_type = TREE_TYPE (value);
940 type = build_complex_type (type);
944 if (type != const_type)
945 value = build1 (EXCESS_PRECISION_EXPR, type, value);
947 return value;
950 /* Interpret TOKEN, a fixed-point number with FLAGS as classified
951 by cpplib. */
953 static tree
954 interpret_fixed (const cpp_token *token, unsigned int flags)
956 tree type;
957 tree value;
958 FIXED_VALUE_TYPE fixed;
959 char *copy;
960 size_t copylen;
962 copylen = token->val.str.len;
964 if (flags & CPP_N_FRACT) /* _Fract. */
966 if (flags & CPP_N_UNSIGNED) /* Unsigned _Fract. */
968 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
970 type = unsigned_long_long_fract_type_node;
971 copylen -= 4;
973 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
975 type = unsigned_long_fract_type_node;
976 copylen -= 3;
978 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
980 type = unsigned_short_fract_type_node;
981 copylen -= 3;
983 else
985 type = unsigned_fract_type_node;
986 copylen -= 2;
989 else /* Signed _Fract. */
991 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
993 type = long_long_fract_type_node;
994 copylen -= 3;
996 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
998 type = long_fract_type_node;
999 copylen -= 2;
1001 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1003 type = short_fract_type_node;
1004 copylen -= 2;
1006 else
1008 type = fract_type_node;
1009 copylen --;
1013 else /* _Accum. */
1015 if (flags & CPP_N_UNSIGNED) /* Unsigned _Accum. */
1017 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1019 type = unsigned_long_long_accum_type_node;
1020 copylen -= 4;
1022 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1024 type = unsigned_long_accum_type_node;
1025 copylen -= 3;
1027 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1029 type = unsigned_short_accum_type_node;
1030 copylen -= 3;
1032 else
1034 type = unsigned_accum_type_node;
1035 copylen -= 2;
1038 else /* Signed _Accum. */
1040 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
1042 type = long_long_accum_type_node;
1043 copylen -= 3;
1045 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
1047 type = long_accum_type_node;
1048 copylen -= 2;
1050 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
1052 type = short_accum_type_node;
1053 copylen -= 2;
1055 else
1057 type = accum_type_node;
1058 copylen --;
1063 copy = (char *) alloca (copylen + 1);
1064 memcpy (copy, token->val.str.text, copylen);
1065 copy[copylen] = '\0';
1067 fixed_from_string (&fixed, copy, TYPE_MODE (type));
1069 /* Create a node with determined type and value. */
1070 value = build_fixed (type, fixed);
1072 return value;
1075 /* Convert a series of STRING, WSTRING, STRING16, STRING32 and/or
1076 UTF8STRING tokens into a tree, performing string constant
1077 concatenation. TOK is the first of these. VALP is the location to
1078 write the string into. OBJC_STRING indicates whether an '@' token
1079 preceded the incoming token (in that case, the strings can either
1080 be ObjC strings, preceded by a single '@', or normal strings, not
1081 preceded by '@'. The result will be a CPP_OBJC_STRING). Returns
1082 the CPP token type of the result (CPP_STRING, CPP_WSTRING,
1083 CPP_STRING32, CPP_STRING16, CPP_UTF8STRING, or CPP_OBJC_STRING).
1085 This is unfortunately more work than it should be. If any of the
1086 strings in the series has an L prefix, the result is a wide string
1087 (6.4.5p4). Whether or not the result is a wide string affects the
1088 meaning of octal and hexadecimal escapes (6.4.4.4p6,9). But escape
1089 sequences do not continue across the boundary between two strings in
1090 a series (6.4.5p7), so we must not lose the boundaries. Therefore
1091 cpp_interpret_string takes a vector of cpp_string structures, which
1092 we must arrange to provide. */
1094 static enum cpp_ttype
1095 lex_string (const cpp_token *tok, tree *valp, bool objc_string, bool translate)
1097 tree value;
1098 size_t concats = 0;
1099 struct obstack str_ob;
1100 cpp_string istr;
1101 enum cpp_ttype type = tok->type;
1103 /* Try to avoid the overhead of creating and destroying an obstack
1104 for the common case of just one string. */
1105 cpp_string str = tok->val.str;
1106 cpp_string *strs = &str;
1108 /* objc_at_sign_was_seen is only used when doing Objective-C string
1109 concatenation. It is 'true' if we have seen an '@' before the
1110 current string, and 'false' if not. We must see exactly one or
1111 zero '@' before each string. */
1112 bool objc_at_sign_was_seen = false;
1114 retry:
1115 tok = cpp_get_token (parse_in);
1116 switch (tok->type)
1118 case CPP_PADDING:
1119 goto retry;
1120 case CPP_ATSIGN:
1121 if (objc_string)
1123 if (objc_at_sign_was_seen)
1124 error ("repeated %<@%> before Objective-C string");
1126 objc_at_sign_was_seen = true;
1127 goto retry;
1129 /* FALLTHROUGH */
1131 default:
1132 break;
1134 case CPP_WSTRING:
1135 case CPP_STRING16:
1136 case CPP_STRING32:
1137 case CPP_UTF8STRING:
1138 if (type != tok->type)
1140 if (type == CPP_STRING)
1141 type = tok->type;
1142 else
1143 error ("unsupported non-standard concatenation of string literals");
1146 case CPP_STRING:
1147 if (!concats)
1149 gcc_obstack_init (&str_ob);
1150 obstack_grow (&str_ob, &str, sizeof (cpp_string));
1153 concats++;
1154 obstack_grow (&str_ob, &tok->val.str, sizeof (cpp_string));
1155 if (objc_string)
1156 objc_at_sign_was_seen = false;
1157 goto retry;
1160 /* It is an error if we saw a '@' with no following string. */
1161 if (objc_at_sign_was_seen)
1162 error ("stray %<@%> in program");
1164 /* We have read one more token than we want. */
1165 _cpp_backup_tokens (parse_in, 1);
1166 if (concats)
1167 strs = XOBFINISH (&str_ob, cpp_string *);
1169 if (concats && !objc_string && !in_system_header_at (input_location))
1170 warning (OPT_Wtraditional,
1171 "traditional C rejects string constant concatenation");
1173 if ((translate
1174 ? cpp_interpret_string : cpp_interpret_string_notranslate)
1175 (parse_in, strs, concats + 1, &istr, type))
1177 value = build_string (istr.len, (const char *) istr.text);
1178 free (CONST_CAST (unsigned char *, istr.text));
1180 else
1182 /* Callers cannot generally handle error_mark_node in this context,
1183 so return the empty string instead. cpp_interpret_string has
1184 issued an error. */
1185 switch (type)
1187 default:
1188 case CPP_STRING:
1189 case CPP_UTF8STRING:
1190 value = build_string (1, "");
1191 break;
1192 case CPP_STRING16:
1193 value = build_string (TYPE_PRECISION (char16_type_node)
1194 / TYPE_PRECISION (char_type_node),
1195 "\0"); /* char16_t is 16 bits */
1196 break;
1197 case CPP_STRING32:
1198 value = build_string (TYPE_PRECISION (char32_type_node)
1199 / TYPE_PRECISION (char_type_node),
1200 "\0\0\0"); /* char32_t is 32 bits */
1201 break;
1202 case CPP_WSTRING:
1203 value = build_string (TYPE_PRECISION (wchar_type_node)
1204 / TYPE_PRECISION (char_type_node),
1205 "\0\0\0"); /* widest supported wchar_t
1206 is 32 bits */
1207 break;
1211 switch (type)
1213 default:
1214 case CPP_STRING:
1215 case CPP_UTF8STRING:
1216 TREE_TYPE (value) = char_array_type_node;
1217 break;
1218 case CPP_STRING16:
1219 TREE_TYPE (value) = char16_array_type_node;
1220 break;
1221 case CPP_STRING32:
1222 TREE_TYPE (value) = char32_array_type_node;
1223 break;
1224 case CPP_WSTRING:
1225 TREE_TYPE (value) = wchar_array_type_node;
1227 *valp = fix_string_type (value);
1229 if (concats)
1230 obstack_free (&str_ob, 0);
1232 return objc_string ? CPP_OBJC_STRING : type;
1235 /* Converts a (possibly wide) character constant token into a tree. */
1236 static tree
1237 lex_charconst (const cpp_token *token)
1239 cppchar_t result;
1240 tree type, value;
1241 unsigned int chars_seen;
1242 int unsignedp = 0;
1244 result = cpp_interpret_charconst (parse_in, token,
1245 &chars_seen, &unsignedp);
1247 if (token->type == CPP_WCHAR)
1248 type = wchar_type_node;
1249 else if (token->type == CPP_CHAR32)
1250 type = char32_type_node;
1251 else if (token->type == CPP_CHAR16)
1252 type = char16_type_node;
1253 /* In C, a character constant has type 'int'.
1254 In C++ 'char', but multi-char charconsts have type 'int'. */
1255 else if (!c_dialect_cxx () || chars_seen > 1)
1256 type = integer_type_node;
1257 else
1258 type = char_type_node;
1260 /* Cast to cppchar_signed_t to get correct sign-extension of RESULT
1261 before possibly widening to HOST_WIDE_INT for build_int_cst. */
1262 if (unsignedp || (cppchar_signed_t) result >= 0)
1263 value = build_int_cst (type, result);
1264 else
1265 value = build_int_cst (type, (cppchar_signed_t) result);
1267 return value;