2014-09-12 Marc Glisse <marc.glisse@inria.fr>
[official-gcc.git] / gcc / c-family / c-lex.c
blobea24bfc2a2e42915543faaa244052c30a42bf4c0
1 /* Mainly the interface between cpplib and the C front ends.
2 Copyright (C) 1987-2014 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "tm.h"
25 #include "tree.h"
26 #include "stringpool.h"
27 #include "stor-layout.h"
28 #include "input.h"
29 #include "c-common.h"
30 #include "flags.h"
31 #include "timevar.h"
32 #include "cpplib.h"
33 #include "c-pragma.h"
34 #include "intl.h"
35 #include "splay-tree.h"
36 #include "debug.h"
37 #include "target.h"
38 #include "wide-int.h"
40 /* We may keep statistics about how long which files took to compile. */
41 static int header_time, body_time;
42 static splay_tree file_info_tree;
44 int pending_lang_change; /* If we need to switch languages - C++ only */
45 int c_header_level; /* depth in C headers - C++ only */
47 static tree interpret_integer (const cpp_token *, unsigned int,
48 enum overflow_type *);
49 static tree interpret_float (const cpp_token *, unsigned int, const char *,
50 enum overflow_type *);
51 static tree interpret_fixed (const cpp_token *, unsigned int);
52 static enum integer_type_kind narrowest_unsigned_type
53 (const widest_int &, unsigned int);
54 static enum integer_type_kind narrowest_signed_type
55 (const widest_int &, unsigned int);
56 static enum cpp_ttype lex_string (const cpp_token *, tree *, bool, bool);
57 static tree lex_charconst (const cpp_token *);
58 static void update_header_times (const char *);
59 static int dump_one_header (splay_tree_node, void *);
60 static void cb_line_change (cpp_reader *, const cpp_token *, int);
61 static void cb_ident (cpp_reader *, unsigned int, const cpp_string *);
62 static void cb_def_pragma (cpp_reader *, unsigned int);
63 static void cb_define (cpp_reader *, unsigned int, cpp_hashnode *);
64 static void cb_undef (cpp_reader *, unsigned int, cpp_hashnode *);
66 void
67 init_c_lex (void)
69 struct cpp_callbacks *cb;
70 struct c_fileinfo *toplevel;
72 /* The get_fileinfo data structure must be initialized before
73 cpp_read_main_file is called. */
74 toplevel = get_fileinfo ("<top level>");
75 if (flag_detailed_statistics)
77 header_time = 0;
78 body_time = get_run_time ();
79 toplevel->time = body_time;
82 cb = cpp_get_callbacks (parse_in);
84 cb->line_change = cb_line_change;
85 cb->ident = cb_ident;
86 cb->def_pragma = cb_def_pragma;
87 cb->valid_pch = c_common_valid_pch;
88 cb->read_pch = c_common_read_pch;
90 /* Set the debug callbacks if we can use them. */
91 if ((debug_info_level == DINFO_LEVEL_VERBOSE
92 && (write_symbols == DWARF2_DEBUG
93 || write_symbols == VMS_AND_DWARF2_DEBUG))
94 || flag_dump_go_spec != NULL)
96 cb->define = cb_define;
97 cb->undef = cb_undef;
101 struct c_fileinfo *
102 get_fileinfo (const char *name)
104 splay_tree_node n;
105 struct c_fileinfo *fi;
107 if (!file_info_tree)
108 file_info_tree = splay_tree_new ((splay_tree_compare_fn) strcmp,
110 (splay_tree_delete_value_fn) free);
112 n = splay_tree_lookup (file_info_tree, (splay_tree_key) name);
113 if (n)
114 return (struct c_fileinfo *) n->value;
116 fi = XNEW (struct c_fileinfo);
117 fi->time = 0;
118 fi->interface_only = 0;
119 fi->interface_unknown = 1;
120 splay_tree_insert (file_info_tree, (splay_tree_key) name,
121 (splay_tree_value) fi);
122 return fi;
125 static void
126 update_header_times (const char *name)
128 /* Changing files again. This means currently collected time
129 is charged against header time, and body time starts back at 0. */
130 if (flag_detailed_statistics)
132 int this_time = get_run_time ();
133 struct c_fileinfo *file = get_fileinfo (name);
134 header_time += this_time - body_time;
135 file->time += this_time - body_time;
136 body_time = this_time;
140 static int
141 dump_one_header (splay_tree_node n, void * ARG_UNUSED (dummy))
143 print_time ((const char *) n->key,
144 ((struct c_fileinfo *) n->value)->time);
145 return 0;
148 void
149 dump_time_statistics (void)
151 struct c_fileinfo *file = get_fileinfo (LOCATION_FILE (input_location));
152 int this_time = get_run_time ();
153 file->time += this_time - body_time;
155 fprintf (stderr, "\n******\n");
156 print_time ("header files (total)", header_time);
157 print_time ("main file (total)", this_time - body_time);
158 fprintf (stderr, "ratio = %g : 1\n",
159 (double) header_time / (double) (this_time - body_time));
160 fprintf (stderr, "\n******\n");
162 splay_tree_foreach (file_info_tree, dump_one_header, 0);
165 static void
166 cb_ident (cpp_reader * ARG_UNUSED (pfile),
167 unsigned int ARG_UNUSED (line),
168 const cpp_string * ARG_UNUSED (str))
170 if (!flag_no_ident)
172 /* Convert escapes in the string. */
173 cpp_string cstr = { 0, 0 };
174 if (cpp_interpret_string (pfile, str, 1, &cstr, CPP_STRING))
176 targetm.asm_out.output_ident ((const char *) cstr.text);
177 free (CONST_CAST (unsigned char *, cstr.text));
182 /* Called at the start of every non-empty line. TOKEN is the first
183 lexed token on the line. Used for diagnostic line numbers. */
184 static void
185 cb_line_change (cpp_reader * ARG_UNUSED (pfile), const cpp_token *token,
186 int parsing_args)
188 if (token->type != CPP_EOF && !parsing_args)
189 input_location = token->src_loc;
192 void
193 fe_file_change (const struct line_map *new_map)
195 if (new_map == NULL)
196 return;
198 if (new_map->reason == LC_ENTER)
200 /* Don't stack the main buffer on the input stack;
201 we already did in compile_file. */
202 if (!MAIN_FILE_P (new_map))
204 unsigned int included_at = LAST_SOURCE_LINE_LOCATION (new_map - 1);
205 int line = 0;
206 if (included_at > BUILTINS_LOCATION)
207 line = SOURCE_LINE (new_map - 1, included_at);
209 input_location = new_map->start_location;
210 (*debug_hooks->start_source_file) (line, LINEMAP_FILE (new_map));
211 #ifndef NO_IMPLICIT_EXTERN_C
212 if (c_header_level)
213 ++c_header_level;
214 else if (LINEMAP_SYSP (new_map) == 2)
216 c_header_level = 1;
217 ++pending_lang_change;
219 #endif
222 else if (new_map->reason == LC_LEAVE)
224 #ifndef NO_IMPLICIT_EXTERN_C
225 if (c_header_level && --c_header_level == 0)
227 if (LINEMAP_SYSP (new_map) == 2)
228 warning (0, "badly nested C headers from preprocessor");
229 --pending_lang_change;
231 #endif
232 input_location = new_map->start_location;
234 (*debug_hooks->end_source_file) (LINEMAP_LINE (new_map));
237 update_header_times (LINEMAP_FILE (new_map));
238 input_location = new_map->start_location;
241 static void
242 cb_def_pragma (cpp_reader *pfile, source_location loc)
244 /* Issue a warning message if we have been asked to do so. Ignore
245 unknown pragmas in system headers unless an explicit
246 -Wunknown-pragmas has been given. */
247 if (warn_unknown_pragmas > in_system_header_at (input_location))
249 const unsigned char *space, *name;
250 const cpp_token *s;
251 location_t fe_loc = loc;
253 space = name = (const unsigned char *) "";
254 s = cpp_get_token (pfile);
255 if (s->type != CPP_EOF)
257 space = cpp_token_as_text (pfile, s);
258 s = cpp_get_token (pfile);
259 if (s->type == CPP_NAME)
260 name = cpp_token_as_text (pfile, s);
263 warning_at (fe_loc, OPT_Wunknown_pragmas, "ignoring #pragma %s %s",
264 space, name);
268 /* #define callback for DWARF and DWARF2 debug info. */
269 static void
270 cb_define (cpp_reader *pfile, source_location loc, cpp_hashnode *node)
272 const struct line_map *map = linemap_lookup (line_table, loc);
273 (*debug_hooks->define) (SOURCE_LINE (map, loc),
274 (const char *) cpp_macro_definition (pfile, node));
277 /* #undef callback for DWARF and DWARF2 debug info. */
278 static void
279 cb_undef (cpp_reader * ARG_UNUSED (pfile), source_location loc,
280 cpp_hashnode *node)
282 const struct line_map *map = linemap_lookup (line_table, loc);
283 (*debug_hooks->undef) (SOURCE_LINE (map, loc),
284 (const char *) NODE_NAME (node));
287 /* Read a token and return its type. Fill *VALUE with its value, if
288 applicable. Fill *CPP_FLAGS with the token's flags, if it is
289 non-NULL. */
291 enum cpp_ttype
292 c_lex_with_flags (tree *value, location_t *loc, unsigned char *cpp_flags,
293 int lex_flags)
295 static bool no_more_pch;
296 const cpp_token *tok;
297 enum cpp_ttype type;
298 unsigned char add_flags = 0;
299 enum overflow_type overflow = OT_NONE;
301 timevar_push (TV_CPP);
302 retry:
303 tok = cpp_get_token_with_location (parse_in, loc);
304 type = tok->type;
306 retry_after_at:
307 switch (type)
309 case CPP_PADDING:
310 goto retry;
312 case CPP_NAME:
313 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
314 break;
316 case CPP_NUMBER:
318 const char *suffix = NULL;
319 unsigned int flags = cpp_classify_number (parse_in, tok, &suffix, *loc);
321 switch (flags & CPP_N_CATEGORY)
323 case CPP_N_INVALID:
324 /* cpplib has issued an error. */
325 *value = error_mark_node;
326 break;
328 case CPP_N_INTEGER:
329 /* C++ uses '0' to mark virtual functions as pure.
330 Set PURE_ZERO to pass this information to the C++ parser. */
331 if (tok->val.str.len == 1 && *tok->val.str.text == '0')
332 add_flags = PURE_ZERO;
333 *value = interpret_integer (tok, flags, &overflow);
334 break;
336 case CPP_N_FLOATING:
337 *value = interpret_float (tok, flags, suffix, &overflow);
338 break;
340 default:
341 gcc_unreachable ();
344 if (flags & CPP_N_USERDEF)
346 char *str;
347 tree literal;
348 tree suffix_id = get_identifier (suffix);
349 int len = tok->val.str.len - strlen (suffix);
350 /* If this is going to be used as a C string to pass to a
351 raw literal operator, we need to add a trailing NUL. */
352 tree num_string = build_string (len + 1,
353 (const char *) tok->val.str.text);
354 TREE_TYPE (num_string) = char_array_type_node;
355 num_string = fix_string_type (num_string);
356 str = CONST_CAST (char *, TREE_STRING_POINTER (num_string));
357 str[len] = '\0';
358 literal = build_userdef_literal (suffix_id, *value, overflow,
359 num_string);
360 *value = literal;
363 break;
365 case CPP_ATSIGN:
366 /* An @ may give the next token special significance in Objective-C. */
367 if (c_dialect_objc ())
369 location_t atloc = *loc;
370 location_t newloc;
372 retry_at:
373 tok = cpp_get_token_with_location (parse_in, &newloc);
374 type = tok->type;
375 switch (type)
377 case CPP_PADDING:
378 goto retry_at;
380 case CPP_STRING:
381 case CPP_WSTRING:
382 case CPP_STRING16:
383 case CPP_STRING32:
384 case CPP_UTF8STRING:
385 type = lex_string (tok, value, true, true);
386 break;
388 case CPP_NAME:
389 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
390 if (OBJC_IS_AT_KEYWORD (C_RID_CODE (*value))
391 || OBJC_IS_CXX_KEYWORD (C_RID_CODE (*value)))
393 type = CPP_AT_NAME;
394 /* Note the complication: if we found an OBJC_CXX
395 keyword, for example, 'class', we will be
396 returning a token of type CPP_AT_NAME and rid
397 code RID_CLASS (not RID_AT_CLASS). The language
398 parser needs to convert that to RID_AT_CLASS.
400 break;
402 /* FALLTHROUGH */
404 default:
405 /* ... or not. */
406 error_at (atloc, "stray %<@%> in program");
407 *loc = newloc;
408 goto retry_after_at;
410 break;
413 /* FALLTHROUGH */
414 case CPP_HASH:
415 case CPP_PASTE:
417 unsigned char name[8];
419 *cpp_spell_token (parse_in, tok, name, true) = 0;
421 error_at (*loc, "stray %qs in program", name);
424 goto retry;
426 case CPP_OTHER:
428 cppchar_t c = tok->val.str.text[0];
430 if (c == '"' || c == '\'')
431 error ("missing terminating %c character", (int) c);
432 else if (ISGRAPH (c))
433 error ("stray %qc in program", (int) c);
434 else
435 error ("stray %<\\%o%> in program", (int) c);
437 goto retry;
439 case CPP_CHAR_USERDEF:
440 case CPP_WCHAR_USERDEF:
441 case CPP_CHAR16_USERDEF:
442 case CPP_CHAR32_USERDEF:
444 tree literal;
445 cpp_token temp_tok = *tok;
446 const char *suffix = cpp_get_userdef_suffix (tok);
447 temp_tok.val.str.len -= strlen (suffix);
448 temp_tok.type = cpp_userdef_char_remove_type (type);
449 literal = build_userdef_literal (get_identifier (suffix),
450 lex_charconst (&temp_tok),
451 OT_NONE, NULL_TREE);
452 *value = literal;
454 break;
456 case CPP_CHAR:
457 case CPP_WCHAR:
458 case CPP_CHAR16:
459 case CPP_CHAR32:
460 *value = lex_charconst (tok);
461 break;
463 case CPP_STRING_USERDEF:
464 case CPP_WSTRING_USERDEF:
465 case CPP_STRING16_USERDEF:
466 case CPP_STRING32_USERDEF:
467 case CPP_UTF8STRING_USERDEF:
469 tree literal, string;
470 const char *suffix = cpp_get_userdef_suffix (tok);
471 string = build_string (tok->val.str.len - strlen (suffix),
472 (const char *) tok->val.str.text);
473 literal = build_userdef_literal (get_identifier (suffix),
474 string, OT_NONE, NULL_TREE);
475 *value = literal;
477 break;
479 case CPP_STRING:
480 case CPP_WSTRING:
481 case CPP_STRING16:
482 case CPP_STRING32:
483 case CPP_UTF8STRING:
484 if ((lex_flags & C_LEX_STRING_NO_JOIN) == 0)
486 type = lex_string (tok, value, false,
487 (lex_flags & C_LEX_STRING_NO_TRANSLATE) == 0);
488 break;
490 *value = build_string (tok->val.str.len, (const char *) tok->val.str.text);
491 break;
493 case CPP_PRAGMA:
494 *value = build_int_cst (integer_type_node, tok->val.pragma);
495 break;
497 /* These tokens should not be visible outside cpplib. */
498 case CPP_HEADER_NAME:
499 case CPP_MACRO_ARG:
500 gcc_unreachable ();
502 /* CPP_COMMENT will appear when compiling with -C and should be
503 ignored. */
504 case CPP_COMMENT:
505 goto retry;
507 default:
508 *value = NULL_TREE;
509 break;
512 if (cpp_flags)
513 *cpp_flags = tok->flags | add_flags;
515 if (!no_more_pch)
517 no_more_pch = true;
518 c_common_no_more_pch ();
521 timevar_pop (TV_CPP);
523 return type;
526 /* Returns the narrowest C-visible unsigned type, starting with the
527 minimum specified by FLAGS, that can fit HIGH:LOW, or itk_none if
528 there isn't one. */
530 static enum integer_type_kind
531 narrowest_unsigned_type (const widest_int &val, unsigned int flags)
533 int itk;
535 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
536 itk = itk_unsigned_int;
537 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
538 itk = itk_unsigned_long;
539 else
540 itk = itk_unsigned_long_long;
542 for (; itk < itk_none; itk += 2 /* skip unsigned types */)
544 tree upper;
546 if (integer_types[itk] == NULL_TREE)
547 continue;
548 upper = TYPE_MAX_VALUE (integer_types[itk]);
550 if (wi::geu_p (wi::to_widest (upper), val))
551 return (enum integer_type_kind) itk;
554 return itk_none;
557 /* Ditto, but narrowest signed type. */
558 static enum integer_type_kind
559 narrowest_signed_type (const widest_int &val, unsigned int flags)
561 int itk;
563 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
564 itk = itk_int;
565 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
566 itk = itk_long;
567 else
568 itk = itk_long_long;
570 for (; itk < itk_none; itk += 2 /* skip signed types */)
572 tree upper;
574 if (integer_types[itk] == NULL_TREE)
575 continue;
576 upper = TYPE_MAX_VALUE (integer_types[itk]);
578 if (wi::geu_p (wi::to_widest (upper), val))
579 return (enum integer_type_kind) itk;
582 return itk_none;
585 /* Interpret TOKEN, an integer with FLAGS as classified by cpplib. */
586 static tree
587 interpret_integer (const cpp_token *token, unsigned int flags,
588 enum overflow_type *overflow)
590 tree value, type;
591 enum integer_type_kind itk;
592 cpp_num integer;
593 HOST_WIDE_INT ival[3];
595 *overflow = OT_NONE;
597 integer = cpp_interpret_integer (parse_in, token, flags);
598 if (integer.overflow)
599 *overflow = OT_OVERFLOW;
601 ival[0] = integer.low;
602 ival[1] = integer.high;
603 ival[2] = 0;
604 widest_int wval = widest_int::from_array (ival, 3);
606 /* The type of a constant with a U suffix is straightforward. */
607 if (flags & CPP_N_UNSIGNED)
608 itk = narrowest_unsigned_type (wval, flags);
609 else
611 /* The type of a potentially-signed integer constant varies
612 depending on the base it's in, the standard in use, and the
613 length suffixes. */
614 enum integer_type_kind itk_u
615 = narrowest_unsigned_type (wval, flags);
616 enum integer_type_kind itk_s
617 = narrowest_signed_type (wval, flags);
619 /* In both C89 and C99, octal and hex constants may be signed or
620 unsigned, whichever fits tighter. We do not warn about this
621 choice differing from the traditional choice, as the constant
622 is probably a bit pattern and either way will work. */
623 if ((flags & CPP_N_RADIX) != CPP_N_DECIMAL)
624 itk = MIN (itk_u, itk_s);
625 else
627 /* In C99, decimal constants are always signed.
628 In C89, decimal constants that don't fit in long have
629 undefined behavior; we try to make them unsigned long.
630 In GCC's extended C89, that last is true of decimal
631 constants that don't fit in long long, too. */
633 itk = itk_s;
634 if (itk_s > itk_u && itk_s > itk_long)
636 if (!flag_isoc99)
638 if (itk_u < itk_unsigned_long)
639 itk_u = itk_unsigned_long;
640 itk = itk_u;
641 warning (0, "this decimal constant is unsigned only in ISO C90");
643 else
644 warning (OPT_Wtraditional,
645 "this decimal constant would be unsigned in ISO C90");
650 if (itk == itk_none)
651 /* cpplib has already issued a warning for overflow. */
652 type = ((flags & CPP_N_UNSIGNED)
653 ? widest_unsigned_literal_type_node
654 : widest_integer_literal_type_node);
655 else
657 type = integer_types[itk];
658 if (itk > itk_unsigned_long
659 && (flags & CPP_N_WIDTH) != CPP_N_LARGE)
660 emit_diagnostic
661 ((c_dialect_cxx () ? cxx_dialect == cxx98 : !flag_isoc99)
662 ? DK_PEDWARN : DK_WARNING,
663 input_location, OPT_Wlong_long,
664 (flags & CPP_N_UNSIGNED)
665 ? "integer constant is too large for %<unsigned long%> type"
666 : "integer constant is too large for %<long%> type");
669 value = wide_int_to_tree (type, wval);
671 /* Convert imaginary to a complex type. */
672 if (flags & CPP_N_IMAGINARY)
673 value = build_complex (NULL_TREE, build_int_cst (type, 0), value);
675 return value;
678 /* Interpret TOKEN, a floating point number with FLAGS as classified
679 by cpplib. For C++0X SUFFIX may contain a user-defined literal suffix. */
680 static tree
681 interpret_float (const cpp_token *token, unsigned int flags,
682 const char *suffix, enum overflow_type *overflow)
684 tree type;
685 tree const_type;
686 tree value;
687 REAL_VALUE_TYPE real;
688 REAL_VALUE_TYPE real_trunc;
689 char *copy;
690 size_t copylen;
692 *overflow = OT_NONE;
694 /* Default (no suffix) depends on whether the FLOAT_CONST_DECIMAL64
695 pragma has been used and is either double or _Decimal64. Types
696 that are not allowed with decimal float default to double. */
697 if (flags & CPP_N_DEFAULT)
699 flags ^= CPP_N_DEFAULT;
700 flags |= CPP_N_MEDIUM;
702 if (((flags & CPP_N_HEX) == 0) && ((flags & CPP_N_IMAGINARY) == 0))
704 warning (OPT_Wunsuffixed_float_constants,
705 "unsuffixed float constant");
706 if (float_const_decimal64_p ())
707 flags |= CPP_N_DFLOAT;
711 /* Decode _Fract and _Accum. */
712 if (flags & CPP_N_FRACT || flags & CPP_N_ACCUM)
713 return interpret_fixed (token, flags);
715 /* Decode type based on width and properties. */
716 if (flags & CPP_N_DFLOAT)
717 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
718 type = dfloat128_type_node;
719 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
720 type = dfloat32_type_node;
721 else
722 type = dfloat64_type_node;
723 else
724 if (flags & CPP_N_WIDTH_MD)
726 char suffix;
727 enum machine_mode mode;
729 if ((flags & CPP_N_WIDTH_MD) == CPP_N_MD_W)
730 suffix = 'w';
731 else
732 suffix = 'q';
734 mode = targetm.c.mode_for_suffix (suffix);
735 if (mode == VOIDmode)
737 error ("unsupported non-standard suffix on floating constant");
739 return error_mark_node;
741 else
742 pedwarn (input_location, OPT_Wpedantic, "non-standard suffix on floating constant");
744 type = c_common_type_for_mode (mode, 0);
745 gcc_assert (type);
747 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
748 type = long_double_type_node;
749 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL
750 || flag_single_precision_constant)
751 type = float_type_node;
752 else
753 type = double_type_node;
755 const_type = excess_precision_type (type);
756 if (!const_type)
757 const_type = type;
759 /* Copy the constant to a nul-terminated buffer. If the constant
760 has any suffixes, cut them off; REAL_VALUE_ATOF/ REAL_VALUE_HTOF
761 can't handle them. */
762 copylen = token->val.str.len;
763 if (flags & CPP_N_USERDEF)
764 copylen -= strlen (suffix);
765 else if (flags & CPP_N_DFLOAT)
766 copylen -= 2;
767 else
769 if ((flags & CPP_N_WIDTH) != CPP_N_MEDIUM)
770 /* Must be an F or L or machine defined suffix. */
771 copylen--;
772 if (flags & CPP_N_IMAGINARY)
773 /* I or J suffix. */
774 copylen--;
777 copy = (char *) alloca (copylen + 1);
778 if (cxx_dialect > cxx11)
780 size_t maxlen = 0;
781 for (size_t i = 0; i < copylen; ++i)
782 if (token->val.str.text[i] != '\'')
783 copy[maxlen++] = token->val.str.text[i];
784 copy[maxlen] = '\0';
786 else
788 memcpy (copy, token->val.str.text, copylen);
789 copy[copylen] = '\0';
792 real_from_string3 (&real, copy, TYPE_MODE (const_type));
793 if (const_type != type)
794 /* Diagnosing if the result of converting the value with excess
795 precision to the semantic type would overflow (with associated
796 double rounding) is more appropriate than diagnosing if the
797 result of converting the string directly to the semantic type
798 would overflow. */
799 real_convert (&real_trunc, TYPE_MODE (type), &real);
801 /* Both C and C++ require a diagnostic for a floating constant
802 outside the range of representable values of its type. Since we
803 have __builtin_inf* to produce an infinity, this is now a
804 mandatory pedwarn if the target does not support infinities. */
805 if (REAL_VALUE_ISINF (real)
806 || (const_type != type && REAL_VALUE_ISINF (real_trunc)))
808 *overflow = OT_OVERFLOW;
809 if (!(flags & CPP_N_USERDEF))
811 if (!MODE_HAS_INFINITIES (TYPE_MODE (type)))
812 pedwarn (input_location, 0,
813 "floating constant exceeds range of %qT", type);
814 else
815 warning (OPT_Woverflow,
816 "floating constant exceeds range of %qT", type);
819 /* We also give a warning if the value underflows. */
820 else if (REAL_VALUES_EQUAL (real, dconst0)
821 || (const_type != type
822 && REAL_VALUES_EQUAL (real_trunc, dconst0)))
824 REAL_VALUE_TYPE realvoidmode;
825 int oflow = real_from_string (&realvoidmode, copy);
826 *overflow = (oflow == 0 ? OT_NONE
827 : (oflow < 0 ? OT_UNDERFLOW : OT_OVERFLOW));
828 if (!(flags & CPP_N_USERDEF))
830 if (oflow < 0 || !REAL_VALUES_EQUAL (realvoidmode, dconst0))
831 warning (OPT_Woverflow, "floating constant truncated to zero");
835 /* Create a node with determined type and value. */
836 value = build_real (const_type, real);
837 if (flags & CPP_N_IMAGINARY)
839 value = build_complex (NULL_TREE, convert (const_type,
840 integer_zero_node), value);
841 if (type != const_type)
843 const_type = TREE_TYPE (value);
844 type = build_complex_type (type);
848 if (type != const_type)
849 value = build1 (EXCESS_PRECISION_EXPR, type, value);
851 return value;
854 /* Interpret TOKEN, a fixed-point number with FLAGS as classified
855 by cpplib. */
857 static tree
858 interpret_fixed (const cpp_token *token, unsigned int flags)
860 tree type;
861 tree value;
862 FIXED_VALUE_TYPE fixed;
863 char *copy;
864 size_t copylen;
866 copylen = token->val.str.len;
868 if (flags & CPP_N_FRACT) /* _Fract. */
870 if (flags & CPP_N_UNSIGNED) /* Unsigned _Fract. */
872 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
874 type = unsigned_long_long_fract_type_node;
875 copylen -= 4;
877 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
879 type = unsigned_long_fract_type_node;
880 copylen -= 3;
882 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
884 type = unsigned_short_fract_type_node;
885 copylen -= 3;
887 else
889 type = unsigned_fract_type_node;
890 copylen -= 2;
893 else /* Signed _Fract. */
895 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
897 type = long_long_fract_type_node;
898 copylen -= 3;
900 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
902 type = long_fract_type_node;
903 copylen -= 2;
905 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
907 type = short_fract_type_node;
908 copylen -= 2;
910 else
912 type = fract_type_node;
913 copylen --;
917 else /* _Accum. */
919 if (flags & CPP_N_UNSIGNED) /* Unsigned _Accum. */
921 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
923 type = unsigned_long_long_accum_type_node;
924 copylen -= 4;
926 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
928 type = unsigned_long_accum_type_node;
929 copylen -= 3;
931 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
933 type = unsigned_short_accum_type_node;
934 copylen -= 3;
936 else
938 type = unsigned_accum_type_node;
939 copylen -= 2;
942 else /* Signed _Accum. */
944 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
946 type = long_long_accum_type_node;
947 copylen -= 3;
949 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
951 type = long_accum_type_node;
952 copylen -= 2;
954 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
956 type = short_accum_type_node;
957 copylen -= 2;
959 else
961 type = accum_type_node;
962 copylen --;
967 copy = (char *) alloca (copylen + 1);
968 memcpy (copy, token->val.str.text, copylen);
969 copy[copylen] = '\0';
971 fixed_from_string (&fixed, copy, TYPE_MODE (type));
973 /* Create a node with determined type and value. */
974 value = build_fixed (type, fixed);
976 return value;
979 /* Convert a series of STRING, WSTRING, STRING16, STRING32 and/or
980 UTF8STRING tokens into a tree, performing string constant
981 concatenation. TOK is the first of these. VALP is the location to
982 write the string into. OBJC_STRING indicates whether an '@' token
983 preceded the incoming token (in that case, the strings can either
984 be ObjC strings, preceded by a single '@', or normal strings, not
985 preceded by '@'. The result will be a CPP_OBJC_STRING). Returns
986 the CPP token type of the result (CPP_STRING, CPP_WSTRING,
987 CPP_STRING32, CPP_STRING16, CPP_UTF8STRING, or CPP_OBJC_STRING).
989 This is unfortunately more work than it should be. If any of the
990 strings in the series has an L prefix, the result is a wide string
991 (6.4.5p4). Whether or not the result is a wide string affects the
992 meaning of octal and hexadecimal escapes (6.4.4.4p6,9). But escape
993 sequences do not continue across the boundary between two strings in
994 a series (6.4.5p7), so we must not lose the boundaries. Therefore
995 cpp_interpret_string takes a vector of cpp_string structures, which
996 we must arrange to provide. */
998 static enum cpp_ttype
999 lex_string (const cpp_token *tok, tree *valp, bool objc_string, bool translate)
1001 tree value;
1002 size_t concats = 0;
1003 struct obstack str_ob;
1004 cpp_string istr;
1005 enum cpp_ttype type = tok->type;
1007 /* Try to avoid the overhead of creating and destroying an obstack
1008 for the common case of just one string. */
1009 cpp_string str = tok->val.str;
1010 cpp_string *strs = &str;
1012 /* objc_at_sign_was_seen is only used when doing Objective-C string
1013 concatenation. It is 'true' if we have seen an '@' before the
1014 current string, and 'false' if not. We must see exactly one or
1015 zero '@' before each string. */
1016 bool objc_at_sign_was_seen = false;
1018 retry:
1019 tok = cpp_get_token (parse_in);
1020 switch (tok->type)
1022 case CPP_PADDING:
1023 goto retry;
1024 case CPP_ATSIGN:
1025 if (objc_string)
1027 if (objc_at_sign_was_seen)
1028 error ("repeated %<@%> before Objective-C string");
1030 objc_at_sign_was_seen = true;
1031 goto retry;
1033 /* FALLTHROUGH */
1035 default:
1036 break;
1038 case CPP_WSTRING:
1039 case CPP_STRING16:
1040 case CPP_STRING32:
1041 case CPP_UTF8STRING:
1042 if (type != tok->type)
1044 if (type == CPP_STRING)
1045 type = tok->type;
1046 else
1047 error ("unsupported non-standard concatenation of string literals");
1050 case CPP_STRING:
1051 if (!concats)
1053 gcc_obstack_init (&str_ob);
1054 obstack_grow (&str_ob, &str, sizeof (cpp_string));
1057 concats++;
1058 obstack_grow (&str_ob, &tok->val.str, sizeof (cpp_string));
1059 if (objc_string)
1060 objc_at_sign_was_seen = false;
1061 goto retry;
1064 /* It is an error if we saw a '@' with no following string. */
1065 if (objc_at_sign_was_seen)
1066 error ("stray %<@%> in program");
1068 /* We have read one more token than we want. */
1069 _cpp_backup_tokens (parse_in, 1);
1070 if (concats)
1071 strs = XOBFINISH (&str_ob, cpp_string *);
1073 if (concats && !objc_string && !in_system_header_at (input_location))
1074 warning (OPT_Wtraditional,
1075 "traditional C rejects string constant concatenation");
1077 if ((translate
1078 ? cpp_interpret_string : cpp_interpret_string_notranslate)
1079 (parse_in, strs, concats + 1, &istr, type))
1081 value = build_string (istr.len, (const char *) istr.text);
1082 free (CONST_CAST (unsigned char *, istr.text));
1084 else
1086 /* Callers cannot generally handle error_mark_node in this context,
1087 so return the empty string instead. cpp_interpret_string has
1088 issued an error. */
1089 switch (type)
1091 default:
1092 case CPP_STRING:
1093 case CPP_UTF8STRING:
1094 value = build_string (1, "");
1095 break;
1096 case CPP_STRING16:
1097 value = build_string (TYPE_PRECISION (char16_type_node)
1098 / TYPE_PRECISION (char_type_node),
1099 "\0"); /* char16_t is 16 bits */
1100 break;
1101 case CPP_STRING32:
1102 value = build_string (TYPE_PRECISION (char32_type_node)
1103 / TYPE_PRECISION (char_type_node),
1104 "\0\0\0"); /* char32_t is 32 bits */
1105 break;
1106 case CPP_WSTRING:
1107 value = build_string (TYPE_PRECISION (wchar_type_node)
1108 / TYPE_PRECISION (char_type_node),
1109 "\0\0\0"); /* widest supported wchar_t
1110 is 32 bits */
1111 break;
1115 switch (type)
1117 default:
1118 case CPP_STRING:
1119 case CPP_UTF8STRING:
1120 TREE_TYPE (value) = char_array_type_node;
1121 break;
1122 case CPP_STRING16:
1123 TREE_TYPE (value) = char16_array_type_node;
1124 break;
1125 case CPP_STRING32:
1126 TREE_TYPE (value) = char32_array_type_node;
1127 break;
1128 case CPP_WSTRING:
1129 TREE_TYPE (value) = wchar_array_type_node;
1131 *valp = fix_string_type (value);
1133 if (concats)
1134 obstack_free (&str_ob, 0);
1136 return objc_string ? CPP_OBJC_STRING : type;
1139 /* Converts a (possibly wide) character constant token into a tree. */
1140 static tree
1141 lex_charconst (const cpp_token *token)
1143 cppchar_t result;
1144 tree type, value;
1145 unsigned int chars_seen;
1146 int unsignedp = 0;
1148 result = cpp_interpret_charconst (parse_in, token,
1149 &chars_seen, &unsignedp);
1151 if (token->type == CPP_WCHAR)
1152 type = wchar_type_node;
1153 else if (token->type == CPP_CHAR32)
1154 type = char32_type_node;
1155 else if (token->type == CPP_CHAR16)
1156 type = char16_type_node;
1157 /* In C, a character constant has type 'int'.
1158 In C++ 'char', but multi-char charconsts have type 'int'. */
1159 else if (!c_dialect_cxx () || chars_seen > 1)
1160 type = integer_type_node;
1161 else
1162 type = char_type_node;
1164 /* Cast to cppchar_signed_t to get correct sign-extension of RESULT
1165 before possibly widening to HOST_WIDE_INT for build_int_cst. */
1166 if (unsignedp || (cppchar_signed_t) result >= 0)
1167 value = build_int_cst (type, result);
1168 else
1169 value = build_int_cst (type, (cppchar_signed_t) result);
1171 return value;