2010-05-28 Segher Boessenkool <segher@kernel.crashing.org>
[official-gcc.git] / gcc / c-lex.c
blob5d77e093fb80e334e63c0cf5771d7dbbea535b09
1 /* Mainly the interface between cpplib and the C front ends.
2 Copyright (C) 1987, 1988, 1989, 1992, 1994, 1995, 1996, 1997
3 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2007, 2008, 2009, 2010
4 Free Software Foundation, Inc.
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 #include "config.h"
23 #include "system.h"
24 #include "coretypes.h"
25 #include "tm.h"
27 #include "tree.h"
28 #include "input.h"
29 #include "output.h"
30 #include "c-tree.h"
31 #include "c-common.h"
32 #include "flags.h"
33 #include "timevar.h"
34 #include "cpplib.h"
35 #include "c-pragma.h"
36 #include "toplev.h"
37 #include "intl.h"
38 #include "splay-tree.h"
39 #include "debug.h"
40 #include "target.h"
42 /* We may keep statistics about how long which files took to compile. */
43 static int header_time, body_time;
44 static splay_tree file_info_tree;
46 int pending_lang_change; /* If we need to switch languages - C++ only */
47 int c_header_level; /* depth in C headers - C++ only */
49 static tree interpret_integer (const cpp_token *, unsigned int);
50 static tree interpret_float (const cpp_token *, unsigned int);
51 static tree interpret_fixed (const cpp_token *, unsigned int);
52 static enum integer_type_kind narrowest_unsigned_type
53 (unsigned HOST_WIDE_INT, unsigned HOST_WIDE_INT, unsigned int);
54 static enum integer_type_kind narrowest_signed_type
55 (unsigned HOST_WIDE_INT, unsigned HOST_WIDE_INT, unsigned int);
56 static enum cpp_ttype lex_string (const cpp_token *, tree *, bool, bool);
57 static tree lex_charconst (const cpp_token *);
58 static void update_header_times (const char *);
59 static int dump_one_header (splay_tree_node, void *);
60 static void cb_line_change (cpp_reader *, const cpp_token *, int);
61 static void cb_ident (cpp_reader *, unsigned int, const cpp_string *);
62 static void cb_def_pragma (cpp_reader *, unsigned int);
63 static void cb_define (cpp_reader *, unsigned int, cpp_hashnode *);
64 static void cb_undef (cpp_reader *, unsigned int, cpp_hashnode *);
66 void
67 init_c_lex (void)
69 struct cpp_callbacks *cb;
70 struct c_fileinfo *toplevel;
72 /* The get_fileinfo data structure must be initialized before
73 cpp_read_main_file is called. */
74 toplevel = get_fileinfo ("<top level>");
75 if (flag_detailed_statistics)
77 header_time = 0;
78 body_time = get_run_time ();
79 toplevel->time = body_time;
82 cb = cpp_get_callbacks (parse_in);
84 cb->line_change = cb_line_change;
85 cb->ident = cb_ident;
86 cb->def_pragma = cb_def_pragma;
87 cb->valid_pch = c_common_valid_pch;
88 cb->read_pch = c_common_read_pch;
90 /* Set the debug callbacks if we can use them. */
91 if (debug_info_level == DINFO_LEVEL_VERBOSE
92 && (write_symbols == DWARF2_DEBUG
93 || write_symbols == VMS_AND_DWARF2_DEBUG))
95 cb->define = cb_define;
96 cb->undef = cb_undef;
100 struct c_fileinfo *
101 get_fileinfo (const char *name)
103 splay_tree_node n;
104 struct c_fileinfo *fi;
106 if (!file_info_tree)
107 file_info_tree = splay_tree_new ((splay_tree_compare_fn) strcmp,
109 (splay_tree_delete_value_fn) free);
111 n = splay_tree_lookup (file_info_tree, (splay_tree_key) name);
112 if (n)
113 return (struct c_fileinfo *) n->value;
115 fi = XNEW (struct c_fileinfo);
116 fi->time = 0;
117 fi->interface_only = 0;
118 fi->interface_unknown = 1;
119 splay_tree_insert (file_info_tree, (splay_tree_key) name,
120 (splay_tree_value) fi);
121 return fi;
124 static void
125 update_header_times (const char *name)
127 /* Changing files again. This means currently collected time
128 is charged against header time, and body time starts back at 0. */
129 if (flag_detailed_statistics)
131 int this_time = get_run_time ();
132 struct c_fileinfo *file = get_fileinfo (name);
133 header_time += this_time - body_time;
134 file->time += this_time - body_time;
135 body_time = this_time;
139 static int
140 dump_one_header (splay_tree_node n, void * ARG_UNUSED (dummy))
142 print_time ((const char *) n->key,
143 ((struct c_fileinfo *) n->value)->time);
144 return 0;
147 void
148 dump_time_statistics (void)
150 struct c_fileinfo *file = get_fileinfo (input_filename);
151 int this_time = get_run_time ();
152 file->time += this_time - body_time;
154 fprintf (stderr, "\n******\n");
155 print_time ("header files (total)", header_time);
156 print_time ("main file (total)", this_time - body_time);
157 fprintf (stderr, "ratio = %g : 1\n",
158 (double) header_time / (double) (this_time - body_time));
159 fprintf (stderr, "\n******\n");
161 splay_tree_foreach (file_info_tree, dump_one_header, 0);
164 static void
165 cb_ident (cpp_reader * ARG_UNUSED (pfile),
166 unsigned int ARG_UNUSED (line),
167 const cpp_string * ARG_UNUSED (str))
169 #ifdef ASM_OUTPUT_IDENT
170 if (!flag_no_ident)
172 /* Convert escapes in the string. */
173 cpp_string cstr = { 0, 0 };
174 if (cpp_interpret_string (pfile, str, 1, &cstr, CPP_STRING))
176 ASM_OUTPUT_IDENT (asm_out_file, (const char *) cstr.text);
177 free (CONST_CAST (unsigned char *, cstr.text));
180 #endif
183 /* Called at the start of every non-empty line. TOKEN is the first
184 lexed token on the line. Used for diagnostic line numbers. */
185 static void
186 cb_line_change (cpp_reader * ARG_UNUSED (pfile), const cpp_token *token,
187 int parsing_args)
189 if (token->type != CPP_EOF && !parsing_args)
190 input_location = token->src_loc;
193 void
194 fe_file_change (const struct line_map *new_map)
196 if (new_map == NULL)
197 return;
199 if (new_map->reason == LC_ENTER)
201 /* Don't stack the main buffer on the input stack;
202 we already did in compile_file. */
203 if (!MAIN_FILE_P (new_map))
205 unsigned int included_at = LAST_SOURCE_LINE_LOCATION (new_map - 1);
206 int line = 0;
207 if (included_at > BUILTINS_LOCATION)
208 line = SOURCE_LINE (new_map - 1, included_at);
210 input_location = new_map->start_location;
211 (*debug_hooks->start_source_file) (line, new_map->to_file);
212 #ifndef NO_IMPLICIT_EXTERN_C
213 if (c_header_level)
214 ++c_header_level;
215 else if (new_map->sysp == 2)
217 c_header_level = 1;
218 ++pending_lang_change;
220 #endif
223 else if (new_map->reason == LC_LEAVE)
225 #ifndef NO_IMPLICIT_EXTERN_C
226 if (c_header_level && --c_header_level == 0)
228 if (new_map->sysp == 2)
229 warning (0, "badly nested C headers from preprocessor");
230 --pending_lang_change;
232 #endif
233 input_location = new_map->start_location;
235 (*debug_hooks->end_source_file) (new_map->to_line);
238 update_header_times (new_map->to_file);
239 input_location = new_map->start_location;
242 static void
243 cb_def_pragma (cpp_reader *pfile, source_location loc)
245 /* Issue a warning message if we have been asked to do so. Ignore
246 unknown pragmas in system headers unless an explicit
247 -Wunknown-pragmas has been given. */
248 if (warn_unknown_pragmas > in_system_header)
250 const unsigned char *space, *name;
251 const cpp_token *s;
252 location_t fe_loc = loc;
254 space = name = (const unsigned char *) "";
255 s = cpp_get_token (pfile);
256 if (s->type != CPP_EOF)
258 space = cpp_token_as_text (pfile, s);
259 s = cpp_get_token (pfile);
260 if (s->type == CPP_NAME)
261 name = cpp_token_as_text (pfile, s);
264 warning_at (fe_loc, OPT_Wunknown_pragmas, "ignoring #pragma %s %s",
265 space, name);
269 /* #define callback for DWARF and DWARF2 debug info. */
270 static void
271 cb_define (cpp_reader *pfile, source_location loc, cpp_hashnode *node)
273 const struct line_map *map = linemap_lookup (line_table, loc);
274 (*debug_hooks->define) (SOURCE_LINE (map, loc),
275 (const char *) cpp_macro_definition (pfile, node));
278 /* #undef callback for DWARF and DWARF2 debug info. */
279 static void
280 cb_undef (cpp_reader * ARG_UNUSED (pfile), source_location loc,
281 cpp_hashnode *node)
283 const struct line_map *map = linemap_lookup (line_table, loc);
284 (*debug_hooks->undef) (SOURCE_LINE (map, loc),
285 (const char *) NODE_NAME (node));
288 /* Read a token and return its type. Fill *VALUE with its value, if
289 applicable. Fill *CPP_FLAGS with the token's flags, if it is
290 non-NULL. */
292 enum cpp_ttype
293 c_lex_with_flags (tree *value, location_t *loc, unsigned char *cpp_flags,
294 int lex_flags)
296 static bool no_more_pch;
297 const cpp_token *tok;
298 enum cpp_ttype type;
299 unsigned char add_flags = 0;
301 timevar_push (TV_CPP);
302 retry:
303 tok = cpp_get_token_with_location (parse_in, loc);
304 type = tok->type;
306 retry_after_at:
307 switch (type)
309 case CPP_PADDING:
310 goto retry;
312 case CPP_NAME:
313 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
314 break;
316 case CPP_NUMBER:
318 unsigned int flags = cpp_classify_number (parse_in, tok);
320 switch (flags & CPP_N_CATEGORY)
322 case CPP_N_INVALID:
323 /* cpplib has issued an error. */
324 *value = error_mark_node;
325 break;
327 case CPP_N_INTEGER:
328 /* C++ uses '0' to mark virtual functions as pure.
329 Set PURE_ZERO to pass this information to the C++ parser. */
330 if (tok->val.str.len == 1 && *tok->val.str.text == '0')
331 add_flags = PURE_ZERO;
332 *value = interpret_integer (tok, flags);
333 break;
335 case CPP_N_FLOATING:
336 *value = interpret_float (tok, flags);
337 break;
339 default:
340 gcc_unreachable ();
343 break;
345 case CPP_ATSIGN:
346 /* An @ may give the next token special significance in Objective-C. */
347 if (c_dialect_objc ())
349 location_t atloc = *loc;
350 location_t newloc;
352 retry_at:
353 tok = cpp_get_token_with_location (parse_in, &newloc);
354 type = tok->type;
355 switch (type)
357 case CPP_PADDING:
358 goto retry_at;
360 case CPP_STRING:
361 case CPP_WSTRING:
362 case CPP_STRING16:
363 case CPP_STRING32:
364 case CPP_UTF8STRING:
365 type = lex_string (tok, value, true, true);
366 break;
368 case CPP_NAME:
369 *value = HT_IDENT_TO_GCC_IDENT (HT_NODE (tok->val.node.node));
370 if (objc_is_reserved_word (*value))
372 type = CPP_AT_NAME;
373 break;
375 /* FALLTHROUGH */
377 default:
378 /* ... or not. */
379 error_at (atloc, "stray %<@%> in program");
380 *loc = newloc;
381 goto retry_after_at;
383 break;
386 /* FALLTHROUGH */
387 case CPP_HASH:
388 case CPP_PASTE:
390 unsigned char name[8];
392 *cpp_spell_token (parse_in, tok, name, true) = 0;
394 error ("stray %qs in program", name);
397 goto retry;
399 case CPP_OTHER:
401 cppchar_t c = tok->val.str.text[0];
403 if (c == '"' || c == '\'')
404 error ("missing terminating %c character", (int) c);
405 else if (ISGRAPH (c))
406 error ("stray %qc in program", (int) c);
407 else
408 error ("stray %<\\%o%> in program", (int) c);
410 goto retry;
412 case CPP_CHAR:
413 case CPP_WCHAR:
414 case CPP_CHAR16:
415 case CPP_CHAR32:
416 *value = lex_charconst (tok);
417 break;
419 case CPP_STRING:
420 case CPP_WSTRING:
421 case CPP_STRING16:
422 case CPP_STRING32:
423 case CPP_UTF8STRING:
424 if ((lex_flags & C_LEX_STRING_NO_JOIN) == 0)
426 type = lex_string (tok, value, false,
427 (lex_flags & C_LEX_STRING_NO_TRANSLATE) == 0);
428 break;
430 *value = build_string (tok->val.str.len, (const char *) tok->val.str.text);
431 break;
433 case CPP_PRAGMA:
434 *value = build_int_cst (NULL, tok->val.pragma);
435 break;
437 /* These tokens should not be visible outside cpplib. */
438 case CPP_HEADER_NAME:
439 case CPP_COMMENT:
440 case CPP_MACRO_ARG:
441 gcc_unreachable ();
443 default:
444 *value = NULL_TREE;
445 break;
448 if (cpp_flags)
449 *cpp_flags = tok->flags | add_flags;
451 if (!no_more_pch)
453 no_more_pch = true;
454 c_common_no_more_pch ();
457 timevar_pop (TV_CPP);
459 return type;
462 /* Returns the narrowest C-visible unsigned type, starting with the
463 minimum specified by FLAGS, that can fit HIGH:LOW, or itk_none if
464 there isn't one. */
466 static enum integer_type_kind
467 narrowest_unsigned_type (unsigned HOST_WIDE_INT low,
468 unsigned HOST_WIDE_INT high,
469 unsigned int flags)
471 int itk;
473 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
474 itk = itk_unsigned_int;
475 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
476 itk = itk_unsigned_long;
477 else
478 itk = itk_unsigned_long_long;
480 for (; itk < itk_none; itk += 2 /* skip unsigned types */)
482 tree upper;
484 if (integer_types[itk] == NULL_TREE)
485 continue;
486 upper = TYPE_MAX_VALUE (integer_types[itk]);
488 if ((unsigned HOST_WIDE_INT) TREE_INT_CST_HIGH (upper) > high
489 || ((unsigned HOST_WIDE_INT) TREE_INT_CST_HIGH (upper) == high
490 && TREE_INT_CST_LOW (upper) >= low))
491 return (enum integer_type_kind) itk;
494 return itk_none;
497 /* Ditto, but narrowest signed type. */
498 static enum integer_type_kind
499 narrowest_signed_type (unsigned HOST_WIDE_INT low,
500 unsigned HOST_WIDE_INT high, unsigned int flags)
502 int itk;
504 if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
505 itk = itk_int;
506 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
507 itk = itk_long;
508 else
509 itk = itk_long_long;
512 for (; itk < itk_none; itk += 2 /* skip signed types */)
514 tree upper;
516 if (integer_types[itk] == NULL_TREE)
517 continue;
518 upper = TYPE_MAX_VALUE (integer_types[itk]);
520 if ((unsigned HOST_WIDE_INT) TREE_INT_CST_HIGH (upper) > high
521 || ((unsigned HOST_WIDE_INT) TREE_INT_CST_HIGH (upper) == high
522 && TREE_INT_CST_LOW (upper) >= low))
523 return (enum integer_type_kind) itk;
526 return itk_none;
529 /* Interpret TOKEN, an integer with FLAGS as classified by cpplib. */
530 static tree
531 interpret_integer (const cpp_token *token, unsigned int flags)
533 tree value, type;
534 enum integer_type_kind itk;
535 cpp_num integer;
536 cpp_options *options = cpp_get_options (parse_in);
538 integer = cpp_interpret_integer (parse_in, token, flags);
539 integer = cpp_num_sign_extend (integer, options->precision);
541 /* The type of a constant with a U suffix is straightforward. */
542 if (flags & CPP_N_UNSIGNED)
543 itk = narrowest_unsigned_type (integer.low, integer.high, flags);
544 else
546 /* The type of a potentially-signed integer constant varies
547 depending on the base it's in, the standard in use, and the
548 length suffixes. */
549 enum integer_type_kind itk_u
550 = narrowest_unsigned_type (integer.low, integer.high, flags);
551 enum integer_type_kind itk_s
552 = narrowest_signed_type (integer.low, integer.high, flags);
554 /* In both C89 and C99, octal and hex constants may be signed or
555 unsigned, whichever fits tighter. We do not warn about this
556 choice differing from the traditional choice, as the constant
557 is probably a bit pattern and either way will work. */
558 if ((flags & CPP_N_RADIX) != CPP_N_DECIMAL)
559 itk = MIN (itk_u, itk_s);
560 else
562 /* In C99, decimal constants are always signed.
563 In C89, decimal constants that don't fit in long have
564 undefined behavior; we try to make them unsigned long.
565 In GCC's extended C89, that last is true of decimal
566 constants that don't fit in long long, too. */
568 itk = itk_s;
569 if (itk_s > itk_u && itk_s > itk_long)
571 if (!flag_isoc99)
573 if (itk_u < itk_unsigned_long)
574 itk_u = itk_unsigned_long;
575 itk = itk_u;
576 warning (0, "this decimal constant is unsigned only in ISO C90");
578 else
579 warning (OPT_Wtraditional,
580 "this decimal constant would be unsigned in ISO C90");
585 if (itk == itk_none)
586 /* cpplib has already issued a warning for overflow. */
587 type = ((flags & CPP_N_UNSIGNED)
588 ? widest_unsigned_literal_type_node
589 : widest_integer_literal_type_node);
590 else
592 type = integer_types[itk];
593 if (itk > itk_unsigned_long
594 && (flags & CPP_N_WIDTH) != CPP_N_LARGE)
595 emit_diagnostic
596 ((c_dialect_cxx () ? cxx_dialect == cxx98 : !flag_isoc99)
597 ? DK_PEDWARN : DK_WARNING,
598 input_location, OPT_Wlong_long,
599 (flags & CPP_N_UNSIGNED)
600 ? "integer constant is too large for %<unsigned long%> type"
601 : "integer constant is too large for %<long%> type");
604 value = build_int_cst_wide (type, integer.low, integer.high);
606 /* Convert imaginary to a complex type. */
607 if (flags & CPP_N_IMAGINARY)
608 value = build_complex (NULL_TREE, build_int_cst (type, 0), value);
610 return value;
613 /* Interpret TOKEN, a floating point number with FLAGS as classified
614 by cpplib. */
615 static tree
616 interpret_float (const cpp_token *token, unsigned int flags)
618 tree type;
619 tree const_type;
620 tree value;
621 REAL_VALUE_TYPE real;
622 REAL_VALUE_TYPE real_trunc;
623 char *copy;
624 size_t copylen;
626 /* Default (no suffix) depends on whether the FLOAT_CONST_DECIMAL64
627 pragma has been used and is either double or _Decimal64. Types
628 that are not allowed with decimal float default to double. */
629 if (flags & CPP_N_DEFAULT)
631 flags ^= CPP_N_DEFAULT;
632 flags |= CPP_N_MEDIUM;
634 if (((flags & CPP_N_HEX) == 0) && ((flags & CPP_N_IMAGINARY) == 0))
636 warning (OPT_Wunsuffixed_float_constants,
637 "unsuffixed float constant");
638 if (float_const_decimal64_p ())
639 flags |= CPP_N_DFLOAT;
643 /* Decode _Fract and _Accum. */
644 if (flags & CPP_N_FRACT || flags & CPP_N_ACCUM)
645 return interpret_fixed (token, flags);
647 /* Decode type based on width and properties. */
648 if (flags & CPP_N_DFLOAT)
649 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
650 type = dfloat128_type_node;
651 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
652 type = dfloat32_type_node;
653 else
654 type = dfloat64_type_node;
655 else
656 if (flags & CPP_N_WIDTH_MD)
658 char suffix;
659 enum machine_mode mode;
661 if ((flags & CPP_N_WIDTH_MD) == CPP_N_MD_W)
662 suffix = 'w';
663 else
664 suffix = 'q';
666 mode = targetm.c.mode_for_suffix (suffix);
667 if (mode == VOIDmode)
669 error ("unsupported non-standard suffix on floating constant");
671 return error_mark_node;
673 else
674 pedwarn (input_location, OPT_pedantic, "non-standard suffix on floating constant");
676 type = c_common_type_for_mode (mode, 0);
677 gcc_assert (type);
679 else if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
680 type = long_double_type_node;
681 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL
682 || flag_single_precision_constant)
683 type = float_type_node;
684 else
685 type = double_type_node;
687 const_type = excess_precision_type (type);
688 if (!const_type)
689 const_type = type;
691 /* Copy the constant to a nul-terminated buffer. If the constant
692 has any suffixes, cut them off; REAL_VALUE_ATOF/ REAL_VALUE_HTOF
693 can't handle them. */
694 copylen = token->val.str.len;
695 if (flags & CPP_N_DFLOAT)
696 copylen -= 2;
697 else
699 if ((flags & CPP_N_WIDTH) != CPP_N_MEDIUM)
700 /* Must be an F or L or machine defined suffix. */
701 copylen--;
702 if (flags & CPP_N_IMAGINARY)
703 /* I or J suffix. */
704 copylen--;
707 copy = (char *) alloca (copylen + 1);
708 memcpy (copy, token->val.str.text, copylen);
709 copy[copylen] = '\0';
711 real_from_string3 (&real, copy, TYPE_MODE (const_type));
712 if (const_type != type)
713 /* Diagnosing if the result of converting the value with excess
714 precision to the semantic type would overflow (with associated
715 double rounding) is more appropriate than diagnosing if the
716 result of converting the string directly to the semantic type
717 would overflow. */
718 real_convert (&real_trunc, TYPE_MODE (type), &real);
720 /* Both C and C++ require a diagnostic for a floating constant
721 outside the range of representable values of its type. Since we
722 have __builtin_inf* to produce an infinity, this is now a
723 mandatory pedwarn if the target does not support infinities. */
724 if (REAL_VALUE_ISINF (real)
725 || (const_type != type && REAL_VALUE_ISINF (real_trunc)))
727 if (!MODE_HAS_INFINITIES (TYPE_MODE (type)))
728 pedwarn (input_location, 0, "floating constant exceeds range of %qT", type);
729 else
730 warning (OPT_Woverflow, "floating constant exceeds range of %qT", type);
732 /* We also give a warning if the value underflows. */
733 else if (REAL_VALUES_EQUAL (real, dconst0)
734 || (const_type != type && REAL_VALUES_EQUAL (real_trunc, dconst0)))
736 REAL_VALUE_TYPE realvoidmode;
737 int overflow = real_from_string (&realvoidmode, copy);
738 if (overflow < 0 || !REAL_VALUES_EQUAL (realvoidmode, dconst0))
739 warning (OPT_Woverflow, "floating constant truncated to zero");
742 /* Create a node with determined type and value. */
743 value = build_real (const_type, real);
744 if (flags & CPP_N_IMAGINARY)
745 value = build_complex (NULL_TREE, convert (const_type, integer_zero_node),
746 value);
748 if (type != const_type)
749 value = build1 (EXCESS_PRECISION_EXPR, type, value);
751 return value;
754 /* Interpret TOKEN, a fixed-point number with FLAGS as classified
755 by cpplib. */
757 static tree
758 interpret_fixed (const cpp_token *token, unsigned int flags)
760 tree type;
761 tree value;
762 FIXED_VALUE_TYPE fixed;
763 char *copy;
764 size_t copylen;
766 copylen = token->val.str.len;
768 if (flags & CPP_N_FRACT) /* _Fract. */
770 if (flags & CPP_N_UNSIGNED) /* Unsigned _Fract. */
772 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
774 type = unsigned_long_long_fract_type_node;
775 copylen -= 4;
777 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
779 type = unsigned_long_fract_type_node;
780 copylen -= 3;
782 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
784 type = unsigned_short_fract_type_node;
785 copylen -= 3;
787 else
789 type = unsigned_fract_type_node;
790 copylen -= 2;
793 else /* Signed _Fract. */
795 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
797 type = long_long_fract_type_node;
798 copylen -= 3;
800 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
802 type = long_fract_type_node;
803 copylen -= 2;
805 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
807 type = short_fract_type_node;
808 copylen -= 2;
810 else
812 type = fract_type_node;
813 copylen --;
817 else /* _Accum. */
819 if (flags & CPP_N_UNSIGNED) /* Unsigned _Accum. */
821 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
823 type = unsigned_long_long_accum_type_node;
824 copylen -= 4;
826 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
828 type = unsigned_long_accum_type_node;
829 copylen -= 3;
831 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
833 type = unsigned_short_accum_type_node;
834 copylen -= 3;
836 else
838 type = unsigned_accum_type_node;
839 copylen -= 2;
842 else /* Signed _Accum. */
844 if ((flags & CPP_N_WIDTH) == CPP_N_LARGE)
846 type = long_long_accum_type_node;
847 copylen -= 3;
849 else if ((flags & CPP_N_WIDTH) == CPP_N_MEDIUM)
851 type = long_accum_type_node;
852 copylen -= 2;
854 else if ((flags & CPP_N_WIDTH) == CPP_N_SMALL)
856 type = short_accum_type_node;
857 copylen -= 2;
859 else
861 type = accum_type_node;
862 copylen --;
867 copy = (char *) alloca (copylen + 1);
868 memcpy (copy, token->val.str.text, copylen);
869 copy[copylen] = '\0';
871 fixed_from_string (&fixed, copy, TYPE_MODE (type));
873 /* Create a node with determined type and value. */
874 value = build_fixed (type, fixed);
876 return value;
879 /* Convert a series of STRING, WSTRING, STRING16, STRING32 and/or
880 UTF8STRING tokens into a tree, performing string constant
881 concatenation. TOK is the first of these. VALP is the location
882 to write the string into. OBJC_STRING indicates whether an '@' token
883 preceded the incoming token.
884 Returns the CPP token type of the result (CPP_STRING, CPP_WSTRING,
885 CPP_STRING32, CPP_STRING16, CPP_UTF8STRING, or CPP_OBJC_STRING).
887 This is unfortunately more work than it should be. If any of the
888 strings in the series has an L prefix, the result is a wide string
889 (6.4.5p4). Whether or not the result is a wide string affects the
890 meaning of octal and hexadecimal escapes (6.4.4.4p6,9). But escape
891 sequences do not continue across the boundary between two strings in
892 a series (6.4.5p7), so we must not lose the boundaries. Therefore
893 cpp_interpret_string takes a vector of cpp_string structures, which
894 we must arrange to provide. */
896 static enum cpp_ttype
897 lex_string (const cpp_token *tok, tree *valp, bool objc_string, bool translate)
899 tree value;
900 size_t concats = 0;
901 struct obstack str_ob;
902 cpp_string istr;
903 enum cpp_ttype type = tok->type;
905 /* Try to avoid the overhead of creating and destroying an obstack
906 for the common case of just one string. */
907 cpp_string str = tok->val.str;
908 cpp_string *strs = &str;
910 retry:
911 tok = cpp_get_token (parse_in);
912 switch (tok->type)
914 case CPP_PADDING:
915 goto retry;
916 case CPP_ATSIGN:
917 if (c_dialect_objc ())
919 objc_string = true;
920 goto retry;
922 /* FALLTHROUGH */
924 default:
925 break;
927 case CPP_WSTRING:
928 case CPP_STRING16:
929 case CPP_STRING32:
930 case CPP_UTF8STRING:
931 if (type != tok->type)
933 if (type == CPP_STRING)
934 type = tok->type;
935 else
936 error ("unsupported non-standard concatenation of string literals");
939 case CPP_STRING:
940 if (!concats)
942 gcc_obstack_init (&str_ob);
943 obstack_grow (&str_ob, &str, sizeof (cpp_string));
946 concats++;
947 obstack_grow (&str_ob, &tok->val.str, sizeof (cpp_string));
948 goto retry;
951 /* We have read one more token than we want. */
952 _cpp_backup_tokens (parse_in, 1);
953 if (concats)
954 strs = XOBFINISH (&str_ob, cpp_string *);
956 if (concats && !objc_string && !in_system_header)
957 warning (OPT_Wtraditional,
958 "traditional C rejects string constant concatenation");
960 if ((translate
961 ? cpp_interpret_string : cpp_interpret_string_notranslate)
962 (parse_in, strs, concats + 1, &istr, type))
964 value = build_string (istr.len, (const char *) istr.text);
965 free (CONST_CAST (unsigned char *, istr.text));
967 else
969 /* Callers cannot generally handle error_mark_node in this context,
970 so return the empty string instead. cpp_interpret_string has
971 issued an error. */
972 switch (type)
974 default:
975 case CPP_STRING:
976 case CPP_UTF8STRING:
977 value = build_string (1, "");
978 break;
979 case CPP_STRING16:
980 value = build_string (TYPE_PRECISION (char16_type_node)
981 / TYPE_PRECISION (char_type_node),
982 "\0"); /* char16_t is 16 bits */
983 break;
984 case CPP_STRING32:
985 value = build_string (TYPE_PRECISION (char32_type_node)
986 / TYPE_PRECISION (char_type_node),
987 "\0\0\0"); /* char32_t is 32 bits */
988 break;
989 case CPP_WSTRING:
990 value = build_string (TYPE_PRECISION (wchar_type_node)
991 / TYPE_PRECISION (char_type_node),
992 "\0\0\0"); /* widest supported wchar_t
993 is 32 bits */
994 break;
998 switch (type)
1000 default:
1001 case CPP_STRING:
1002 case CPP_UTF8STRING:
1003 TREE_TYPE (value) = char_array_type_node;
1004 break;
1005 case CPP_STRING16:
1006 TREE_TYPE (value) = char16_array_type_node;
1007 break;
1008 case CPP_STRING32:
1009 TREE_TYPE (value) = char32_array_type_node;
1010 break;
1011 case CPP_WSTRING:
1012 TREE_TYPE (value) = wchar_array_type_node;
1014 *valp = fix_string_type (value);
1016 if (concats)
1017 obstack_free (&str_ob, 0);
1019 return objc_string ? CPP_OBJC_STRING : type;
1022 /* Converts a (possibly wide) character constant token into a tree. */
1023 static tree
1024 lex_charconst (const cpp_token *token)
1026 cppchar_t result;
1027 tree type, value;
1028 unsigned int chars_seen;
1029 int unsignedp = 0;
1031 result = cpp_interpret_charconst (parse_in, token,
1032 &chars_seen, &unsignedp);
1034 if (token->type == CPP_WCHAR)
1035 type = wchar_type_node;
1036 else if (token->type == CPP_CHAR32)
1037 type = char32_type_node;
1038 else if (token->type == CPP_CHAR16)
1039 type = char16_type_node;
1040 /* In C, a character constant has type 'int'.
1041 In C++ 'char', but multi-char charconsts have type 'int'. */
1042 else if (!c_dialect_cxx () || chars_seen > 1)
1043 type = integer_type_node;
1044 else
1045 type = char_type_node;
1047 /* Cast to cppchar_signed_t to get correct sign-extension of RESULT
1048 before possibly widening to HOST_WIDE_INT for build_int_cst. */
1049 if (unsignedp || (cppchar_signed_t) result >= 0)
1050 value = build_int_cst_wide (type, result, 0);
1051 else
1052 value = build_int_cst_wide (type, (cppchar_signed_t) result, -1);
1054 return value;