PR c++/79143
[official-gcc.git] / gcc / pretty-print.c
blobbcb1a70ac033b9f2dcd9c5d1bafd35a8d9930b6e
1 /* Various declarations for language-independent pretty-print subroutines.
2 Copyright (C) 2003-2017 Free Software Foundation, Inc.
3 Contributed by Gabriel Dos Reis <gdr@integrable-solutions.net>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "intl.h"
25 #include "pretty-print.h"
26 #include "diagnostic-color.h"
27 #include "selftest.h"
29 #if HAVE_ICONV
30 #include <iconv.h>
31 #endif
33 static void pp_quoted_string (pretty_printer *, const char *, size_t = -1);
35 /* Overwrite the given location/range within this text_info's rich_location.
36 For use e.g. when implementing "+" in client format decoders. */
38 void
39 text_info::set_location (unsigned int idx, location_t loc, bool show_caret_p)
41 gcc_checking_assert (m_richloc);
42 m_richloc->set_range (line_table, idx, loc, show_caret_p);
45 location_t
46 text_info::get_location (unsigned int index_of_location) const
48 gcc_checking_assert (m_richloc);
50 if (index_of_location == 0)
51 return m_richloc->get_loc ();
52 else
53 return UNKNOWN_LOCATION;
56 // Default construct an output buffer.
58 output_buffer::output_buffer ()
59 : formatted_obstack (),
60 chunk_obstack (),
61 obstack (&formatted_obstack),
62 cur_chunk_array (),
63 stream (stderr),
64 line_length (),
65 digit_buffer (),
66 flush_p (true)
68 obstack_init (&formatted_obstack);
69 obstack_init (&chunk_obstack);
72 // Release resources owned by an output buffer at the end of lifetime.
74 output_buffer::~output_buffer ()
76 obstack_free (&chunk_obstack, NULL);
77 obstack_free (&formatted_obstack, NULL);
81 /* Format an integer given by va_arg (ARG, type-specifier T) where
82 type-specifier is a precision modifier as indicated by PREC. F is
83 a string used to construct the appropriate format-specifier. */
84 #define pp_integer_with_precision(PP, ARG, PREC, T, F) \
85 do \
86 switch (PREC) \
87 { \
88 case 0: \
89 pp_scalar (PP, "%" F, va_arg (ARG, T)); \
90 break; \
92 case 1: \
93 pp_scalar (PP, "%l" F, va_arg (ARG, long T)); \
94 break; \
96 case 2: \
97 pp_scalar (PP, "%" HOST_LONG_LONG_FORMAT F, va_arg (ARG, long long T)); \
98 break; \
100 default: \
101 break; \
103 while (0)
106 /* Subroutine of pp_set_maximum_length. Set up PRETTY-PRINTER's
107 internal maximum characters per line. */
108 static void
109 pp_set_real_maximum_length (pretty_printer *pp)
111 /* If we're told not to wrap lines then do the obvious thing. In case
112 we'll emit prefix only once per message, it is appropriate
113 not to increase unnecessarily the line-length cut-off. */
114 if (!pp_is_wrapping_line (pp)
115 || pp_prefixing_rule (pp) == DIAGNOSTICS_SHOW_PREFIX_ONCE
116 || pp_prefixing_rule (pp) == DIAGNOSTICS_SHOW_PREFIX_NEVER)
117 pp->maximum_length = pp_line_cutoff (pp);
118 else
120 int prefix_length = pp->prefix ? strlen (pp->prefix) : 0;
121 /* If the prefix is ridiculously too long, output at least
122 32 characters. */
123 if (pp_line_cutoff (pp) - prefix_length < 32)
124 pp->maximum_length = pp_line_cutoff (pp) + 32;
125 else
126 pp->maximum_length = pp_line_cutoff (pp);
130 /* Clear PRETTY-PRINTER's output state. */
131 static inline void
132 pp_clear_state (pretty_printer *pp)
134 pp->emitted_prefix = false;
135 pp_indentation (pp) = 0;
138 /* Flush the formatted text of PRETTY-PRINTER onto the attached stream. */
139 void
140 pp_write_text_to_stream (pretty_printer *pp)
142 const char *text = pp_formatted_text (pp);
143 fputs (text, pp_buffer (pp)->stream);
144 pp_clear_output_area (pp);
147 /* As pp_write_text_to_stream, but for GraphViz label output.
149 Flush the formatted text of pretty-printer PP onto the attached stream.
150 Replace characters in PPF that have special meaning in a GraphViz .dot
151 file.
153 This routine is not very fast, but it doesn't have to be as this is only
154 be used by routines dumping intermediate representations in graph form. */
156 void
157 pp_write_text_as_dot_label_to_stream (pretty_printer *pp, bool for_record)
159 const char *text = pp_formatted_text (pp);
160 const char *p = text;
161 FILE *fp = pp_buffer (pp)->stream;
163 for (;*p; p++)
165 bool escape_char;
166 switch (*p)
168 /* Print newlines as a left-aligned newline. */
169 case '\n':
170 fputs ("\\l", fp);
171 escape_char = true;
172 break;
174 /* The following characters are only special for record-shape nodes. */
175 case '|':
176 case '{':
177 case '}':
178 case '<':
179 case '>':
180 case ' ':
181 escape_char = for_record;
182 break;
184 /* The following characters always have to be escaped
185 for use in labels. */
186 case '\\':
187 /* There is a bug in some (f.i. 2.36.0) versions of graphiz
188 ( http://www.graphviz.org/mantisbt/view.php?id=2524 ) related to
189 backslash as last char in label. Let's avoid triggering it. */
190 gcc_assert (*(p + 1) != '\0');
191 /* Fall through. */
192 case '"':
193 escape_char = true;
194 break;
196 default:
197 escape_char = false;
198 break;
201 if (escape_char)
202 fputc ('\\', fp);
204 fputc (*p, fp);
207 pp_clear_output_area (pp);
210 /* Wrap a text delimited by START and END into PRETTY-PRINTER. */
211 static void
212 pp_wrap_text (pretty_printer *pp, const char *start, const char *end)
214 bool wrapping_line = pp_is_wrapping_line (pp);
216 while (start != end)
218 /* Dump anything bordered by whitespaces. */
220 const char *p = start;
221 while (p != end && !ISBLANK (*p) && *p != '\n')
222 ++p;
223 if (wrapping_line
224 && p - start >= pp_remaining_character_count_for_line (pp))
225 pp_newline (pp);
226 pp_append_text (pp, start, p);
227 start = p;
230 if (start != end && ISBLANK (*start))
232 pp_space (pp);
233 ++start;
235 if (start != end && *start == '\n')
237 pp_newline (pp);
238 ++start;
243 /* Same as pp_wrap_text but wrap text only when in line-wrapping mode. */
244 static inline void
245 pp_maybe_wrap_text (pretty_printer *pp, const char *start, const char *end)
247 if (pp_is_wrapping_line (pp))
248 pp_wrap_text (pp, start, end);
249 else
250 pp_append_text (pp, start, end);
253 /* Append to the output area of PRETTY-PRINTER a string specified by its
254 STARTing character and LENGTH. */
255 static inline void
256 pp_append_r (pretty_printer *pp, const char *start, int length)
258 output_buffer_append_r (pp_buffer (pp), start, length);
261 /* Insert enough spaces into the output area of PRETTY-PRINTER to bring
262 the column position to the current indentation level, assuming that a
263 newline has just been written to the buffer. */
264 void
265 pp_indent (pretty_printer *pp)
267 int n = pp_indentation (pp);
268 int i;
270 for (i = 0; i < n; ++i)
271 pp_space (pp);
274 /* The following format specifiers are recognized as being client independent:
275 %d, %i: (signed) integer in base ten.
276 %u: unsigned integer in base ten.
277 %o: unsigned integer in base eight.
278 %x: unsigned integer in base sixteen.
279 %ld, %li, %lo, %lu, %lx: long versions of the above.
280 %lld, %lli, %llo, %llu, %llx: long long versions.
281 %wd, %wi, %wo, %wu, %wx: HOST_WIDE_INT versions.
282 %c: character.
283 %s: string.
284 %p: pointer (printed in a host-dependent manner).
285 %r: if pp_show_color(pp), switch to color identified by const char *.
286 %R: if pp_show_color(pp), reset color.
287 %m: strerror(text->err_no) - does not consume a value from args_ptr.
288 %%: '%'.
289 %<: opening quote.
290 %>: closing quote.
291 %': apostrophe (should only be used in untranslated messages;
292 translations should use appropriate punctuation directly).
293 %.*s: a substring the length of which is specified by an argument
294 integer.
295 %Ns: likewise, but length specified as constant in the format string.
296 Flag 'q': quote formatted text (must come immediately after '%').
297 %Z: Requires two arguments - array of int, and len. Prints elements
298 of the array.
300 Arguments can be used sequentially, or through %N$ resp. *N$
301 notation Nth argument after the format string. If %N$ / *N$
302 notation is used, it must be used for all arguments, except %m, %%,
303 %<, %> and %', which may not have a number, as they do not consume
304 an argument. When %M$.*N$s is used, M must be N + 1. (This may
305 also be written %M$.*s, provided N is not otherwise used.) The
306 format string must have conversion specifiers with argument numbers
307 1 up to highest argument; each argument may only be used once.
308 A format string can have at most 30 arguments. */
310 /* Formatting phases 1 and 2: render TEXT->format_spec plus
311 TEXT->args_ptr into a series of chunks in pp_buffer (PP)->args[].
312 Phase 3 is in pp_output_formatted_text. */
314 void
315 pp_format (pretty_printer *pp, text_info *text)
317 output_buffer *buffer = pp_buffer (pp);
318 const char *p;
319 const char **args;
320 struct chunk_info *new_chunk_array;
322 unsigned int curarg = 0, chunk = 0, argno;
323 pp_wrapping_mode_t old_wrapping_mode;
324 bool any_unnumbered = false, any_numbered = false;
325 const char **formatters[PP_NL_ARGMAX];
327 /* Allocate a new chunk structure. */
328 new_chunk_array = XOBNEW (&buffer->chunk_obstack, struct chunk_info);
329 new_chunk_array->prev = buffer->cur_chunk_array;
330 buffer->cur_chunk_array = new_chunk_array;
331 args = new_chunk_array->args;
333 /* Formatting phase 1: split up TEXT->format_spec into chunks in
334 pp_buffer (PP)->args[]. Even-numbered chunks are to be output
335 verbatim, odd-numbered chunks are format specifiers.
336 %m, %%, %<, %>, and %' are replaced with the appropriate text at
337 this point. */
339 memset (formatters, 0, sizeof formatters);
341 for (p = text->format_spec; *p; )
343 while (*p != '\0' && *p != '%')
345 obstack_1grow (&buffer->chunk_obstack, *p);
346 p++;
349 if (*p == '\0')
350 break;
352 switch (*++p)
354 case '\0':
355 gcc_unreachable ();
357 case '%':
358 obstack_1grow (&buffer->chunk_obstack, '%');
359 p++;
360 continue;
362 case '<':
364 obstack_grow (&buffer->chunk_obstack,
365 open_quote, strlen (open_quote));
366 const char *colorstr
367 = colorize_start (pp_show_color (pp), "quote");
368 obstack_grow (&buffer->chunk_obstack, colorstr, strlen (colorstr));
369 p++;
370 continue;
373 case '>':
375 const char *colorstr = colorize_stop (pp_show_color (pp));
376 obstack_grow (&buffer->chunk_obstack, colorstr, strlen (colorstr));
378 /* FALLTHRU */
379 case '\'':
380 obstack_grow (&buffer->chunk_obstack,
381 close_quote, strlen (close_quote));
382 p++;
383 continue;
385 case 'R':
387 const char *colorstr = colorize_stop (pp_show_color (pp));
388 obstack_grow (&buffer->chunk_obstack, colorstr,
389 strlen (colorstr));
390 p++;
391 continue;
394 case 'm':
396 const char *errstr = xstrerror (text->err_no);
397 obstack_grow (&buffer->chunk_obstack, errstr, strlen (errstr));
399 p++;
400 continue;
402 default:
403 /* Handled in phase 2. Terminate the plain chunk here. */
404 obstack_1grow (&buffer->chunk_obstack, '\0');
405 gcc_assert (chunk < PP_NL_ARGMAX * 2);
406 args[chunk++] = XOBFINISH (&buffer->chunk_obstack, const char *);
407 break;
410 if (ISDIGIT (*p))
412 char *end;
413 argno = strtoul (p, &end, 10) - 1;
414 p = end;
415 gcc_assert (*p == '$');
416 p++;
418 any_numbered = true;
419 gcc_assert (!any_unnumbered);
421 else
423 argno = curarg++;
424 any_unnumbered = true;
425 gcc_assert (!any_numbered);
427 gcc_assert (argno < PP_NL_ARGMAX);
428 gcc_assert (!formatters[argno]);
429 formatters[argno] = &args[chunk];
432 obstack_1grow (&buffer->chunk_obstack, *p);
433 p++;
435 while (strchr ("qwl+#", p[-1]));
437 if (p[-1] == '.')
439 /* We handle '%.Ns' and '%.*s' or '%M$.*N$s'
440 (where M == N + 1). */
441 if (ISDIGIT (*p))
445 obstack_1grow (&buffer->chunk_obstack, *p);
446 p++;
448 while (ISDIGIT (p[-1]));
449 gcc_assert (p[-1] == 's');
451 else
453 gcc_assert (*p == '*');
454 obstack_1grow (&buffer->chunk_obstack, '*');
455 p++;
457 if (ISDIGIT (*p))
459 char *end;
460 unsigned int argno2 = strtoul (p, &end, 10) - 1;
461 p = end;
462 gcc_assert (argno2 == argno - 1);
463 gcc_assert (!any_unnumbered);
464 gcc_assert (*p == '$');
466 p++;
467 formatters[argno2] = formatters[argno];
469 else
471 gcc_assert (!any_numbered);
472 formatters[argno+1] = formatters[argno];
473 curarg++;
475 gcc_assert (*p == 's');
476 obstack_1grow (&buffer->chunk_obstack, 's');
477 p++;
480 if (*p == '\0')
481 break;
483 obstack_1grow (&buffer->chunk_obstack, '\0');
484 gcc_assert (chunk < PP_NL_ARGMAX * 2);
485 args[chunk++] = XOBFINISH (&buffer->chunk_obstack, const char *);
488 obstack_1grow (&buffer->chunk_obstack, '\0');
489 gcc_assert (chunk < PP_NL_ARGMAX * 2);
490 args[chunk++] = XOBFINISH (&buffer->chunk_obstack, const char *);
491 args[chunk] = 0;
493 /* Set output to the argument obstack, and switch line-wrapping and
494 prefixing off. */
495 buffer->obstack = &buffer->chunk_obstack;
496 old_wrapping_mode = pp_set_verbatim_wrapping (pp);
498 /* Second phase. Replace each formatter with the formatted text it
499 corresponds to. */
501 for (argno = 0; formatters[argno]; argno++)
503 int precision = 0;
504 bool wide = false;
505 bool plus = false;
506 bool hash = false;
507 bool quote = false;
509 /* We do not attempt to enforce any ordering on the modifier
510 characters. */
512 for (p = *formatters[argno];; p++)
514 switch (*p)
516 case 'q':
517 gcc_assert (!quote);
518 quote = true;
519 continue;
521 case '+':
522 gcc_assert (!plus);
523 plus = true;
524 continue;
526 case '#':
527 gcc_assert (!hash);
528 hash = true;
529 continue;
531 case 'w':
532 gcc_assert (!wide);
533 wide = true;
534 continue;
536 case 'l':
537 /* We don't support precision beyond that of "long long". */
538 gcc_assert (precision < 2);
539 precision++;
540 continue;
542 break;
545 gcc_assert (!wide || precision == 0);
547 if (quote)
549 pp_string (pp, open_quote);
550 pp_string (pp, colorize_start (pp_show_color (pp), "quote"));
553 switch (*p)
555 case 'r':
556 pp_string (pp, colorize_start (pp_show_color (pp),
557 va_arg (*text->args_ptr,
558 const char *)));
559 break;
561 case 'c':
563 /* When quoting, print alphanumeric, punctuation, and the space
564 character unchanged, and all others in hexadecimal with the
565 "\x" prefix. Otherwise print them all unchanged. */
566 int chr = va_arg (*text->args_ptr, int);
567 if (ISPRINT (chr) || !quote)
568 pp_character (pp, chr);
569 else
571 const char str [2] = { chr, '\0' };
572 pp_quoted_string (pp, str, 1);
574 break;
577 case 'd':
578 case 'i':
579 if (wide)
580 pp_wide_integer (pp, va_arg (*text->args_ptr, HOST_WIDE_INT));
581 else
582 pp_integer_with_precision
583 (pp, *text->args_ptr, precision, int, "d");
584 break;
586 case 'o':
587 if (wide)
588 pp_scalar (pp, "%" HOST_WIDE_INT_PRINT "o",
589 va_arg (*text->args_ptr, unsigned HOST_WIDE_INT));
590 else
591 pp_integer_with_precision
592 (pp, *text->args_ptr, precision, unsigned, "o");
593 break;
595 case 's':
596 if (quote)
597 pp_quoted_string (pp, va_arg (*text->args_ptr, const char *));
598 else
599 pp_string (pp, va_arg (*text->args_ptr, const char *));
600 break;
602 case 'p':
603 pp_pointer (pp, va_arg (*text->args_ptr, void *));
604 break;
606 case 'u':
607 if (wide)
608 pp_scalar (pp, HOST_WIDE_INT_PRINT_UNSIGNED,
609 va_arg (*text->args_ptr, unsigned HOST_WIDE_INT));
610 else
611 pp_integer_with_precision
612 (pp, *text->args_ptr, precision, unsigned, "u");
613 break;
615 case 'Z':
617 int *v = va_arg (*text->args_ptr, int *);
618 unsigned len = va_arg (*text->args_ptr, unsigned);
620 for (unsigned i = 0; i < len; ++i)
622 pp_scalar (pp, "%i", v[i]);
623 if (i < len - 1)
625 pp_comma (pp);
626 pp_space (pp);
629 break;
632 case 'x':
633 if (wide)
634 pp_scalar (pp, HOST_WIDE_INT_PRINT_HEX,
635 va_arg (*text->args_ptr, unsigned HOST_WIDE_INT));
636 else
637 pp_integer_with_precision
638 (pp, *text->args_ptr, precision, unsigned, "x");
639 break;
641 case '.':
643 int n;
644 const char *s;
646 /* We handle '%.Ns' and '%.*s' or '%M$.*N$s'
647 (where M == N + 1). The format string should be verified
648 already from the first phase. */
649 p++;
650 if (ISDIGIT (*p))
652 char *end;
653 n = strtoul (p, &end, 10);
654 p = end;
655 gcc_assert (*p == 's');
657 else
659 gcc_assert (*p == '*');
660 p++;
661 gcc_assert (*p == 's');
662 n = va_arg (*text->args_ptr, int);
664 /* This consumes a second entry in the formatters array. */
665 gcc_assert (formatters[argno] == formatters[argno+1]);
666 argno++;
669 s = va_arg (*text->args_ptr, const char *);
670 pp_append_text (pp, s, s + n);
672 break;
674 default:
676 bool ok;
678 gcc_assert (pp_format_decoder (pp));
679 ok = pp_format_decoder (pp) (pp, text, p,
680 precision, wide, plus, hash);
681 gcc_assert (ok);
685 if (quote)
687 pp_string (pp, colorize_stop (pp_show_color (pp)));
688 pp_string (pp, close_quote);
691 obstack_1grow (&buffer->chunk_obstack, '\0');
692 *formatters[argno] = XOBFINISH (&buffer->chunk_obstack, const char *);
695 if (CHECKING_P)
696 for (; argno < PP_NL_ARGMAX; argno++)
697 gcc_assert (!formatters[argno]);
699 /* Revert to normal obstack and wrapping mode. */
700 buffer->obstack = &buffer->formatted_obstack;
701 buffer->line_length = 0;
702 pp_wrapping_mode (pp) = old_wrapping_mode;
703 pp_clear_state (pp);
706 /* Format of a message pointed to by TEXT. */
707 void
708 pp_output_formatted_text (pretty_printer *pp)
710 unsigned int chunk;
711 output_buffer *buffer = pp_buffer (pp);
712 struct chunk_info *chunk_array = buffer->cur_chunk_array;
713 const char **args = chunk_array->args;
715 gcc_assert (buffer->obstack == &buffer->formatted_obstack);
716 gcc_assert (buffer->line_length == 0);
718 /* This is a third phase, first 2 phases done in pp_format_args.
719 Now we actually print it. */
720 for (chunk = 0; args[chunk]; chunk++)
721 pp_string (pp, args[chunk]);
723 /* Deallocate the chunk structure and everything after it (i.e. the
724 associated series of formatted strings). */
725 buffer->cur_chunk_array = chunk_array->prev;
726 obstack_free (&buffer->chunk_obstack, chunk_array);
729 /* Helper subroutine of output_verbatim and verbatim. Do the appropriate
730 settings needed by BUFFER for a verbatim formatting. */
731 void
732 pp_format_verbatim (pretty_printer *pp, text_info *text)
734 /* Set verbatim mode. */
735 pp_wrapping_mode_t oldmode = pp_set_verbatim_wrapping (pp);
737 /* Do the actual formatting. */
738 pp_format (pp, text);
739 pp_output_formatted_text (pp);
741 /* Restore previous settings. */
742 pp_wrapping_mode (pp) = oldmode;
745 /* Flush the content of BUFFER onto the attached stream. This
746 function does nothing unless pp->output_buffer->flush_p. */
747 void
748 pp_flush (pretty_printer *pp)
750 pp_clear_state (pp);
751 if (!pp->buffer->flush_p)
752 return;
753 pp_write_text_to_stream (pp);
754 fflush (pp_buffer (pp)->stream);
757 /* Flush the content of BUFFER onto the attached stream independently
758 of the value of pp->output_buffer->flush_p. */
759 void
760 pp_really_flush (pretty_printer *pp)
762 pp_clear_state (pp);
763 pp_write_text_to_stream (pp);
764 fflush (pp_buffer (pp)->stream);
767 /* Sets the number of maximum characters per line PRETTY-PRINTER can
768 output in line-wrapping mode. A LENGTH value 0 suppresses
769 line-wrapping. */
770 void
771 pp_set_line_maximum_length (pretty_printer *pp, int length)
773 pp_line_cutoff (pp) = length;
774 pp_set_real_maximum_length (pp);
777 /* Clear PRETTY-PRINTER output area text info. */
778 void
779 pp_clear_output_area (pretty_printer *pp)
781 obstack_free (pp_buffer (pp)->obstack,
782 obstack_base (pp_buffer (pp)->obstack));
783 pp_buffer (pp)->line_length = 0;
786 /* Set PREFIX for PRETTY-PRINTER. */
787 void
788 pp_set_prefix (pretty_printer *pp, const char *prefix)
790 pp->prefix = prefix;
791 pp_set_real_maximum_length (pp);
792 pp->emitted_prefix = false;
793 pp_indentation (pp) = 0;
796 /* Free PRETTY-PRINTER's prefix, a previously malloc()'d string. */
797 void
798 pp_destroy_prefix (pretty_printer *pp)
800 if (pp->prefix != NULL)
802 free (CONST_CAST (char *, pp->prefix));
803 pp->prefix = NULL;
807 /* Write out PRETTY-PRINTER's prefix. */
808 void
809 pp_emit_prefix (pretty_printer *pp)
811 if (pp->prefix != NULL)
813 switch (pp_prefixing_rule (pp))
815 default:
816 case DIAGNOSTICS_SHOW_PREFIX_NEVER:
817 break;
819 case DIAGNOSTICS_SHOW_PREFIX_ONCE:
820 if (pp->emitted_prefix)
822 pp_indent (pp);
823 break;
825 pp_indentation (pp) += 3;
826 /* Fall through. */
828 case DIAGNOSTICS_SHOW_PREFIX_EVERY_LINE:
830 int prefix_length = strlen (pp->prefix);
831 pp_append_r (pp, pp->prefix, prefix_length);
832 pp->emitted_prefix = true;
834 break;
839 /* Construct a PRETTY-PRINTER with PREFIX and of MAXIMUM_LENGTH
840 characters per line. */
842 pretty_printer::pretty_printer (const char *p, int l)
843 : buffer (new (XCNEW (output_buffer)) output_buffer ()),
844 prefix (),
845 padding (pp_none),
846 maximum_length (),
847 indent_skip (),
848 wrapping (),
849 format_decoder (),
850 emitted_prefix (),
851 need_newline (),
852 translate_identifiers (true),
853 show_color ()
855 pp_line_cutoff (this) = l;
856 /* By default, we emit prefixes once per message. */
857 pp_prefixing_rule (this) = DIAGNOSTICS_SHOW_PREFIX_ONCE;
858 pp_set_prefix (this, p);
861 pretty_printer::~pretty_printer ()
863 buffer->~output_buffer ();
864 XDELETE (buffer);
867 /* Append a string delimited by START and END to the output area of
868 PRETTY-PRINTER. No line wrapping is done. However, if beginning a
869 new line then emit PRETTY-PRINTER's prefix and skip any leading
870 whitespace if appropriate. The caller must ensure that it is
871 safe to do so. */
872 void
873 pp_append_text (pretty_printer *pp, const char *start, const char *end)
875 /* Emit prefix and skip whitespace if we're starting a new line. */
876 if (pp_buffer (pp)->line_length == 0)
878 pp_emit_prefix (pp);
879 if (pp_is_wrapping_line (pp))
880 while (start != end && *start == ' ')
881 ++start;
883 pp_append_r (pp, start, end - start);
886 /* Finishes constructing a NULL-terminated character string representing
887 the PRETTY-PRINTED text. */
888 const char *
889 pp_formatted_text (pretty_printer *pp)
891 return output_buffer_formatted_text (pp_buffer (pp));
894 /* Return a pointer to the last character emitted in PRETTY-PRINTER's
895 output area. A NULL pointer means no character available. */
896 const char *
897 pp_last_position_in_text (const pretty_printer *pp)
899 return output_buffer_last_position_in_text (pp_buffer (pp));
902 /* Return the amount of characters PRETTY-PRINTER can accept to
903 make a full line. Meaningful only in line-wrapping mode. */
905 pp_remaining_character_count_for_line (pretty_printer *pp)
907 return pp->maximum_length - pp_buffer (pp)->line_length;
911 /* Format a message into BUFFER a la printf. */
912 void
913 pp_printf (pretty_printer *pp, const char *msg, ...)
915 text_info text;
916 va_list ap;
918 va_start (ap, msg);
919 text.err_no = errno;
920 text.args_ptr = &ap;
921 text.format_spec = msg;
922 pp_format (pp, &text);
923 pp_output_formatted_text (pp);
924 va_end (ap);
928 /* Output MESSAGE verbatim into BUFFER. */
929 void
930 pp_verbatim (pretty_printer *pp, const char *msg, ...)
932 text_info text;
933 va_list ap;
935 va_start (ap, msg);
936 text.err_no = errno;
937 text.args_ptr = &ap;
938 text.format_spec = msg;
939 pp_format_verbatim (pp, &text);
940 va_end (ap);
945 /* Have PRETTY-PRINTER start a new line. */
946 void
947 pp_newline (pretty_printer *pp)
949 obstack_1grow (pp_buffer (pp)->obstack, '\n');
950 pp_needs_newline (pp) = false;
951 pp_buffer (pp)->line_length = 0;
954 /* Have PRETTY-PRINTER add a CHARACTER. */
955 void
956 pp_character (pretty_printer *pp, int c)
958 if (pp_is_wrapping_line (pp)
959 && pp_remaining_character_count_for_line (pp) <= 0)
961 pp_newline (pp);
962 if (ISSPACE (c))
963 return;
965 obstack_1grow (pp_buffer (pp)->obstack, c);
966 ++pp_buffer (pp)->line_length;
969 /* Append a STRING to the output area of PRETTY-PRINTER; the STRING may
970 be line-wrapped if in appropriate mode. */
971 void
972 pp_string (pretty_printer *pp, const char *str)
974 gcc_checking_assert (str);
975 pp_maybe_wrap_text (pp, str, str + strlen (str));
978 /* Append the leading N characters of STRING to the output area of
979 PRETTY-PRINTER, quoting in hexadecimal non-printable characters.
980 Setting N = -1 is as if N were set to strlen (STRING). The STRING
981 may be line-wrapped if in appropriate mode. */
982 static void
983 pp_quoted_string (pretty_printer *pp, const char *str, size_t n /* = -1 */)
985 gcc_checking_assert (str);
987 const char *last = str;
988 const char *ps;
990 /* Compute the length if not specified. */
991 if (n == (size_t) -1)
992 n = strlen (str);
994 for (ps = str; n; ++ps, --n)
996 if (ISPRINT (*ps))
997 continue;
999 if (last < ps)
1000 pp_maybe_wrap_text (pp, last, ps - 1);
1002 /* Append the hexadecimal value of the character. Allocate a buffer
1003 that's large enough for a 32-bit char plus the hex prefix. */
1004 char buf [11];
1005 int n = sprintf (buf, "\\x%02x", (unsigned char)*ps);
1006 pp_maybe_wrap_text (pp, buf, buf + n);
1007 last = ps + 1;
1010 pp_maybe_wrap_text (pp, last, ps);
1013 /* Maybe print out a whitespace if needed. */
1015 void
1016 pp_maybe_space (pretty_printer *pp)
1018 if (pp->padding != pp_none)
1020 pp_space (pp);
1021 pp->padding = pp_none;
1025 // Add a newline to the pretty printer PP and flush formatted text.
1027 void
1028 pp_newline_and_flush (pretty_printer *pp)
1030 pp_newline (pp);
1031 pp_flush (pp);
1032 pp_needs_newline (pp) = false;
1035 // Add a newline to the pretty printer PP, followed by indentation.
1037 void
1038 pp_newline_and_indent (pretty_printer *pp, int n)
1040 pp_indentation (pp) += n;
1041 pp_newline (pp);
1042 pp_indent (pp);
1043 pp_needs_newline (pp) = false;
1046 // Add separator C, followed by a single whitespace.
1048 void
1049 pp_separate_with (pretty_printer *pp, char c)
1051 pp_character (pp, c);
1052 pp_space (pp);
1056 /* The string starting at P has LEN (at least 1) bytes left; if they
1057 start with a valid UTF-8 sequence, return the length of that
1058 sequence and set *VALUE to the value of that sequence, and
1059 otherwise return 0 and set *VALUE to (unsigned int) -1. */
1061 static int
1062 decode_utf8_char (const unsigned char *p, size_t len, unsigned int *value)
1064 unsigned int t = *p;
1066 if (len == 0)
1067 abort ();
1068 if (t & 0x80)
1070 size_t utf8_len = 0;
1071 unsigned int ch;
1072 size_t i;
1073 for (t = *p; t & 0x80; t <<= 1)
1074 utf8_len++;
1076 if (utf8_len > len || utf8_len < 2 || utf8_len > 6)
1078 *value = (unsigned int) -1;
1079 return 0;
1081 ch = *p & ((1 << (7 - utf8_len)) - 1);
1082 for (i = 1; i < utf8_len; i++)
1084 unsigned int u = p[i];
1085 if ((u & 0xC0) != 0x80)
1087 *value = (unsigned int) -1;
1088 return 0;
1090 ch = (ch << 6) | (u & 0x3F);
1092 if ( (ch <= 0x7F && utf8_len > 1)
1093 || (ch <= 0x7FF && utf8_len > 2)
1094 || (ch <= 0xFFFF && utf8_len > 3)
1095 || (ch <= 0x1FFFFF && utf8_len > 4)
1096 || (ch <= 0x3FFFFFF && utf8_len > 5)
1097 || (ch >= 0xD800 && ch <= 0xDFFF))
1099 *value = (unsigned int) -1;
1100 return 0;
1102 *value = ch;
1103 return utf8_len;
1105 else
1107 *value = t;
1108 return 1;
1112 /* Allocator for identifier_to_locale and corresponding function to
1113 free memory. */
1115 void *(*identifier_to_locale_alloc) (size_t) = xmalloc;
1116 void (*identifier_to_locale_free) (void *) = free;
1118 /* Given IDENT, an identifier in the internal encoding, return a
1119 version of IDENT suitable for diagnostics in the locale character
1120 set: either IDENT itself, or a string, allocated using
1121 identifier_to_locale_alloc, converted to the locale character set
1122 and using escape sequences if not representable in the locale
1123 character set or containing control characters or invalid byte
1124 sequences. Existing backslashes in IDENT are not doubled, so the
1125 result may not uniquely specify the contents of an arbitrary byte
1126 sequence identifier. */
1128 const char *
1129 identifier_to_locale (const char *ident)
1131 const unsigned char *uid = (const unsigned char *) ident;
1132 size_t idlen = strlen (ident);
1133 bool valid_printable_utf8 = true;
1134 bool all_ascii = true;
1135 size_t i;
1137 for (i = 0; i < idlen;)
1139 unsigned int c;
1140 size_t utf8_len = decode_utf8_char (&uid[i], idlen - i, &c);
1141 if (utf8_len == 0 || c <= 0x1F || (c >= 0x7F && c <= 0x9F))
1143 valid_printable_utf8 = false;
1144 break;
1146 if (utf8_len > 1)
1147 all_ascii = false;
1148 i += utf8_len;
1151 /* If IDENT contains invalid UTF-8 sequences (which may occur with
1152 attributes putting arbitrary byte sequences in identifiers), or
1153 control characters, we use octal escape sequences for all bytes
1154 outside printable ASCII. */
1155 if (!valid_printable_utf8)
1157 char *ret = (char *) identifier_to_locale_alloc (4 * idlen + 1);
1158 char *p = ret;
1159 for (i = 0; i < idlen; i++)
1161 if (uid[i] > 0x1F && uid[i] < 0x7F)
1162 *p++ = uid[i];
1163 else
1165 sprintf (p, "\\%03o", uid[i]);
1166 p += 4;
1169 *p = 0;
1170 return ret;
1173 /* Otherwise, if it is valid printable ASCII, or printable UTF-8
1174 with the locale character set being UTF-8, IDENT is used. */
1175 if (all_ascii || locale_utf8)
1176 return ident;
1178 /* Otherwise IDENT is converted to the locale character set if
1179 possible. */
1180 #if defined ENABLE_NLS && defined HAVE_LANGINFO_CODESET && HAVE_ICONV
1181 if (locale_encoding != NULL)
1183 iconv_t cd = iconv_open (locale_encoding, "UTF-8");
1184 bool conversion_ok = true;
1185 char *ret = NULL;
1186 if (cd != (iconv_t) -1)
1188 size_t ret_alloc = 4 * idlen + 1;
1189 for (;;)
1191 /* Repeat the whole conversion process as needed with
1192 larger buffers so non-reversible transformations can
1193 always be detected. */
1194 ICONV_CONST char *inbuf = CONST_CAST (char *, ident);
1195 char *outbuf;
1196 size_t inbytesleft = idlen;
1197 size_t outbytesleft = ret_alloc - 1;
1198 size_t iconv_ret;
1200 ret = (char *) identifier_to_locale_alloc (ret_alloc);
1201 outbuf = ret;
1203 if (iconv (cd, 0, 0, 0, 0) == (size_t) -1)
1205 conversion_ok = false;
1206 break;
1209 iconv_ret = iconv (cd, &inbuf, &inbytesleft,
1210 &outbuf, &outbytesleft);
1211 if (iconv_ret == (size_t) -1 || inbytesleft != 0)
1213 if (errno == E2BIG)
1215 ret_alloc *= 2;
1216 identifier_to_locale_free (ret);
1217 ret = NULL;
1218 continue;
1220 else
1222 conversion_ok = false;
1223 break;
1226 else if (iconv_ret != 0)
1228 conversion_ok = false;
1229 break;
1231 /* Return to initial shift state. */
1232 if (iconv (cd, 0, 0, &outbuf, &outbytesleft) == (size_t) -1)
1234 if (errno == E2BIG)
1236 ret_alloc *= 2;
1237 identifier_to_locale_free (ret);
1238 ret = NULL;
1239 continue;
1241 else
1243 conversion_ok = false;
1244 break;
1247 *outbuf = 0;
1248 break;
1250 iconv_close (cd);
1251 if (conversion_ok)
1252 return ret;
1255 #endif
1257 /* Otherwise, convert non-ASCII characters in IDENT to UCNs. */
1259 char *ret = (char *) identifier_to_locale_alloc (10 * idlen + 1);
1260 char *p = ret;
1261 for (i = 0; i < idlen;)
1263 unsigned int c;
1264 size_t utf8_len = decode_utf8_char (&uid[i], idlen - i, &c);
1265 if (utf8_len == 1)
1266 *p++ = uid[i];
1267 else
1269 sprintf (p, "\\U%08x", c);
1270 p += 10;
1272 i += utf8_len;
1274 *p = 0;
1275 return ret;
1279 #if CHECKING_P
1281 namespace selftest {
1283 /* Smoketest for pretty_printer. */
1285 static void
1286 test_basic_printing ()
1288 pretty_printer pp;
1289 pp_string (&pp, "hello");
1290 pp_space (&pp);
1291 pp_string (&pp, "world");
1293 ASSERT_STREQ ("hello world", pp_formatted_text (&pp));
1296 /* Helper function for testing pp_format.
1297 Verify that pp_format (FMT, ...) followed by pp_output_formatted_text
1298 prints EXPECTED, assuming that pp_show_color is SHOW_COLOR. */
1300 static void
1301 assert_pp_format_va (const location &loc, const char *expected,
1302 bool show_color, const char *fmt, va_list *ap)
1304 pretty_printer pp;
1305 text_info ti;
1306 rich_location rich_loc (line_table, UNKNOWN_LOCATION);
1308 ti.format_spec = fmt;
1309 ti.args_ptr = ap;
1310 ti.err_no = 0;
1311 ti.x_data = NULL;
1312 ti.m_richloc = &rich_loc;
1314 pp_show_color (&pp) = show_color;
1315 pp_format (&pp, &ti);
1316 pp_output_formatted_text (&pp);
1317 ASSERT_STREQ_AT (loc, expected, pp_formatted_text (&pp));
1320 /* Verify that pp_format (FMT, ...) followed by pp_output_formatted_text
1321 prints EXPECTED, with show_color disabled. */
1323 static void
1324 assert_pp_format (const location &loc, const char *expected,
1325 const char *fmt, ...)
1327 va_list ap;
1329 va_start (ap, fmt);
1330 assert_pp_format_va (loc, expected, false, fmt, &ap);
1331 va_end (ap);
1334 /* As above, but with colorization enabled. */
1336 static void
1337 assert_pp_format_colored (const location &loc, const char *expected,
1338 const char *fmt, ...)
1340 /* The tests of colorization assume the default color scheme.
1341 If GCC_COLORS is set, then the colors have potentially been
1342 overridden; skip the test. */
1343 if (getenv ("GCC_COLORS"))
1344 return;
1346 va_list ap;
1348 va_start (ap, fmt);
1349 assert_pp_format_va (loc, expected, true, fmt, &ap);
1350 va_end (ap);
1353 /* Helper function for calling testing pp_format,
1354 by calling assert_pp_format with various numbers of arguments.
1355 These exist mostly to avoid having to write SELFTEST_LOCATION
1356 throughout test_pp_format. */
1358 #define ASSERT_PP_FORMAT_1(EXPECTED, FMT, ARG1) \
1359 SELFTEST_BEGIN_STMT \
1360 assert_pp_format ((SELFTEST_LOCATION), (EXPECTED), (FMT), \
1361 (ARG1)); \
1362 SELFTEST_END_STMT
1364 #define ASSERT_PP_FORMAT_2(EXPECTED, FMT, ARG1, ARG2) \
1365 SELFTEST_BEGIN_STMT \
1366 assert_pp_format ((SELFTEST_LOCATION), (EXPECTED), (FMT), \
1367 (ARG1), (ARG2)); \
1368 SELFTEST_END_STMT
1370 #define ASSERT_PP_FORMAT_3(EXPECTED, FMT, ARG1, ARG2, ARG3) \
1371 SELFTEST_BEGIN_STMT \
1372 assert_pp_format ((SELFTEST_LOCATION), (EXPECTED), (FMT), \
1373 (ARG1), (ARG2), (ARG3)); \
1374 SELFTEST_END_STMT
1376 /* Verify that pp_format works, for various format codes. */
1378 static void
1379 test_pp_format ()
1381 /* Avoid introducing locale-specific differences in the results
1382 by hardcoding open_quote and close_quote. */
1383 const char *old_open_quote = open_quote;
1384 const char *old_close_quote = close_quote;
1385 open_quote = "`";
1386 close_quote = "'";
1388 /* Verify that plain text is passed through unchanged. */
1389 assert_pp_format (SELFTEST_LOCATION, "unformatted", "unformatted");
1391 /* Verify various individual format codes, in the order listed in the
1392 comment for pp_format above. For each code, we append a second
1393 argument with a known bit pattern (0x12345678), to ensure that we
1394 are consuming arguments correctly. */
1395 ASSERT_PP_FORMAT_2 ("-27 12345678", "%d %x", -27, 0x12345678);
1396 ASSERT_PP_FORMAT_2 ("-5 12345678", "%i %x", -5, 0x12345678);
1397 ASSERT_PP_FORMAT_2 ("10 12345678", "%u %x", 10, 0x12345678);
1398 ASSERT_PP_FORMAT_2 ("17 12345678", "%o %x", 15, 0x12345678);
1399 ASSERT_PP_FORMAT_2 ("cafebabe 12345678", "%x %x", 0xcafebabe, 0x12345678);
1400 ASSERT_PP_FORMAT_2 ("-27 12345678", "%ld %x", (long)-27, 0x12345678);
1401 ASSERT_PP_FORMAT_2 ("-5 12345678", "%li %x", (long)-5, 0x12345678);
1402 ASSERT_PP_FORMAT_2 ("10 12345678", "%lu %x", (long)10, 0x12345678);
1403 ASSERT_PP_FORMAT_2 ("17 12345678", "%lo %x", (long)15, 0x12345678);
1404 ASSERT_PP_FORMAT_2 ("cafebabe 12345678", "%lx %x", (long)0xcafebabe,
1405 0x12345678);
1406 ASSERT_PP_FORMAT_2 ("-27 12345678", "%lld %x", (long long)-27, 0x12345678);
1407 ASSERT_PP_FORMAT_2 ("-5 12345678", "%lli %x", (long long)-5, 0x12345678);
1408 ASSERT_PP_FORMAT_2 ("10 12345678", "%llu %x", (long long)10, 0x12345678);
1409 ASSERT_PP_FORMAT_2 ("17 12345678", "%llo %x", (long long)15, 0x12345678);
1410 ASSERT_PP_FORMAT_2 ("cafebabe 12345678", "%llx %x", (long long)0xcafebabe,
1411 0x12345678);
1412 ASSERT_PP_FORMAT_2 ("-27 12345678", "%wd %x", (HOST_WIDE_INT)-27, 0x12345678);
1413 ASSERT_PP_FORMAT_2 ("-5 12345678", "%wi %x", (HOST_WIDE_INT)-5, 0x12345678);
1414 ASSERT_PP_FORMAT_2 ("10 12345678", "%wu %x", (unsigned HOST_WIDE_INT)10,
1415 0x12345678);
1416 ASSERT_PP_FORMAT_2 ("17 12345678", "%wo %x", (HOST_WIDE_INT)15, 0x12345678);
1417 ASSERT_PP_FORMAT_2 ("0xcafebabe 12345678", "%wx %x", (HOST_WIDE_INT)0xcafebabe,
1418 0x12345678);
1419 ASSERT_PP_FORMAT_2 ("A 12345678", "%c %x", 'A', 0x12345678);
1420 ASSERT_PP_FORMAT_2 ("hello world 12345678", "%s %x", "hello world",
1421 0x12345678);
1422 /* We can't test for %p; the pointer is printed in an implementation-defined
1423 manner. */
1424 ASSERT_PP_FORMAT_2 ("normal colored normal 12345678",
1425 "normal %rcolored%R normal %x",
1426 "error", 0x12345678);
1427 assert_pp_format_colored
1428 (SELFTEST_LOCATION,
1429 "normal \33[01;31m\33[Kcolored\33[m\33[K normal 12345678",
1430 "normal %rcolored%R normal %x", "error", 0x12345678);
1431 /* TODO:
1432 %m: strerror(text->err_no) - does not consume a value from args_ptr. */
1433 ASSERT_PP_FORMAT_1 ("% 12345678", "%% %x", 0x12345678);
1434 ASSERT_PP_FORMAT_1 ("` 12345678", "%< %x", 0x12345678);
1435 ASSERT_PP_FORMAT_1 ("' 12345678", "%> %x", 0x12345678);
1436 ASSERT_PP_FORMAT_1 ("' 12345678", "%' %x", 0x12345678);
1437 ASSERT_PP_FORMAT_3 ("abc 12345678", "%.*s %x", 3, "abcdef", 0x12345678);
1438 ASSERT_PP_FORMAT_2 ("abc 12345678", "%.3s %x", "abcdef", 0x12345678);
1440 /* Verify flag 'q'. */
1441 ASSERT_PP_FORMAT_2 ("`foo' 12345678", "%qs %x", "foo", 0x12345678);
1442 assert_pp_format_colored (SELFTEST_LOCATION,
1443 "`\33[01m\33[Kfoo\33[m\33[K' 12345678", "%qs %x",
1444 "foo", 0x12345678);
1446 /* Verify %Z. */
1447 int v[] = { 1, 2, 3 };
1448 ASSERT_PP_FORMAT_3 ("1, 2, 3 12345678", "%Z %x", v, 3, 0x12345678);
1450 int v2[] = { 0 };
1451 ASSERT_PP_FORMAT_3 ("0 12345678", "%Z %x", v2, 1, 0x12345678);
1453 /* Verify that combinations work, along with unformatted text. */
1454 assert_pp_format (SELFTEST_LOCATION,
1455 "the quick brown fox jumps over the lazy dog",
1456 "the %s %s %s jumps over the %s %s",
1457 "quick", "brown", "fox", "lazy", "dog");
1458 assert_pp_format (SELFTEST_LOCATION, "item 3 of 7", "item %i of %i", 3, 7);
1459 assert_pp_format (SELFTEST_LOCATION, "problem with `bar' at line 10",
1460 "problem with %qs at line %i", "bar", 10);
1462 /* Restore old values of open_quote and close_quote. */
1463 open_quote = old_open_quote;
1464 close_quote = old_close_quote;
1467 /* Run all of the selftests within this file. */
1469 void
1470 pretty_print_c_tests ()
1472 test_basic_printing ();
1473 test_pp_format ();
1476 } // namespace selftest
1478 #endif /* CHECKING_P */