libgo: Update to Go 1.3 release.
[official-gcc.git] / libgo / go / go / printer / printer.go
blob280c697a0dd7caced68425182c1c11a4da0c9074
1 // Copyright 2009 The Go Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style
3 // license that can be found in the LICENSE file.
5 // Package printer implements printing of AST nodes.
6 package printer
8 import (
9 "fmt"
10 "go/ast"
11 "go/token"
12 "io"
13 "os"
14 "strconv"
15 "strings"
16 "text/tabwriter"
17 "unicode"
20 const (
21 maxNewlines = 2 // max. number of newlines between source text
22 debug = false // enable for debugging
23 infinity = 1 << 30
26 type whiteSpace byte
28 const (
29 ignore = whiteSpace(0)
30 blank = whiteSpace(' ')
31 vtab = whiteSpace('\v')
32 newline = whiteSpace('\n')
33 formfeed = whiteSpace('\f')
34 indent = whiteSpace('>')
35 unindent = whiteSpace('<')
38 // A pmode value represents the current printer mode.
39 type pmode int
41 const (
42 noExtraBlank pmode = 1 << iota // disables extra blank after /*-style comment
43 noExtraLinebreak // disables extra line break after /*-style comment
46 type commentInfo struct {
47 cindex int // current comment index
48 comment *ast.CommentGroup // = printer.comments[cindex]; or nil
49 commentOffset int // = printer.posFor(printer.comments[cindex].List[0].Pos()).Offset; or infinity
50 commentNewline bool // true if the comment group contains newlines
53 type printer struct {
54 // Configuration (does not change after initialization)
55 Config
56 fset *token.FileSet
58 // Current state
59 output []byte // raw printer result
60 indent int // current indentation
61 mode pmode // current printer mode
62 impliedSemi bool // if set, a linebreak implies a semicolon
63 lastTok token.Token // last token printed (token.ILLEGAL if it's whitespace)
64 prevOpen token.Token // previous non-brace "open" token (, [, or token.ILLEGAL
65 wsbuf []whiteSpace // delayed white space
67 // Positions
68 // The out position differs from the pos position when the result
69 // formatting differs from the source formatting (in the amount of
70 // white space). If there's a difference and SourcePos is set in
71 // ConfigMode, //line comments are used in the output to restore
72 // original source positions for a reader.
73 pos token.Position // current position in AST (source) space
74 out token.Position // current position in output space
75 last token.Position // value of pos after calling writeString
76 linePtr *int // if set, record out.Line for the next token in *linePtr
78 // The list of all source comments, in order of appearance.
79 comments []*ast.CommentGroup // may be nil
80 useNodeComments bool // if not set, ignore lead and line comments of nodes
82 // Information about p.comments[p.cindex]; set up by nextComment.
83 commentInfo
85 // Cache of already computed node sizes.
86 nodeSizes map[ast.Node]int
88 // Cache of most recently computed line position.
89 cachedPos token.Pos
90 cachedLine int // line corresponding to cachedPos
93 func (p *printer) init(cfg *Config, fset *token.FileSet, nodeSizes map[ast.Node]int) {
94 p.Config = *cfg
95 p.fset = fset
96 p.pos = token.Position{Line: 1, Column: 1}
97 p.out = token.Position{Line: 1, Column: 1}
98 p.wsbuf = make([]whiteSpace, 0, 16) // whitespace sequences are short
99 p.nodeSizes = nodeSizes
100 p.cachedPos = -1
103 func (p *printer) internalError(msg ...interface{}) {
104 if debug {
105 fmt.Print(p.pos.String() + ": ")
106 fmt.Println(msg...)
107 panic("go/printer")
111 // commentsHaveNewline reports whether a list of comments belonging to
112 // an *ast.CommentGroup contains newlines. Because the position information
113 // may only be partially correct, we also have to read the comment text.
114 func (p *printer) commentsHaveNewline(list []*ast.Comment) bool {
115 // len(list) > 0
116 line := p.lineFor(list[0].Pos())
117 for i, c := range list {
118 if i > 0 && p.lineFor(list[i].Pos()) != line {
119 // not all comments on the same line
120 return true
122 if t := c.Text; len(t) >= 2 && (t[1] == '/' || strings.Contains(t, "\n")) {
123 return true
126 _ = line
127 return false
130 func (p *printer) nextComment() {
131 for p.cindex < len(p.comments) {
132 c := p.comments[p.cindex]
133 p.cindex++
134 if list := c.List; len(list) > 0 {
135 p.comment = c
136 p.commentOffset = p.posFor(list[0].Pos()).Offset
137 p.commentNewline = p.commentsHaveNewline(list)
138 return
140 // we should not reach here (correct ASTs don't have empty
141 // ast.CommentGroup nodes), but be conservative and try again
143 // no more comments
144 p.commentOffset = infinity
147 // commentBefore returns true iff the current comment group occurs
148 // before the next position in the source code and printing it does
149 // not introduce implicit semicolons.
151 func (p *printer) commentBefore(next token.Position) bool {
152 return p.commentOffset < next.Offset && (!p.impliedSemi || !p.commentNewline)
155 // commentSizeBefore returns the estimated size of the
156 // comments on the same line before the next position.
158 func (p *printer) commentSizeBefore(next token.Position) int {
159 // save/restore current p.commentInfo (p.nextComment() modifies it)
160 defer func(info commentInfo) {
161 p.commentInfo = info
162 }(p.commentInfo)
164 size := 0
165 for p.commentBefore(next) {
166 for _, c := range p.comment.List {
167 size += len(c.Text)
169 p.nextComment()
171 return size
174 // recordLine records the output line number for the next non-whitespace
175 // token in *linePtr. It is used to compute an accurate line number for a
176 // formatted construct, independent of pending (not yet emitted) whitespace
177 // or comments.
179 func (p *printer) recordLine(linePtr *int) {
180 p.linePtr = linePtr
183 // linesFrom returns the number of output lines between the current
184 // output line and the line argument, ignoring any pending (not yet
185 // emitted) whitespace or comments. It is used to compute an accurate
186 // size (in number of lines) for a formatted construct.
188 func (p *printer) linesFrom(line int) int {
189 return p.out.Line - line
192 func (p *printer) posFor(pos token.Pos) token.Position {
193 // not used frequently enough to cache entire token.Position
194 return p.fset.Position(pos)
197 func (p *printer) lineFor(pos token.Pos) int {
198 if pos != p.cachedPos {
199 p.cachedPos = pos
200 p.cachedLine = p.fset.Position(pos).Line
202 return p.cachedLine
205 // atLineBegin emits a //line comment if necessary and prints indentation.
206 func (p *printer) atLineBegin(pos token.Position) {
207 // write a //line comment if necessary
208 if p.Config.Mode&SourcePos != 0 && pos.IsValid() && (p.out.Line != pos.Line || p.out.Filename != pos.Filename) {
209 p.output = append(p.output, tabwriter.Escape) // protect '\n' in //line from tabwriter interpretation
210 p.output = append(p.output, fmt.Sprintf("//line %s:%d\n", pos.Filename, pos.Line)...)
211 p.output = append(p.output, tabwriter.Escape)
212 // p.out must match the //line comment
213 p.out.Filename = pos.Filename
214 p.out.Line = pos.Line
217 // write indentation
218 // use "hard" htabs - indentation columns
219 // must not be discarded by the tabwriter
220 n := p.Config.Indent + p.indent // include base indentation
221 for i := 0; i < n; i++ {
222 p.output = append(p.output, '\t')
225 // update positions
226 p.pos.Offset += n
227 p.pos.Column += n
228 p.out.Column += n
231 // writeByte writes ch n times to p.output and updates p.pos.
232 func (p *printer) writeByte(ch byte, n int) {
233 if p.out.Column == 1 {
234 p.atLineBegin(p.pos)
237 for i := 0; i < n; i++ {
238 p.output = append(p.output, ch)
241 // update positions
242 p.pos.Offset += n
243 if ch == '\n' || ch == '\f' {
244 p.pos.Line += n
245 p.out.Line += n
246 p.pos.Column = 1
247 p.out.Column = 1
248 return
250 p.pos.Column += n
251 p.out.Column += n
254 // writeString writes the string s to p.output and updates p.pos, p.out,
255 // and p.last. If isLit is set, s is escaped w/ tabwriter.Escape characters
256 // to protect s from being interpreted by the tabwriter.
258 // Note: writeString is only used to write Go tokens, literals, and
259 // comments, all of which must be written literally. Thus, it is correct
260 // to always set isLit = true. However, setting it explicitly only when
261 // needed (i.e., when we don't know that s contains no tabs or line breaks)
262 // avoids processing extra escape characters and reduces run time of the
263 // printer benchmark by up to 10%.
265 func (p *printer) writeString(pos token.Position, s string, isLit bool) {
266 if p.out.Column == 1 {
267 p.atLineBegin(pos)
270 if pos.IsValid() {
271 // update p.pos (if pos is invalid, continue with existing p.pos)
272 // Note: Must do this after handling line beginnings because
273 // atLineBegin updates p.pos if there's indentation, but p.pos
274 // is the position of s.
275 p.pos = pos
278 if isLit {
279 // Protect s such that is passes through the tabwriter
280 // unchanged. Note that valid Go programs cannot contain
281 // tabwriter.Escape bytes since they do not appear in legal
282 // UTF-8 sequences.
283 p.output = append(p.output, tabwriter.Escape)
286 if debug {
287 p.output = append(p.output, fmt.Sprintf("/*%s*/", pos)...) // do not update p.pos!
289 p.output = append(p.output, s...)
291 // update positions
292 nlines := 0
293 var li int // index of last newline; valid if nlines > 0
294 for i := 0; i < len(s); i++ {
295 // Go tokens cannot contain '\f' - no need to look for it
296 if s[i] == '\n' {
297 nlines++
298 li = i
301 p.pos.Offset += len(s)
302 if nlines > 0 {
303 p.pos.Line += nlines
304 p.out.Line += nlines
305 c := len(s) - li
306 p.pos.Column = c
307 p.out.Column = c
308 } else {
309 p.pos.Column += len(s)
310 p.out.Column += len(s)
313 if isLit {
314 p.output = append(p.output, tabwriter.Escape)
317 p.last = p.pos
320 // writeCommentPrefix writes the whitespace before a comment.
321 // If there is any pending whitespace, it consumes as much of
322 // it as is likely to help position the comment nicely.
323 // pos is the comment position, next the position of the item
324 // after all pending comments, prev is the previous comment in
325 // a group of comments (or nil), and tok is the next token.
327 func (p *printer) writeCommentPrefix(pos, next token.Position, prev, comment *ast.Comment, tok token.Token) {
328 if len(p.output) == 0 {
329 // the comment is the first item to be printed - don't write any whitespace
330 return
333 if pos.IsValid() && pos.Filename != p.last.Filename {
334 // comment in a different file - separate with newlines
335 p.writeByte('\f', maxNewlines)
336 return
339 if pos.Line == p.last.Line && (prev == nil || prev.Text[1] != '/') {
340 // comment on the same line as last item:
341 // separate with at least one separator
342 hasSep := false
343 if prev == nil {
344 // first comment of a comment group
345 j := 0
346 for i, ch := range p.wsbuf {
347 switch ch {
348 case blank:
349 // ignore any blanks before a comment
350 p.wsbuf[i] = ignore
351 continue
352 case vtab:
353 // respect existing tabs - important
354 // for proper formatting of commented structs
355 hasSep = true
356 continue
357 case indent:
358 // apply pending indentation
359 continue
361 j = i
362 break
364 p.writeWhitespace(j)
366 // make sure there is at least one separator
367 if !hasSep {
368 sep := byte('\t')
369 if pos.Line == next.Line {
370 // next item is on the same line as the comment
371 // (which must be a /*-style comment): separate
372 // with a blank instead of a tab
373 sep = ' '
375 p.writeByte(sep, 1)
378 } else {
379 // comment on a different line:
380 // separate with at least one line break
381 droppedLinebreak := false
382 j := 0
383 for i, ch := range p.wsbuf {
384 switch ch {
385 case blank, vtab:
386 // ignore any horizontal whitespace before line breaks
387 p.wsbuf[i] = ignore
388 continue
389 case indent:
390 // apply pending indentation
391 continue
392 case unindent:
393 // if this is not the last unindent, apply it
394 // as it is (likely) belonging to the last
395 // construct (e.g., a multi-line expression list)
396 // and is not part of closing a block
397 if i+1 < len(p.wsbuf) && p.wsbuf[i+1] == unindent {
398 continue
400 // if the next token is not a closing }, apply the unindent
401 // if it appears that the comment is aligned with the
402 // token; otherwise assume the unindent is part of a
403 // closing block and stop (this scenario appears with
404 // comments before a case label where the comments
405 // apply to the next case instead of the current one)
406 if tok != token.RBRACE && pos.Column == next.Column {
407 continue
409 case newline, formfeed:
410 p.wsbuf[i] = ignore
411 droppedLinebreak = prev == nil // record only if first comment of a group
413 j = i
414 break
416 p.writeWhitespace(j)
418 // determine number of linebreaks before the comment
419 n := 0
420 if pos.IsValid() && p.last.IsValid() {
421 n = pos.Line - p.last.Line
422 if n < 0 { // should never happen
423 n = 0
427 // at the package scope level only (p.indent == 0),
428 // add an extra newline if we dropped one before:
429 // this preserves a blank line before documentation
430 // comments at the package scope level (issue 2570)
431 if p.indent == 0 && droppedLinebreak {
435 // make sure there is at least one line break
436 // if the previous comment was a line comment
437 if n == 0 && prev != nil && prev.Text[1] == '/' {
438 n = 1
441 if n > 0 {
442 // use formfeeds to break columns before a comment;
443 // this is analogous to using formfeeds to separate
444 // individual lines of /*-style comments
445 p.writeByte('\f', nlimit(n))
450 // Returns true if s contains only white space
451 // (only tabs and blanks can appear in the printer's context).
453 func isBlank(s string) bool {
454 for i := 0; i < len(s); i++ {
455 if s[i] > ' ' {
456 return false
459 return true
462 // commonPrefix returns the common prefix of a and b.
463 func commonPrefix(a, b string) string {
464 i := 0
465 for i < len(a) && i < len(b) && a[i] == b[i] && (a[i] <= ' ' || a[i] == '*') {
468 return a[0:i]
471 // trimRight returns s with trailing whitespace removed.
472 func trimRight(s string) string {
473 return strings.TrimRightFunc(s, unicode.IsSpace)
476 // stripCommonPrefix removes a common prefix from /*-style comment lines (unless no
477 // comment line is indented, all but the first line have some form of space prefix).
478 // The prefix is computed using heuristics such that is likely that the comment
479 // contents are nicely laid out after re-printing each line using the printer's
480 // current indentation.
482 func stripCommonPrefix(lines []string) {
483 if len(lines) <= 1 {
484 return // at most one line - nothing to do
486 // len(lines) > 1
488 // The heuristic in this function tries to handle a few
489 // common patterns of /*-style comments: Comments where
490 // the opening /* and closing */ are aligned and the
491 // rest of the comment text is aligned and indented with
492 // blanks or tabs, cases with a vertical "line of stars"
493 // on the left, and cases where the closing */ is on the
494 // same line as the last comment text.
496 // Compute maximum common white prefix of all but the first,
497 // last, and blank lines, and replace blank lines with empty
498 // lines (the first line starts with /* and has no prefix).
499 // In case of two-line comments, consider the last line for
500 // the prefix computation since otherwise the prefix would
501 // be empty.
503 // Note that the first and last line are never empty (they
504 // contain the opening /* and closing */ respectively) and
505 // thus they can be ignored by the blank line check.
506 var prefix string
507 if len(lines) > 2 {
508 first := true
509 for i, line := range lines[1 : len(lines)-1] {
510 switch {
511 case isBlank(line):
512 lines[1+i] = "" // range starts with lines[1]
513 case first:
514 prefix = commonPrefix(line, line)
515 first = false
516 default:
517 prefix = commonPrefix(prefix, line)
520 } else { // len(lines) == 2, lines cannot be blank (contain /* and */)
521 line := lines[1]
522 prefix = commonPrefix(line, line)
526 * Check for vertical "line of stars" and correct prefix accordingly.
528 lineOfStars := false
529 if i := strings.Index(prefix, "*"); i >= 0 {
530 // Line of stars present.
531 if i > 0 && prefix[i-1] == ' ' {
532 i-- // remove trailing blank from prefix so stars remain aligned
534 prefix = prefix[0:i]
535 lineOfStars = true
536 } else {
537 // No line of stars present.
538 // Determine the white space on the first line after the /*
539 // and before the beginning of the comment text, assume two
540 // blanks instead of the /* unless the first character after
541 // the /* is a tab. If the first comment line is empty but
542 // for the opening /*, assume up to 3 blanks or a tab. This
543 // whitespace may be found as suffix in the common prefix.
544 first := lines[0]
545 if isBlank(first[2:]) {
546 // no comment text on the first line:
547 // reduce prefix by up to 3 blanks or a tab
548 // if present - this keeps comment text indented
549 // relative to the /* and */'s if it was indented
550 // in the first place
551 i := len(prefix)
552 for n := 0; n < 3 && i > 0 && prefix[i-1] == ' '; n++ {
555 if i == len(prefix) && i > 0 && prefix[i-1] == '\t' {
558 prefix = prefix[0:i]
559 } else {
560 // comment text on the first line
561 suffix := make([]byte, len(first))
562 n := 2 // start after opening /*
563 for n < len(first) && first[n] <= ' ' {
564 suffix[n] = first[n]
567 if n > 2 && suffix[2] == '\t' {
568 // assume the '\t' compensates for the /*
569 suffix = suffix[2:n]
570 } else {
571 // otherwise assume two blanks
572 suffix[0], suffix[1] = ' ', ' '
573 suffix = suffix[0:n]
575 // Shorten the computed common prefix by the length of
576 // suffix, if it is found as suffix of the prefix.
577 prefix = strings.TrimSuffix(prefix, string(suffix))
581 // Handle last line: If it only contains a closing */, align it
582 // with the opening /*, otherwise align the text with the other
583 // lines.
584 last := lines[len(lines)-1]
585 closing := "*/"
586 i := strings.Index(last, closing) // i >= 0 (closing is always present)
587 if isBlank(last[0:i]) {
588 // last line only contains closing */
589 if lineOfStars {
590 closing = " */" // add blank to align final star
592 lines[len(lines)-1] = prefix + closing
593 } else {
594 // last line contains more comment text - assume
595 // it is aligned like the other lines and include
596 // in prefix computation
597 prefix = commonPrefix(prefix, last)
600 // Remove the common prefix from all but the first and empty lines.
601 for i, line := range lines {
602 if i > 0 && line != "" {
603 lines[i] = line[len(prefix):]
608 func (p *printer) writeComment(comment *ast.Comment) {
609 text := comment.Text
610 pos := p.posFor(comment.Pos())
612 const linePrefix = "//line "
613 if strings.HasPrefix(text, linePrefix) && (!pos.IsValid() || pos.Column == 1) {
614 // possibly a line directive
615 ldir := strings.TrimSpace(text[len(linePrefix):])
616 if i := strings.LastIndex(ldir, ":"); i >= 0 {
617 if line, err := strconv.Atoi(ldir[i+1:]); err == nil && line > 0 {
618 // The line directive we are about to print changed
619 // the Filename and Line number used for subsequent
620 // tokens. We have to update our AST-space position
621 // accordingly and suspend indentation temporarily.
622 indent := p.indent
623 p.indent = 0
624 defer func() {
625 p.pos.Filename = ldir[:i]
626 p.pos.Line = line
627 p.pos.Column = 1
628 p.indent = indent
634 // shortcut common case of //-style comments
635 if text[1] == '/' {
636 p.writeString(pos, trimRight(text), true)
637 return
640 // for /*-style comments, print line by line and let the
641 // write function take care of the proper indentation
642 lines := strings.Split(text, "\n")
644 // The comment started in the first column but is going
645 // to be indented. For an idempotent result, add indentation
646 // to all lines such that they look like they were indented
647 // before - this will make sure the common prefix computation
648 // is the same independent of how many times formatting is
649 // applied (was issue 1835).
650 if pos.IsValid() && pos.Column == 1 && p.indent > 0 {
651 for i, line := range lines[1:] {
652 lines[1+i] = " " + line
656 stripCommonPrefix(lines)
658 // write comment lines, separated by formfeed,
659 // without a line break after the last line
660 for i, line := range lines {
661 if i > 0 {
662 p.writeByte('\f', 1)
663 pos = p.pos
665 if len(line) > 0 {
666 p.writeString(pos, trimRight(line), true)
671 // writeCommentSuffix writes a line break after a comment if indicated
672 // and processes any leftover indentation information. If a line break
673 // is needed, the kind of break (newline vs formfeed) depends on the
674 // pending whitespace. The writeCommentSuffix result indicates if a
675 // newline was written or if a formfeed was dropped from the whitespace
676 // buffer.
678 func (p *printer) writeCommentSuffix(needsLinebreak bool) (wroteNewline, droppedFF bool) {
679 for i, ch := range p.wsbuf {
680 switch ch {
681 case blank, vtab:
682 // ignore trailing whitespace
683 p.wsbuf[i] = ignore
684 case indent, unindent:
685 // don't lose indentation information
686 case newline, formfeed:
687 // if we need a line break, keep exactly one
688 // but remember if we dropped any formfeeds
689 if needsLinebreak {
690 needsLinebreak = false
691 wroteNewline = true
692 } else {
693 if ch == formfeed {
694 droppedFF = true
696 p.wsbuf[i] = ignore
700 p.writeWhitespace(len(p.wsbuf))
702 // make sure we have a line break
703 if needsLinebreak {
704 p.writeByte('\n', 1)
705 wroteNewline = true
708 return
711 // intersperseComments consumes all comments that appear before the next token
712 // tok and prints it together with the buffered whitespace (i.e., the whitespace
713 // that needs to be written before the next token). A heuristic is used to mix
714 // the comments and whitespace. The intersperseComments result indicates if a
715 // newline was written or if a formfeed was dropped from the whitespace buffer.
717 func (p *printer) intersperseComments(next token.Position, tok token.Token) (wroteNewline, droppedFF bool) {
718 var last *ast.Comment
719 for p.commentBefore(next) {
720 for _, c := range p.comment.List {
721 p.writeCommentPrefix(p.posFor(c.Pos()), next, last, c, tok)
722 p.writeComment(c)
723 last = c
725 p.nextComment()
728 if last != nil {
729 // if the last comment is a /*-style comment and the next item
730 // follows on the same line but is not a comma, and not a "closing"
731 // token immediately following its corresponding "opening" token,
732 // add an extra blank for separation unless explicitly disabled
733 if p.mode&noExtraBlank == 0 &&
734 last.Text[1] == '*' && p.lineFor(last.Pos()) == next.Line &&
735 tok != token.COMMA &&
736 (tok != token.RPAREN || p.prevOpen == token.LPAREN) &&
737 (tok != token.RBRACK || p.prevOpen == token.LBRACK) {
738 p.writeByte(' ', 1)
740 // ensure that there is a line break after a //-style comment,
741 // before a closing '}' unless explicitly disabled, or at eof
742 needsLinebreak :=
743 last.Text[1] == '/' ||
744 tok == token.RBRACE && p.mode&noExtraLinebreak == 0 ||
745 tok == token.EOF
746 return p.writeCommentSuffix(needsLinebreak)
749 // no comment was written - we should never reach here since
750 // intersperseComments should not be called in that case
751 p.internalError("intersperseComments called without pending comments")
752 return
755 // whiteWhitespace writes the first n whitespace entries.
756 func (p *printer) writeWhitespace(n int) {
757 // write entries
758 for i := 0; i < n; i++ {
759 switch ch := p.wsbuf[i]; ch {
760 case ignore:
761 // ignore!
762 case indent:
763 p.indent++
764 case unindent:
765 p.indent--
766 if p.indent < 0 {
767 p.internalError("negative indentation:", p.indent)
768 p.indent = 0
770 case newline, formfeed:
771 // A line break immediately followed by a "correcting"
772 // unindent is swapped with the unindent - this permits
773 // proper label positioning. If a comment is between
774 // the line break and the label, the unindent is not
775 // part of the comment whitespace prefix and the comment
776 // will be positioned correctly indented.
777 if i+1 < n && p.wsbuf[i+1] == unindent {
778 // Use a formfeed to terminate the current section.
779 // Otherwise, a long label name on the next line leading
780 // to a wide column may increase the indentation column
781 // of lines before the label; effectively leading to wrong
782 // indentation.
783 p.wsbuf[i], p.wsbuf[i+1] = unindent, formfeed
784 i-- // do it again
785 continue
787 fallthrough
788 default:
789 p.writeByte(byte(ch), 1)
793 // shift remaining entries down
794 l := copy(p.wsbuf, p.wsbuf[n:])
795 p.wsbuf = p.wsbuf[:l]
798 // ----------------------------------------------------------------------------
799 // Printing interface
801 // nlines limits n to maxNewlines.
802 func nlimit(n int) int {
803 if n > maxNewlines {
804 n = maxNewlines
806 return n
809 func mayCombine(prev token.Token, next byte) (b bool) {
810 switch prev {
811 case token.INT:
812 b = next == '.' // 1.
813 case token.ADD:
814 b = next == '+' // ++
815 case token.SUB:
816 b = next == '-' // --
817 case token.QUO:
818 b = next == '*' // /*
819 case token.LSS:
820 b = next == '-' || next == '<' // <- or <<
821 case token.AND:
822 b = next == '&' || next == '^' // && or &^
824 return
827 // print prints a list of "items" (roughly corresponding to syntactic
828 // tokens, but also including whitespace and formatting information).
829 // It is the only print function that should be called directly from
830 // any of the AST printing functions in nodes.go.
832 // Whitespace is accumulated until a non-whitespace token appears. Any
833 // comments that need to appear before that token are printed first,
834 // taking into account the amount and structure of any pending white-
835 // space for best comment placement. Then, any leftover whitespace is
836 // printed, followed by the actual token.
838 func (p *printer) print(args ...interface{}) {
839 for _, arg := range args {
840 // information about the current arg
841 var data string
842 var isLit bool
843 var impliedSemi bool // value for p.impliedSemi after this arg
845 // record previous opening token, if any
846 switch p.lastTok {
847 case token.ILLEGAL:
848 // ignore (white space)
849 case token.LPAREN, token.LBRACK:
850 p.prevOpen = p.lastTok
851 default:
852 // other tokens followed any opening token
853 p.prevOpen = token.ILLEGAL
856 switch x := arg.(type) {
857 case pmode:
858 // toggle printer mode
859 p.mode ^= x
860 continue
862 case whiteSpace:
863 if x == ignore {
864 // don't add ignore's to the buffer; they
865 // may screw up "correcting" unindents (see
866 // LabeledStmt)
867 continue
869 i := len(p.wsbuf)
870 if i == cap(p.wsbuf) {
871 // Whitespace sequences are very short so this should
872 // never happen. Handle gracefully (but possibly with
873 // bad comment placement) if it does happen.
874 p.writeWhitespace(i)
875 i = 0
877 p.wsbuf = p.wsbuf[0 : i+1]
878 p.wsbuf[i] = x
879 if x == newline || x == formfeed {
880 // newlines affect the current state (p.impliedSemi)
881 // and not the state after printing arg (impliedSemi)
882 // because comments can be interspersed before the arg
883 // in this case
884 p.impliedSemi = false
886 p.lastTok = token.ILLEGAL
887 continue
889 case *ast.Ident:
890 data = x.Name
891 impliedSemi = true
892 p.lastTok = token.IDENT
894 case *ast.BasicLit:
895 data = x.Value
896 isLit = true
897 impliedSemi = true
898 p.lastTok = x.Kind
900 case token.Token:
901 s := x.String()
902 if mayCombine(p.lastTok, s[0]) {
903 // the previous and the current token must be
904 // separated by a blank otherwise they combine
905 // into a different incorrect token sequence
906 // (except for token.INT followed by a '.' this
907 // should never happen because it is taken care
908 // of via binary expression formatting)
909 if len(p.wsbuf) != 0 {
910 p.internalError("whitespace buffer not empty")
912 p.wsbuf = p.wsbuf[0:1]
913 p.wsbuf[0] = ' '
915 data = s
916 // some keywords followed by a newline imply a semicolon
917 switch x {
918 case token.BREAK, token.CONTINUE, token.FALLTHROUGH, token.RETURN,
919 token.INC, token.DEC, token.RPAREN, token.RBRACK, token.RBRACE:
920 impliedSemi = true
922 p.lastTok = x
924 case token.Pos:
925 if x.IsValid() {
926 p.pos = p.posFor(x) // accurate position of next item
928 continue
930 case string:
931 // incorrect AST - print error message
932 data = x
933 isLit = true
934 impliedSemi = true
935 p.lastTok = token.STRING
937 default:
938 fmt.Fprintf(os.Stderr, "print: unsupported argument %v (%T)\n", arg, arg)
939 panic("go/printer type")
941 // data != ""
943 next := p.pos // estimated/accurate position of next item
944 wroteNewline, droppedFF := p.flush(next, p.lastTok)
946 // intersperse extra newlines if present in the source and
947 // if they don't cause extra semicolons (don't do this in
948 // flush as it will cause extra newlines at the end of a file)
949 if !p.impliedSemi {
950 n := nlimit(next.Line - p.pos.Line)
951 // don't exceed maxNewlines if we already wrote one
952 if wroteNewline && n == maxNewlines {
953 n = maxNewlines - 1
955 if n > 0 {
956 ch := byte('\n')
957 if droppedFF {
958 ch = '\f' // use formfeed since we dropped one before
960 p.writeByte(ch, n)
961 impliedSemi = false
965 // the next token starts now - record its line number if requested
966 if p.linePtr != nil {
967 *p.linePtr = p.out.Line
968 p.linePtr = nil
971 p.writeString(next, data, isLit)
972 p.impliedSemi = impliedSemi
976 // flush prints any pending comments and whitespace occurring textually
977 // before the position of the next token tok. The flush result indicates
978 // if a newline was written or if a formfeed was dropped from the whitespace
979 // buffer.
981 func (p *printer) flush(next token.Position, tok token.Token) (wroteNewline, droppedFF bool) {
982 if p.commentBefore(next) {
983 // if there are comments before the next item, intersperse them
984 wroteNewline, droppedFF = p.intersperseComments(next, tok)
985 } else {
986 // otherwise, write any leftover whitespace
987 p.writeWhitespace(len(p.wsbuf))
989 return
992 // getNode returns the ast.CommentGroup associated with n, if any.
993 func getDoc(n ast.Node) *ast.CommentGroup {
994 switch n := n.(type) {
995 case *ast.Field:
996 return n.Doc
997 case *ast.ImportSpec:
998 return n.Doc
999 case *ast.ValueSpec:
1000 return n.Doc
1001 case *ast.TypeSpec:
1002 return n.Doc
1003 case *ast.GenDecl:
1004 return n.Doc
1005 case *ast.FuncDecl:
1006 return n.Doc
1007 case *ast.File:
1008 return n.Doc
1010 return nil
1013 func (p *printer) printNode(node interface{}) error {
1014 // unpack *CommentedNode, if any
1015 var comments []*ast.CommentGroup
1016 if cnode, ok := node.(*CommentedNode); ok {
1017 node = cnode.Node
1018 comments = cnode.Comments
1021 if comments != nil {
1022 // commented node - restrict comment list to relevant range
1023 n, ok := node.(ast.Node)
1024 if !ok {
1025 goto unsupported
1027 beg := n.Pos()
1028 end := n.End()
1029 // if the node has associated documentation,
1030 // include that commentgroup in the range
1031 // (the comment list is sorted in the order
1032 // of the comment appearance in the source code)
1033 if doc := getDoc(n); doc != nil {
1034 beg = doc.Pos()
1036 // token.Pos values are global offsets, we can
1037 // compare them directly
1038 i := 0
1039 for i < len(comments) && comments[i].End() < beg {
1042 j := i
1043 for j < len(comments) && comments[j].Pos() < end {
1046 if i < j {
1047 p.comments = comments[i:j]
1049 } else if n, ok := node.(*ast.File); ok {
1050 // use ast.File comments, if any
1051 p.comments = n.Comments
1054 // if there are no comments, use node comments
1055 p.useNodeComments = p.comments == nil
1057 // get comments ready for use
1058 p.nextComment()
1060 // format node
1061 switch n := node.(type) {
1062 case ast.Expr:
1063 p.expr(n)
1064 case ast.Stmt:
1065 // A labeled statement will un-indent to position the label.
1066 // Set p.indent to 1 so we don't get indent "underflow".
1067 if _, ok := n.(*ast.LabeledStmt); ok {
1068 p.indent = 1
1070 p.stmt(n, false)
1071 case ast.Decl:
1072 p.decl(n)
1073 case ast.Spec:
1074 p.spec(n, 1, false)
1075 case []ast.Stmt:
1076 // A labeled statement will un-indent to position the label.
1077 // Set p.indent to 1 so we don't get indent "underflow".
1078 for _, s := range n {
1079 if _, ok := s.(*ast.LabeledStmt); ok {
1080 p.indent = 1
1083 p.stmtList(n, 0, false)
1084 case []ast.Decl:
1085 p.declList(n)
1086 case *ast.File:
1087 p.file(n)
1088 default:
1089 goto unsupported
1092 return nil
1094 unsupported:
1095 return fmt.Errorf("go/printer: unsupported node type %T", node)
1098 // ----------------------------------------------------------------------------
1099 // Trimmer
1101 // A trimmer is an io.Writer filter for stripping tabwriter.Escape
1102 // characters, trailing blanks and tabs, and for converting formfeed
1103 // and vtab characters into newlines and htabs (in case no tabwriter
1104 // is used). Text bracketed by tabwriter.Escape characters is passed
1105 // through unchanged.
1107 type trimmer struct {
1108 output io.Writer
1109 state int
1110 space []byte
1113 // trimmer is implemented as a state machine.
1114 // It can be in one of the following states:
1115 const (
1116 inSpace = iota // inside space
1117 inEscape // inside text bracketed by tabwriter.Escapes
1118 inText // inside text
1121 func (p *trimmer) resetSpace() {
1122 p.state = inSpace
1123 p.space = p.space[0:0]
1126 // Design note: It is tempting to eliminate extra blanks occurring in
1127 // whitespace in this function as it could simplify some
1128 // of the blanks logic in the node printing functions.
1129 // However, this would mess up any formatting done by
1130 // the tabwriter.
1132 var aNewline = []byte("\n")
1134 func (p *trimmer) Write(data []byte) (n int, err error) {
1135 // invariants:
1136 // p.state == inSpace:
1137 // p.space is unwritten
1138 // p.state == inEscape, inText:
1139 // data[m:n] is unwritten
1140 m := 0
1141 var b byte
1142 for n, b = range data {
1143 if b == '\v' {
1144 b = '\t' // convert to htab
1146 switch p.state {
1147 case inSpace:
1148 switch b {
1149 case '\t', ' ':
1150 p.space = append(p.space, b)
1151 case '\n', '\f':
1152 p.resetSpace() // discard trailing space
1153 _, err = p.output.Write(aNewline)
1154 case tabwriter.Escape:
1155 _, err = p.output.Write(p.space)
1156 p.state = inEscape
1157 m = n + 1 // +1: skip tabwriter.Escape
1158 default:
1159 _, err = p.output.Write(p.space)
1160 p.state = inText
1161 m = n
1163 case inEscape:
1164 if b == tabwriter.Escape {
1165 _, err = p.output.Write(data[m:n])
1166 p.resetSpace()
1168 case inText:
1169 switch b {
1170 case '\t', ' ':
1171 _, err = p.output.Write(data[m:n])
1172 p.resetSpace()
1173 p.space = append(p.space, b)
1174 case '\n', '\f':
1175 _, err = p.output.Write(data[m:n])
1176 p.resetSpace()
1177 _, err = p.output.Write(aNewline)
1178 case tabwriter.Escape:
1179 _, err = p.output.Write(data[m:n])
1180 p.state = inEscape
1181 m = n + 1 // +1: skip tabwriter.Escape
1183 default:
1184 panic("unreachable")
1186 if err != nil {
1187 return
1190 n = len(data)
1192 switch p.state {
1193 case inEscape, inText:
1194 _, err = p.output.Write(data[m:n])
1195 p.resetSpace()
1198 return
1201 // ----------------------------------------------------------------------------
1202 // Public interface
1204 // A Mode value is a set of flags (or 0). They control printing.
1205 type Mode uint
1207 const (
1208 RawFormat Mode = 1 << iota // do not use a tabwriter; if set, UseSpaces is ignored
1209 TabIndent // use tabs for indentation independent of UseSpaces
1210 UseSpaces // use spaces instead of tabs for alignment
1211 SourcePos // emit //line comments to preserve original source positions
1214 // A Config node controls the output of Fprint.
1215 type Config struct {
1216 Mode Mode // default: 0
1217 Tabwidth int // default: 8
1218 Indent int // default: 0 (all code is indented at least by this much)
1221 // fprint implements Fprint and takes a nodesSizes map for setting up the printer state.
1222 func (cfg *Config) fprint(output io.Writer, fset *token.FileSet, node interface{}, nodeSizes map[ast.Node]int) (err error) {
1223 // print node
1224 var p printer
1225 p.init(cfg, fset, nodeSizes)
1226 if err = p.printNode(node); err != nil {
1227 return
1229 // print outstanding comments
1230 p.impliedSemi = false // EOF acts like a newline
1231 p.flush(token.Position{Offset: infinity, Line: infinity}, token.EOF)
1233 // redirect output through a trimmer to eliminate trailing whitespace
1234 // (Input to a tabwriter must be untrimmed since trailing tabs provide
1235 // formatting information. The tabwriter could provide trimming
1236 // functionality but no tabwriter is used when RawFormat is set.)
1237 output = &trimmer{output: output}
1239 // redirect output through a tabwriter if necessary
1240 if cfg.Mode&RawFormat == 0 {
1241 minwidth := cfg.Tabwidth
1243 padchar := byte('\t')
1244 if cfg.Mode&UseSpaces != 0 {
1245 padchar = ' '
1248 twmode := tabwriter.DiscardEmptyColumns
1249 if cfg.Mode&TabIndent != 0 {
1250 minwidth = 0
1251 twmode |= tabwriter.TabIndent
1254 output = tabwriter.NewWriter(output, minwidth, cfg.Tabwidth, 1, padchar, twmode)
1257 // write printer result via tabwriter/trimmer to output
1258 if _, err = output.Write(p.output); err != nil {
1259 return
1262 // flush tabwriter, if any
1263 if tw, _ := output.(*tabwriter.Writer); tw != nil {
1264 err = tw.Flush()
1267 return
1270 // A CommentedNode bundles an AST node and corresponding comments.
1271 // It may be provided as argument to any of the Fprint functions.
1273 type CommentedNode struct {
1274 Node interface{} // *ast.File, or ast.Expr, ast.Decl, ast.Spec, or ast.Stmt
1275 Comments []*ast.CommentGroup
1278 // Fprint "pretty-prints" an AST node to output for a given configuration cfg.
1279 // Position information is interpreted relative to the file set fset.
1280 // The node type must be *ast.File, *CommentedNode, []ast.Decl, []ast.Stmt,
1281 // or assignment-compatible to ast.Expr, ast.Decl, ast.Spec, or ast.Stmt.
1283 func (cfg *Config) Fprint(output io.Writer, fset *token.FileSet, node interface{}) error {
1284 return cfg.fprint(output, fset, node, make(map[ast.Node]int))
1287 // Fprint "pretty-prints" an AST node to output.
1288 // It calls Config.Fprint with default settings.
1290 func Fprint(output io.Writer, fset *token.FileSet, node interface{}) error {
1291 return (&Config{Tabwidth: 8}).Fprint(output, fset, node)