libgo/go/go/printer/printer.go

   1 // Copyright 2009 The Go Authors. All rights reserved.
   2 // Use of this source code is governed by a BSD-style
   3 // license that can be found in the LICENSE file.
   4
   5 // Package printer implements printing of AST nodes.
   6 package printer
   7
   8 import (
   9         "fmt"
  10         "go/ast"
  11         "go/token"
  12         "io"
  13         "os"
  14         "strconv"
  15         "strings"
  16         "text/tabwriter"
  17         "unicode"
  18 )
  19
  20 const (
  21         maxNewlines = 2     // max. number of newlines between source text
  22         debug       = false // enable for debugging
  23         infinity    = 1 << 30
  24 )
  25
  26 type whiteSpace byte
  27
  28 const (
  29         ignore   = whiteSpace(0)
  30         blank    = whiteSpace(' ')
  31         vtab     = whiteSpace('\v')
  32         newline  = whiteSpace('\n')
  33         formfeed = whiteSpace('\f')
  34         indent   = whiteSpace('>')
  35         unindent = whiteSpace('<')
  36 )
  37
  38 // A pmode value represents the current printer mode.
  39 type pmode int
  40
  41 const (
  42         noExtraBlank     pmode = 1 << iota // disables extra blank after /*-style comment
  43         noExtraLinebreak                   // disables extra line break after /*-style comment
  44 )
  45
  46 type commentInfo struct {
  47         cindex         int               // current comment index
  48         comment        *ast.CommentGroup // = printer.comments[cindex]; or nil
  49         commentOffset  int               // = printer.posFor(printer.comments[cindex].List[0].Pos()).Offset; or infinity
  50         commentNewline bool              // true if the comment group contains newlines
  51 }
  52
  53 type printer struct {
  54         // Configuration (does not change after initialization)
  55         Config
  56         fset *token.FileSet
  57
  58         // Current state
  59         output      []byte       // raw printer result
  60         indent      int          // current indentation
  61         mode        pmode        // current printer mode
  62         impliedSemi bool         // if set, a linebreak implies a semicolon
  63         lastTok     token.Token  // last token printed (token.ILLEGAL if it's whitespace)
  64         prevOpen    token.Token  // previous non-brace "open" token (, [, or token.ILLEGAL
  65         wsbuf       []whiteSpace // delayed white space
  66
  67         // Positions
  68         // The out position differs from the pos position when the result
  69         // formatting differs from the source formatting (in the amount of
  70         // white space). If there's a difference and SourcePos is set in
  71         // ConfigMode, //line comments are used in the output to restore
  72         // original source positions for a reader.
  73         pos     token.Position // current position in AST (source) space
  74         out     token.Position // current position in output space
  75         last    token.Position // value of pos after calling writeString
  76         linePtr *int           // if set, record out.Line for the next token in *linePtr
  77
  78         // The list of all source comments, in order of appearance.
  79         comments        []*ast.CommentGroup // may be nil
  80         useNodeComments bool                // if not set, ignore lead and line comments of nodes
  81
  82         // Information about p.comments[p.cindex]; set up by nextComment.
  83         commentInfo
  84
  85         // Cache of already computed node sizes.
  86         nodeSizes map[ast.Node]int
  87
  88         // Cache of most recently computed line position.
  89         cachedPos  token.Pos
  90         cachedLine int // line corresponding to cachedPos
  91 }
  92
  93 func (p *printer) init(cfg *Config, fset *token.FileSet, nodeSizes map[ast.Node]int) {
  94         p.Config = *cfg
  95         p.fset = fset
  96         p.pos = token.Position{Line: 1, Column: 1}
  97         p.out = token.Position{Line: 1, Column: 1}
  98         p.wsbuf = make([]whiteSpace, 0, 16) // whitespace sequences are short
  99         p.nodeSizes = nodeSizes
 100         p.cachedPos = -1
 101 }
 102
 103 func (p *printer) internalError(msg ...interface{}) {
 104         if debug {
 105                 fmt.Print(p.pos.String() + ": ")
 106                 fmt.Println(msg...)
 107                 panic("go/printer")
 108         }
 109 }
 110
 111 // commentsHaveNewline reports whether a list of comments belonging to
 112 // an *ast.CommentGroup contains newlines. Because the position information
 113 // may only be partially correct, we also have to read the comment text.
 114 func (p *printer) commentsHaveNewline(list []*ast.Comment) bool {
 115         // len(list) > 0
 116         line := p.lineFor(list[0].Pos())
 117         for i, c := range list {
 118                 if i > 0 && p.lineFor(list[i].Pos()) != line {
 119                         // not all comments on the same line
 120                         return true
 121                 }
 122                 if t := c.Text; len(t) >= 2 && (t[1] == '/' || strings.Contains(t, "\n")) {
 123                         return true
 124                 }
 125         }
 126         _ = line
 127         return false
 128 }
 129
 130 func (p *printer) nextComment() {
 131         for p.cindex < len(p.comments) {
 132                 c := p.comments[p.cindex]
 133                 p.cindex++
 134                 if list := c.List; len(list) > 0 {
 135                         p.comment = c
 136                         p.commentOffset = p.posFor(list[0].Pos()).Offset
 137                         p.commentNewline = p.commentsHaveNewline(list)
 138                         return
 139                 }
 140                 // we should not reach here (correct ASTs don't have empty
 141                 // ast.CommentGroup nodes), but be conservative and try again
 142         }
 143         // no more comments
 144         p.commentOffset = infinity
 145 }
 146
 147 // commentBefore returns true iff the current comment group occurs
 148 // before the next position in the source code and printing it does
 149 // not introduce implicit semicolons.
 150 //
 151 func (p *printer) commentBefore(next token.Position) bool {
 152         return p.commentOffset < next.Offset && (!p.impliedSemi || !p.commentNewline)
 153 }
 154
 155 // commentSizeBefore returns the estimated size of the
 156 // comments on the same line before the next position.
 157 //
 158 func (p *printer) commentSizeBefore(next token.Position) int {
 159         // save/restore current p.commentInfo (p.nextComment() modifies it)
 160         defer func(info commentInfo) {
 161                 p.commentInfo = info
 162         }(p.commentInfo)
 163
 164         size := 0
 165         for p.commentBefore(next) {
 166                 for _, c := range p.comment.List {
 167                         size += len(c.Text)
 168                 }
 169                 p.nextComment()
 170         }
 171         return size
 172 }
 173
 174 // recordLine records the output line number for the next non-whitespace
 175 // token in *linePtr. It is used to compute an accurate line number for a
 176 // formatted construct, independent of pending (not yet emitted) whitespace
 177 // or comments.
 178 //
 179 func (p *printer) recordLine(linePtr *int) {
 180         p.linePtr = linePtr
 181 }
 182
 183 // linesFrom returns the number of output lines between the current
 184 // output line and the line argument, ignoring any pending (not yet
 185 // emitted) whitespace or comments. It is used to compute an accurate
 186 // size (in number of lines) for a formatted construct.
 187 //
 188 func (p *printer) linesFrom(line int) int {
 189         return p.out.Line - line
 190 }
 191
 192 func (p *printer) posFor(pos token.Pos) token.Position {
 193         // not used frequently enough to cache entire token.Position
 194         return p.fset.Position(pos)
 195 }
 196
 197 func (p *printer) lineFor(pos token.Pos) int {
 198         if pos != p.cachedPos {
 199                 p.cachedPos = pos
 200                 p.cachedLine = p.fset.Position(pos).Line
 201         }
 202         return p.cachedLine
 203 }
 204
 205 // atLineBegin emits a //line comment if necessary and prints indentation.
 206 func (p *printer) atLineBegin(pos token.Position) {
 207         // write a //line comment if necessary
 208         if p.Config.Mode&SourcePos != 0 && pos.IsValid() && (p.out.Line != pos.Line || p.out.Filename != pos.Filename) {
 209                 p.output = append(p.output, tabwriter.Escape) // protect '\n' in //line from tabwriter interpretation
 210                 p.output = append(p.output, fmt.Sprintf("//line %s:%d\n", pos.Filename, pos.Line)...)
 211                 p.output = append(p.output, tabwriter.Escape)
 212                 // p.out must match the //line comment
 213                 p.out.Filename = pos.Filename
 214                 p.out.Line = pos.Line
 215         }
 216
 217         // write indentation
 218         // use "hard" htabs - indentation columns
 219         // must not be discarded by the tabwriter
 220         n := p.Config.Indent + p.indent // include base indentation
 221         for i := 0; i < n; i++ {
 222                 p.output = append(p.output, '\t')
 223         }
 224
 225         // update positions
 226         p.pos.Offset += n
 227         p.pos.Column += n
 228         p.out.Column += n
 229 }
 230
 231 // writeByte writes ch n times to p.output and updates p.pos.
 232 func (p *printer) writeByte(ch byte, n int) {
 233         if p.out.Column == 1 {
 234                 p.atLineBegin(p.pos)
 235         }
 236
 237         for i := 0; i < n; i++ {
 238                 p.output = append(p.output, ch)
 239         }
 240
 241         // update positions
 242         p.pos.Offset += n
 243         if ch == '\n' || ch == '\f' {
 244                 p.pos.Line += n
 245                 p.out.Line += n
 246                 p.pos.Column = 1
 247                 p.out.Column = 1
 248                 return
 249         }
 250         p.pos.Column += n
 251         p.out.Column += n
 252 }
 253
 254 // writeString writes the string s to p.output and updates p.pos, p.out,
 255 // and p.last. If isLit is set, s is escaped w/ tabwriter.Escape characters
 256 // to protect s from being interpreted by the tabwriter.
 257 //
 258 // Note: writeString is only used to write Go tokens, literals, and
 259 // comments, all of which must be written literally. Thus, it is correct
 260 // to always set isLit = true. However, setting it explicitly only when
 261 // needed (i.e., when we don't know that s contains no tabs or line breaks)
 262 // avoids processing extra escape characters and reduces run time of the
 263 // printer benchmark by up to 10%.
 264 //
 265 func (p *printer) writeString(pos token.Position, s string, isLit bool) {
 266         if p.out.Column == 1 {
 267                 p.atLineBegin(pos)
 268         }
 269
 270         if pos.IsValid() {
 271                 // update p.pos (if pos is invalid, continue with existing p.pos)
 272                 // Note: Must do this after handling line beginnings because
 273                 // atLineBegin updates p.pos if there's indentation, but p.pos
 274                 // is the position of s.
 275                 p.pos = pos
 276         }
 277
 278         if isLit {
 279                 // Protect s such that is passes through the tabwriter
 280                 // unchanged. Note that valid Go programs cannot contain
 281                 // tabwriter.Escape bytes since they do not appear in legal
 282                 // UTF-8 sequences.
 283                 p.output = append(p.output, tabwriter.Escape)
 284         }
 285
 286         if debug {
 287                 p.output = append(p.output, fmt.Sprintf("/*%s*/", pos)...) // do not update p.pos!
 288         }
 289         p.output = append(p.output, s...)
 290
 291         // update positions
 292         nlines := 0
 293         var li int // index of last newline; valid if nlines > 0
 294         for i := 0; i < len(s); i++ {
 295                 // Go tokens cannot contain '\f' - no need to look for it
 296                 if s[i] == '\n' {
 297                         nlines++
 298                         li = i
 299                 }
 300         }
 301         p.pos.Offset += len(s)
 302         if nlines > 0 {
 303                 p.pos.Line += nlines
 304                 p.out.Line += nlines
 305                 c := len(s) - li
 306                 p.pos.Column = c
 307                 p.out.Column = c
 308         } else {
 309                 p.pos.Column += len(s)
 310                 p.out.Column += len(s)
 311         }
 312
 313         if isLit {
 314                 p.output = append(p.output, tabwriter.Escape)
 315         }
 316
 317         p.last = p.pos
 318 }
 319
 320 // writeCommentPrefix writes the whitespace before a comment.
 321 // If there is any pending whitespace, it consumes as much of
 322 // it as is likely to help position the comment nicely.
 323 // pos is the comment position, next the position of the item
 324 // after all pending comments, prev is the previous comment in
 325 // a group of comments (or nil), and tok is the next token.
 326 //
 327 func (p *printer) writeCommentPrefix(pos, next token.Position, prev, comment *ast.Comment, tok token.Token) {
 328         if len(p.output) == 0 {
 329                 // the comment is the first item to be printed - don't write any whitespace
 330                 return
 331         }
 332
 333         if pos.IsValid() && pos.Filename != p.last.Filename {
 334                 // comment in a different file - separate with newlines
 335                 p.writeByte('\f', maxNewlines)
 336                 return
 337         }
 338
 339         if pos.Line == p.last.Line && (prev == nil || prev.Text[1] != '/') {
 340                 // comment on the same line as last item:
 341                 // separate with at least one separator
 342                 hasSep := false
 343                 if prev == nil {
 344                         // first comment of a comment group
 345                         j := 0
 346                         for i, ch := range p.wsbuf {
 347                                 switch ch {
 348                                 case blank:
 349                                         // ignore any blanks before a comment
 350                                         p.wsbuf[i] = ignore
 351                                         continue
 352                                 case vtab:
 353                                         // respect existing tabs - important
 354                                         // for proper formatting of commented structs
 355                                         hasSep = true
 356                                         continue
 357                                 case indent:
 358                                         // apply pending indentation
 359                                         continue
 360                                 }
 361                                 j = i
 362                                 break
 363                         }
 364                         p.writeWhitespace(j)
 365                 }
 366                 // make sure there is at least one separator
 367                 if !hasSep {
 368                         sep := byte('\t')
 369                         if pos.Line == next.Line {
 370                                 // next item is on the same line as the comment
 371                                 // (which must be a /*-style comment): separate
 372                                 // with a blank instead of a tab
 373                                 sep = ' '
 374                         }
 375                         p.writeByte(sep, 1)
 376                 }
 377
 378         } else {
 379                 // comment on a different line:
 380                 // separate with at least one line break
 381                 droppedLinebreak := false
 382                 j := 0
 383                 for i, ch := range p.wsbuf {
 384                         switch ch {
 385                         case blank, vtab:
 386                                 // ignore any horizontal whitespace before line breaks
 387                                 p.wsbuf[i] = ignore
 388                                 continue
 389                         case indent:
 390                                 // apply pending indentation
 391                                 continue
 392                         case unindent:
 393                                 // if this is not the last unindent, apply it
 394                                 // as it is (likely) belonging to the last
 395                                 // construct (e.g., a multi-line expression list)
 396                                 // and is not part of closing a block
 397                                 if i+1 < len(p.wsbuf) && p.wsbuf[i+1] == unindent {
 398                                         continue
 399                                 }
 400                                 // if the next token is not a closing }, apply the unindent
 401                                 // if it appears that the comment is aligned with the
 402                                 // token; otherwise assume the unindent is part of a
 403                                 // closing block and stop (this scenario appears with
 404                                 // comments before a case label where the comments
 405                                 // apply to the next case instead of the current one)
 406                                 if tok != token.RBRACE && pos.Column == next.Column {
 407                                         continue
 408                                 }
 409                         case newline, formfeed:
 410                                 p.wsbuf[i] = ignore
 411                                 droppedLinebreak = prev == nil // record only if first comment of a group
 412                         }
 413                         j = i
 414                         break
 415                 }
 416                 p.writeWhitespace(j)
 417
 418                 // determine number of linebreaks before the comment
 419                 n := 0
 420                 if pos.IsValid() && p.last.IsValid() {
 421                         n = pos.Line - p.last.Line
 422                         if n < 0 { // should never happen
 423                                 n = 0
 424                         }
 425                 }
 426
 427                 // at the package scope level only (p.indent == 0),
 428                 // add an extra newline if we dropped one before:
 429                 // this preserves a blank line before documentation
 430                 // comments at the package scope level (issue 2570)
 431                 if p.indent == 0 && droppedLinebreak {
 432                         n++
 433                 }
 434
 435                 // make sure there is at least one line break
 436                 // if the previous comment was a line comment
 437                 if n == 0 && prev != nil && prev.Text[1] == '/' {
 438                         n = 1
 439                 }
 440
 441                 if n > 0 {
 442                         // use formfeeds to break columns before a comment;
 443                         // this is analogous to using formfeeds to separate
 444                         // individual lines of /*-style comments
 445                         p.writeByte('\f', nlimit(n))
 446                 }
 447         }
 448 }
 449
 450 // Returns true if s contains only white space
 451 // (only tabs and blanks can appear in the printer's context).
 452 //
 453 func isBlank(s string) bool {
 454         for i := 0; i < len(s); i++ {
 455                 if s[i] > ' ' {
 456                         return false
 457                 }
 458         }
 459         return true
 460 }
 461
 462 // commonPrefix returns the common prefix of a and b.
 463 func commonPrefix(a, b string) string {
 464         i := 0
 465         for i < len(a) && i < len(b) && a[i] == b[i] && (a[i] <= ' ' || a[i] == '*') {
 466                 i++
 467         }
 468         return a[0:i]
 469 }
 470
 471 // trimRight returns s with trailing whitespace removed.
 472 func trimRight(s string) string {
 473         return strings.TrimRightFunc(s, unicode.IsSpace)
 474 }
 475
 476 // stripCommonPrefix removes a common prefix from /*-style comment lines (unless no
 477 // comment line is indented, all but the first line have some form of space prefix).
 478 // The prefix is computed using heuristics such that is likely that the comment
 479 // contents are nicely laid out after re-printing each line using the printer's
 480 // current indentation.
 481 //
 482 func stripCommonPrefix(lines []string) {
 483         if len(lines) <= 1 {
 484                 return // at most one line - nothing to do
 485         }
 486         // len(lines) > 1
 487
 488         // The heuristic in this function tries to handle a few
 489         // common patterns of /*-style comments: Comments where
 490         // the opening /* and closing */ are aligned and the
 491         // rest of the comment text is aligned and indented with
 492         // blanks or tabs, cases with a vertical "line of stars"
 493         // on the left, and cases where the closing */ is on the
 494         // same line as the last comment text.
 495
 496         // Compute maximum common white prefix of all but the first,
 497         // last, and blank lines, and replace blank lines with empty
 498         // lines (the first line starts with /* and has no prefix).
 499         // In case of two-line comments, consider the last line for
 500         // the prefix computation since otherwise the prefix would
 501         // be empty.
 502         //
 503         // Note that the first and last line are never empty (they
 504         // contain the opening /* and closing */ respectively) and
 505         // thus they can be ignored by the blank line check.
 506         var prefix string
 507         if len(lines) > 2 {
 508                 first := true
 509                 for i, line := range lines[1 : len(lines)-1] {
 510                         switch {
 511                         case isBlank(line):
 512                                 lines[1+i] = "" // range starts with lines[1]
 513                         case first:
 514                                 prefix = commonPrefix(line, line)
 515                                 first = false
 516                         default:
 517                                 prefix = commonPrefix(prefix, line)
 518                         }
 519                 }
 520         } else { // len(lines) == 2, lines cannot be blank (contain /* and */)
 521                 line := lines[1]
 522                 prefix = commonPrefix(line, line)
 523         }
 524
 525         /*
 526          * Check for vertical "line of stars" and correct prefix accordingly.
 527          */
 528         lineOfStars := false
 529         if i := strings.Index(prefix, "*"); i >= 0 {
 530                 // Line of stars present.
 531                 if i > 0 && prefix[i-1] == ' ' {
 532                         i-- // remove trailing blank from prefix so stars remain aligned
 533                 }
 534                 prefix = prefix[0:i]
 535                 lineOfStars = true
 536         } else {
 537                 // No line of stars present.
 538                 // Determine the white space on the first line after the /*
 539                 // and before the beginning of the comment text, assume two
 540                 // blanks instead of the /* unless the first character after
 541                 // the /* is a tab. If the first comment line is empty but
 542                 // for the opening /*, assume up to 3 blanks or a tab. This
 543                 // whitespace may be found as suffix in the common prefix.
 544                 first := lines[0]
 545                 if isBlank(first[2:]) {
 546                         // no comment text on the first line:
 547                         // reduce prefix by up to 3 blanks or a tab
 548                         // if present - this keeps comment text indented
 549                         // relative to the /* and */'s if it was indented
 550                         // in the first place
 551                         i := len(prefix)
 552                         for n := 0; n < 3 && i > 0 && prefix[i-1] == ' '; n++ {
 553                                 i--
 554                         }
 555                         if i == len(prefix) && i > 0 && prefix[i-1] == '\t' {
 556                                 i--
 557                         }
 558                         prefix = prefix[0:i]
 559                 } else {
 560                         // comment text on the first line
 561                         suffix := make([]byte, len(first))
 562                         n := 2 // start after opening /*
 563                         for n < len(first) && first[n] <= ' ' {
 564                                 suffix[n] = first[n]
 565                                 n++
 566                         }
 567                         if n > 2 && suffix[2] == '\t' {
 568                                 // assume the '\t' compensates for the /*
 569                                 suffix = suffix[2:n]
 570                         } else {
 571                                 // otherwise assume two blanks
 572                                 suffix[0], suffix[1] = ' ', ' '
 573                                 suffix = suffix[0:n]
 574                         }
 575                         // Shorten the computed common prefix by the length of
 576                         // suffix, if it is found as suffix of the prefix.
 577                         prefix = strings.TrimSuffix(prefix, string(suffix))
 578                 }
 579         }
 580
 581         // Handle last line: If it only contains a closing */, align it
 582         // with the opening /*, otherwise align the text with the other
 583         // lines.
 584         last := lines[len(lines)-1]
 585         closing := "*/"
 586         i := strings.Index(last, closing) // i >= 0 (closing is always present)
 587         if isBlank(last[0:i]) {
 588                 // last line only contains closing */
 589                 if lineOfStars {
 590                         closing = " */" // add blank to align final star
 591                 }
 592                 lines[len(lines)-1] = prefix + closing
 593         } else {
 594                 // last line contains more comment text - assume
 595                 // it is aligned like the other lines and include
 596                 // in prefix computation
 597                 prefix = commonPrefix(prefix, last)
 598         }
 599
 600         // Remove the common prefix from all but the first and empty lines.
 601         for i, line := range lines {
 602                 if i > 0 && line != "" {
 603                         lines[i] = line[len(prefix):]
 604                 }
 605         }
 606 }
 607
 608 func (p *printer) writeComment(comment *ast.Comment) {
 609         text := comment.Text
 610         pos := p.posFor(comment.Pos())
 611
 612         const linePrefix = "//line "
 613         if strings.HasPrefix(text, linePrefix) && (!pos.IsValid() || pos.Column == 1) {
 614                 // possibly a line directive
 615                 ldir := strings.TrimSpace(text[len(linePrefix):])
 616                 if i := strings.LastIndex(ldir, ":"); i >= 0 {
 617                         if line, err := strconv.Atoi(ldir[i+1:]); err == nil && line > 0 {
 618                                 // The line directive we are about to print changed
 619                                 // the Filename and Line number used for subsequent
 620                                 // tokens. We have to update our AST-space position
 621                                 // accordingly and suspend indentation temporarily.
 622                                 indent := p.indent
 623                                 p.indent = 0
 624                                 defer func() {
 625                                         p.pos.Filename = ldir[:i]
 626                                         p.pos.Line = line
 627                                         p.pos.Column = 1
 628                                         p.indent = indent
 629                                 }()
 630                         }
 631                 }
 632         }
 633
 634         // shortcut common case of //-style comments
 635         if text[1] == '/' {
 636                 p.writeString(pos, trimRight(text), true)
 637                 return
 638         }
 639
 640         // for /*-style comments, print line by line and let the
 641         // write function take care of the proper indentation
 642         lines := strings.Split(text, "\n")
 643
 644         // The comment started in the first column but is going
 645         // to be indented. For an idempotent result, add indentation
 646         // to all lines such that they look like they were indented
 647         // before - this will make sure the common prefix computation
 648         // is the same independent of how many times formatting is
 649         // applied (was issue 1835).
 650         if pos.IsValid() && pos.Column == 1 && p.indent > 0 {
 651                 for i, line := range lines[1:] {
 652                         lines[1+i] = "   " + line
 653                 }
 654         }
 655
 656         stripCommonPrefix(lines)
 657
 658         // write comment lines, separated by formfeed,
 659         // without a line break after the last line
 660         for i, line := range lines {
 661                 if i > 0 {
 662                         p.writeByte('\f', 1)
 663                         pos = p.pos
 664                 }
 665                 if len(line) > 0 {
 666                         p.writeString(pos, trimRight(line), true)
 667                 }
 668         }
 669 }
 670
 671 // writeCommentSuffix writes a line break after a comment if indicated
 672 // and processes any leftover indentation information. If a line break
 673 // is needed, the kind of break (newline vs formfeed) depends on the
 674 // pending whitespace. The writeCommentSuffix result indicates if a
 675 // newline was written or if a formfeed was dropped from the whitespace
 676 // buffer.
 677 //
 678 func (p *printer) writeCommentSuffix(needsLinebreak bool) (wroteNewline, droppedFF bool) {
 679         for i, ch := range p.wsbuf {
 680                 switch ch {
 681                 case blank, vtab:
 682                         // ignore trailing whitespace
 683                         p.wsbuf[i] = ignore
 684                 case indent, unindent:
 685                         // don't lose indentation information
 686                 case newline, formfeed:
 687                         // if we need a line break, keep exactly one
 688                         // but remember if we dropped any formfeeds
 689                         if needsLinebreak {
 690                                 needsLinebreak = false
 691                                 wroteNewline = true
 692                         } else {
 693                                 if ch == formfeed {
 694                                         droppedFF = true
 695                                 }
 696                                 p.wsbuf[i] = ignore
 697                         }
 698                 }
 699         }
 700         p.writeWhitespace(len(p.wsbuf))
 701
 702         // make sure we have a line break
 703         if needsLinebreak {
 704                 p.writeByte('\n', 1)
 705                 wroteNewline = true
 706         }
 707
 708         return
 709 }
 710
 711 // intersperseComments consumes all comments that appear before the next token
 712 // tok and prints it together with the buffered whitespace (i.e., the whitespace
 713 // that needs to be written before the next token). A heuristic is used to mix
 714 // the comments and whitespace. The intersperseComments result indicates if a
 715 // newline was written or if a formfeed was dropped from the whitespace buffer.
 716 //
 717 func (p *printer) intersperseComments(next token.Position, tok token.Token) (wroteNewline, droppedFF bool) {
 718         var last *ast.Comment
 719         for p.commentBefore(next) {
 720                 for _, c := range p.comment.List {
 721                         p.writeCommentPrefix(p.posFor(c.Pos()), next, last, c, tok)
 722                         p.writeComment(c)
 723                         last = c
 724                 }
 725                 p.nextComment()
 726         }
 727
 728         if last != nil {
 729                 // if the last comment is a /*-style comment and the next item
 730                 // follows on the same line but is not a comma, and not a "closing"
 731                 // token immediately following its corresponding "opening" token,
 732                 // add an extra blank for separation unless explicitly disabled
 733                 if p.mode&noExtraBlank == 0 &&
 734                         last.Text[1] == '*' && p.lineFor(last.Pos()) == next.Line &&
 735                         tok != token.COMMA &&
 736                         (tok != token.RPAREN || p.prevOpen == token.LPAREN) &&
 737                         (tok != token.RBRACK || p.prevOpen == token.LBRACK) {
 738                         p.writeByte(' ', 1)
 739                 }
 740                 // ensure that there is a line break after a //-style comment,
 741                 // before a closing '}' unless explicitly disabled, or at eof
 742                 needsLinebreak :=
 743                         last.Text[1] == '/' ||
 744                                 tok == token.RBRACE && p.mode&noExtraLinebreak == 0 ||
 745                                 tok == token.EOF
 746                 return p.writeCommentSuffix(needsLinebreak)
 747         }
 748
 749         // no comment was written - we should never reach here since
 750         // intersperseComments should not be called in that case
 751         p.internalError("intersperseComments called without pending comments")
 752         return
 753 }
 754
 755 // whiteWhitespace writes the first n whitespace entries.
 756 func (p *printer) writeWhitespace(n int) {
 757         // write entries
 758         for i := 0; i < n; i++ {
 759                 switch ch := p.wsbuf[i]; ch {
 760                 case ignore:
 761                         // ignore!
 762                 case indent:
 763                         p.indent++
 764                 case unindent:
 765                         p.indent--
 766                         if p.indent < 0 {
 767                                 p.internalError("negative indentation:", p.indent)
 768                                 p.indent = 0
 769                         }
 770                 case newline, formfeed:
 771                         // A line break immediately followed by a "correcting"
 772                         // unindent is swapped with the unindent - this permits
 773                         // proper label positioning. If a comment is between
 774                         // the line break and the label, the unindent is not
 775                         // part of the comment whitespace prefix and the comment
 776                         // will be positioned correctly indented.
 777                         if i+1 < n && p.wsbuf[i+1] == unindent {
 778                                 // Use a formfeed to terminate the current section.
 779                                 // Otherwise, a long label name on the next line leading
 780                                 // to a wide column may increase the indentation column
 781                                 // of lines before the label; effectively leading to wrong
 782                                 // indentation.
 783                                 p.wsbuf[i], p.wsbuf[i+1] = unindent, formfeed
 784                                 i-- // do it again
 785                                 continue
 786                         }
 787                         fallthrough
 788                 default:
 789                         p.writeByte(byte(ch), 1)
 790                 }
 791         }
 792
 793         // shift remaining entries down
 794         l := copy(p.wsbuf, p.wsbuf[n:])
 795         p.wsbuf = p.wsbuf[:l]
 796 }
 797
 798 // ----------------------------------------------------------------------------
 799 // Printing interface
 800
 801 // nlines limits n to maxNewlines.
 802 func nlimit(n int) int {
 803         if n > maxNewlines {
 804                 n = maxNewlines
 805         }
 806         return n
 807 }
 808
 809 func mayCombine(prev token.Token, next byte) (b bool) {
 810         switch prev {
 811         case token.INT:
 812                 b = next == '.' // 1.
 813         case token.ADD:
 814                 b = next == '+' // ++
 815         case token.SUB:
 816                 b = next == '-' // --
 817         case token.QUO:
 818                 b = next == '*' // /*
 819         case token.LSS:
 820                 b = next == '-' || next == '<' // <- or <<
 821         case token.AND:
 822                 b = next == '&' || next == '^' // && or &^
 823         }
 824         return
 825 }
 826
 827 // print prints a list of "items" (roughly corresponding to syntactic
 828 // tokens, but also including whitespace and formatting information).
 829 // It is the only print function that should be called directly from
 830 // any of the AST printing functions in nodes.go.
 831 //
 832 // Whitespace is accumulated until a non-whitespace token appears. Any
 833 // comments that need to appear before that token are printed first,
 834 // taking into account the amount and structure of any pending white-
 835 // space for best comment placement. Then, any leftover whitespace is
 836 // printed, followed by the actual token.
 837 //
 838 func (p *printer) print(args ...interface{}) {
 839         for _, arg := range args {
 840                 // information about the current arg
 841                 var data string
 842                 var isLit bool
 843                 var impliedSemi bool // value for p.impliedSemi after this arg
 844
 845                 // record previous opening token, if any
 846                 switch p.lastTok {
 847                 case token.ILLEGAL:
 848                         // ignore (white space)
 849                 case token.LPAREN, token.LBRACK:
 850                         p.prevOpen = p.lastTok
 851                 default:
 852                         // other tokens followed any opening token
 853                         p.prevOpen = token.ILLEGAL
 854                 }
 855
 856                 switch x := arg.(type) {
 857                 case pmode:
 858                         // toggle printer mode
 859                         p.mode ^= x
 860                         continue
 861
 862                 case whiteSpace:
 863                         if x == ignore {
 864                                 // don't add ignore's to the buffer; they
 865                                 // may screw up "correcting" unindents (see
 866                                 // LabeledStmt)
 867                                 continue
 868                         }
 869                         i := len(p.wsbuf)
 870                         if i == cap(p.wsbuf) {
 871                                 // Whitespace sequences are very short so this should
 872                                 // never happen. Handle gracefully (but possibly with
 873                                 // bad comment placement) if it does happen.
 874                                 p.writeWhitespace(i)
 875                                 i = 0
 876                         }
 877                         p.wsbuf = p.wsbuf[0 : i+1]
 878                         p.wsbuf[i] = x
 879                         if x == newline || x == formfeed {
 880                                 // newlines affect the current state (p.impliedSemi)
 881                                 // and not the state after printing arg (impliedSemi)
 882                                 // because comments can be interspersed before the arg
 883                                 // in this case
 884                                 p.impliedSemi = false
 885                         }
 886                         p.lastTok = token.ILLEGAL
 887                         continue
 888
 889                 case *ast.Ident:
 890                         data = x.Name
 891                         impliedSemi = true
 892                         p.lastTok = token.IDENT
 893
 894                 case *ast.BasicLit:
 895                         data = x.Value
 896                         isLit = true
 897                         impliedSemi = true
 898                         p.lastTok = x.Kind
 899
 900                 case token.Token:
 901                         s := x.String()
 902                         if mayCombine(p.lastTok, s[0]) {
 903                                 // the previous and the current token must be
 904                                 // separated by a blank otherwise they combine
 905                                 // into a different incorrect token sequence
 906                                 // (except for token.INT followed by a '.' this
 907                                 // should never happen because it is taken care
 908                                 // of via binary expression formatting)
 909                                 if len(p.wsbuf) != 0 {
 910                                         p.internalError("whitespace buffer not empty")
 911                                 }
 912                                 p.wsbuf = p.wsbuf[0:1]
 913                                 p.wsbuf[0] = ' '
 914                         }
 915                         data = s
 916                         // some keywords followed by a newline imply a semicolon
 917                         switch x {
 918                         case token.BREAK, token.CONTINUE, token.FALLTHROUGH, token.RETURN,
 919                                 token.INC, token.DEC, token.RPAREN, token.RBRACK, token.RBRACE:
 920                                 impliedSemi = true
 921                         }
 922                         p.lastTok = x
 923
 924                 case token.Pos:
 925                         if x.IsValid() {
 926                                 p.pos = p.posFor(x) // accurate position of next item
 927                         }
 928                         continue
 929
 930                 case string:
 931                         // incorrect AST - print error message
 932                         data = x
 933                         isLit = true
 934                         impliedSemi = true
 935                         p.lastTok = token.STRING
 936
 937                 default:
 938                         fmt.Fprintf(os.Stderr, "print: unsupported argument %v (%T)\n", arg, arg)
 939                         panic("go/printer type")
 940                 }
 941                 // data != ""
 942
 943                 next := p.pos // estimated/accurate position of next item
 944                 wroteNewline, droppedFF := p.flush(next, p.lastTok)
 945
 946                 // intersperse extra newlines if present in the source and
 947                 // if they don't cause extra semicolons (don't do this in
 948                 // flush as it will cause extra newlines at the end of a file)
 949                 if !p.impliedSemi {
 950                         n := nlimit(next.Line - p.pos.Line)
 951                         // don't exceed maxNewlines if we already wrote one
 952                         if wroteNewline && n == maxNewlines {
 953                                 n = maxNewlines - 1
 954                         }
 955                         if n > 0 {
 956                                 ch := byte('\n')
 957                                 if droppedFF {
 958                                         ch = '\f' // use formfeed since we dropped one before
 959                                 }
 960                                 p.writeByte(ch, n)
 961                                 impliedSemi = false
 962                         }
 963                 }
 964
 965                 // the next token starts now - record its line number if requested
 966                 if p.linePtr != nil {
 967                         *p.linePtr = p.out.Line
 968                         p.linePtr = nil
 969                 }
 970
 971                 p.writeString(next, data, isLit)
 972                 p.impliedSemi = impliedSemi
 973         }
 974 }
 975
 976 // flush prints any pending comments and whitespace occurring textually
 977 // before the position of the next token tok. The flush result indicates
 978 // if a newline was written or if a formfeed was dropped from the whitespace
 979 // buffer.
 980 //
 981 func (p *printer) flush(next token.Position, tok token.Token) (wroteNewline, droppedFF bool) {
 982         if p.commentBefore(next) {
 983                 // if there are comments before the next item, intersperse them
 984                 wroteNewline, droppedFF = p.intersperseComments(next, tok)
 985         } else {
 986                 // otherwise, write any leftover whitespace
 987                 p.writeWhitespace(len(p.wsbuf))
 988         }
 989         return
 990 }
 991
 992 // getNode returns the ast.CommentGroup associated with n, if any.
 993 func getDoc(n ast.Node) *ast.CommentGroup {
 994         switch n := n.(type) {
 995         case *ast.Field:
 996                 return n.Doc
 997         case *ast.ImportSpec:
 998                 return n.Doc
 999         case *ast.ValueSpec:
1000                 return n.Doc
1001         case *ast.TypeSpec:
1002                 return n.Doc
1003         case *ast.GenDecl:
1004                 return n.Doc
1005         case *ast.FuncDecl:
1006                 return n.Doc
1007         case *ast.File:
1008                 return n.Doc
1009         }
1010         return nil
1011 }
1012
1013 func (p *printer) printNode(node interface{}) error {
1014         // unpack *CommentedNode, if any
1015         var comments []*ast.CommentGroup
1016         if cnode, ok := node.(*CommentedNode); ok {
1017                 node = cnode.Node
1018                 comments = cnode.Comments
1019         }
1020
1021         if comments != nil {
1022                 // commented node - restrict comment list to relevant range
1023                 n, ok := node.(ast.Node)
1024                 if !ok {
1025                         goto unsupported
1026                 }
1027                 beg := n.Pos()
1028                 end := n.End()
1029                 // if the node has associated documentation,
1030                 // include that commentgroup in the range
1031                 // (the comment list is sorted in the order
1032                 // of the comment appearance in the source code)
1033                 if doc := getDoc(n); doc != nil {
1034                         beg = doc.Pos()
1035                 }
1036                 // token.Pos values are global offsets, we can
1037                 // compare them directly
1038                 i := 0
1039                 for i < len(comments) && comments[i].End() < beg {
1040                         i++
1041                 }
1042                 j := i
1043                 for j < len(comments) && comments[j].Pos() < end {
1044                         j++
1045                 }
1046                 if i < j {
1047                         p.comments = comments[i:j]
1048                 }
1049         } else if n, ok := node.(*ast.File); ok {
1050                 // use ast.File comments, if any
1051                 p.comments = n.Comments
1052         }
1053
1054         // if there are no comments, use node comments
1055         p.useNodeComments = p.comments == nil
1056
1057         // get comments ready for use
1058         p.nextComment()
1059
1060         // format node
1061         switch n := node.(type) {
1062         case ast.Expr:
1063                 p.expr(n)
1064         case ast.Stmt:
1065                 // A labeled statement will un-indent to position the label.
1066                 // Set p.indent to 1 so we don't get indent "underflow".
1067                 if _, ok := n.(*ast.LabeledStmt); ok {
1068                         p.indent = 1
1069                 }
1070                 p.stmt(n, false)
1071         case ast.Decl:
1072                 p.decl(n)
1073         case ast.Spec:
1074                 p.spec(n, 1, false)
1075         case []ast.Stmt:
1076                 // A labeled statement will un-indent to position the label.
1077                 // Set p.indent to 1 so we don't get indent "underflow".
1078                 for _, s := range n {
1079                         if _, ok := s.(*ast.LabeledStmt); ok {
1080                                 p.indent = 1
1081                         }
1082                 }
1083                 p.stmtList(n, 0, false)
1084         case []ast.Decl:
1085                 p.declList(n)
1086         case *ast.File:
1087                 p.file(n)
1088         default:
1089                 goto unsupported
1090         }
1091
1092         return nil
1093
1094 unsupported:
1095         return fmt.Errorf("go/printer: unsupported node type %T", node)
1096 }
1097
1098 // ----------------------------------------------------------------------------
1099 // Trimmer
1100
1101 // A trimmer is an io.Writer filter for stripping tabwriter.Escape
1102 // characters, trailing blanks and tabs, and for converting formfeed
1103 // and vtab characters into newlines and htabs (in case no tabwriter
1104 // is used). Text bracketed by tabwriter.Escape characters is passed
1105 // through unchanged.
1106 //
1107 type trimmer struct {
1108         output io.Writer
1109         state  int
1110         space  []byte
1111 }
1112
1113 // trimmer is implemented as a state machine.
1114 // It can be in one of the following states:
1115 const (
1116         inSpace  = iota // inside space
1117         inEscape        // inside text bracketed by tabwriter.Escapes
1118         inText          // inside text
1119 )
1120
1121 func (p *trimmer) resetSpace() {
1122         p.state = inSpace
1123         p.space = p.space[0:0]
1124 }
1125
1126 // Design note: It is tempting to eliminate extra blanks occurring in
1127 //              whitespace in this function as it could simplify some
1128 //              of the blanks logic in the node printing functions.
1129 //              However, this would mess up any formatting done by
1130 //              the tabwriter.
1131
1132 var aNewline = []byte("\n")
1133
1134 func (p *trimmer) Write(data []byte) (n int, err error) {
1135         // invariants:
1136         // p.state == inSpace:
1137         //      p.space is unwritten
1138         // p.state == inEscape, inText:
1139         //      data[m:n] is unwritten
1140         m := 0
1141         var b byte
1142         for n, b = range data {
1143                 if b == '\v' {
1144                         b = '\t' // convert to htab
1145                 }
1146                 switch p.state {
1147                 case inSpace:
1148                         switch b {
1149                         case '\t', ' ':
1150                                 p.space = append(p.space, b)
1151                         case '\n', '\f':
1152                                 p.resetSpace() // discard trailing space
1153                                 _, err = p.output.Write(aNewline)
1154                         case tabwriter.Escape:
1155                                 _, err = p.output.Write(p.space)
1156                                 p.state = inEscape
1157                                 m = n + 1 // +1: skip tabwriter.Escape
1158                         default:
1159                                 _, err = p.output.Write(p.space)
1160                                 p.state = inText
1161                                 m = n
1162                         }
1163                 case inEscape:
1164                         if b == tabwriter.Escape {
1165                                 _, err = p.output.Write(data[m:n])
1166                                 p.resetSpace()
1167                         }
1168                 case inText:
1169                         switch b {
1170                         case '\t', ' ':
1171                                 _, err = p.output.Write(data[m:n])
1172                                 p.resetSpace()
1173                                 p.space = append(p.space, b)
1174                         case '\n', '\f':
1175                                 _, err = p.output.Write(data[m:n])
1176                                 p.resetSpace()
1177                                 _, err = p.output.Write(aNewline)
1178                         case tabwriter.Escape:
1179                                 _, err = p.output.Write(data[m:n])
1180                                 p.state = inEscape
1181                                 m = n + 1 // +1: skip tabwriter.Escape
1182                         }
1183                 default:
1184                         panic("unreachable")
1185                 }
1186                 if err != nil {
1187                         return
1188                 }
1189         }
1190         n = len(data)
1191
1192         switch p.state {
1193         case inEscape, inText:
1194                 _, err = p.output.Write(data[m:n])
1195                 p.resetSpace()
1196         }
1197
1198         return
1199 }
1200
1201 // ----------------------------------------------------------------------------
1202 // Public interface
1203
1204 // A Mode value is a set of flags (or 0). They control printing.
1205 type Mode uint
1206
1207 const (
1208         RawFormat Mode = 1 << iota // do not use a tabwriter; if set, UseSpaces is ignored
1209         TabIndent                  // use tabs for indentation independent of UseSpaces
1210         UseSpaces                  // use spaces instead of tabs for alignment
1211         SourcePos                  // emit //line comments to preserve original source positions
1212 )
1213
1214 // A Config node controls the output of Fprint.
1215 type Config struct {
1216         Mode     Mode // default: 0
1217         Tabwidth int  // default: 8
1218         Indent   int  // default: 0 (all code is indented at least by this much)
1219 }
1220
1221 // fprint implements Fprint and takes a nodesSizes map for setting up the printer state.
1222 func (cfg *Config) fprint(output io.Writer, fset *token.FileSet, node interface{}, nodeSizes map[ast.Node]int) (err error) {
1223         // print node
1224         var p printer
1225         p.init(cfg, fset, nodeSizes)
1226         if err = p.printNode(node); err != nil {
1227                 return
1228         }
1229         // print outstanding comments
1230         p.impliedSemi = false // EOF acts like a newline
1231         p.flush(token.Position{Offset: infinity, Line: infinity}, token.EOF)
1232
1233         // redirect output through a trimmer to eliminate trailing whitespace
1234         // (Input to a tabwriter must be untrimmed since trailing tabs provide
1235         // formatting information. The tabwriter could provide trimming
1236         // functionality but no tabwriter is used when RawFormat is set.)
1237         output = &trimmer{output: output}
1238
1239         // redirect output through a tabwriter if necessary
1240         if cfg.Mode&RawFormat == 0 {
1241                 minwidth := cfg.Tabwidth
1242
1243                 padchar := byte('\t')
1244                 if cfg.Mode&UseSpaces != 0 {
1245                         padchar = ' '
1246                 }
1247
1248                 twmode := tabwriter.DiscardEmptyColumns
1249                 if cfg.Mode&TabIndent != 0 {
1250                         minwidth = 0
1251                         twmode |= tabwriter.TabIndent
1252                 }
1253
1254                 output = tabwriter.NewWriter(output, minwidth, cfg.Tabwidth, 1, padchar, twmode)
1255         }
1256
1257         // write printer result via tabwriter/trimmer to output
1258         if _, err = output.Write(p.output); err != nil {
1259                 return
1260         }
1261
1262         // flush tabwriter, if any
1263         if tw, _ := output.(*tabwriter.Writer); tw != nil {
1264                 err = tw.Flush()
1265         }
1266
1267         return
1268 }
1269
1270 // A CommentedNode bundles an AST node and corresponding comments.
1271 // It may be provided as argument to any of the Fprint functions.
1272 //
1273 type CommentedNode struct {
1274         Node     interface{} // *ast.File, or ast.Expr, ast.Decl, ast.Spec, or ast.Stmt
1275         Comments []*ast.CommentGroup
1276 }
1277
1278 // Fprint "pretty-prints" an AST node to output for a given configuration cfg.
1279 // Position information is interpreted relative to the file set fset.
1280 // The node type must be *ast.File, *CommentedNode, []ast.Decl, []ast.Stmt,
1281 // or assignment-compatible to ast.Expr, ast.Decl, ast.Spec, or ast.Stmt.
1282 //
1283 func (cfg *Config) Fprint(output io.Writer, fset *token.FileSet, node interface{}) error {
1284         return cfg.fprint(output, fset, node, make(map[ast.Node]int))
1285 }
1286
1287 // Fprint "pretty-prints" an AST node to output.
1288 // It calls Config.Fprint with default settings.
1289 //
1290 func Fprint(output io.Writer, fset *token.FileSet, node interface{}) error {
1291         return (&Config{Tabwidth: 8}).Fprint(output, fset, node)
1292 }