print.go 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719
  1. /*
  2. Copyright 2016 Google Inc. All Rights Reserved.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. // Printing of syntax trees.
  14. package build
  15. import (
  16. "bytes"
  17. "fmt"
  18. "strings"
  19. )
  20. const nestedIndentation = 2 // Indentation of nested blocks
  21. const listIndentation = 4 // Indentation of multiline expressions
  22. // Format returns the formatted form of the given BUILD file.
  23. func Format(f *File) []byte {
  24. pr := &printer{}
  25. pr.file(f)
  26. return pr.Bytes()
  27. }
  28. // FormatString returns the string form of the given expression.
  29. func FormatString(x Expr) string {
  30. pr := &printer{}
  31. switch x := x.(type) {
  32. case *File:
  33. pr.file(x)
  34. default:
  35. pr.expr(x, precLow)
  36. }
  37. return pr.String()
  38. }
  39. // A printer collects the state during printing of a file or expression.
  40. type printer struct {
  41. bytes.Buffer // output buffer
  42. comment []Comment // pending end-of-line comments
  43. margin int // left margin (indent), a number of spaces
  44. depth int // nesting depth inside ( ) [ ] { }
  45. }
  46. // printf prints to the buffer.
  47. func (p *printer) printf(format string, args ...interface{}) {
  48. fmt.Fprintf(p, format, args...)
  49. }
  50. // indent returns the position on the current line, in bytes, 0-indexed.
  51. func (p *printer) indent() int {
  52. b := p.Bytes()
  53. n := 0
  54. for n < len(b) && b[len(b)-1-n] != '\n' {
  55. n++
  56. }
  57. return n
  58. }
  59. // newline ends the current line, flushing end-of-line comments.
  60. // It must only be called when printing a newline is known to be safe:
  61. // when not inside an expression or when p.depth > 0.
  62. // To break a line inside an expression that might not be enclosed
  63. // in brackets of some kind, use breakline instead.
  64. func (p *printer) newline() {
  65. if len(p.comment) > 0 {
  66. p.printf(" ")
  67. for i, com := range p.comment {
  68. if i > 0 {
  69. p.trim()
  70. p.printf("\n%*s", p.margin, "")
  71. }
  72. p.printf("%s", strings.TrimSpace(com.Token))
  73. }
  74. p.comment = p.comment[:0]
  75. }
  76. p.trim()
  77. p.printf("\n%*s", p.margin, "")
  78. }
  79. // breakline breaks the current line, inserting a continuation \ if needed.
  80. // If no continuation \ is needed, breakline flushes end-of-line comments.
  81. func (p *printer) breakline() {
  82. if p.depth == 0 {
  83. // Cannot have both final \ and comments.
  84. p.printf(" \\\n%*s", p.margin, "")
  85. return
  86. }
  87. // Safe to use newline.
  88. p.newline()
  89. }
  90. // trim removes trailing spaces from the current line.
  91. func (p *printer) trim() {
  92. // Remove trailing space from line we're about to end.
  93. b := p.Bytes()
  94. n := len(b)
  95. for n > 0 && b[n-1] == ' ' {
  96. n--
  97. }
  98. p.Truncate(n)
  99. }
  100. // file formats the given file into the print buffer.
  101. func (p *printer) file(f *File) {
  102. for _, com := range f.Before {
  103. p.printf("%s", strings.TrimSpace(com.Token))
  104. p.newline()
  105. }
  106. p.statements(f.Stmt)
  107. for _, com := range f.After {
  108. p.printf("%s", strings.TrimSpace(com.Token))
  109. p.newline()
  110. }
  111. // If the last expression is in an indented code block there can be spaces in the last line.
  112. p.trim()
  113. }
  114. func (p *printer) statements(stmts []Expr) {
  115. for i, stmt := range stmts {
  116. switch stmt := stmt.(type) {
  117. case *CommentBlock:
  118. // comments already handled
  119. case *PythonBlock:
  120. for _, com := range stmt.Before {
  121. p.printf("%s", strings.TrimSpace(com.Token))
  122. p.newline()
  123. }
  124. p.printf("%s", stmt.Token)
  125. p.newline()
  126. default:
  127. p.expr(stmt, precLow)
  128. // Print an empty line break after the expression unless it's a code block.
  129. // For a code block, the line break is generated by its last statement.
  130. if !isCodeBlock(stmt) {
  131. p.newline()
  132. }
  133. }
  134. for _, com := range stmt.Comment().After {
  135. p.printf("%s", strings.TrimSpace(com.Token))
  136. p.newline()
  137. }
  138. if i+1 < len(stmts) && !compactStmt(stmt, stmts[i+1], p.margin == 0) {
  139. p.newline()
  140. }
  141. }
  142. }
  143. // compactStmt reports whether the pair of statements s1, s2
  144. // should be printed without an intervening blank line.
  145. // We omit the blank line when both are subinclude statements
  146. // and the second one has no leading comments.
  147. func compactStmt(s1, s2 Expr, isTopLevel bool) bool {
  148. if len(s2.Comment().Before) > 0 {
  149. return false
  150. }
  151. if isTopLevel {
  152. return isCall(s1, "load") && isCall(s2, "load")
  153. } else {
  154. return !(isCodeBlock(s1) || isCodeBlock(s2))
  155. }
  156. }
  157. // isCall reports whether x is a call to a function with the given name.
  158. func isCall(x Expr, name string) bool {
  159. c, ok := x.(*CallExpr)
  160. if !ok {
  161. return false
  162. }
  163. nam, ok := c.X.(*LiteralExpr)
  164. if !ok {
  165. return false
  166. }
  167. return nam.Token == name
  168. }
  169. // isCodeBlock checks if the statement is a code block (def, if, for, etc.)
  170. func isCodeBlock(x Expr) bool {
  171. switch x.(type) {
  172. case *FuncDef:
  173. return true
  174. case *ForLoop:
  175. return true
  176. case *IfElse:
  177. return true
  178. default:
  179. return false
  180. }
  181. }
  182. // Expression formatting.
  183. // The expression formatter must introduce parentheses to force the
  184. // meaning described by the parse tree. We preserve parentheses in the
  185. // input, so extra parentheses are only needed if we have edited the tree.
  186. //
  187. // For example consider these expressions:
  188. // (1) "x" "y" % foo
  189. // (2) "x" + "y" % foo
  190. // (3) "x" + ("y" % foo)
  191. // (4) ("x" + "y") % foo
  192. // When we parse (1), we represent the concatenation as an addition.
  193. // However, if we print the addition back out without additional parens,
  194. // as in (2), it has the same meaning as (3), which is not the original
  195. // meaning. To preserve the original meaning we must add parens as in (4).
  196. //
  197. // To allow arbitrary rewrites to be formatted properly, we track full
  198. // operator precedence while printing instead of just handling this one
  199. // case of string concatenation.
  200. //
  201. // The precedences are assigned values low to high. A larger number
  202. // binds tighter than a smaller number. All binary operators bind
  203. // left-to-right.
  204. const (
  205. precLow = iota
  206. precAssign
  207. precComma
  208. precColon
  209. precIn
  210. precOr
  211. precAnd
  212. precCmp
  213. precAdd
  214. precMultiply
  215. precSuffix
  216. precUnary
  217. precConcat
  218. )
  219. // opPrec gives the precedence for operators found in a BinaryExpr.
  220. var opPrec = map[string]int{
  221. "=": precAssign,
  222. "+=": precAssign,
  223. "-=": precAssign,
  224. "*=": precAssign,
  225. "/=": precAssign,
  226. "//=": precAssign,
  227. "%=": precAssign,
  228. "or": precOr,
  229. "and": precAnd,
  230. "<": precCmp,
  231. ">": precCmp,
  232. "==": precCmp,
  233. "!=": precCmp,
  234. "<=": precCmp,
  235. ">=": precCmp,
  236. "+": precAdd,
  237. "-": precAdd,
  238. "*": precMultiply,
  239. "/": precMultiply,
  240. "//": precMultiply,
  241. "%": precMultiply,
  242. }
  243. // expr prints the expression v to the print buffer.
  244. // The value outerPrec gives the precedence of the operator
  245. // outside expr. If that operator binds tighter than v's operator,
  246. // expr must introduce parentheses to preserve the meaning
  247. // of the parse tree (see above).
  248. func (p *printer) expr(v Expr, outerPrec int) {
  249. // Emit line-comments preceding this expression.
  250. // If we are in the middle of an expression but not inside ( ) [ ] { }
  251. // then we cannot just break the line: we'd have to end it with a \.
  252. // However, even then we can't emit line comments since that would
  253. // end the expression. This is only a concern if we have rewritten
  254. // the parse tree. If comments were okay before this expression in
  255. // the original input they're still okay now, in the absense of rewrites.
  256. //
  257. // TODO(bazel-team): Check whether it is valid to emit comments right now,
  258. // and if not, insert them earlier in the output instead, at the most
  259. // recent \n not following a \ line.
  260. if before := v.Comment().Before; len(before) > 0 {
  261. // Want to print a line comment.
  262. // Line comments must be at the current margin.
  263. p.trim()
  264. if p.indent() > 0 {
  265. // There's other text on the line. Start a new line.
  266. p.printf("\n")
  267. }
  268. // Re-indent to margin.
  269. p.printf("%*s", p.margin, "")
  270. for _, com := range before {
  271. p.printf("%s", strings.TrimSpace(com.Token))
  272. p.newline()
  273. }
  274. }
  275. // Do we introduce parentheses?
  276. // The result depends on the kind of expression.
  277. // Each expression type that might need parentheses
  278. // calls addParen with its own precedence.
  279. // If parentheses are necessary, addParen prints the
  280. // opening parenthesis and sets parenthesized so that
  281. // the code after the switch can print the closing one.
  282. parenthesized := false
  283. addParen := func(prec int) {
  284. if prec < outerPrec {
  285. p.printf("(")
  286. p.depth++
  287. parenthesized = true
  288. }
  289. }
  290. switch v := v.(type) {
  291. default:
  292. panic(fmt.Errorf("printer: unexpected type %T", v))
  293. case *LiteralExpr:
  294. p.printf("%s", v.Token)
  295. case *StringExpr:
  296. // If the Token is a correct quoting of Value, use it.
  297. // This preserves the specific escaping choices that
  298. // BUILD authors have made, and it also works around
  299. // b/7272572.
  300. if strings.HasPrefix(v.Token, `"`) {
  301. s, triple, err := unquote(v.Token)
  302. if s == v.Value && triple == v.TripleQuote && err == nil {
  303. p.printf("%s", v.Token)
  304. break
  305. }
  306. }
  307. p.printf("%s", quote(v.Value, v.TripleQuote))
  308. case *DotExpr:
  309. addParen(precSuffix)
  310. p.expr(v.X, precSuffix)
  311. p.printf(".%s", v.Name)
  312. case *IndexExpr:
  313. addParen(precSuffix)
  314. p.expr(v.X, precSuffix)
  315. p.printf("[")
  316. p.expr(v.Y, precLow)
  317. p.printf("]")
  318. case *KeyValueExpr:
  319. p.expr(v.Key, precLow)
  320. p.printf(": ")
  321. p.expr(v.Value, precLow)
  322. case *SliceExpr:
  323. addParen(precSuffix)
  324. p.expr(v.X, precSuffix)
  325. p.printf("[")
  326. if v.From != nil {
  327. p.expr(v.From, precLow)
  328. }
  329. p.printf(":")
  330. if v.To != nil {
  331. p.expr(v.To, precLow)
  332. }
  333. if v.SecondColon.Byte != 0 {
  334. p.printf(":")
  335. if v.Step != nil {
  336. p.expr(v.Step, precLow)
  337. }
  338. }
  339. p.printf("]")
  340. case *UnaryExpr:
  341. addParen(precUnary)
  342. if v.Op == "not" {
  343. p.printf("not ") // Requires a space after it.
  344. } else {
  345. p.printf("%s", v.Op)
  346. }
  347. p.expr(v.X, precUnary)
  348. case *LambdaExpr:
  349. addParen(precColon)
  350. p.printf("lambda ")
  351. for i, name := range v.Var {
  352. if i > 0 {
  353. p.printf(", ")
  354. }
  355. p.expr(name, precLow)
  356. }
  357. p.printf(": ")
  358. p.expr(v.Expr, precColon)
  359. case *BinaryExpr:
  360. // Precedence: use the precedence of the operator.
  361. // Since all binary expressions format left-to-right,
  362. // it is okay for the left side to reuse the same operator
  363. // without parentheses, so we use prec for v.X.
  364. // For the same reason, the right side cannot reuse the same
  365. // operator, or else a parse tree for a + (b + c), where the ( ) are
  366. // not present in the source, will format as a + b + c, which
  367. // means (a + b) + c. Treat the right expression as appearing
  368. // in a context one precedence level higher: use prec+1 for v.Y.
  369. //
  370. // Line breaks: if we are to break the line immediately after
  371. // the operator, introduce a margin at the current column,
  372. // so that the second operand lines up with the first one and
  373. // also so that neither operand can use space to the left.
  374. // If the operator is an =, indent the right side another 4 spaces.
  375. prec := opPrec[v.Op]
  376. addParen(prec)
  377. m := p.margin
  378. if v.LineBreak {
  379. p.margin = p.indent()
  380. if v.Op == "=" {
  381. p.margin += listIndentation
  382. }
  383. }
  384. p.expr(v.X, prec)
  385. p.printf(" %s", v.Op)
  386. if v.LineBreak {
  387. p.breakline()
  388. } else {
  389. p.printf(" ")
  390. }
  391. p.expr(v.Y, prec+1)
  392. p.margin = m
  393. case *ParenExpr:
  394. p.seq("()", []Expr{v.X}, &v.End, modeParen, false, v.ForceMultiLine)
  395. case *CallExpr:
  396. addParen(precSuffix)
  397. p.expr(v.X, precSuffix)
  398. p.seq("()", v.List, &v.End, modeCall, v.ForceCompact, v.ForceMultiLine)
  399. case *ListExpr:
  400. p.seq("[]", v.List, &v.End, modeList, false, v.ForceMultiLine)
  401. case *SetExpr:
  402. p.seq("{}", v.List, &v.End, modeList, false, v.ForceMultiLine)
  403. case *TupleExpr:
  404. p.seq("()", v.List, &v.End, modeTuple, v.ForceCompact, v.ForceMultiLine)
  405. case *DictExpr:
  406. var list []Expr
  407. for _, x := range v.List {
  408. list = append(list, x)
  409. }
  410. p.seq("{}", list, &v.End, modeDict, false, v.ForceMultiLine)
  411. case *ListForExpr:
  412. p.listFor(v)
  413. case *ConditionalExpr:
  414. addParen(precSuffix)
  415. p.expr(v.Then, precSuffix)
  416. p.printf(" if ")
  417. p.expr(v.Test, precSuffix)
  418. p.printf(" else ")
  419. p.expr(v.Else, precSuffix)
  420. case *ReturnExpr:
  421. p.printf("return")
  422. if v.X != nil {
  423. p.printf(" ")
  424. p.expr(v.X, precSuffix)
  425. }
  426. case *FuncDef:
  427. p.printf("def ")
  428. p.printf(v.Name)
  429. p.seq("()", v.Args, &v.End, modeCall, v.ForceCompact, v.ForceMultiLine)
  430. p.printf(":")
  431. p.margin += nestedIndentation
  432. p.newline()
  433. p.statements(v.Body.Statements)
  434. p.margin -= nestedIndentation
  435. case *ForLoop:
  436. p.printf("for ")
  437. for i, loopVar := range v.LoopVars {
  438. if i > 0 {
  439. p.printf(", ")
  440. }
  441. p.expr(loopVar, precLow)
  442. }
  443. p.printf(" in ")
  444. p.expr(v.Iterable, precLow)
  445. p.printf(":")
  446. p.margin += nestedIndentation
  447. p.newline()
  448. p.statements(v.Body.Statements)
  449. p.margin -= nestedIndentation
  450. case *IfElse:
  451. for i, block := range v.Conditions {
  452. if i == 0 {
  453. p.printf("if ")
  454. } else if block.If == nil {
  455. p.newline()
  456. p.printf("else")
  457. } else {
  458. p.newline()
  459. p.printf("elif ")
  460. }
  461. if block.If != nil {
  462. p.expr(block.If, precLow)
  463. }
  464. p.printf(":")
  465. p.margin += nestedIndentation
  466. p.newline()
  467. p.statements(block.Then.Statements)
  468. p.margin -= nestedIndentation
  469. }
  470. }
  471. // Add closing parenthesis if needed.
  472. if parenthesized {
  473. p.depth--
  474. p.printf(")")
  475. }
  476. // Queue end-of-line comments for printing when we
  477. // reach the end of the line.
  478. p.comment = append(p.comment, v.Comment().Suffix...)
  479. }
  480. // A seqMode describes a formatting mode for a sequence of values,
  481. // like a list or call arguments.
  482. type seqMode int
  483. const (
  484. _ seqMode = iota
  485. modeCall // f(x)
  486. modeList // [x]
  487. modeTuple // (x,)
  488. modeParen // (x)
  489. modeDict // {x:y}
  490. modeSeq // x, y
  491. )
  492. // seq formats a list of values inside a given bracket pair (brack = "()", "[]", "{}").
  493. // The end node holds any trailing comments to be printed just before the
  494. // closing bracket.
  495. // The mode parameter specifies the sequence mode (see above).
  496. // If multiLine is true, seq avoids the compact form even
  497. // for 0- and 1-element sequences.
  498. func (p *printer) seq(brack string, list []Expr, end *End, mode seqMode, forceCompact, forceMultiLine bool) {
  499. p.printf("%s", brack[:1])
  500. p.depth++
  501. // If there are line comments, force multiline
  502. // so we can print the comments before the closing bracket.
  503. for _, x := range list {
  504. if len(x.Comment().Before) > 0 {
  505. forceMultiLine = true
  506. }
  507. }
  508. if len(end.Before) > 0 {
  509. forceMultiLine = true
  510. }
  511. // Resolve possibly ambiguous call arguments explicitly
  512. // instead of depending on implicit resolution in logic below.
  513. if forceMultiLine {
  514. forceCompact = false
  515. }
  516. switch {
  517. case len(list) == 0 && !forceMultiLine:
  518. // Compact form: print nothing.
  519. case len(list) == 1 && !forceMultiLine:
  520. // Compact form.
  521. p.expr(list[0], precLow)
  522. // Tuple must end with comma, to mark it as a tuple.
  523. if mode == modeTuple {
  524. p.printf(",")
  525. }
  526. case forceCompact:
  527. // Compact form but multiple elements.
  528. for i, x := range list {
  529. if i > 0 {
  530. p.printf(", ")
  531. }
  532. p.expr(x, precLow)
  533. }
  534. default:
  535. // Multi-line form.
  536. p.margin += listIndentation
  537. for i, x := range list {
  538. // If we are about to break the line before the first
  539. // element and there are trailing end-of-line comments
  540. // waiting to be printed, delay them and print them as
  541. // whole-line comments preceding that element.
  542. // Do this by printing a newline ourselves and positioning
  543. // so that the end-of-line comment, with the two spaces added,
  544. // will line up with the current margin.
  545. if i == 0 && len(p.comment) > 0 {
  546. p.printf("\n%*s", p.margin-2, "")
  547. }
  548. p.newline()
  549. p.expr(x, precLow)
  550. if mode != modeParen || i+1 < len(list) {
  551. p.printf(",")
  552. }
  553. }
  554. // Final comments.
  555. for _, com := range end.Before {
  556. p.newline()
  557. p.printf("%s", strings.TrimSpace(com.Token))
  558. }
  559. p.margin -= listIndentation
  560. p.newline()
  561. }
  562. p.depth--
  563. p.printf("%s", brack[1:])
  564. }
  565. // listFor formats a ListForExpr (list comprehension).
  566. // The single-line form is:
  567. // [x for y in z if c]
  568. //
  569. // and the multi-line form is:
  570. // [
  571. // x
  572. // for y in z
  573. // if c
  574. // ]
  575. //
  576. func (p *printer) listFor(v *ListForExpr) {
  577. multiLine := v.ForceMultiLine || len(v.End.Before) > 0
  578. // space breaks the line in multiline mode
  579. // or else prints a space.
  580. space := func() {
  581. if multiLine {
  582. p.breakline()
  583. } else {
  584. p.printf(" ")
  585. }
  586. }
  587. if v.Brack != "" {
  588. p.depth++
  589. p.printf("%s", v.Brack[:1])
  590. }
  591. if multiLine {
  592. if v.Brack != "" {
  593. p.margin += listIndentation
  594. }
  595. p.newline()
  596. }
  597. p.expr(v.X, precLow)
  598. for _, c := range v.For {
  599. space()
  600. p.printf("for ")
  601. for i, name := range c.For.Var {
  602. if i > 0 {
  603. p.printf(", ")
  604. }
  605. p.expr(name, precLow)
  606. }
  607. p.printf(" in ")
  608. p.expr(c.For.Expr, precLow)
  609. p.comment = append(p.comment, c.For.Comment().Suffix...)
  610. for _, i := range c.Ifs {
  611. space()
  612. p.printf("if ")
  613. p.expr(i.Cond, precLow)
  614. p.comment = append(p.comment, i.Comment().Suffix...)
  615. }
  616. p.comment = append(p.comment, c.Comment().Suffix...)
  617. }
  618. if multiLine {
  619. for _, com := range v.End.Before {
  620. p.newline()
  621. p.printf("%s", strings.TrimSpace(com.Token))
  622. }
  623. if v.Brack != "" {
  624. p.margin -= listIndentation
  625. }
  626. p.newline()
  627. }
  628. if v.Brack != "" {
  629. p.printf("%s", v.Brack[1:])
  630. p.depth--
  631. }
  632. }
  633. func (p *printer) isTopLevel() bool {
  634. return p.margin == 0
  635. }