syntax.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495
  1. /*
  2. Copyright 2016 Google Inc. All Rights Reserved.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. // Package build implements parsing and printing of BUILD files.
  14. package build
  15. // Syntax data structure definitions.
  16. import (
  17. "strings"
  18. "unicode/utf8"
  19. )
  20. // A Position describes the position between two bytes of input.
  21. type Position struct {
  22. Line int // line in input (starting at 1)
  23. LineRune int // rune in line (starting at 1)
  24. Byte int // byte in input (starting at 0)
  25. }
  26. // add returns the position at the end of s, assuming it starts at p.
  27. func (p Position) add(s string) Position {
  28. p.Byte += len(s)
  29. if n := strings.Count(s, "\n"); n > 0 {
  30. p.Line += n
  31. s = s[strings.LastIndex(s, "\n")+1:]
  32. p.LineRune = 1
  33. }
  34. p.LineRune += utf8.RuneCountInString(s)
  35. return p
  36. }
  37. // An Expr represents an input element.
  38. type Expr interface {
  39. // Span returns the start and end position of the expression,
  40. // excluding leading or trailing comments.
  41. Span() (start, end Position)
  42. // Comment returns the comments attached to the expression.
  43. // This method would normally be named 'Comments' but that
  44. // would interfere with embedding a type of the same name.
  45. Comment() *Comments
  46. }
  47. // A Comment represents a single # comment.
  48. type Comment struct {
  49. Start Position
  50. Token string // without trailing newline
  51. }
  52. // Comments collects the comments associated with an expression.
  53. type Comments struct {
  54. Before []Comment // whole-line comments before this expression
  55. Suffix []Comment // end-of-line comments after this expression
  56. // For top-level expressions only, After lists whole-line
  57. // comments following the expression.
  58. After []Comment
  59. }
  60. // Comment returns the receiver. This isn't useful by itself, but
  61. // a Comments struct is embedded into all the expression
  62. // implementation types, and this gives each of those a Comment
  63. // method to satisfy the Expr interface.
  64. func (c *Comments) Comment() *Comments {
  65. return c
  66. }
  67. // A File represents an entire BUILD file.
  68. type File struct {
  69. Path string // file path, relative to workspace directory
  70. Comments
  71. Stmt []Expr
  72. }
  73. func (f *File) Span() (start, end Position) {
  74. if len(f.Stmt) == 0 {
  75. return
  76. }
  77. start, _ = f.Stmt[0].Span()
  78. _, end = f.Stmt[len(f.Stmt)-1].Span()
  79. return start, end
  80. }
  81. // A CommentBlock represents a top-level block of comments separate
  82. // from any rule.
  83. type CommentBlock struct {
  84. Comments
  85. Start Position
  86. }
  87. func (x *CommentBlock) Span() (start, end Position) {
  88. return x.Start, x.Start
  89. }
  90. // A PythonBlock represents a blob of Python code, typically a def or for loop.
  91. type PythonBlock struct {
  92. Comments
  93. Start Position
  94. Token string // raw Python code, including final newline
  95. }
  96. func (x *PythonBlock) Span() (start, end Position) {
  97. return x.Start, x.Start.add(x.Token)
  98. }
  99. // A LiteralExpr represents a literal identifier or number.
  100. type LiteralExpr struct {
  101. Comments
  102. Start Position
  103. Token string // identifier token
  104. }
  105. func (x *LiteralExpr) Span() (start, end Position) {
  106. return x.Start, x.Start.add(x.Token)
  107. }
  108. // A StringExpr represents a single literal string.
  109. type StringExpr struct {
  110. Comments
  111. Start Position
  112. Value string // string value (decoded)
  113. TripleQuote bool // triple quote output
  114. End Position
  115. // To allow specific formatting of string literals,
  116. // at least within our requirements, record the
  117. // preferred form of Value. This field is a hint:
  118. // it is only used if it is a valid quoted form for Value.
  119. Token string
  120. }
  121. func (x *StringExpr) Span() (start, end Position) {
  122. return x.Start, x.End
  123. }
  124. // An End represents the end of a parenthesized or bracketed expression.
  125. // It is a place to hang comments.
  126. type End struct {
  127. Comments
  128. Pos Position
  129. }
  130. func (x *End) Span() (start, end Position) {
  131. return x.Pos, x.Pos.add(")")
  132. }
  133. // A CallExpr represents a function call expression: X(List).
  134. type CallExpr struct {
  135. Comments
  136. X Expr
  137. ListStart Position // position of (
  138. List []Expr
  139. End // position of )
  140. ForceCompact bool // force compact (non-multiline) form when printing
  141. ForceMultiLine bool // force multiline form when printing
  142. }
  143. func (x *CallExpr) Span() (start, end Position) {
  144. start, _ = x.X.Span()
  145. return start, x.End.Pos.add(")")
  146. }
  147. // A DotExpr represents a field selector: X.Name.
  148. type DotExpr struct {
  149. Comments
  150. X Expr
  151. Dot Position
  152. NamePos Position
  153. Name string
  154. }
  155. func (x *DotExpr) Span() (start, end Position) {
  156. start, _ = x.X.Span()
  157. return start, x.NamePos.add(x.Name)
  158. }
  159. // A ListForExpr represents a list comprehension expression: [X for ... if ...].
  160. type ListForExpr struct {
  161. Comments
  162. ForceMultiLine bool // split expression across multiple lines
  163. Brack string // "", "()", or "[]"
  164. Start Position
  165. X Expr
  166. For []*ForClauseWithIfClausesOpt
  167. End
  168. }
  169. func (x *ListForExpr) Span() (start, end Position) {
  170. return x.Start, x.End.Pos.add("]")
  171. }
  172. // A ForClause represents a for clause in a list comprehension: for Var in Expr.
  173. type ForClause struct {
  174. Comments
  175. For Position
  176. Var []Expr
  177. In Position
  178. Expr Expr
  179. }
  180. func (x *ForClause) Span() (start, end Position) {
  181. _, end = x.Expr.Span()
  182. return x.For, end
  183. }
  184. // An IfClause represents an if clause in a list comprehension: if Cond.
  185. type IfClause struct {
  186. Comments
  187. If Position
  188. Cond Expr
  189. }
  190. func (x *IfClause) Span() (start, end Position) {
  191. _, end = x.Cond.Span()
  192. return x.If, end
  193. }
  194. // A ForClauseWithIfClausesOpt represents a for clause in a list comprehension followed by optional
  195. // if expressions: for ... in ... [if ... if ...]
  196. type ForClauseWithIfClausesOpt struct {
  197. Comments
  198. For *ForClause
  199. Ifs []*IfClause
  200. }
  201. func (x *ForClauseWithIfClausesOpt) Span() (start, end Position) {
  202. start, end = x.For.Span()
  203. if len(x.Ifs) > 0 {
  204. _, end = x.Ifs[len(x.Ifs)-1].Span()
  205. }
  206. return start, end
  207. }
  208. // A KeyValueExpr represents a dictionary entry: Key: Value.
  209. type KeyValueExpr struct {
  210. Comments
  211. Key Expr
  212. Colon Position
  213. Value Expr
  214. }
  215. func (x *KeyValueExpr) Span() (start, end Position) {
  216. start, _ = x.Key.Span()
  217. _, end = x.Value.Span()
  218. return start, end
  219. }
  220. // A DictExpr represents a dictionary literal: { List }.
  221. type DictExpr struct {
  222. Comments
  223. Start Position
  224. List []Expr // all *KeyValueExprs
  225. Comma Position // position of trailing comma, if any
  226. End
  227. ForceMultiLine bool // force multiline form when printing
  228. }
  229. func (x *DictExpr) Span() (start, end Position) {
  230. return x.Start, x.End.Pos.add("}")
  231. }
  232. // A ListExpr represents a list literal: [ List ].
  233. type ListExpr struct {
  234. Comments
  235. Start Position
  236. List []Expr
  237. Comma Position // position of trailing comma, if any
  238. End
  239. ForceMultiLine bool // force multiline form when printing
  240. }
  241. func (x *ListExpr) Span() (start, end Position) {
  242. return x.Start, x.End.Pos.add("]")
  243. }
  244. // A SetExpr represents a set literal: { List }.
  245. type SetExpr struct {
  246. Comments
  247. Start Position
  248. List []Expr
  249. Comma Position // position of trailing comma, if any
  250. End
  251. ForceMultiLine bool // force multiline form when printing
  252. }
  253. func (x *SetExpr) Span() (start, end Position) {
  254. return x.Start, x.End.Pos.add("}")
  255. }
  256. // A TupleExpr represents a tuple literal: (List)
  257. type TupleExpr struct {
  258. Comments
  259. Start Position
  260. List []Expr
  261. Comma Position // position of trailing comma, if any
  262. End
  263. ForceCompact bool // force compact (non-multiline) form when printing
  264. ForceMultiLine bool // force multiline form when printing
  265. }
  266. func (x *TupleExpr) Span() (start, end Position) {
  267. return x.Start, x.End.Pos.add(")")
  268. }
  269. // A UnaryExpr represents a unary expression: Op X.
  270. type UnaryExpr struct {
  271. Comments
  272. OpStart Position
  273. Op string
  274. X Expr
  275. }
  276. func (x *UnaryExpr) Span() (start, end Position) {
  277. _, end = x.X.Span()
  278. return x.OpStart, end
  279. }
  280. // A BinaryExpr represents a binary expression: X Op Y.
  281. type BinaryExpr struct {
  282. Comments
  283. X Expr
  284. OpStart Position
  285. Op string
  286. LineBreak bool // insert line break between Op and Y
  287. Y Expr
  288. }
  289. func (x *BinaryExpr) Span() (start, end Position) {
  290. start, _ = x.X.Span()
  291. _, end = x.Y.Span()
  292. return start, end
  293. }
  294. // A ParenExpr represents a parenthesized expression: (X).
  295. type ParenExpr struct {
  296. Comments
  297. Start Position
  298. X Expr
  299. End
  300. ForceMultiLine bool // insert line break after opening ( and before closing )
  301. }
  302. func (x *ParenExpr) Span() (start, end Position) {
  303. return x.Start, x.End.Pos.add(")")
  304. }
  305. // A SliceExpr represents a slice expression: expr[from:to] or expr[from:to:step] .
  306. type SliceExpr struct {
  307. Comments
  308. X Expr
  309. SliceStart Position
  310. From Expr
  311. FirstColon Position
  312. To Expr
  313. SecondColon Position
  314. Step Expr
  315. End Position
  316. }
  317. func (x *SliceExpr) Span() (start, end Position) {
  318. start, _ = x.X.Span()
  319. return start, x.End
  320. }
  321. // An IndexExpr represents an index expression: X[Y].
  322. type IndexExpr struct {
  323. Comments
  324. X Expr
  325. IndexStart Position
  326. Y Expr
  327. End Position
  328. }
  329. func (x *IndexExpr) Span() (start, end Position) {
  330. start, _ = x.X.Span()
  331. return start, x.End
  332. }
  333. // A LambdaExpr represents a lambda expression: lambda Var: Expr.
  334. type LambdaExpr struct {
  335. Comments
  336. Lambda Position
  337. Var []Expr
  338. Colon Position
  339. Expr Expr
  340. }
  341. func (x *LambdaExpr) Span() (start, end Position) {
  342. _, end = x.Expr.Span()
  343. return x.Lambda, end
  344. }
  345. // ConditionalExpr represents the conditional: X if TEST else ELSE.
  346. type ConditionalExpr struct {
  347. Comments
  348. Then Expr
  349. IfStart Position
  350. Test Expr
  351. ElseStart Position
  352. Else Expr
  353. }
  354. // Span returns the start and end position of the expression,
  355. // excluding leading or trailing comments.
  356. func (x *ConditionalExpr) Span() (start, end Position) {
  357. start, _ = x.Then.Span()
  358. _, end = x.Else.Span()
  359. return start, end
  360. }
  361. // A CodeBlock represents an indented code block.
  362. type CodeBlock struct {
  363. Statements []Expr
  364. Start Position
  365. End
  366. }
  367. func (x *CodeBlock) Span() (start, end Position) {
  368. return x.Start, x.End.Pos
  369. }
  370. // A FuncDef represents a function definition expression: def foo(List):.
  371. type FuncDef struct {
  372. Comments
  373. Start Position // position of def
  374. Name string
  375. ListStart Position // position of (
  376. Args []Expr
  377. Body CodeBlock
  378. End // position of the end
  379. ForceCompact bool // force compact (non-multiline) form when printing
  380. ForceMultiLine bool // force multiline form when printing
  381. }
  382. func (x *FuncDef) Span() (start, end Position) {
  383. return x.Start, x.End.Pos
  384. }
  385. // A ReturnExpr represents a return statement: return f(x).
  386. type ReturnExpr struct {
  387. Comments
  388. Start Position
  389. X Expr
  390. End Position
  391. }
  392. func (x *ReturnExpr) Span() (start, end Position) {
  393. return x.Start, x.End
  394. }
  395. // A ForLoop represents a for loop block: for x in range(10):.
  396. type ForLoop struct {
  397. Comments
  398. Start Position // position of for
  399. LoopVars []Expr
  400. Iterable Expr
  401. Body CodeBlock
  402. End // position of the end
  403. }
  404. func (x *ForLoop) Span() (start, end Position) {
  405. return x.Start, x.End.Pos
  406. }
  407. // An IfElse represents an if-else blocks sequence: if x: ... elif y: ... else: ... .
  408. type IfElse struct {
  409. Comments
  410. Start Position // position of if
  411. Conditions []Condition
  412. End // position of the end
  413. }
  414. type Condition struct {
  415. If Expr
  416. Then CodeBlock
  417. }
  418. func (x *IfElse) Span() (start, end Position) {
  419. return x.Start, x.End.Pos
  420. }