cue/ast: add package

Change-Id: I587028ef8ce9e2e57eb75b8db5667b786dce9213
diff --git a/cue/ast/ast.go b/cue/ast/ast.go
new file mode 100644
index 0000000..cea67d9
--- /dev/null
+++ b/cue/ast/ast.go
@@ -0,0 +1,707 @@
+// Copyright 2018 The CUE Authors
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+// Package ast declares the types used to represent syntax trees for CUE
+// packages.
+package ast // import "cuelang.org/go/cue/ast"
+
+import (
+	"strconv"
+	"strings"
+
+	"cuelang.org/go/cue/token"
+)
+
+// ----------------------------------------------------------------------------
+// Interfaces
+//
+// There are two main classes of nodes: expressions, clauses, and declaration
+// nodes. The node names usually match the corresponding CUE spec production
+// names to which they correspond. The node fields correspond to the individual
+// parts of the respective productions.
+//
+// All nodes contain position information marking the beginning of the
+// corresponding source text segment; it is accessible via the Pos accessor
+// method. Nodes may contain additional position info for language constructs
+// where comments may be found between parts of the construct (typically any
+// larger, parenthesized subpart). That position information is needed to
+// properly position comments when printing the construct.
+
+// A Node represents any node in the abstract syntax tree.
+type Node interface {
+	Pos() token.Pos // position of first character belonging to the node
+	End() token.Pos // position of first character immediately after the node
+
+	// TODO: SetPos(p token.RelPos)
+
+	Comments() []*CommentGroup
+	AddComment(*CommentGroup)
+}
+
+// An Expr is implemented by all expression nodes.
+type Expr interface {
+	Node
+	exprNode()
+}
+
+func (*BadExpr) exprNode()       {}
+func (*Ident) exprNode()         {}
+func (*Ellipsis) exprNode()      {}
+func (*BasicLit) exprNode()      {}
+func (*Interpolation) exprNode() {}
+func (*StructLit) exprNode()     {}
+func (*ListLit) exprNode()       {}
+func (*LambdaExpr) exprNode()    {}
+
+// func (*StructComprehension) exprNode() {}
+func (*ListComprehension) exprNode() {}
+func (*ParenExpr) exprNode()         {}
+func (*SelectorExpr) exprNode()      {}
+func (*IndexExpr) exprNode()         {}
+func (*SliceExpr) exprNode()         {}
+func (*CallExpr) exprNode()          {}
+func (*UnaryExpr) exprNode()         {}
+func (*BinaryExpr) exprNode()        {}
+func (*BottomLit) exprNode()         {}
+
+// A Decl node is implemented by all declarations.
+type Decl interface {
+	Node
+	declNode()
+}
+
+func (*Field) declNode()             {}
+func (*ComprehensionDecl) declNode() {}
+func (*ImportDecl) declNode()        {}
+func (*BadDecl) declNode()           {}
+func (*EmitDecl) declNode()          {}
+func (*Alias) declNode()             {}
+
+// A Label is any prduction that can be used as a LHS label.
+type Label interface {
+	Node
+	labelName() (name string, isIdent bool)
+}
+
+func (n *Ident) labelName() (string, bool) {
+	return n.Name, true
+}
+
+func (n *BasicLit) labelName() (string, bool) {
+	switch n.Kind {
+	case token.STRING:
+		// Use strconv to only allow double-quoted, single-line strings.
+		if str, err := strconv.Unquote(n.Value); err == nil {
+			return str, true
+		}
+	case token.NULL, token.TRUE, token.FALSE:
+		return n.Value, true
+
+		// TODO: allow numbers to be fields?
+	}
+	return "", false
+}
+
+func (n *TemplateLabel) labelName() (string, bool) {
+	return n.Ident.Name, false
+}
+
+func (n *Interpolation) labelName() (string, bool) {
+	return "", false
+}
+func (n *ExprLabel) labelName() (string, bool) {
+	return "", false
+}
+
+// LabelName reports the name of a label, if known, and whether it is valid.
+func LabelName(x Label) (name string, ok bool) {
+	return x.labelName()
+}
+
+// As for now, a ExprLabel is not a label, as it can only use used in
+// struct comprehensions.
+
+// Clause nodes are part of comprehensions.
+type Clause interface {
+	Node
+	clauseNode()
+}
+
+func (x *ForClause) clauseNode() {}
+func (x *IfClause) clauseNode()  {}
+func (x *Alias) clauseNode()     {}
+
+// Comments
+
+type comments struct {
+	groups *[]*CommentGroup
+}
+
+func (c *comments) Comments() []*CommentGroup {
+	if c.groups == nil {
+		return []*CommentGroup{}
+	}
+	return *c.groups
+}
+
+// // AddComment adds the given comments to the fields.
+// // If line is true the comment is inserted at the preceding token.
+
+func (c *comments) AddComment(cg *CommentGroup) {
+	if cg == nil {
+		return
+	}
+	if c.groups == nil {
+		a := []*CommentGroup{cg}
+		c.groups = &a
+		return
+	}
+	*c.groups = append(*c.groups, cg)
+}
+
+// A Comment node represents a single //-style or /*-style comment.
+type Comment struct {
+	Slash token.Pos // position of "/" starting the comment
+	Text  string    // comment text (excluding '\n' for //-style comments)
+}
+
+func (g *Comment) Comments() []*CommentGroup { return nil }
+func (g *Comment) AddComment(*CommentGroup)  {}
+
+func (c *Comment) Pos() token.Pos { return c.Slash }
+func (c *Comment) End() token.Pos { return c.Slash.Add(len(c.Text)) }
+
+// A CommentGroup represents a sequence of comments
+// with no other tokens and no empty lines between.
+type CommentGroup struct {
+	// TODO: remove and use the token position of the first commment.
+	Doc  bool
+	Line bool // true if it is on the same line as the node's end pos.
+
+	// Position indicates where a comment should be attached if a node has
+	// multiple tokens. 0 means before the first token, 1 means before the
+	// second, etc. For instance, for a field, the positions are:
+	//    <0> Label <1> ":" <2> Expr <3> "," <4>
+	Position int8
+	List     []*Comment // len(List) > 0
+}
+
+func (g *CommentGroup) Pos() token.Pos { return g.List[0].Pos() }
+func (g *CommentGroup) End() token.Pos { return g.List[len(g.List)-1].End() }
+
+func (g *CommentGroup) Comments() []*CommentGroup { return nil }
+func (g *CommentGroup) AddComment(*CommentGroup)  {}
+
+func isWhitespace(ch byte) bool { return ch == ' ' || ch == '\t' || ch == '\n' || ch == '\r' }
+
+func stripTrailingWhitespace(s string) string {
+	i := len(s)
+	for i > 0 && isWhitespace(s[i-1]) {
+		i--
+	}
+	return s[0:i]
+}
+
+// Text returns the text of the comment.
+// Comment markers (//, /*, and */), the first space of a line comment, and
+// leading and trailing empty lines are removed. Multiple empty lines are
+// reduced to one, and trailing space on lines is trimmed. Unless the result
+// is empty, it is newline-terminated.
+func (g *CommentGroup) Text() string {
+	if g == nil {
+		return ""
+	}
+	comments := make([]string, len(g.List))
+	for i, c := range g.List {
+		comments[i] = c.Text
+	}
+
+	lines := make([]string, 0, 10) // most comments are less than 10 lines
+	for _, c := range comments {
+		// Remove comment markers.
+		// The parser has given us exactly the comment text.
+		switch c[1] {
+		case '/':
+			//-style comment (no newline at the end)
+			c = c[2:]
+			// strip first space - required for Example tests
+			if len(c) > 0 && c[0] == ' ' {
+				c = c[1:]
+			}
+		case '*':
+			/*-style comment */
+			c = c[2 : len(c)-2]
+		}
+
+		// Split on newlines.
+		cl := strings.Split(c, "\n")
+
+		// Walk lines, stripping trailing white space and adding to list.
+		for _, l := range cl {
+			lines = append(lines, stripTrailingWhitespace(l))
+		}
+	}
+
+	// Remove leading blank lines; convert runs of
+	// interior blank lines to a single blank line.
+	n := 0
+	for _, line := range lines {
+		if line != "" || n > 0 && lines[n-1] != "" {
+			lines[n] = line
+			n++
+		}
+	}
+	lines = lines[0:n]
+
+	// Add final "" entry to get trailing newline from Join.
+	if n > 0 && lines[n-1] != "" {
+		lines = append(lines, "")
+	}
+
+	return strings.Join(lines, "\n")
+}
+
+// A Field represents a field declaration in a struct.
+type Field struct {
+	comments
+	Label Label // must have at least one element.
+
+	// No colon: Value must be an StructLit with one field or a
+	// LambdaExpr.
+	Colon token.Pos
+	Value Expr // the value associated with this field.
+}
+
+func (d *Field) Pos() token.Pos { return d.Label.Pos() }
+func (d *Field) End() token.Pos { return d.Value.End() }
+
+// An Alias binds another field to the alias name in the current struct.
+type Alias struct {
+	comments
+	Ident *Ident    // field name, always an Ident
+	Equal token.Pos // position of "="
+	Expr  Expr      // An Ident or SelectorExpr
+}
+
+func (a *Alias) Pos() token.Pos { return a.Ident.Pos() }
+func (a *Alias) End() token.Pos { return a.Expr.End() }
+
+// A ComprehensionDecl node represents a field comprehension.
+type ComprehensionDecl struct {
+	comments
+	Field   *Field
+	Select  token.Pos
+	Clauses []Clause
+}
+
+func (x *ComprehensionDecl) Pos() token.Pos { return x.Field.Pos() }
+func (x *ComprehensionDecl) End() token.Pos {
+	if len(x.Clauses) > 0 {
+		return x.Clauses[len(x.Clauses)-1].End()
+	}
+	return x.Select
+}
+
+// ----------------------------------------------------------------------------
+// Expressions and types
+//
+// An expression is represented by a tree consisting of one
+// or more of the following concrete expression nodes.
+
+// A LambdaExpr defines a function expression.
+//
+// Lambdas are only used internally under controlled conditions. Although
+// the implementation of lambdas is fully functional, enabling them will
+// cause the language to be Turing-complete (if not otherwise limited).
+// Also, lambdas would provide yet another way to create structure, and one
+// that is known to not work well for declarative configuration languages.
+type LambdaExpr struct {
+	comments
+	Lparen token.Pos // position of "("
+	Params []*Field  // parameters with possible initializers
+	Rparen token.Pos // position of ")"
+	Expr   Expr
+}
+
+func (t *LambdaExpr) Pos() token.Pos { return t.Lparen }
+func (t *LambdaExpr) End() token.Pos { return t.Rparen }
+
+// A BadExpr node is a placeholder for expressions containing
+// syntax errors for which no correct expression nodes can be
+// created. This is different from an ErrorExpr which represents
+// an explicitly marked error in the source.
+type BadExpr struct {
+	comments
+	From, To token.Pos // position range of bad expression
+}
+
+// A BottomLit indicates an error.
+type BottomLit struct {
+	comments
+	Bottom token.Pos
+}
+
+// An Ident node represents an left-hand side identifier.
+type Ident struct {
+	comments
+	NamePos token.Pos // identifier position
+
+	// This LHS path element may be an identifier. Possible forms:
+	//  foo:    a normal identifier
+	//  "foo":  JSON compatible
+	//  <foo>:  a template shorthand
+	Name string
+
+	Scope Node // scope in which node was found or nil if referring directly
+	Node  Node
+}
+
+// A TemplateLabel represents a field template declaration in a struct.
+type TemplateLabel struct {
+	comments
+	Langle token.Pos
+	Ident  *Ident
+	Rangle token.Pos
+}
+
+// An ExprLabel is an expression to create a label in struct comprehensions.
+type ExprLabel struct {
+	comments
+	Lbrack token.Pos
+	Label  Expr
+	Rbrack token.Pos
+}
+
+// An Ellipsis node stands for the "..." type in a
+// parameter list or the "..." length in an array type.
+type Ellipsis struct {
+	comments
+	Ellipsis token.Pos // position of "..."
+	Elt      Expr      // ellipsis element type (parameter lists only); or nil
+}
+
+// A BasicLit node represents a literal of basic type.
+type BasicLit struct {
+	comments
+	ValuePos token.Pos   // literal position
+	Kind     token.Token // INT, FLOAT, DURATION, or STRING
+	Value    string      // literal string; e.g. 42, 0x7f, 3.14, 1_234_567, 1e-9, 2.4i, 'a', '\x7f', "foo", or '\m\n\o'
+}
+
+// A Interpolation node represents a string or bytes interpolation.
+type Interpolation struct { // TODO: rename to TemplateLit
+	comments
+	Elts []Expr // interleaving of strings and expressions.
+}
+
+// A StructLit node represents a literal struct.
+type StructLit struct {
+	comments
+	Lbrace token.Pos // position of "{"
+	Elts   []Decl    // list of elements; or nil
+	Rbrace token.Pos // position of "}"
+}
+
+// A ListLit node represents a literal list.
+type ListLit struct {
+	comments
+	Lbrack   token.Pos // position of "["
+	Elts     []Expr    // list of composite elements; or nil
+	Ellipsis token.Pos // open list if set
+	Type     Expr      // type for the remaining elements
+	Rbrack   token.Pos // position of "]"
+}
+
+// A ListComprehension node represents as list comprehension.
+type ListComprehension struct {
+	comments
+	Lbrack  token.Pos // position of "["
+	Expr    Expr
+	Clauses []Clause  // Feed or Guard (TODO let)
+	Rbrack  token.Pos // position of "]"
+}
+
+// A ForClause node represents a for clause in a comprehension.
+type ForClause struct {
+	comments
+	For    token.Pos
+	Key    *Ident // allow pattern matching?
+	Colon  token.Pos
+	Value  *Ident // allow pattern matching?
+	In     token.Pos
+	Source Expr
+}
+
+// A IfClause node represents an if guard clause in a comprehension.
+type IfClause struct {
+	comments
+	If        token.Pos
+	Condition Expr
+}
+
+// A ParenExpr node represents a parenthesized expression.
+type ParenExpr struct {
+	comments
+	Lparen token.Pos // position of "("
+	X      Expr      // parenthesized expression
+	Rparen token.Pos // position of ")"
+}
+
+// A SelectorExpr node represents an expression followed by a selector.
+type SelectorExpr struct {
+	comments
+	X   Expr   // expression
+	Sel *Ident // field selector
+}
+
+// An IndexExpr node represents an expression followed by an index.
+type IndexExpr struct {
+	comments
+	X      Expr      // expression
+	Lbrack token.Pos // position of "["
+	Index  Expr      // index expression
+	Rbrack token.Pos // position of "]"
+}
+
+// An SliceExpr node represents an expression followed by slice indices.
+type SliceExpr struct {
+	comments
+	X      Expr      // expression
+	Lbrack token.Pos // position of "["
+	Low    Expr      // begin of slice range; or nil
+	High   Expr      // end of slice range; or nil
+	Rbrack token.Pos // position of "]"
+}
+
+// A CallExpr node represents an expression followed by an argument list.
+type CallExpr struct {
+	comments
+	Fun    Expr      // function expression
+	Lparen token.Pos // position of "("
+	Args   []Expr    // function arguments; or nil
+	Rparen token.Pos // position of ")"
+}
+
+// A UnaryExpr node represents a unary expression.
+type UnaryExpr struct {
+	comments
+	OpPos token.Pos   // position of Op
+	Op    token.Token // operator
+	X     Expr        // operand
+}
+
+// A BinaryExpr node represents a binary expression.
+type BinaryExpr struct {
+	comments
+	X     Expr        // left operand
+	OpPos token.Pos   // position of Op
+	Op    token.Token // operator
+	Y     Expr        // right operand
+}
+
+// token.Pos and End implementations for expression/type nodes.
+
+func (x *BadExpr) Pos() token.Pos       { return x.From }
+func (x *Ident) Pos() token.Pos         { return x.NamePos }
+func (x *TemplateLabel) Pos() token.Pos { return x.Langle }
+func (x *ExprLabel) Pos() token.Pos     { return x.Lbrack }
+func (x *Ellipsis) Pos() token.Pos      { return x.Ellipsis }
+func (x *BasicLit) Pos() token.Pos      { return x.ValuePos }
+func (x *Interpolation) Pos() token.Pos { return x.Elts[0].Pos() }
+func (x *StructLit) Pos() token.Pos {
+	if x.Lbrace == token.NoPos && len(x.Elts) > 0 {
+		return x.Elts[0].Pos()
+	}
+	return x.Lbrace
+}
+
+func (x *ListLit) Pos() token.Pos           { return x.Lbrack }
+func (x *ListComprehension) Pos() token.Pos { return x.Lbrack }
+func (x *ForClause) Pos() token.Pos         { return x.For }
+func (x *IfClause) Pos() token.Pos          { return x.If }
+func (x *ParenExpr) Pos() token.Pos         { return x.Lparen }
+func (x *SelectorExpr) Pos() token.Pos      { return x.X.Pos() }
+func (x *IndexExpr) Pos() token.Pos         { return x.X.Pos() }
+func (x *SliceExpr) Pos() token.Pos         { return x.X.Pos() }
+func (x *CallExpr) Pos() token.Pos          { return x.Fun.Pos() }
+func (x *UnaryExpr) Pos() token.Pos         { return x.OpPos }
+func (x *BinaryExpr) Pos() token.Pos        { return x.X.Pos() }
+func (x *BottomLit) Pos() token.Pos         { return x.Bottom }
+
+func (x *BadExpr) End() token.Pos { return x.To }
+func (x *Ident) End() token.Pos {
+	return x.NamePos.Add(len(x.Name))
+}
+func (x *TemplateLabel) End() token.Pos { return x.Rangle }
+func (x *ExprLabel) End() token.Pos     { return x.Rbrack }
+func (x *Ellipsis) End() token.Pos {
+	if x.Elt != nil {
+		return x.Elt.End()
+	}
+	return x.Ellipsis + 3 // len("...")
+}
+func (x *BasicLit) End() token.Pos      { return token.Pos(int(x.ValuePos) + len(x.Value)) }
+func (x *Interpolation) End() token.Pos { return x.Elts[len(x.Elts)-1].Pos() }
+func (x *StructLit) End() token.Pos {
+	if x.Rbrace == token.NoPos && len(x.Elts) > 0 {
+		return x.Elts[len(x.Elts)-1].Pos()
+	}
+	return x.Rbrace.Add(1)
+}
+func (x *ListLit) End() token.Pos           { return x.Rbrack.Add(1) }
+func (x *ListComprehension) End() token.Pos { return x.Rbrack }
+func (x *ForClause) End() token.Pos         { return x.Source.End() }
+func (x *IfClause) End() token.Pos          { return x.Condition.End() }
+func (x *ParenExpr) End() token.Pos         { return x.Rparen.Add(1) }
+func (x *SelectorExpr) End() token.Pos      { return x.Sel.End() }
+func (x *IndexExpr) End() token.Pos         { return x.Rbrack.Add(1) }
+func (x *SliceExpr) End() token.Pos         { return x.Rbrack.Add(1) }
+func (x *CallExpr) End() token.Pos          { return x.Rparen.Add(1) }
+func (x *UnaryExpr) End() token.Pos         { return x.X.End() }
+func (x *BinaryExpr) End() token.Pos        { return x.Y.End() }
+func (x *BottomLit) End() token.Pos         { return x.Bottom.Add(1) }
+
+// ----------------------------------------------------------------------------
+// Convenience functions for Idents
+
+// NewIdent creates a new Ident without position.
+// Useful for ASTs generated by code other than the Go
+func NewIdent(name string) *Ident {
+	return &Ident{comments{}, token.NoPos, name, nil, nil}
+}
+
+func (id *Ident) String() string {
+	if id != nil {
+		return id.Name
+	}
+	return "<nil>"
+}
+
+// ----------------------------------------------------------------------------
+// Declarations
+
+// An ImportSpec node represents a single package import.
+type ImportSpec struct {
+	comments
+	Name   *Ident    // local package name (including "."); or nil
+	Path   *BasicLit // import path
+	EndPos token.Pos // end of spec (overrides Path.Pos if nonzero)
+}
+
+// Pos and End implementations for spec nodes.
+
+func (s *ImportSpec) Pos() token.Pos {
+	if s.Name != nil {
+		return s.Name.Pos()
+	}
+	return s.Path.Pos()
+}
+
+// func (s *AliasSpec) Pos() token.Pos { return s.Name.Pos() }
+// func (s *ValueSpec) Pos() token.Pos { return s.Names[0].Pos() }
+// func (s *TypeSpec) Pos() token.Pos  { return s.Name.Pos() }
+
+func (s *ImportSpec) End() token.Pos {
+	if s.EndPos != 0 {
+		return s.EndPos
+	}
+	return s.Path.End()
+}
+
+// specNode() ensures that only spec nodes can be assigned to a Spec.
+func (*ImportSpec) specNode() {}
+
+// A declaration is represented by one of the following declaration nodes.
+type (
+	// A BadDecl node is a placeholder for declarations containing
+	// syntax errors for which no correct declaration nodes can be
+	// created.
+	BadDecl struct {
+		comments
+		From, To token.Pos // position range of bad declaration
+	}
+
+	// A ImportDecl node represents a series of import declarations. A valid
+	// Lparen position (Lparen.Line > 0) indicates a parenthesized declaration.
+	ImportDecl struct {
+		comments
+		Import token.Pos
+		Lparen token.Pos // position of '(', if any
+		Specs  []*ImportSpec
+		Rparen token.Pos // position of ')', if any
+	}
+
+	// An EmitDecl node represents a single expression used as a declaration.
+	// The expressions in this declaration is what will be emitted as
+	// configuration output.
+	//
+	// An EmitDecl may only appear at the top level.
+	EmitDecl struct {
+		comments
+		Expr Expr
+	}
+)
+
+// Pos and End implementations for declaration nodes.
+
+func (d *BadDecl) Pos() token.Pos    { return d.From }
+func (d *ImportDecl) Pos() token.Pos { return d.Import }
+func (d *EmitDecl) Pos() token.Pos   { return d.Expr.Pos() }
+
+func (d *BadDecl) End() token.Pos { return d.To }
+func (d *ImportDecl) End() token.Pos {
+	if d.Rparen.IsValid() {
+		return d.Rparen.Add(1)
+	}
+	return d.Specs[0].End()
+}
+func (d *EmitDecl) End() token.Pos { return d.Expr.End() }
+
+// ----------------------------------------------------------------------------
+// Files and packages
+
+// A File node represents a Go source file.
+//
+// The Comments list contains all comments in the source file in order of
+// appearance, including the comments that are pointed to from other nodes
+// via Doc and Comment fields.
+type File struct {
+	Filename string
+	comments
+	Package token.Pos // position of "package" pseudo-keyword
+	Name    *Ident    // package names
+	// TODO: Change Expr to Decl?
+	Imports    []*ImportSpec // imports in this file
+	Decls      []Decl        // top-level declarations; or nil
+	Unresolved []*Ident      // unresolved identifiers in this file
+}
+
+func (f *File) Pos() token.Pos {
+	if f.Package != token.NoPos {
+		return f.Package
+	}
+	if len(f.Decls) > 0 {
+		return f.Decls[0].Pos()
+	}
+	return token.NoPos
+}
+func (f *File) End() token.Pos {
+	if n := len(f.Decls); n > 0 {
+		return f.Decls[n-1].End()
+	}
+	if f.Name != nil {
+		return f.Name.End()
+	}
+	return token.NoPos
+}
diff --git a/cue/ast/ast_test.go b/cue/ast/ast_test.go
new file mode 100644
index 0000000..4272ffe
--- /dev/null
+++ b/cue/ast/ast_test.go
@@ -0,0 +1,60 @@
+// Copyright 2018 The CUE Authors
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package ast
+
+import (
+	"testing"
+)
+
+func TestCommentText(t *testing.T) {
+	testCases := []struct {
+		list []string
+		text string
+	}{
+		{[]string{"//"}, ""},
+		{[]string{"//   "}, ""},
+		{[]string{"//", "//", "//   "}, ""},
+		{[]string{"// foo   "}, "foo\n"},
+		{[]string{"//", "//", "// foo"}, "foo\n"},
+		{[]string{"// foo  bar  "}, "foo  bar\n"},
+		{[]string{"// foo", "// bar"}, "foo\nbar\n"},
+		{[]string{"// foo", "//", "//", "//", "// bar"}, "foo\n\nbar\n"},
+		{[]string{"// foo", "/* bar */"}, "foo\n bar\n"},
+		{[]string{"//", "//", "//", "// foo", "//", "//", "//"}, "foo\n"},
+
+		{[]string{"/**/"}, ""},
+		{[]string{"/*   */"}, ""},
+		{[]string{"/**/", "/**/", "/*   */"}, ""},
+		{[]string{"/* Foo   */"}, " Foo\n"},
+		{[]string{"/* Foo  Bar  */"}, " Foo  Bar\n"},
+		{[]string{"/* Foo*/", "/* Bar*/"}, " Foo\n Bar\n"},
+		{[]string{"/* Foo*/", "/**/", "/**/", "/**/", "// Bar"}, " Foo\n\nBar\n"},
+		{[]string{"/* Foo*/", "/*\n*/", "//", "/*\n*/", "// Bar"}, " Foo\n\nBar\n"},
+		{[]string{"/* Foo*/", "// Bar"}, " Foo\nBar\n"},
+		{[]string{"/* Foo\n Bar*/"}, " Foo\n Bar\n"},
+	}
+
+	for i, c := range testCases {
+		list := make([]*Comment, len(c.list))
+		for i, s := range c.list {
+			list[i] = &Comment{Text: s}
+		}
+
+		text := (&CommentGroup{List: list}).Text()
+		if text != c.text {
+			t.Errorf("case %d: got %q; expected %q", i, text, c.text)
+		}
+	}
+}
diff --git a/cue/ast/walk.go b/cue/ast/walk.go
new file mode 100644
index 0000000..be492e3
--- /dev/null
+++ b/cue/ast/walk.go
@@ -0,0 +1,287 @@
+// Copyright 2018 The CUE Authors
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package ast
+
+import (
+	"fmt"
+
+	"cuelang.org/go/cue/token"
+)
+
+// Walk traverses an AST in depth-first order: It starts by calling f(node);
+// node must not be nil. If before returns true, Walk invokes f recursively for
+// each of the non-nil children of node, followed by a call of after. Both
+// functions may be nil. If before is nil, it is assumed to always return true.
+//
+func Walk(node Node, before func(Node) bool, after func(Node)) {
+	walk(&inspector{before: before, after: after}, node)
+}
+
+// A visitor's before method is invoked for each node encountered by Walk.
+// If the result visitor w is not nil, Walk visits each of the children
+// of node with the visitor w, followed by a call of w.After.
+type visitor interface {
+	Before(node Node) (w visitor)
+	After(node Node)
+}
+
+// Helper functions for common node lists. They may be empty.
+
+func walkIdentList(v visitor, list []*Ident) {
+	for _, x := range list {
+		walk(v, x)
+	}
+}
+
+func walkExprList(v visitor, list []Expr) {
+	for _, x := range list {
+		walk(v, x)
+	}
+}
+
+func walkDeclList(v visitor, list []Decl) {
+	for _, x := range list {
+		walk(v, x)
+	}
+}
+
+// walk traverses an AST in depth-first order: It starts by calling
+// v.Visit(node); node must not be nil. If the visitor w returned by
+// v.Visit(node) is not nil, walk is invoked recursively with visitor
+// w for each of the non-nil children of node, followed by a call of
+// w.Visit(nil).
+//
+func walk(v visitor, node Node) {
+	if v = v.Before(node); v == nil {
+		return
+	}
+
+	// TODO: record the comment groups and interleave with the values like for
+	// parsing and printing?
+	for _, c := range node.Comments() {
+		walk(v, c)
+	}
+
+	// walk children
+	// (the order of the cases matches the order
+	// of the corresponding node types in go)
+	switch n := node.(type) {
+	// Comments and fields
+	case *Comment:
+		// nothing to do
+
+	case *CommentGroup:
+		for _, c := range n.List {
+			walk(v, c)
+		}
+
+	case *Field:
+		walk(v, n.Label)
+		if n.Value != nil {
+			walk(v, n.Value)
+		}
+
+	case *LambdaExpr:
+		for _, p := range n.Params {
+			walk(v, p)
+		}
+		walk(v, n.Expr)
+
+	case *StructLit:
+		for _, f := range n.Elts {
+			walk(v, f)
+		}
+
+	// Expressions
+	case *BottomLit, *BadExpr, *Ident, *BasicLit:
+		// nothing to do
+
+	case *ExprLabel:
+		walk(v, n.Label)
+
+	case *TemplateLabel:
+		walk(v, n.Ident)
+
+	case *Interpolation:
+		for _, e := range n.Elts {
+			walk(v, e)
+		}
+
+	case *Ellipsis:
+		if n.Elt != nil {
+			walk(v, n.Elt)
+		}
+
+	case *ListLit:
+		walkExprList(v, n.Elts)
+		if n.Type != nil {
+			walk(v, n.Type)
+		}
+
+	case *ParenExpr:
+		walk(v, n.X)
+
+	case *SelectorExpr:
+		walk(v, n.X)
+		walk(v, n.Sel)
+
+	case *IndexExpr:
+		walk(v, n.X)
+		walk(v, n.Index)
+
+	case *SliceExpr:
+		walk(v, n.X)
+		if n.Low != nil {
+			walk(v, n.Low)
+		}
+		if n.High != nil {
+			walk(v, n.High)
+		}
+
+	case *CallExpr:
+		walk(v, n.Fun)
+		walkExprList(v, n.Args)
+
+	case *UnaryExpr:
+		walk(v, n.X)
+
+	case *BinaryExpr:
+		walk(v, n.X)
+		walk(v, n.Y)
+
+	// Declarations
+	case *ImportSpec:
+		if n.Name != nil {
+			walk(v, n.Name)
+		}
+		walk(v, n.Path)
+
+	case *BadDecl:
+		// nothing to do
+
+	case *ImportDecl:
+		for _, s := range n.Specs {
+			walk(v, s)
+		}
+
+	case *EmitDecl:
+		walk(v, n.Expr)
+
+	case *Alias:
+		walk(v, n.Ident)
+		walk(v, n.Expr)
+
+	case *ComprehensionDecl:
+		walk(v, n.Field)
+		for _, c := range n.Clauses {
+			walk(v, c)
+		}
+
+	// Files and packages
+	case *File:
+		if n.Name != nil {
+			walk(v, n.Name)
+		}
+		walkDeclList(v, n.Decls)
+		// don't walk n.Comments - they have been
+		// visited already through the individual
+		// nodes
+
+	case *ListComprehension:
+		walk(v, n.Expr)
+		for _, c := range n.Clauses {
+			walk(v, c)
+		}
+
+	case *ForClause:
+		if n.Key != nil {
+			walk(v, n.Key)
+		}
+		walk(v, n.Value)
+		walk(v, n.Source)
+
+	case *IfClause:
+		walk(v, n.Condition)
+
+	default:
+		panic(fmt.Sprintf("Walk: unexpected node type %T", n))
+	}
+
+	v.After(node)
+}
+
+type inspector struct {
+	before func(Node) bool
+	after  func(Node)
+
+	commentStack []commentFrame
+	current      commentFrame
+}
+
+type commentFrame struct {
+	cg  []*CommentGroup
+	pos int8
+}
+
+func (f *inspector) Before(node Node) visitor {
+	if f.before == nil || f.before(node) {
+		f.commentStack = append(f.commentStack, f.current)
+		f.current = commentFrame{cg: node.Comments()}
+		f.visitComments(f.current.pos)
+		return f
+	}
+	return nil
+}
+
+func (f *inspector) After(node Node) {
+	f.visitComments(127)
+	p := len(f.commentStack) - 1
+	f.current = f.commentStack[p]
+	f.commentStack = f.commentStack[:p]
+	f.current.pos++
+	if f.after != nil {
+		f.after(node)
+	}
+}
+
+func (f *inspector) Token(t token.Token) {
+	f.current.pos++
+}
+
+func (f *inspector) setPos(i int8) {
+	f.current.pos = i
+}
+
+func (f *inspector) visitComments(pos int8) {
+	c := &f.current
+	for ; len(c.cg) > 0; c.cg = c.cg[1:] {
+		cg := c.cg[0]
+		if cg.Position == pos {
+			continue
+		}
+		if f.before == nil || f.before(cg) {
+			for _, c := range cg.List {
+				if f.before == nil || f.before(c) {
+					if f.after != nil {
+						f.after(c)
+					}
+				}
+			}
+			if f.after != nil {
+				f.after(cg)
+			}
+		}
+	}
+}