/* Copyright 2016 Google Inc. All rights reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ // Package ast provides AST nodes and ancillary structures and algorithms. package ast import ( "fmt" ) // Identifier represents a variable / parameter / field name. //+gen set type Identifier string // Identifiers represents an Identifier slice. type Identifiers []Identifier // TODO(jbeda) implement interning of identifiers if necessary. The C++ // version does so. // --------------------------------------------------------------------------- // Context represents the surrounding context of a node (e.g. a function it's in) type Context *string // Node represents a node in the AST. type Node interface { Context() Context Loc() *LocationRange FreeVariables() Identifiers SetFreeVariables(Identifiers) SetContext(Context) } // Nodes represents a Node slice. type Nodes []Node // --------------------------------------------------------------------------- // NodeBase holds fields common to all node types. type NodeBase struct { loc LocationRange context Context freeVariables Identifiers } // NewNodeBase creates a new NodeBase from initial LocationRange and // Identifiers. func NewNodeBase(loc LocationRange, freeVariables Identifiers) NodeBase { return NodeBase{ loc: loc, freeVariables: freeVariables, } } // NewNodeBaseLoc creates a new NodeBase from an initial LocationRange. func NewNodeBaseLoc(loc LocationRange) NodeBase { return NodeBase{ loc: loc, freeVariables: []Identifier{}, } } // Loc returns a NodeBase's loc. func (n *NodeBase) Loc() *LocationRange { return &n.loc } // FreeVariables returns a NodeBase's freeVariables. func (n *NodeBase) FreeVariables() Identifiers { return n.freeVariables } // SetFreeVariables sets a NodeBase's freeVariables. func (n *NodeBase) SetFreeVariables(idents Identifiers) { n.freeVariables = idents } // Context returns a NodeBase's context. func (n *NodeBase) Context() Context { return n.context } // SetContext sets a NodeBase's context. func (n *NodeBase) SetContext(context Context) { n.context = context } // --------------------------------------------------------------------------- // IfSpec represents an if-specification in a comprehension. type IfSpec struct { Expr Node } // ForSpec represents a for-specification in a comprehension. // Example: // expr for x in arr1 for y in arr2 for z in arr3 // The order is the same as in python, i.e. the leftmost is the outermost. // // Our internal representation reflects how they are semantically nested: // ForSpec(z, outer=ForSpec(y, outer=ForSpec(x, outer=nil))) // Any ifspecs are attached to the relevant ForSpec. // // Ifs are attached to the one on the left, for example: // expr for x in arr1 for y in arr2 if x % 2 == 0 for z in arr3 // The if is attached to the y forspec. // // It desugares to: // flatMap(\x -> // flatMap(\y -> // flatMap(\z -> [expr], arr3) // arr2) // arr3) type ForSpec struct { VarName Identifier Expr Node Conditions []IfSpec Outer *ForSpec } // --------------------------------------------------------------------------- // Apply represents a function call type Apply struct { NodeBase Target Node Arguments Arguments TrailingComma bool TailStrict bool } // NamedArgument represents a named argument to function call x=1. type NamedArgument struct { Name Identifier Arg Node } // Arguments represents positional and named arguments to a function call // f(x, y, z=1). type Arguments struct { Positional Nodes Named []NamedArgument } // --------------------------------------------------------------------------- // ApplyBrace represents e { }. Desugared to e + { }. type ApplyBrace struct { NodeBase Left Node Right Node } // --------------------------------------------------------------------------- // Array represents array constructors [1, 2, 3]. type Array struct { NodeBase Elements Nodes TrailingComma bool } // --------------------------------------------------------------------------- // ArrayComp represents array comprehensions (which are like Python list // comprehensions) type ArrayComp struct { NodeBase Body Node TrailingComma bool Spec ForSpec } // --------------------------------------------------------------------------- // Assert represents an assert expression (not an object-level assert). // // After parsing, message can be nil indicating that no message was // specified. This AST is elimiated by desugaring. type Assert struct { NodeBase Cond Node Message Node Rest Node } // --------------------------------------------------------------------------- // BinaryOp represents a binary operator. type BinaryOp int // Binary operators const ( BopMult BinaryOp = iota BopDiv BopPercent BopPlus BopMinus BopShiftL BopShiftR BopGreater BopGreaterEq BopLess BopLessEq BopIn BopManifestEqual BopManifestUnequal BopBitwiseAnd BopBitwiseXor BopBitwiseOr BopAnd BopOr ) var bopStrings = []string{ BopMult: "*", BopDiv: "/", BopPercent: "%", BopPlus: "+", BopMinus: "-", BopShiftL: "<<", BopShiftR: ">>", BopGreater: ">", BopGreaterEq: ">=", BopLess: "<", BopLessEq: "<=", BopIn: "in", BopManifestEqual: "==", BopManifestUnequal: "!=", BopBitwiseAnd: "&", BopBitwiseXor: "^", BopBitwiseOr: "|", BopAnd: "&&", BopOr: "||", } // BopMap is a map from binary operator token strings to BinaryOp values. var BopMap = map[string]BinaryOp{ "*": BopMult, "/": BopDiv, "%": BopPercent, "+": BopPlus, "-": BopMinus, "<<": BopShiftL, ">>": BopShiftR, ">": BopGreater, ">=": BopGreaterEq, "<": BopLess, "<=": BopLessEq, "in": BopIn, "==": BopManifestEqual, "!=": BopManifestUnequal, "&": BopBitwiseAnd, "^": BopBitwiseXor, "|": BopBitwiseOr, "&&": BopAnd, "||": BopOr, } func (b BinaryOp) String() string { if b < 0 || int(b) >= len(bopStrings) { panic(fmt.Sprintf("INTERNAL ERROR: Unrecognised binary operator: %d", b)) } return bopStrings[b] } // Binary represents binary operators. type Binary struct { NodeBase Left Node Op BinaryOp Right Node } // --------------------------------------------------------------------------- // Conditional represents if/then/else. // // After parsing, branchFalse can be nil indicating that no else branch // was specified. The desugarer fills this in with a LiteralNull type Conditional struct { NodeBase Cond Node BranchTrue Node BranchFalse Node } // --------------------------------------------------------------------------- // Dollar represents the $ keyword type Dollar struct{ NodeBase } // --------------------------------------------------------------------------- // Error represents the error e. type Error struct { NodeBase Expr Node } // --------------------------------------------------------------------------- // Function represents a function definition type Function struct { NodeBase Parameters Parameters TrailingComma bool Body Node } // NamedParameter represents an optional named parameter of a function. type NamedParameter struct { Name Identifier DefaultArg Node } // Parameters represents the required positional parameters and optional named // parameters to a function definition. type Parameters struct { Required Identifiers Optional []NamedParameter } // --------------------------------------------------------------------------- // Import represents import "file". type Import struct { NodeBase File *LiteralString } // --------------------------------------------------------------------------- // ImportStr represents importstr "file". type ImportStr struct { NodeBase File *LiteralString } // --------------------------------------------------------------------------- // Index represents both e[e] and the syntax sugar e.f. // // One of index and id will be nil before desugaring. After desugaring id // will be nil. type Index struct { NodeBase Target Node Index Node Id *Identifier } // Slice represents an array slice a[begin:end:step]. type Slice struct { NodeBase Target Node // Each of these can be nil BeginIndex Node EndIndex Node Step Node } // --------------------------------------------------------------------------- // LocalBind is a helper struct for astLocal type LocalBind struct { Variable Identifier Body Node Fun *Function } // LocalBinds represents a LocalBind slice. type LocalBinds []LocalBind // Local represents local x = e; e. After desugaring, functionSugar is false. type Local struct { NodeBase Binds LocalBinds Body Node } // --------------------------------------------------------------------------- // LiteralBoolean represents true and false type LiteralBoolean struct { NodeBase Value bool } // --------------------------------------------------------------------------- // LiteralNull represents the null keyword type LiteralNull struct{ NodeBase } // --------------------------------------------------------------------------- // LiteralNumber represents a JSON number type LiteralNumber struct { NodeBase Value float64 OriginalString string } // --------------------------------------------------------------------------- // LiteralStringKind represents the kind of a literal string. type LiteralStringKind int // Literal string kinds const ( StringSingle LiteralStringKind = iota StringDouble StringBlock VerbatimStringDouble VerbatimStringSingle ) // FullyEscaped returns true iff the literal string kind may contain escape // sequences that require unescaping. func (k LiteralStringKind) FullyEscaped() bool { switch k { case StringSingle, StringDouble: return true case StringBlock, VerbatimStringDouble, VerbatimStringSingle: return false } panic(fmt.Sprintf("Unknown string kind: %v", k)) } // LiteralString represents a JSON string type LiteralString struct { NodeBase Value string Kind LiteralStringKind BlockIndent string } // --------------------------------------------------------------------------- // ObjectFieldKind represents the kind of an object field. type ObjectFieldKind int // Kinds of object fields const ( ObjectAssert ObjectFieldKind = iota // assert expr2 [: expr3] where expr3 can be nil ObjectFieldID // id:[:[:]] expr2 ObjectFieldExpr // '['expr1']':[:[:]] expr2 ObjectFieldStr // expr1:[:[:]] expr2 ObjectLocal // local id = expr2 ObjectNullID // null id ObjectNullExpr // null '['expr1']' ObjectNullStr // null expr1 ) // ObjectFieldHide represents the visibility of an object field. type ObjectFieldHide int // Object field visibilities const ( ObjectFieldHidden ObjectFieldHide = iota // f:: e ObjectFieldInherit // f: e ObjectFieldVisible // f::: e ) // ObjectField represents a field of an object or object comprehension. // TODO(sbarzowski) consider having separate types for various kinds type ObjectField struct { Kind ObjectFieldKind Hide ObjectFieldHide // (ignore if kind != astObjectField*) SuperSugar bool // +: (ignore if kind != astObjectField*) MethodSugar bool // f(x, y, z): ... (ignore if kind == astObjectAssert) Method *Function Expr1 Node // Not in scope of the object Id *Identifier Params *Parameters // If methodSugar == true then holds the params. TrailingComma bool // If methodSugar == true then remembers the trailing comma Expr2, Expr3 Node // In scope of the object (can see self). } // ObjectFieldLocalNoMethod creates a non-method local object field. func ObjectFieldLocalNoMethod(id *Identifier, body Node) ObjectField { return ObjectField{ObjectLocal, ObjectFieldVisible, false, false, nil, nil, id, nil, false, body, nil} } // ObjectFields represents an ObjectField slice. type ObjectFields []ObjectField // Object represents object constructors { f: e ... }. // // The trailing comma is only allowed if len(fields) > 0. Converted to // DesugaredObject during desugaring. type Object struct { NodeBase Fields ObjectFields TrailingComma bool } // --------------------------------------------------------------------------- // DesugaredObjectField represents a desugared object field. type DesugaredObjectField struct { Hide ObjectFieldHide Name Node Body Node PlusSuper bool } // DesugaredObjectFields represents a DesugaredObjectField slice. type DesugaredObjectFields []DesugaredObjectField // DesugaredObject represents object constructors { f: e ... } after // desugaring. // // The assertions either return true or raise an error. type DesugaredObject struct { NodeBase Asserts Nodes Fields DesugaredObjectFields } // --------------------------------------------------------------------------- // ObjectComp represents object comprehension // { [e]: e for x in e for.. if... }. type ObjectComp struct { NodeBase Fields ObjectFields TrailingComma bool Spec ForSpec } // --------------------------------------------------------------------------- // Parens represents parentheses // ( e ) type Parens struct { NodeBase Inner Node } // --------------------------------------------------------------------------- // Self represents the self keyword. type Self struct{ NodeBase } // --------------------------------------------------------------------------- // SuperIndex represents the super[e] and super.f constructs. // // Either index or identifier will be set before desugaring. After desugaring, id will be // nil. type SuperIndex struct { NodeBase Index Node Id *Identifier } // InSuper represents the e in super construct. type InSuper struct { NodeBase Index Node } // --------------------------------------------------------------------------- // UnaryOp represents a unary operator. type UnaryOp int // Unary operators const ( UopNot UnaryOp = iota UopBitwiseNot UopPlus UopMinus ) var uopStrings = []string{ UopNot: "!", UopBitwiseNot: "~", UopPlus: "+", UopMinus: "-", } // UopMap is a map from unary operator token strings to UnaryOp values. var UopMap = map[string]UnaryOp{ "!": UopNot, "~": UopBitwiseNot, "+": UopPlus, "-": UopMinus, } func (u UnaryOp) String() string { if u < 0 || int(u) >= len(uopStrings) { panic(fmt.Sprintf("INTERNAL ERROR: Unrecognised unary operator: %d", u)) } return uopStrings[u] } // Unary represents unary operators. type Unary struct { NodeBase Op UnaryOp Expr Node } // --------------------------------------------------------------------------- // Var represents variables. type Var struct { NodeBase Id Identifier } // ---------------------------------------------------------------------------