hcl/parser/parser.go

314 lines
6.8 KiB
Go
Raw Normal View History

2015-10-25 15:14:16 +00:00
// Package parser implements a parser for HCL (HashiCorp Configuration
// Language)
package parser
2015-10-07 22:38:39 +00:00
2015-10-11 23:27:43 +00:00
import (
2015-10-12 19:53:40 +00:00
"errors"
2015-10-11 23:27:43 +00:00
"fmt"
2015-10-16 20:12:26 +00:00
"github.com/fatih/hcl/ast"
2015-10-11 23:27:43 +00:00
"github.com/fatih/hcl/scanner"
2015-10-16 20:12:26 +00:00
"github.com/fatih/hcl/token"
2015-10-11 23:27:43 +00:00
)
2015-10-07 22:38:39 +00:00
type Parser struct {
sc *scanner.Scanner
2015-10-24 20:11:03 +00:00
tok token.Token // last read token
comments []*ast.Comment
2015-10-11 23:27:43 +00:00
enableTrace bool
indent int
n int // buffer size (max = 1)
2015-10-07 22:38:39 +00:00
}
func newParser(src []byte) *Parser {
2015-10-07 22:38:39 +00:00
return &Parser{
sc: scanner.New(src),
}
}
// Parse returns the fully parsed source and returns the abstract syntax tree.
func Parse(src []byte) (ast.Node, error) {
p := newParser(src)
return p.Parse()
}
var errEofToken = errors.New("EOF token found")
// Parse returns the fully parsed source and returns the abstract syntax tree.
2015-10-16 20:12:26 +00:00
func (p *Parser) Parse() (ast.Node, error) {
return p.parseObjectList()
2015-10-18 22:30:14 +00:00
}
func (p *Parser) parseObjectList() (*ast.ObjectList, error) {
2015-10-18 22:30:14 +00:00
defer un(trace(p, "ParseObjectList"))
node := &ast.ObjectList{}
2015-10-18 22:30:14 +00:00
for {
n, err := p.next()
if err == errEofToken {
break // we are finished
}
// we don't return a nil, because might want to use already collected
// items.
if err != nil {
return node, err
}
2015-10-24 20:11:03 +00:00
switch t := n.(type) {
case *ast.ObjectItem:
node.Add(t)
case *ast.Comment:
p.comments = append(p.comments, t)
}
2015-10-07 22:38:39 +00:00
}
2015-10-12 07:37:37 +00:00
return node, nil
}
2015-10-18 22:30:14 +00:00
// next returns the next node
func (p *Parser) next() (ast.Node, error) {
defer un(trace(p, "ParseNode"))
tok := p.scan()
switch tok.Type {
case token.EOF:
return nil, errEofToken
2015-10-18 22:30:14 +00:00
case token.IDENT, token.STRING:
p.unscan()
2015-10-18 22:30:14 +00:00
return p.parseObjectItem()
case token.COMMENT:
return &ast.Comment{
Start: tok.Pos,
Text: tok.Text,
}, nil
default:
return nil, fmt.Errorf("expected: IDENT | STRING | COMMENT got: %+v", tok.Type)
2015-10-18 22:30:14 +00:00
}
}
// parseObjectItem parses a single object item
2015-10-16 20:12:26 +00:00
func (p *Parser) parseObjectItem() (*ast.ObjectItem, error) {
defer un(trace(p, "ParseObjectItem"))
2015-10-11 23:27:43 +00:00
keys, err := p.parseObjectKey()
if err != nil {
return nil, err
}
2015-10-16 11:16:12 +00:00
switch p.tok.Type {
2015-10-16 20:12:26 +00:00
case token.ASSIGN:
// assignments
2015-10-16 20:12:26 +00:00
o := &ast.ObjectItem{
Keys: keys,
Assign: p.tok.Pos,
2015-10-16 11:44:11 +00:00
}
2015-10-16 20:12:26 +00:00
o.Val, err = p.parseType()
2015-10-16 11:44:11 +00:00
if err != nil {
return nil, err
}
return o, nil
2015-10-16 20:12:26 +00:00
case token.LBRACE:
// object or nested objects
o := &ast.ObjectItem{
Keys: keys,
2015-10-16 11:16:12 +00:00
}
o.Val, err = p.parseObjectType()
if err != nil {
return nil, err
}
return o, nil
2015-10-16 11:16:12 +00:00
}
2015-10-16 19:57:56 +00:00
return nil, fmt.Errorf("not yet implemented: %s", p.tok.Type)
}
// parseObjectKey parses an object key and returns a ObjectKey AST
2015-10-16 20:12:26 +00:00
func (p *Parser) parseObjectKey() ([]*ast.ObjectKey, error) {
keyCount := 0
2015-10-18 22:30:14 +00:00
keys := make([]*ast.ObjectKey, 0)
2015-10-16 11:16:12 +00:00
for {
tok := p.scan()
switch tok.Type {
2015-10-18 22:30:14 +00:00
case token.EOF:
return nil, errEofToken
2015-10-16 20:12:26 +00:00
case token.ASSIGN:
2015-10-16 11:44:11 +00:00
// assignment or object only, but not nested objects. this is not
// allowed: `foo bar = {}`
if keyCount > 1 {
2015-10-18 22:30:14 +00:00
return nil, fmt.Errorf("nested object expected: LBRACE got: %s", p.tok.Type)
2015-10-16 11:16:12 +00:00
}
if keyCount == 0 {
return nil, errors.New("no keys found!!!")
}
2015-10-16 11:16:12 +00:00
return keys, nil
2015-10-16 20:12:26 +00:00
case token.LBRACE:
2015-10-16 11:16:12 +00:00
// object
return keys, nil
2015-10-16 20:12:26 +00:00
case token.IDENT, token.STRING:
keyCount++
2015-10-18 22:30:14 +00:00
keys = append(keys, &ast.ObjectKey{Token: p.tok})
case token.ILLEGAL:
fmt.Println("illegal")
2015-10-16 11:16:12 +00:00
default:
2015-10-18 22:30:14 +00:00
return nil, fmt.Errorf("expected: IDENT | STRING | ASSIGN | LBRACE got: %s", p.tok.Type)
2015-10-16 11:16:12 +00:00
}
}
}
2015-10-18 22:30:14 +00:00
// parseType parses any type of Type, such as number, bool, string, object or
// list.
func (p *Parser) parseType() (ast.Node, error) {
defer un(trace(p, "ParseType"))
tok := p.scan()
switch tok.Type {
case token.NUMBER, token.FLOAT, token.BOOL, token.STRING:
return p.parseLiteralType()
case token.LBRACE:
return p.parseObjectType()
case token.LBRACK:
return p.parseListType()
case token.COMMENT:
// implement comment
case token.EOF:
return nil, errEofToken
}
return nil, fmt.Errorf("Unknown token: %+v", tok)
}
2015-10-16 22:14:40 +00:00
// parseObjectType parses an object type and returns a ObjectType AST
func (p *Parser) parseObjectType() (*ast.ObjectType, error) {
defer un(trace(p, "ParseObjectType"))
// we assume that the currently scanned token is a LBRACE
o := &ast.ObjectType{
Lbrace: p.tok.Pos,
}
l, err := p.parseObjectList()
// if we hit RBRACE, we are good to go (means we parsed all Items), if it's
// not a RBRACE, it's an syntax error and we just return it.
if err != nil && p.tok.Type != token.RBRACE {
return nil, err
}
o.List = l
o.Rbrace = p.tok.Pos // advanced via parseObjectList
return o, nil
}
2015-10-16 21:00:05 +00:00
// parseListType parses a list type and returns a ListType AST
func (p *Parser) parseListType() (*ast.ListType, error) {
defer un(trace(p, "ParseListType"))
2015-10-16 22:14:40 +00:00
// we assume that the currently scanned token is a LBRACK
2015-10-16 21:00:05 +00:00
l := &ast.ListType{
Lbrack: p.tok.Pos,
}
for {
tok := p.scan()
switch tok.Type {
case token.NUMBER, token.FLOAT, token.STRING:
node, err := p.parseLiteralType()
if err != nil {
return nil, err
}
l.Add(node)
case token.COMMA:
// get next list item or we are at the end
continue
case token.COMMENT:
// TODO(arslan): parse comment
continue
2015-10-16 21:00:05 +00:00
case token.BOOL:
// TODO(arslan) should we support? not supported by HCL yet
case token.LBRACK:
2015-10-16 22:14:40 +00:00
// TODO(arslan) should we support nested lists? Even though it's
2015-10-18 20:19:56 +00:00
// written in README of HCL, it's not a part of the grammar
// (not defined in parse.y)
2015-10-16 21:00:05 +00:00
case token.RBRACK:
// finished
l.Rbrack = p.tok.Pos
return l, nil
default:
return nil, fmt.Errorf("unexpected token while parsing list: %s", tok.Type)
}
}
}
2015-10-12 20:44:53 +00:00
// parseLiteralType parses a literal type and returns a LiteralType AST
2015-10-16 20:12:26 +00:00
func (p *Parser) parseLiteralType() (*ast.LiteralType, error) {
defer un(trace(p, "ParseLiteral"))
2015-10-12 20:44:53 +00:00
2015-10-16 20:12:26 +00:00
return &ast.LiteralType{
Token: p.tok,
}, nil
2015-10-12 20:44:53 +00:00
}
// scan returns the next token from the underlying scanner.
// If a token has been unscanned then read that instead.
2015-10-16 20:12:26 +00:00
func (p *Parser) scan() token.Token {
// If we have a token on the buffer, then return it.
if p.n != 0 {
p.n = 0
return p.tok
}
// Otherwise read the next token from the scanner and Save it to the buffer
// in case we unscan later.
p.tok = p.sc.Scan()
return p.tok
2015-10-07 22:38:39 +00:00
}
// unscan pushes the previously read token back onto the buffer.
func (p *Parser) unscan() {
p.n = 1
}
2015-10-11 23:27:43 +00:00
// ----------------------------------------------------------------------------
// Parsing support
func (p *Parser) printTrace(a ...interface{}) {
if !p.enableTrace {
return
}
const dots = ". . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . "
const n = len(dots)
fmt.Printf("%5d:%3d: ", p.tok.Pos.Line, p.tok.Pos.Column)
i := 2 * p.indent
for i > n {
fmt.Print(dots)
i -= n
}
// i <= n
fmt.Print(dots[0:i])
fmt.Println(a...)
}
func trace(p *Parser, msg string) *Parser {
p.printTrace(msg, "(")
p.indent++
return p
}
// Usage pattern: defer un(trace(p, "..."))
func un(p *Parser) {
p.indent--
p.printTrace(")")
}