zclwrite: consume trailing line comments and newlines in body items

We consume both of these things primarily so that when we manipulate
the AST they will all stay together. For example, removing an attribute
from a body should take its comments and newline too.
This commit is contained in:
Martin Atkins 2017-06-09 08:00:38 -07:00
parent 755fe38505
commit 1de72e146e
2 changed files with 185 additions and 15 deletions

View File

@ -81,9 +81,8 @@ func (it inputTokens) Partition(rng zcl.Range) (before, within, after inputToken
func (it inputTokens) PartitionIncludingComments(rng zcl.Range) (before, within, after inputTokens) { func (it inputTokens) PartitionIncludingComments(rng zcl.Range) (before, within, after inputTokens) {
start, end := partitionTokens(it.nativeTokens, rng) start, end := partitionTokens(it.nativeTokens, rng)
start = partitionLeadCommentTokens(it.nativeTokens[:start]) start = partitionLeadCommentTokens(it.nativeTokens[:start])
_, afterNewline := partitionLineEndTokens(it.nativeTokens[end:])
// TODO: Also adjust "end" to include any trailing line comments and the end += afterNewline
// associated newline.
before = it.Slice(0, start) before = it.Slice(0, start)
within = it.Slice(start, end) within = it.Slice(start, end)
@ -92,13 +91,14 @@ func (it inputTokens) PartitionIncludingComments(rng zcl.Range) (before, within,
} }
// PartitionWithComments is similar to PartitionIncludeComments but it returns // PartitionBlockItem is similar to PartitionIncludeComments but it returns
// the comments as separate token sequences so that they can be captured into // the comments as separate token sequences so that they can be captured into
// AST attributes. // AST attributes. It makes assumptions that apply only to block items, so
func (it inputTokens) PartitionWithComments(rng zcl.Range) (before, leadComments, within, lineComments, after inputTokens) { // should not be used for other constructs.
func (it inputTokens) PartitionBlockItem(rng zcl.Range) (before, leadComments, within, lineComments, newline, after inputTokens) {
before, within, after = it.Partition(rng) before, within, after = it.Partition(rng)
before, leadComments = before.PartitionLeadComments() before, leadComments = before.PartitionLeadComments()
lineComments = after.Slice(0, 0) // FIXME: implement this lineComments, newline, after = after.PartitionLineEndTokens()
return return
} }
@ -109,6 +109,14 @@ func (it inputTokens) PartitionLeadComments() (before, within inputTokens) {
return return
} }
func (it inputTokens) PartitionLineEndTokens() (comments, newline, after inputTokens) {
afterComments, afterNewline := partitionLineEndTokens(it.nativeTokens)
comments = it.Slice(0, afterComments)
newline = it.Slice(afterComments, afterNewline)
after = it.Slice(afterNewline, len(it.nativeTokens))
return
}
func (it inputTokens) Slice(start, end int) inputTokens { func (it inputTokens) Slice(start, end int) inputTokens {
// When we slice, we create a new slice with no additional capacity because // When we slice, we create a new slice with no additional capacity because
// we expect that these slices will be mutated in order to insert // we expect that these slices will be mutated in order to insert
@ -179,13 +187,13 @@ func parseBody(nativeBody *zclsyntax.Body, from inputTokens) (inputTokens, *Body
} }
func parseBodyItem(nativeItem zclsyntax.Node, from inputTokens) (inputTokens, Node, inputTokens) { func parseBodyItem(nativeItem zclsyntax.Node, from inputTokens) (inputTokens, Node, inputTokens) {
before, leadComments, within, lineComments, after := from.PartitionWithComments(nativeItem.Range()) before, leadComments, within, lineComments, newline, after := from.PartitionBlockItem(nativeItem.Range())
var item Node var item Node
switch tItem := nativeItem.(type) { switch tItem := nativeItem.(type) {
case *zclsyntax.Attribute: case *zclsyntax.Attribute:
item = parseAttribute(tItem, within, leadComments, lineComments) item = parseAttribute(tItem, within, leadComments, lineComments, newline)
// TODO: Grab the newline and any line comment from "after" and // TODO: Grab the newline and any line comment from "after" and
// write them into the attribute object. // write them into the attribute object.
case *zclsyntax.Block: case *zclsyntax.Block:
@ -199,7 +207,7 @@ func parseBodyItem(nativeItem zclsyntax.Node, from inputTokens) (inputTokens, No
return before, item, after return before, item, after
} }
func parseAttribute(nativeAttr *zclsyntax.Attribute, from, leadComments, lineComments inputTokens) *Attribute { func parseAttribute(nativeAttr *zclsyntax.Attribute, from, leadComments, lineComments, newline inputTokens) *Attribute {
var allTokens TokenSeq var allTokens TokenSeq
attr := &Attribute{} attr := &Attribute{}
@ -229,16 +237,20 @@ func parseAttribute(nativeAttr *zclsyntax.Attribute, from, leadComments, lineCom
attr.Expr = parseExpression(nativeAttr.Expr, exprTokens) attr.Expr = parseExpression(nativeAttr.Expr, exprTokens)
allTokens = append(allTokens, attr.Expr.AllTokens) allTokens = append(allTokens, attr.Expr.AllTokens)
// Collect any stragglers, such as a trailing newline
if from.Len() > 0 {
allTokens = append(allTokens, from.Seq())
}
if lineComments.Len() > 0 { if lineComments.Len() > 0 {
attr.LineCommentTokens = lineComments.Seq() attr.LineCommentTokens = lineComments.Seq()
allTokens = append(allTokens, attr.LineCommentTokens) allTokens = append(allTokens, attr.LineCommentTokens)
} }
if newline.Len() > 0 {
allTokens = append(allTokens, newline.Seq())
}
// Collect any stragglers, though there shouldn't be any
if from.Len() > 0 {
allTokens = append(allTokens, from.Seq())
}
attr.AllTokens = &allTokens attr.AllTokens = &allTokens
return attr return attr
@ -365,6 +377,47 @@ func partitionLeadCommentTokens(toks zclsyntax.Tokens) int {
return 0 return 0
} }
// partitionLineEndTokens takes a sequence of tokens that is assumed
// to immediately follow a construct that can have a line comment, and
// returns first the index where any line comments end and then second
// the index immediately after the trailing newline.
//
// Line comments are defined as comments that appear immediately after
// a construct on the same line where its significant tokens ended.
//
// Since single-line comment tokens (# and //) include the newline that
// terminates them, in the presence of these the two returned indices
// will be the same since the comment itself serves as the line end.
func partitionLineEndTokens(toks zclsyntax.Tokens) (afterComment, afterNewline int) {
for i := 0; i < len(toks); i++ {
tok := toks[i]
if tok.Type != zclsyntax.TokenComment {
switch tok.Type {
case zclsyntax.TokenNewline:
return i, i + 1
case zclsyntax.TokenEOF:
// Although this is valid, we mustn't include the EOF
// itself as our "newline" or else strange things will
// happen when we try to append new items.
return i, i
default:
// If we have well-formed input here then nothing else should be
// possible. This path should never happen, because we only try
// to extract tokens from the sequence if the parser succeeded,
// and it should catch this problem itself.
panic("malformed line trailers: expected only comments and newlines")
}
}
if len(tok.Bytes) > 0 && tok.Bytes[len(tok.Bytes)-1] == '\n' {
// Newline at the end of a single-line comment serves both as
// the end of comments *and* the end of the line.
return i + 1, i + 1
}
}
return len(toks), len(toks)
}
// lexConfig uses the zclsyntax scanner to get a token stream and then // lexConfig uses the zclsyntax scanner to get a token stream and then
// rewrites it into this package's token model. // rewrites it into this package's token model.
// //

View File

@ -232,6 +232,123 @@ func TestParse(t *testing.T) {
}, },
}, },
}, },
{
"a = 1 # because it is\n",
&Body{
Items: []Node{
&Attribute{
AllTokens: &TokenSeq{
&TokenSeq{
Tokens{
{
Type: zclsyntax.TokenIdent,
Bytes: []byte(`a`),
SpacesBefore: 0,
},
},
},
&TokenSeq{
Tokens{
{
Type: zclsyntax.TokenEqual,
Bytes: []byte(`=`),
SpacesBefore: 1,
},
},
},
&TokenSeq{
Tokens{
{
Type: zclsyntax.TokenNumberLit,
Bytes: []byte(`1`),
SpacesBefore: 1,
},
},
},
&TokenSeq{
Tokens{
{
Type: zclsyntax.TokenComment,
Bytes: []byte("# because it is\n"),
SpacesBefore: 1,
},
},
},
},
NameTokens: &TokenSeq{Tokens{
{
Type: zclsyntax.TokenIdent,
Bytes: []byte(`a`),
SpacesBefore: 0,
},
}},
EqualsTokens: &TokenSeq{Tokens{
{
Type: zclsyntax.TokenEqual,
Bytes: []byte(`=`),
SpacesBefore: 1,
},
}},
Expr: &Expression{
AllTokens: &TokenSeq{Tokens{
{
Type: zclsyntax.TokenNumberLit,
Bytes: []byte(`1`),
SpacesBefore: 1,
},
}},
},
LineCommentTokens: &TokenSeq{Tokens{
{
Type: zclsyntax.TokenComment,
Bytes: []byte("# because it is\n"),
SpacesBefore: 1,
},
}},
},
},
AllTokens: &TokenSeq{
&TokenSeq{
&TokenSeq{
Tokens{
{
Type: zclsyntax.TokenIdent,
Bytes: []byte(`a`),
SpacesBefore: 0,
},
},
},
&TokenSeq{
Tokens{
{
Type: zclsyntax.TokenEqual,
Bytes: []byte(`=`),
SpacesBefore: 1,
},
},
},
&TokenSeq{
Tokens{
{
Type: zclsyntax.TokenNumberLit,
Bytes: []byte(`1`),
SpacesBefore: 1,
},
},
},
&TokenSeq{
Tokens{
{
Type: zclsyntax.TokenComment,
Bytes: []byte("# because it is\n"),
SpacesBefore: 1,
},
},
},
},
},
},
},
{ {
"# bee bee bee\n\nb = 1", // two newlines separate the comment from the attribute "# bee bee bee\n\nb = 1", // two newlines separate the comment from the attribute
&Body{ &Body{