Browse Source

parser.Parser: refactor using TextParser

Signed-off-by: Alejandro Mery <amery@jpi.io>
pull/7/head
Alejandro Mery 1 year ago
parent
commit
01cd4139bd
  1. 63
      parser/lexer.go
  2. 43
      parser/parser.go

63
parser/lexer.go

@ -5,71 +5,42 @@ import "asciigoat.org/core/lexer"
// Run parses the source // Run parses the source
func (p *Parser) Run() error { func (p *Parser) Run() error {
p.setDefaults() p.setDefaults()
p.pos.Reset()
return lexer.Run(p.lexStart) return lexer.Run(p.lexStart)
} }
func (p *Parser) lexStart() (lexer.StateFn, error) { func (p *Parser) lexStart() (lexer.StateFn, error) {
for { for {
r, _, err := p.src.ReadRune() r, _, err := p.p.ReadRune()
switch { switch {
case err != nil: case err != nil:
return p.emitError("", err) return p.emitError("", err)
case IsNewLine(r): case IsNewLine(r):
// new line // new line
p.lexMoreNewLine(r) p.p.UnreadRune()
p.p.AcceptNewLine()
p.stepLine() p.stepLine()
case IsSpace(r): case IsSpace(r):
// whitespace // whitespace
p.stepRune() p.stepString()
case IsCommentStart(r): case IsCommentStart(r):
// switch to comment lexer // switch to comment lexer
p.src.UnreadRune() p.p.UnreadRune()
return p.lexComment, nil return p.lexComment, nil
case IsSectionStart(r): case IsSectionStart(r):
// section // section
return p.lexSectionStart, nil return p.lexSectionStart, nil
default: default:
// entry // entry
p.src.UnreadRune() p.p.UnreadRune()
return p.lexEntryStart, nil return p.lexEntryStart, nil
} }
} }
} }
func (p *Parser) lexMoreNewLine(r1 rune) {
// r1 is warrantied to be either '\r' or '\n'
r2, _, err := p.src.ReadRune()
switch r1 {
case '\n':
switch {
case r2 == '\r':
// LN CR
case err == nil:
// LN
p.src.UnreadRune()
default:
// LN EOF
}
case '\r':
switch {
case r2 == '\n':
// CR LN
case err == nil:
// CR
p.src.UnreadRune()
default:
// CR EOF
}
default:
panic("unreachable")
}
}
func (p *Parser) lexComment() (lexer.StateFn, error) { func (p *Parser) lexComment() (lexer.StateFn, error) {
// until the end of the line // until the end of the line
p.src.AcceptAll(IsNotNewLine) p.p.AcceptAll(IsNotNewLine)
err := p.emitString(TokenComment) err := p.emitString(TokenComment)
return p.lexStart, err return p.lexStart, err
@ -81,11 +52,11 @@ func (p *Parser) lexSectionStart() (lexer.StateFn, error) {
} }
// remove whitespace between `[` and the name // remove whitespace between `[` and the name
if p.src.AcceptAll(IsSpaceNotNewLine) { if p.p.AcceptAll(IsSpaceNotNewLine) {
p.stepString() p.stepString()
} }
if !p.src.AcceptAll(IsName) { if !p.p.AcceptAll(IsName) {
// no name // no name
return p.emitError("section name missing", lexer.ErrUnacceptableRune) return p.emitError("section name missing", lexer.ErrUnacceptableRune)
} }
@ -94,12 +65,12 @@ func (p *Parser) lexSectionStart() (lexer.StateFn, error) {
return nil, err return nil, err
} }
// remove whitespace between the name andthe closing `]` // remove whitespace between the name and the closing `]`
if p.src.AcceptAll(IsSpaceNotNewLine) { if p.p.AcceptAll(IsSpaceNotNewLine) {
p.stepString() p.stepString()
} }
r, _, err := p.src.ReadRune() r, _, err := p.p.ReadRune()
switch { switch {
case err != nil: case err != nil:
return p.emitError("", err) return p.emitError("", err)
@ -112,17 +83,17 @@ func (p *Parser) lexSectionStart() (lexer.StateFn, error) {
} }
func (p *Parser) lexEntryStart() (lexer.StateFn, error) { func (p *Parser) lexEntryStart() (lexer.StateFn, error) {
p.src.AcceptAll(IsName) p.p.AcceptAll(IsName)
if err := p.emitString(TokenFieldKey); err != nil { if err := p.emitString(TokenFieldKey); err != nil {
return nil, err return nil, err
} }
// ignore whitespace between key and the '=' sign // ignore whitespace between key and the '=' sign
if p.src.AcceptAll(IsSpaceNotNewLine) { if p.p.AcceptAll(IsSpaceNotNewLine) {
p.stepString() p.stepString()
} }
r, _, err := p.src.ReadRune() r, _, err := p.p.ReadRune()
switch { switch {
case err != nil: case err != nil:
return p.emitError("", err) return p.emitError("", err)
@ -131,11 +102,11 @@ func (p *Parser) lexEntryStart() (lexer.StateFn, error) {
} }
// ignore whitespace between the '=' and the value // ignore whitespace between the '=' and the value
if p.src.AcceptAll(IsSpaceNotNewLine) { if p.p.AcceptAll(IsSpaceNotNewLine) {
p.stepString() p.stepString()
} }
p.src.AcceptAll(IsNotNewLine) p.p.AcceptAll(IsNotNewLine)
if err := p.emitString(TokenFieldValue); err != nil { if err := p.emitString(TokenFieldValue); err != nil {
return nil, err return nil, err
} }

43
parser/parser.go

@ -1,4 +1,4 @@
// Package parser parses dosini-style files // Package parser parses ini-style files
package parser package parser
import ( import (
@ -8,10 +8,9 @@ import (
"asciigoat.org/core/lexer" "asciigoat.org/core/lexer"
) )
// Parser parses a dosini-style document // Parser parses a ini-style document
type Parser struct { type Parser struct {
src *lexer.Reader p TextParser
pos lexer.Position
// OnToken is called for each identified token. if it returns an error // OnToken is called for each identified token. if it returns an error
// parsing is interrupted. // parsing is interrupted.
@ -51,15 +50,13 @@ func (p *Parser) setDefaults() {
} }
func (p *Parser) emitString(typ TokenType) error { func (p *Parser) emitString(typ TokenType) error {
s := p.src.Emit() pos, s := p.p.Emit()
err := p.OnToken(p.pos, typ, s) return p.OnToken(pos, typ, s)
p.pos.StepN(len(s))
return err
} }
func (p *Parser) emitError(content string, err error) (lexer.StateFn, error) { func (p *Parser) emitError(content string, err error) (lexer.StateFn, error) {
err2 := p.OnError(p.pos, content, err) pos := p.p.Position()
err2 := p.OnError(pos, content, err)
switch { switch {
case err2 != nil: case err2 != nil:
// return wrapped error // return wrapped error
@ -77,33 +74,25 @@ func (p *Parser) emitInvalidRune(r rune) (lexer.StateFn, error) {
// stepLine discards the data and moves the position // stepLine discards the data and moves the position
// to the next line. // to the next line.
func (p *Parser) stepLine() { func (p *Parser) stepLine() {
p.src.Discard() p.p.StepLine()
p.pos.StepLine()
}
// stepRune discards the data and moves the position
// one rune forward on the same line.
func (p *Parser) stepRune() {
p.src.Discard()
p.pos.Step()
} }
// stepString discards the data and moves the position // stepString discards the data and moves the position
// forward on the same line the length of the discarded // forward on the same line the length of the discarded
// content. // content.
func (p *Parser) stepString() { func (p *Parser) stepString() {
s := p.src.Emit() p.p.Step()
p.pos.StepN(len(s))
} }
// NewParser creates a dosini-style parser using // NewParser creates a ini-style parser using
// an [io.Reader] as source // an [io.Reader] as source
func NewParser(r io.Reader) *Parser { func NewParser(r io.Reader) *Parser {
if r == nil { var p *Parser
return nil
}
return &Parser{ if r != nil {
src: lexer.NewReader(r), p = new(Parser)
p.p.Init(r)
} }
return p
} }

Loading…
Cancel
Save