decoder [WIP]

Signed-off-by: Alejandro Mery <amery@jpi.io>
build-sys: use local darvaza.org/core [DO-NOT-MERGE]
2023-09-03 17:04:37 +00:00 · 2023-09-03 17:03:48 +00:00 · 2023-09-03 17:03:48 +00:00 · 2023-09-03 17:02:51 +00:00 · 2023-09-03 17:01:26 +00:00 · 2023-09-03 17:01:26 +00:00
14 changed files with 840 additions and 81 deletions
@@ -0,0 +1,57 @@
 # asciigoat's INI parser
 [![Go Reference][godoc-badge]][godoc]
 [![Go Report Card][goreport-badge]][goreport]
 `asciigoat.org/ini` is a simple Go library that very loosly parses
 [`INI`-style][wikipedia-dosini] documents allowing the implementation
 of stricter parsers of similar form.
 **asciigoat** is [MIT](https://opensource.org/license/mit/) licensed.
 [godoc]: https://pkg.go.dev/asciigoat.org/ini
 [godoc-badge]: https://pkg.go.dev/badge/asciigoat.org/ini.svg
 [goreport]: https://goreportcard.com/report/asciigoat.org/ini
 [goreport-badge]: https://goreportcard.com/badge/asciigoat.org/ini
 [godoc-lexer]: https://pkg.go.dev/asciigoat.org/core/lexer
 [godoc-parser-parser]: https://pkg.go.dev/asciigoat.org/ini/parser#Parser
 [godoc-basic-parser]: https://pkg.go.dev/asciigoat.org/ini/basic#Decode
 [wikipedia-dosini]: https://en.wikipedia.org/wiki/INI_file
 ## Parser
 [`parser.Parser`][godoc-parser-parser] uses
 [`asciigoat`'s lexer][godoc-lexer] to process an `INI`-style document
 emiting tokens and errors via callbacks.
 ## Basic Parser
 [`basic.Decode()`][godoc-basic-parser] provies a one-shot decoder
 that returns a structured document for you to post-process.
 To allow for correct handling of repetition of section and field names downstream,
 it uses arrays instead of maps, and makes almost no judgment
 about what section or field names are acceptable.
 ## Other Implementations
 Other implementations exist, and they are mature and feature-rich, but they
 are highly opinionated about what's a valid file. Built around maps they don't
 allow repeating names and constraint what characters can be used.
 These are great when you can adapt, or already agree, to their conditions but
 that's not always the case when you are parsing configuration files from
 other applications and that's what [asciigoat.org/ini][godoc] attempts to solve.
 * [gcfg](https://pkg.go.dev/gopkg.in/gcfg.v1)
 * [unknwon's go-ini](https://github.com/go-ini/ini)
 * [wlevene's GoINI](https://github.com/wlevene/ini)
 ## See also
 * [asciigoat.org/core](https://asciigoat.org/core)
 * [oss.jpi.io](https://oss.jpi.io)
 * [INI file][wikipedia-dosini] (_wikipedia_)
 * [TOML](https://www.kelche.co/blog/go/toml/)
@@ -0,0 +1,24 @@
 // Package basic provides a basic representation of dosini-style documents
 package basic
 // Document represents an INI-style document
 type Document struct {
 	Global []Field
 	Sections []Section
 }
 // Section represents an INI-style section with optional GIT-style IDs
 type Section struct {
 	Key     string
 	ID      string
 	EmptyID bool
 	Fields []Field
 }
 // Field represents a key = value entry in an INI-style document
 type Field struct {
 	Key   string
 	Value string
 }
@@ -0,0 +1,49 @@
 package basic
 import (
 	"bytes"
 	"io"
 	"io/fs"
 	"strings"
 	"asciigoat.org/ini/parser"
 )
 type decoder struct {
 	p   *parser.Parser
 	out *Document
 	queue   []*token
 	current *Section
 }
 // Decode attempts to decode an INI-style from an [io.Reader] array into a [Document]
 func Decode(r io.Reader) (*Document, error) {
 	var out Document
 	if r == nil {
 		return nil, fs.ErrNotExist
 	}
 	// parser
 	p := parser.NewParser(r)
 	// decoder
 	dec := decoder{p: p, out: &out}
 	// glue
 	p.OnToken = dec.OnToken
 	p.OnError = dec.OnError
 	// Go!
 	err := p.Run()
 	return &out, err
 }
 // DecodeBytes attempts to decode an INI-style bytes array into a [Document]
 func DecodeBytes(b []byte) (*Document, error) {
 	return Decode(bytes.NewReader(b))
 }
 // DecodeString attempts to decode an INI-style string into a [Document]
 func DecodeString(s string) (*Document, error) {
 	return Decode(strings.NewReader(s))
 }
@@ -0,0 +1,31 @@
 package basic
 import (
 	"errors"
 	"asciigoat.org/core/lexer"
 )
 var (
 	errInvalidToken = errors.New("invalid token")
 )
 func newError(pos lexer.Position, content, hint string, err error) *lexer.Error {
 	return &lexer.Error{
 		Line:    pos.Line,
 		Column:  pos.Column,
 		Content: content,
 		Hint:    hint,
 		Err:     err,
 	}
 }
 func newErrInvalidToken(t *token) *lexer.Error {
 	return newError(t.pos, t.value, "", errInvalidToken)
 }
 func (dec *decoder) OnError(pos lexer.Position, content string, err error) error {
 	err = newError(pos, content, "", err)
 	dec.executeFinal()
 	return err
 }
@@ -0,0 +1,165 @@
 package basic
 import (
 	"fmt"
 	"asciigoat.org/core/lexer"
 	"asciigoat.org/ini/parser"
 )
 type token struct {
 	pos   lexer.Position
 	typ   parser.TokenType
 	value string
 }
 func (t token) String() string {
 	return fmt.Sprintf("%s %s: %q", t.pos, t.typ, t.value)
 }
 func (dec *decoder) executeFinal() {
 	if len(dec.queue) > 0 {
 		// we have unfinished businesses
 		switch dec.queue[0].typ {
 		case parser.TokenSectionStart:
 			dec.execute(parser.TokenSectionEnd)
 		case parser.TokenFieldKey:
 			dec.execute(parser.TokenFieldValue)
 		}
 	}
 }
 func (dec *decoder) execute(typ parser.TokenType) {
 	switch typ {
 	case parser.TokenSectionEnd:
 		name1, ok1 := dec.queueValue(1, parser.TokenSectionName)
 		if ok1 {
 			name2, ok2 := dec.queueValue(2, parser.TokenSectionSubname)
 			dec.addSection(name1, name2, ok2)
 		}
 		dec.queueReset()
 	case parser.TokenFieldValue:
 		key, _ := dec.queueValue(0, parser.TokenFieldKey)
 		value, _ := dec.queueValue(1, parser.TokenFieldValue)
 		dec.addField(key, value)
 		dec.queueReset()
 	}
 }
 func (dec *decoder) addSection(key, id string, allowEmptyID bool) {
 	emptyID := allowEmptyID && id == ""
 	// index for dec.current
 	n := len(dec.out.Sections)
 	// new section
 	dec.out.Sections = append(dec.out.Sections, Section{
 		Key:     key,
 		ID:      id,
 		EmptyID: emptyID,
 	})
 	// pointer to the latest section
 	dec.current = &dec.out.Sections[n]
 }
 func (dec *decoder) addField(key, value string) {
 	field := Field{
 		Key:   key,
 		Value: value,
 	}
 	if p := dec.current; p != nil {
 		// in section
 		p.Fields = append(p.Fields, field)
 	} else {
 		// global
 		dec.out.Global = append(dec.out.Global, field)
 	}
 }
 // queueValue extracts the value of element on the queue if the type matches.
 func (dec *decoder) queueValue(idx int, typ parser.TokenType) (string, bool) {
 	switch {
 	case idx < 0 || idx >= len(dec.queue):
 		// out of range
 		return "", false
 	case dec.queue[idx].typ != typ:
 		// wrong type
 		return "", false
 	default:
 		return dec.queue[idx].value, true
 	}
 }
 // queueReset removes all tokens from the queue
 func (dec *decoder) queueReset() {
 	dec.queue = dec.queue[:0]
 }
 // queueDepth confirms the current depth of the queue
 func (dec *decoder) queueDepth(depth int) bool {
 	return len(dec.queue) == depth
 }
 // queueDepthType confirms the current depth of the queue and the type of the last
 // element.
 func (dec *decoder) queueDepthType(depth int, typ parser.TokenType) bool {
 	if dec.queueDepth(depth) {
 		return dec.queueType(depth-1, typ)
 	}
 	return false
 }
 // queueType tells if the specified element on the queue is of the required type.
 func (dec *decoder) queueType(idx int, typ parser.TokenType) bool {
 	_, ok := dec.queueValue(idx, typ)
 	return ok
 }
 func (dec *decoder) typeOK(typ parser.TokenType) bool {
 	switch typ {
 	case parser.TokenSectionStart, parser.TokenFieldKey:
 		// first token only
 		return dec.queueDepth(0)
 	case parser.TokenSectionName:
 		// right after TokenSectionStart
 		return dec.queueDepthType(1, parser.TokenSectionStart)
 	case parser.TokenSectionSubname:
 		// right after TokenSectionName
 		return dec.queueDepthType(2, parser.TokenSectionName)
 	case parser.TokenSectionEnd:
 		// only on a section with name
 		return dec.queueType(1, parser.TokenSectionName)
 	case parser.TokenFieldValue:
 		// right after a TokenFieldKey
 		return dec.queueDepthType(1, parser.TokenFieldKey)
 	default:
 		// never
 		return false
 	}
 }
 func (dec *decoder) OnToken(pos lexer.Position, typ parser.TokenType, value string) error {
 	t := &token{pos, typ, value}
 	switch {
 	case typ == parser.TokenComment:
 		// ignore comments
 		return nil
 	case dec.typeOK(typ):
 		// acceptable token
 		dec.queue = append(dec.queue, t)
 		dec.execute(typ)
 		return nil
 	default:
 		// unacceptable
 		err := newErrInvalidToken(t)
 		dec.executeFinal()
 		return err
 	}
 }
@@ -0,0 +1,104 @@
 package basic
 import (
 	"bytes"
 	"fmt"
 	"io"
 	"asciigoat.org/ini/parser"
 )
 // WriteNewLine is the new line representation used by [doc.WriteTo]
 const WriteNewLine = "\n"
 // AsBuffer returns a INI representation of the document on
 // a memory buffer
 func (doc *Document) AsBuffer(nl string) *bytes.Buffer {
 	var buf bytes.Buffer
 	if len(doc.Global) > 0 {
 		_, _ = writeFieldsTo(&buf, doc.Global, nl)
 	}
 	for _, sec := range doc.Sections {
 		if buf.Len() > 0 {
 			_, _ = buf.WriteString(nl)
 		}
 		_ = writeSectionToBuffer(&buf, &sec, nl)
 	}
 	return &buf
 }
 func writeFieldsTo(w io.Writer, fields []Field, nl string) (int64, error) {
 	var written int
 	for _, field := range fields {
 		n, err := fmt.Fprintf(w, "%s = %q%s", field.Key, field.Value, nl)
 		switch {
 		case err != nil:
 			return int64(written), err
 		case n > 0:
 			written += n
 		}
 	}
 	return int64(written), nil
 }
 // String generates a string output for "%s"
 func (field Field) String() string {
 	var buf bytes.Buffer
 	_, _ = writeFieldsTo(&buf, []Field{field}, WriteNewLine)
 	return buf.String()
 }
 func writeSectionToBuffer(w *bytes.Buffer, sec *Section, nl string) int {
 	var written, n int
 	_, _ = w.WriteRune(parser.RuneSectionStart)
 	written++
 	n, _ = w.WriteString(sec.Key)
 	written += n
 	switch {
 	case sec.EmptyID:
 		n, _ = w.WriteString(" \"\"")
 		written += n
 	case sec.ID != "":
 		_, _ = w.WriteRune(' ')
 		n, _ = fmt.Fprintf(w, "%q", sec.ID)
 		written += n + 1
 	}
 	_, _ = w.WriteRune(parser.RuneSectionEnd)
 	written++
 	n, _ = w.WriteString(nl)
 	written += n
 	n64, _ := writeFieldsTo(w, sec.Fields, nl)
 	return written + int(n64)
 }
 // String generates a string output for "%s"
 func (sec *Section) String() string {
 	var buf bytes.Buffer
 	_ = writeSectionToBuffer(&buf, sec, WriteNewLine)
 	return buf.String()
 }
 // WriteTo writes a INI representation of the document
 // onto the provided writer.
 func (doc *Document) WriteTo(w io.Writer) (int64, error) {
 	buf := doc.AsBuffer(WriteNewLine)
 	return buf.WriteTo(w)
 }
 // String generates a string output for "%s"
 func (doc *Document) String() string {
 	buf := doc.AsBuffer(WriteNewLine)
 	return buf.String()
 }
@@ -0,0 +1,83 @@
 package ini
 import (
 	"bytes"
 	"io"
 	"strings"
 	"asciigoat.org/core"
 	"asciigoat.org/core/reflective"
 	"asciigoat.org/ini/parser"
 )
 const (
 	decPrefixLiteral = "ini: Decode"
 )
 var (
 	decINIPrefix = decPrefixLiteral[0:3]
 	decDecPrefix = decPrefixLiteral[5:]
 )
 // Decoder ...
 type Decoder struct {
 	io.Closer
 	out   *reflective.Reflection
 	p     *parser.Parser
 	queue []*token
 }
 // Decode ...
 func (dec *Decoder) Decode(v any) error {
 	defer dec.Close()
 	r, err := reflective.New(v)
 	switch e := err.(type) {
 	case *reflective.InvalidUnmarshalError:
 		// customize error
 		e.Prefix = decINIPrefix
 		e.Method = decDecPrefix
 	case *reflective.UnmarshalTypeError:
 		// customize error
 		e.Prefix = decPrefixLiteral
 	case nil:
 		// good reflection. Go!
 		dec.out = r
 		err = dec.p.Run()
 	}
 	return err
 }
 // NewDecoder creates a Decoder using the provided [io.Reader]
 // as source
 func NewDecoder(r io.Reader) *Decoder {
 	rc := core.NewReadCloser(r)
 	switch {
 	case rc == nil:
 		return nil
 	default:
 		dec := &Decoder{
 			p:      parser.NewParser(rc),
 			Closer: rc,
 		}
 		// callbacks
 		dec.p.OnToken = dec.parserOnToken
 		dec.p.OnError = dec.parserOnError
 		return dec
 	}
 }
 // NewDecoderBytes creates a Decoder using the provided bytes array
 // as source
 func NewDecoderBytes(b []byte) *Decoder {
 	return NewDecoder(bytes.NewReader(b))
 }
 // NewDecoderString creates a Decoder over a provided string of data
 func NewDecoderString(s string) *Decoder {
 	return NewDecoder(strings.NewReader(s))
 }
@@ -0,0 +1,32 @@
 package ini
 import (
 	"errors"
 	"log"
 	"asciigoat.org/core/lexer"
 )
 var (
 	errInvalidToken = errors.New("invalid token")
 )
 func newError(pos lexer.Position, content, hint string, err error) *lexer.Error {
 	return &lexer.Error{
 		Line:    pos.Line,
 		Column:  pos.Column,
 		Content: content,
 		Hint:    hint,
 		Err:     err,
 	}
 }
 func (*Decoder) newErrInvalidToken(t *token) *lexer.Error {
 	return newError(t.pos, t.value, "", errInvalidToken)
 }
 // parserOnError is the callback for lexer errors
 func (*Decoder) parserOnError(pos lexer.Position, content string, err error) error {
 	log.Printf("%s: %s %s: %q: %v", "ini", pos, "error", content, err)
 	return newError(pos, content, "", err)
 }
@@ -0,0 +1,144 @@
 package ini
 import (
 	"fmt"
 	"log"
 	"asciigoat.org/core/lexer"
 	"asciigoat.org/ini/parser"
 )
 type token struct {
 	pos   lexer.Position
 	typ   parser.TokenType
 	value string
 }
 func (t token) String() string {
 	return fmt.Sprintf("%s %s: %q", t.pos, t.typ, t.value)
 }
 // queueValue extracts the value of element on the queue if the type matches.
 func (dec *Decoder) queueValue(idx int, typ parser.TokenType) (string, bool) {
 	switch {
 	case idx < 0 || idx >= len(dec.queue):
 		// out of range
 		return "", false
 	case dec.queue[idx].typ != typ:
 		// wrong type
 		return "", false
 	default:
 		// match
 		return dec.queue[idx].value, true
 	}
 }
 // queueReset removes all tokens from the queue
 func (dec *Decoder) queueReset() {
 	dec.queue = dec.queue[:0]
 }
 // queueType tells if the specified element on the queue is of the required type.
 func (dec *Decoder) queueType(idx int, typ parser.TokenType) bool {
 	_, ok := dec.queueValue(idx, typ)
 	return ok
 }
 // queueDepth confirms the current depth of the queue
 func (dec *Decoder) queueDepth(depth int) bool {
 	return len(dec.queue) == depth
 }
 // queueDepthType confirms the current depth of the queue and the type of the last
 // element.
 func (dec *Decoder) queueDepthType(depth int, typ parser.TokenType) bool {
 	if dec.queueDepth(depth) {
 		return dec.queueType(depth-1, typ)
 	}
 	return false
 }
 // typeOK tells if a token of the specified type is acceptable
 // at this time.
 func (dec *Decoder) typeOK(typ parser.TokenType) bool {
 	switch typ {
 	case parser.TokenSectionStart:
 		return dec.queueDepth(0)
 	case parser.TokenSectionName:
 		return dec.queueDepthType(1, parser.TokenSectionStart)
 	case parser.TokenSectionSubname:
 		return dec.queueDepthType(2, parser.TokenSectionName)
 	case parser.TokenSectionEnd:
 		return dec.queueType(1, parser.TokenSectionName)
 	case parser.TokenFieldKey:
 		return dec.queueDepth(0)
 	case parser.TokenFieldValue:
 		return dec.queueDepthType(1, parser.TokenFieldKey)
 	case parser.TokenComment:
 		panic("unreachable")
 	default:
 		return false
 	}
 }
 // execute is called after each acceptable token is appended to the queue
 func (dec *Decoder) execute() error {
 	if l := len(dec.queue); l > 0 {
 		// based on the type of the last element
 		switch dec.queue[l-1].typ {
 		case parser.TokenSectionEnd:
 			name1, _ := dec.queueValue(1, parser.TokenSectionName)
 			name2, ok2 := dec.queueValue(2, parser.TokenSectionSubname)
 			defer dec.queueReset()
 			return dec.executeSection(name1, name2, ok2)
 		case parser.TokenFieldValue:
 			key, _ := dec.queueValue(0, parser.TokenFieldKey)
 			value, _ := dec.queueValue(1, parser.TokenFieldValue)
 			defer dec.queueReset()
 			return dec.executeField(key, value)
 		}
 	}
 	return nil
 }
 // revive:disable:flag-parameter
 func (*Decoder) executeSection(key, id string, hasID bool) error {
 	// revive:enable:flag-parameter
 	if hasID {
 		log.Printf("%s: %s%s[%q]: %q", "ini", "", "section", key, id)
 	} else {
 		log.Printf("%s: %s%s[%q]", "ini", "", "section", key)
 	}
 	return nil
 }
 func (*Decoder) executeField(key, value string) error {
 	log.Printf("%s: %s%s[%q]: %q", "ini", "  ", "field", key, value)
 	return nil
 }
 // parserOnToken is the callback from the parser
 func (dec *Decoder) parserOnToken(pos lexer.Position, typ parser.TokenType, value string) error {
 	var err error
 	t := &token{pos, typ, value}
 	switch {
 	case typ == parser.TokenComment:
 		// ignore comments
 	case dec.typeOK(typ):
 		// acceptable token
 		dec.queue = append(dec.queue, t)
 		err = dec.execute()
 	default:
 		// unacceptable
 		err = dec.newErrInvalidToken(t)
 	}
 	return err
 }
@@ -2,24 +2,30 @@ module asciigoat.org/ini
 go 1.19
 replace (
 	asciigoat.org/core => ../core
 	darvaza.org/core => ../../darvaza.org/core
 )
 require (
-	asciigoat.org/core v0.3.6
+	asciigoat.org/core v0.3.7
 	github.com/mgechev/revive v1.3.3
 	golang.org/x/tools v0.12.0
 )
 require (
 	github.com/BurntSushi/toml v1.3.2 // indirect
-	github.com/chavacava/garif v0.0.0-20230608123814-4bd63c2919ab // indirect
+	github.com/chavacava/garif v0.1.0 // indirect
 	github.com/fatih/color v1.15.0 // indirect
 	github.com/fatih/structtag v1.2.0 // indirect
 	github.com/mattn/go-colorable v0.1.13 // indirect
 	github.com/mattn/go-isatty v0.0.19 // indirect
-	github.com/mattn/go-runewidth v0.0.9 // indirect
+	github.com/mattn/go-runewidth v0.0.15 // indirect
 	github.com/mgechev/dots v0.0.0-20210922191527-e955255bf517 // indirect
 	github.com/mitchellh/go-homedir v1.1.0 // indirect
 	github.com/olekukonko/tablewriter v0.0.5 // indirect
 	github.com/pkg/errors v0.9.1 // indirect
 	github.com/rivo/uniseg v0.4.4 // indirect
 	golang.org/x/mod v0.12.0 // indirect
 	golang.org/x/sys v0.11.0 // indirect
 )
@@ -1,9 +1,7 @@
 asciigoat.org/core v0.3.6 h1:b1vL090OxylmSOwLQryjrmC8FhhCtktMyeJSy1e6LwI=
 asciigoat.org/core v0.3.6/go.mod h1:tXj+JUutxRbcO40ZQRuUVaZ4rnYz1kAZ0nblisV8u74=
 github.com/BurntSushi/toml v1.3.2 h1:o7IhLm0Msx3BaB+n3Ag7L8EVlByGnpq14C4YWiu/gL8=
 github.com/BurntSushi/toml v1.3.2/go.mod h1:CxXYINrC8qIiEnFrOxCa7Jy5BFHlXnUU2pbicEuybxQ=
-github.com/chavacava/garif v0.0.0-20230608123814-4bd63c2919ab h1:5JxePczlyGAtj6R1MUEFZ/UFud6FfsOejq7xLC2ZIb0=
+github.com/chavacava/garif v0.1.0 h1:2JHa3hbYf5D9dsgseMKAmc/MZ109otzgNFk5s87H9Pc=
-github.com/chavacava/garif v0.0.0-20230608123814-4bd63c2919ab/go.mod h1:XMyYCkEL58DF0oyW4qDjjnPWONs2HBqYKI+UIPD+Gww=
+github.com/chavacava/garif v0.1.0/go.mod h1:XMyYCkEL58DF0oyW4qDjjnPWONs2HBqYKI+UIPD+Gww=
 github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
 github.com/davecgh/go-spew v1.1.1 h1:vj9j/u1bqnvCEfJOwUhtlOARqs3+rkHYY13jYWTU97c=
 github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
@@ -16,8 +14,9 @@ github.com/mattn/go-colorable v0.1.13/go.mod h1:7S9/ev0klgBDR4GtXTXX8a3vIGJpMovk
 github.com/mattn/go-isatty v0.0.16/go.mod h1:kYGgaQfpe5nmfYZH+SKPsOc2e4SrIfOl2e/yFXSvRLM=
 github.com/mattn/go-isatty v0.0.19 h1:JITubQf0MOLdlGRuRq+jtsDlekdYPia9ZFsB8h/APPA=
 github.com/mattn/go-isatty v0.0.19/go.mod h1:W+V8PltTTMOvKvAeJH7IuucS94S2C6jfK/D7dTCTo3Y=
 github.com/mattn/go-runewidth v0.0.9 h1:Lm995f3rfxdpd6TSmuVCHVb/QhupuXlYr8sCI/QdE+0=
 github.com/mattn/go-runewidth v0.0.9/go.mod h1:H031xJmbD/WCDINGzjvQ9THkh0rPKHF+m2gUSrubnMI=
 github.com/mattn/go-runewidth v0.0.15 h1:UNAjwbU9l54TA3KzvqLGxwWjHmMgBUVhBiTjelZgg3U=
 github.com/mattn/go-runewidth v0.0.15/go.mod h1:Jdepj2loyihRzMpdS35Xk/zdY8IAYHsh153qUoGf23w=
 github.com/mgechev/dots v0.0.0-20210922191527-e955255bf517 h1:zpIH83+oKzcpryru8ceC6BxnoG8TBrhgAvRg8obzup0=
 github.com/mgechev/dots v0.0.0-20210922191527-e955255bf517/go.mod h1:KQ7+USdGKfpPjXk4Ga+5XxQM4Lm4e3gAogrreFAYpOg=
 github.com/mgechev/revive v1.3.3 h1:GUWzV3g185agbHN4ZdaQvR6zrLVYTUSA2ktvIinivK0=
@@ -30,6 +29,9 @@ github.com/pkg/errors v0.9.1 h1:FEBLx1zS214owpjy7qsBeixbURkuhQAwrK5UwLGTwt4=
 github.com/pkg/errors v0.9.1/go.mod h1:bwawxfHBFNV+L2hUp1rHADufV3IMtnDRdf1r5NINEl0=
 github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM=
 github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
 github.com/rivo/uniseg v0.2.0/go.mod h1:J6wj4VEh+S6ZtnVlnTBMWIodfgj8LQOQFoIToxlJtxc=
 github.com/rivo/uniseg v0.4.4 h1:8TfxU8dW6PdqD27gjM8MVNuicgxIjxpm4K7x4jp8sis=
 github.com/rivo/uniseg v0.4.4/go.mod h1:FN3SvrM+Zdj16jyLfmOkMNblXMcoc8DfTHruCPUcx88=
 github.com/stretchr/objx v0.1.0/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME=
 github.com/stretchr/objx v0.4.0/go.mod h1:YvHI0jy2hoMjB+UWwv71VJQ9isScKT/TqJzVSSt89Yw=
 github.com/stretchr/objx v0.5.0/go.mod h1:Yh+to48EsGEfYuaHDzXPcE3xhTkx73EhmCGUpEOglKo=
@@ -5,71 +5,42 @@ import "asciigoat.org/core/lexer"
 // Run parses the source
 func (p *Parser) Run() error {
 	p.setDefaults()
 	p.pos.Reset()
 	return lexer.Run(p.lexStart)
 }
 func (p *Parser) lexStart() (lexer.StateFn, error) {
 	for {
-		r, _, err := p.src.ReadRune()
+		r, _, err := p.p.ReadRune()
 		switch {
 		case err != nil:
 			return p.emitError("", err)
 		case IsNewLine(r):
 			// new line
-			p.lexMoreNewLine(r)
+			p.p.UnreadRune()
 			p.p.AcceptNewLine()
 			p.stepLine()
 		case IsSpace(r):
 			// whitespace
-			p.stepRune()
+			p.stepString()
 		case IsCommentStart(r):
 			// switch to comment lexer
-			p.src.UnreadRune()
+			p.p.UnreadRune()
 			return p.lexComment, nil
 		case IsSectionStart(r):
 			// section
 			return p.lexSectionStart, nil
 		default:
 			// entry
-			p.src.UnreadRune()
+			p.p.UnreadRune()
 			return p.lexEntryStart, nil
 		}
 	}
 }
 func (p *Parser) lexMoreNewLine(r1 rune) {
 	// r1 is warrantied to be either '\r' or '\n'
 	r2, _, err := p.src.ReadRune()
 	switch r1 {
 	case '\n':
 		switch {
 		case r2 == '\r':
 			// LN CR
 		case err == nil:
 			// LN
 			p.src.UnreadRune()
 		default:
 			// LN EOF
 		}
 	case '\r':
 		switch {
 		case r2 == '\n':
 			// CR LN
 		case err == nil:
 			// CR
 			p.src.UnreadRune()
 		default:
 			// CR EOF
 		}
 	default:
 		panic("unreachable")
 	}
 }
 func (p *Parser) lexComment() (lexer.StateFn, error) {
 	// until the end of the line
-	p.src.AcceptAll(IsNotNewLine)
+	p.p.AcceptAll(IsNotNewLine)
 	err := p.emitString(TokenComment)
 	return p.lexStart, err
@@ -81,11 +52,11 @@ func (p *Parser) lexSectionStart() (lexer.StateFn, error) {
 	}
 	// remove whitespace between `[` and the name
-	if p.src.AcceptAll(IsSpaceNotNewLine) {
+	if p.p.AcceptAll(IsSpaceNotNewLine) {
 		p.stepString()
 	}
-	if !p.src.AcceptAll(IsName) {
+	if !p.p.AcceptAll(IsName) {
 		// no name
 		return p.emitError("section name missing", lexer.ErrUnacceptableRune)
 	}
@@ -94,12 +65,12 @@ func (p *Parser) lexSectionStart() (lexer.StateFn, error) {
 		return nil, err
 	}
-	// remove whitespace between the name andthe closing `]`
+	// remove whitespace between the name and the closing `]`
-	if p.src.AcceptAll(IsSpaceNotNewLine) {
+	if p.p.AcceptAll(IsSpaceNotNewLine) {
 		p.stepString()
 	}
-	r, _, err := p.src.ReadRune()
+	r, _, err := p.p.ReadRune()
 	switch {
 	case err != nil:
 		return p.emitError("", err)
@@ -112,17 +83,17 @@ func (p *Parser) lexSectionStart() (lexer.StateFn, error) {
 }
 func (p *Parser) lexEntryStart() (lexer.StateFn, error) {
-	p.src.AcceptAll(IsName)
+	p.p.AcceptAll(IsName)
 	if err := p.emitString(TokenFieldKey); err != nil {
 		return nil, err
 	}
 	// ignore whitespace between key and the '=' sign
-	if p.src.AcceptAll(IsSpaceNotNewLine) {
+	if p.p.AcceptAll(IsSpaceNotNewLine) {
 		p.stepString()
 	}
-	r, _, err := p.src.ReadRune()
+	r, _, err := p.p.ReadRune()
 	switch {
 	case err != nil:
 		return p.emitError("", err)
@@ -131,11 +102,11 @@ func (p *Parser) lexEntryStart() (lexer.StateFn, error) {
 	}
 	// ignore whitespace between the '=' and the value
-	if p.src.AcceptAll(IsSpaceNotNewLine) {
+	if p.p.AcceptAll(IsSpaceNotNewLine) {
 		p.stepString()
 	}
-	p.src.AcceptAll(IsNotNewLine)
+	p.p.AcceptAll(IsNotNewLine)
 	if err := p.emitString(TokenFieldValue); err != nil {
 		return nil, err
 	}
@@ -1,4 +1,4 @@
-// Package parser parses dosini-style files
+// Package parser parses ini-style files
 package parser
 import (
@@ -8,10 +8,9 @@ import (
 	"asciigoat.org/core/lexer"
 )
-// Parser parses a dosini-style document
+// Parser parses a ini-style document
 type Parser struct {
-	src *lexer.Reader
+	p TextParser
 	pos lexer.Position
 	// OnToken is called for each identified token. if it returns an error
 	// parsing is interrupted.
@@ -51,15 +50,13 @@ func (p *Parser) setDefaults() {
 }
 func (p *Parser) emitString(typ TokenType) error {
-	s := p.src.Emit()
+	pos, s := p.p.Emit()
-	err := p.OnToken(p.pos, typ, s)
+	return p.OnToken(pos, typ, s)
 	p.pos.StepN(len(s))
 	return err
 }
 func (p *Parser) emitError(content string, err error) (lexer.StateFn, error) {
-	err2 := p.OnError(p.pos, content, err)
+	pos := p.p.Position()
 	err2 := p.OnError(pos, content, err)
 	switch {
 	case err2 != nil:
 		// return wrapped error
@@ -77,33 +74,25 @@ func (p *Parser) emitInvalidRune(r rune) (lexer.StateFn, error) {
 // stepLine discards the data and moves the position
 // to the next line.
 func (p *Parser) stepLine() {
-	p.src.Discard()
+	p.p.StepLine()
 	p.pos.StepLine()
 }
 // stepRune discards the data and moves the position
 // one rune forward on the same line.
 func (p *Parser) stepRune() {
 	p.src.Discard()
 	p.pos.Step()
 }
 // stepString discards the data and moves the position
 // forward on the same line the length of the discarded
 // content.
 func (p *Parser) stepString() {
-	s := p.src.Emit()
+	p.p.Step()
 	p.pos.StepN(len(s))
 }
-// NewParser creates a dosini-style parser using
+// NewParser creates a ini-style parser using
 // an [io.Reader] as source
 func NewParser(r io.Reader) *Parser {
-	if r == nil {
+	var p *Parser
-		return nil
+
 	if r != nil {
 		p = new(Parser)
 		p.p.Init(r)
 	}
-	return &Parser{
+	return p
 		src: lexer.NewReader(r),
 	}
 }
@@ -0,0 +1,102 @@
 package parser
 import (
 	"bytes"
 	"io"
 	"strings"
 	"asciigoat.org/core/lexer"
 )
 // TextParser is a generic text parser.
 type TextParser struct {
 	*lexer.Reader
 	pos lexer.Position
 }
 // Init initializes the [TextParser] with a non-nil [io.Reader].
 func (p *TextParser) Init(r io.Reader) {
 	switch {
 	case p == nil || r == nil:
 		panic("invalid call")
 	case p.Reader != nil:
 		panic("parser already initialized")
 	default:
 		p.Reader = lexer.NewReader(r)
 		p.pos.Reset()
 	}
 }
 // InitBytes initializes the [TextParser] with a byte array
 func (p *TextParser) InitBytes(b []byte) {
 	p.Init(bytes.NewReader(b))
 }
 // InitString initializes the [TextParser] with a byte array
 func (p *TextParser) InitString(s string) {
 	p.Init(strings.NewReader(s))
 }
 // Discard shadows [lexer.Reader]'s, and takes in consideration
 // new lines on the discarded data when moving the position
 func (*TextParser) Discard() {
 	// TODO: consider new lines
 	panic("not implemented")
 }
 // Emit returns the accepted text, its position, and
 // moves the cursor position accordingly
 func (p *TextParser) Emit() (lexer.Position, string) {
 	pos := p.pos
 	s := p.Reader.Emit()
 	// TODO: consider new lines
 	p.pos.StepN(len(s))
 	return pos, s
 }
 // Step discards what's been accepted and increments the
 // position assuming they all increment the column counter
 func (p *TextParser) Step() {
 	s := p.Reader.Emit()
 	p.pos.StepN(len(s))
 }
 // StepLine discards what's been accepted and moves then
 // position to the beginning of the next line
 func (p *TextParser) StepLine() {
 	p.Reader.Discard()
 	p.pos.StepLine()
 }
 // Position returns the position of the first character
 // of the accepted text
 func (p *TextParser) Position() lexer.Position {
 	return p.pos
 }
 // AcceptNewLine checks if next is a new line.
 // It accepts "\n", "\n\r", "\r" and "\r\n".
 func (p *TextParser) AcceptNewLine() bool {
 	r1, _, err := p.ReadRune()
 	switch {
 	case err != nil:
 		return false
 	case r1 == '\n':
 		p.AcceptRune('\r')
 		return true
 	case r1 == '\r':
 		p.AcceptRune('\n')
 		return true
 	default:
 		p.UnreadRune()
 		return false
 	}
 }
 // AcceptRune checks if next is the specified rune
 func (p *TextParser) AcceptRune(r rune) bool {
 	return p.Accept(func(r2 rune) bool {
 		return r == r2
 	})
 }
Author	SHA1	Message	Date
amery	df0fe8b9c0	decoder [WIP] Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-03 17:04:37 +00:00
amery	23a6bd090c	build-sys: use local darvaza.org/core [DO-NOT-MERGE] Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-03 17:03:48 +00:00
amery	f8fa9d678a	build-sys: use local asciigoat.org/core [DO-NOT-MERGE] Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-03 17:03:48 +00:00
amery	7e2797607d	Merge branch 'pr-amery-textparser' into next-amery	2023-09-03 17:02:51 +00:00
amery	01cd4139bd	parser.Parser: refactor using TextParser Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-03 17:01:26 +00:00
amery	e34e8eda0a	parser.TextParser: AcceptNewLine() and AcceptRune() Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-03 17:01:26 +00:00
amery	ecff6f6016	parser: introduce generic-ish TextParser Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-03 17:01:26 +00:00
amery	79fc27f965	chore: update dependencies Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-03 15:09:05 +00:00
amery	d75b2dbc78	basic: rename and document queue related methods Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-02 16:07:04 +00:00
amery	46ba96d6b4	basic: refactor error handling Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-02 16:06:59 +00:00
amery	11c5ce70a6	Merge pull request 'basic: implement Section.String() and Field.String()' (#5 ) Reviewed-on: #5	2023-09-02 18:00:08 +02:00
amery	16d52188f6	basic: implement Section.String() and Field.String() to ease development Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-01 21:13:13 +00:00
amery	a4f981610e	Merge pull request 'basic: introduce basic one-shot INI-style decoder' (#4 ) Reviewed-on: #4	2023-09-01 19:29:11 +02:00
amery	a1e20fa3b6	basic: introduce Document.WriteTo() and Document.String() producing an INI-style representation of the Document Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-01 14:22:48 +00:00
amery	174f72c4cf	basic: introduce basic one-shot INI-style decoder Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-01 14:21:55 +00:00
amery	c92e0df47b	chore: update asciigoat.org/core Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-01 13:04:05 +00:00
amery	cf100578c0	Merge pull request 'README: add initial description of the package' (#3 ) Reviewed-on: #3	2023-09-01 15:02:34 +02:00
amery	2eacc65215	README: add initial description of the package Signed-off-by: Alejandro Mery <amery@jpi.io>	2023-09-01 12:57:55 +00:00