Combine Cursor with State
This commit is contained in:
@ -11,19 +11,18 @@ import (
|
||||
"unicode/utf8"
|
||||
|
||||
"git.codemonkeysoftware.net/b/gigaparsec"
|
||||
"git.codemonkeysoftware.net/b/gigaparsec/cursor"
|
||||
)
|
||||
|
||||
// RuneReader is an io.RuneReader backed by a Cursor, for compatibility
|
||||
// with the regexp package.
|
||||
type RuneReader struct {
|
||||
cursor cursor.Cursor[byte]
|
||||
start uint64
|
||||
err error
|
||||
state gigaparsec.State[byte]
|
||||
start uint64
|
||||
err error
|
||||
}
|
||||
|
||||
func NewRuneReader(c cursor.Cursor[byte]) *RuneReader {
|
||||
return &RuneReader{cursor: c, start: c.Pos()}
|
||||
func NewRuneReader(state gigaparsec.State[byte]) *RuneReader {
|
||||
return &RuneReader{state: state, start: state.Pos()}
|
||||
}
|
||||
|
||||
func (rr *RuneReader) ReadRune() (r rune, size int, err error) {
|
||||
@ -32,9 +31,9 @@ func (rr *RuneReader) ReadRune() (r rune, size int, err error) {
|
||||
}()
|
||||
var b [4]byte
|
||||
s := b[:]
|
||||
n, next, err := rr.cursor.Read(s)
|
||||
n, next, err := rr.state.Read(s)
|
||||
if err != nil && !errors.Is(err, io.EOF) {
|
||||
rr.cursor = next
|
||||
rr.state = next
|
||||
return 0, 0, fmt.Errorf("ReadRune: %w", err)
|
||||
}
|
||||
if n == 0 {
|
||||
@ -42,12 +41,12 @@ func (rr *RuneReader) ReadRune() (r rune, size int, err error) {
|
||||
}
|
||||
s = s[:n]
|
||||
r, size = utf8.DecodeRune(s)
|
||||
rr.cursor = rr.cursor.At(rr.cursor.Pos() + uint64(size))
|
||||
rr.state = rr.state.At(rr.state.Pos() + uint64(size))
|
||||
return r, size, nil
|
||||
}
|
||||
|
||||
func (rr *RuneReader) Cursor() cursor.Cursor[byte] {
|
||||
return rr.cursor
|
||||
func (rr *RuneReader) State() gigaparsec.State[byte] {
|
||||
return rr.state
|
||||
}
|
||||
|
||||
func (rr *RuneReader) Error() error {
|
||||
@ -55,7 +54,7 @@ func (rr *RuneReader) Error() error {
|
||||
}
|
||||
|
||||
func (rr *RuneReader) Count() uint64 {
|
||||
return rr.cursor.Pos() - rr.start
|
||||
return rr.state.Pos() - rr.start
|
||||
}
|
||||
|
||||
func Regexp(pattern string) gigaparsec.Parser[byte, string] {
|
||||
@ -63,7 +62,7 @@ func Regexp(pattern string) gigaparsec.Parser[byte, string] {
|
||||
re := regexp.MustCompile(pattern)
|
||||
expected := fmt.Sprintf("match `%s`", pattern)
|
||||
return func(input gigaparsec.State[byte]) (gigaparsec.Result[byte, string], error) {
|
||||
r := NewRuneReader(input.Cursor())
|
||||
r := NewRuneReader(input)
|
||||
idx := re.FindReaderIndex(r)
|
||||
err := r.Error()
|
||||
if err != nil && !errors.Is(err, io.EOF) {
|
||||
@ -71,7 +70,7 @@ func Regexp(pattern string) gigaparsec.Parser[byte, string] {
|
||||
}
|
||||
if idx == nil {
|
||||
got := make([]byte, r.Count())
|
||||
_, _, err = input.Cursor().Read(got)
|
||||
_, _, err = input.Read(got)
|
||||
if err != nil {
|
||||
return gigaparsec.Result[byte, string]{}, fmt.Errorf("Regexp: unexpected error: %w", err)
|
||||
}
|
||||
@ -80,7 +79,7 @@ func Regexp(pattern string) gigaparsec.Parser[byte, string] {
|
||||
// Alas, this is a little wasteful because a Regexp can only return indices
|
||||
// when searching a RuneReader.
|
||||
dst := make([]byte, idx[1]-idx[0])
|
||||
n, _, err := input.Cursor().Read(dst)
|
||||
n, _, err := input.Read(dst)
|
||||
if err != nil {
|
||||
return gigaparsec.Result[byte, string]{}, fmt.Errorf("Regexp: unexpected error: %w", err)
|
||||
}
|
||||
|
Reference in New Issue
Block a user