Fix whitespace lexing/parsing.
Our consumeWhitespace method had a bug where it wouldn't emit the whitespace
token, meaning we weren't actually skipping the whitespace. Oops.
While in there, I removed an outdated TODO (we already supplied a default
state).
I updated the lexing of unquoted strings to take into account the rules about
spaces and unquoted strings; basically, spaces before or after are ignored as
whitespace, spaces in the middle ocunt, and empty strings are not allowed.
I removed an extra case when detecting what to do when lexing an unquoted
string; we already consumed all the whitespace, so the next character shouldn't
be whitespace, so no need to test for it.
We need to consume whitespace before we start lexing the separator character.
I updated the token debugging to be a bit more useful, by defining a String()
method on the token type itself, so it'll expose both the type and the value.
This makes unexpected errors easier to deal with, and is used in all the errors
raised by the parser now.
I added a bunch of whitespace tests for lexing and parsing.
7 func parse(l *lexer) ([]*string, error) {
9 pchan := make(chan *string)
10 errchan := make(chan error)
11 done := make(chan struct{})
12 go runParse(l, pchan, errchan, done)
15 case err := <-errchan:
18 parsed = append(parsed, item)
25 func runParse(l *lexer, parsed chan *string, err chan error, done chan struct{}) {
26 var state parseFunc = parseStart
29 state, e = state(l, parsed)
41 type parseFunc func(*lexer, chan *string) (parseFunc, error)
43 func parseEOF(l *lexer, parsed chan *string) (parseFunc, error) {
45 if tok.typ == tokenWhitespace {
48 if tok.typ != tokenEOF {
49 return nil, errors.New("expected EOF, got " + tok.String())
54 func parseStringOrNull(l *lexer, parsed chan *string) (parseFunc, error) {
56 if tok.typ == tokenWhitespace {
57 return parseStringOrNull, nil
58 } else if tok.typ == tokenString {
60 return parseSeparatorOrDelim, nil
61 } else if tok.typ == tokenNull {
63 return parseSeparatorOrDelim, nil
65 return nil, errors.New("expected string, got " + tok.String())
68 func parseStringOrNullOrEnd(l *lexer, parsed chan *string) (parseFunc, error) {
70 if tok.typ == tokenWhitespace {
71 return parseStringOrNullOrEnd, nil
72 } else if tok.typ == tokenString {
74 return parseSeparatorOrDelim, nil
75 } else if tok.typ == tokenNull {
77 return parseSeparatorOrDelim, nil
78 } else if tok.typ == tokenArrayEnd {
81 return nil, errors.New("Expected string or end, got " + tok.String())
84 func parseSeparatorOrDelim(l *lexer, parsed chan *string) (parseFunc, error) {
86 if tok.typ == tokenWhitespace {
87 return parseSeparatorOrDelim, nil
88 } else if tok.typ == tokenSeparator {
89 return parseStringOrNull, nil
90 } else if tok.typ == tokenArrayEnd {
93 return nil, errors.New("expected separator or delim, got " + tok.String())
96 func parseStart(l *lexer, parsed chan *string) (parseFunc, error) {
98 if tok.typ == tokenWhitespace {
99 return parseStart, nil
100 } else if tok.typ == tokenArrayStart {
101 return parseStringOrNullOrEnd, nil
103 return nil, errors.New("expected separator or delim, got " + tok.String())