2022-03-15 15:16:15 +01:00
|
|
|
package token_test
|
2022-03-10 06:10:36 +01:00
|
|
|
|
|
|
|
import (
|
|
|
|
"strings"
|
|
|
|
"testing"
|
|
|
|
"time"
|
|
|
|
|
2022-03-15 15:16:15 +01:00
|
|
|
"ewintr.nl/adoc/token"
|
2022-03-10 06:10:36 +01:00
|
|
|
"ewintr.nl/go-kit/test"
|
|
|
|
)
|
|
|
|
|
|
|
|
func TestLexer(t *testing.T) {
|
2022-03-15 15:16:15 +01:00
|
|
|
word := token.TYPE_WORD
|
|
|
|
ws := token.TYPE_WHITESPACE
|
|
|
|
nl := token.TYPE_NEWLINE
|
|
|
|
eq := token.TYPE_EQUALSIGN
|
|
|
|
bt := token.TYPE_BACKTICK
|
|
|
|
as := token.TYPE_ASTERISK
|
|
|
|
un := token.TYPE_UNDERSCORE
|
2022-03-10 06:10:36 +01:00
|
|
|
|
|
|
|
for _, tc := range []struct {
|
|
|
|
name string
|
|
|
|
input string
|
2022-03-15 15:16:15 +01:00
|
|
|
exp []token.Token
|
2022-03-10 06:10:36 +01:00
|
|
|
}{
|
|
|
|
{
|
|
|
|
name: "word string",
|
|
|
|
input: "one two",
|
2022-03-15 15:16:15 +01:00
|
|
|
exp: []token.Token{
|
2022-03-10 06:10:36 +01:00
|
|
|
{Type: word, Literal: "one"},
|
|
|
|
{Type: ws, Literal: " "},
|
|
|
|
{Type: word, Literal: "two"},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "punctuation",
|
|
|
|
input: `. ,`,
|
2022-03-15 15:16:15 +01:00
|
|
|
exp: []token.Token{
|
2022-03-10 06:10:36 +01:00
|
|
|
{Type: word, Literal: "."},
|
|
|
|
{Type: ws, Literal: " "},
|
|
|
|
{Type: word, Literal: ","},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "whitespace",
|
|
|
|
input: " \t",
|
2022-03-15 15:16:15 +01:00
|
|
|
exp: []token.Token{
|
2022-03-10 06:10:36 +01:00
|
|
|
{Type: ws, Literal: " \t"},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "tab",
|
|
|
|
input: "\t",
|
2022-03-15 15:16:15 +01:00
|
|
|
exp: []token.Token{{Type: ws, Literal: "\t"}},
|
2022-03-10 06:10:36 +01:00
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "newlines",
|
|
|
|
input: "\n\n\n",
|
2022-03-15 15:16:15 +01:00
|
|
|
exp: []token.Token{{Type: nl, Literal: "\n\n\n"}},
|
2022-03-10 06:10:36 +01:00
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "special chars",
|
|
|
|
input: "=*_",
|
2022-03-15 15:16:15 +01:00
|
|
|
exp: []token.Token{
|
2022-03-10 06:10:36 +01:00
|
|
|
{Type: eq, Literal: "="},
|
|
|
|
{Type: as, Literal: "*"},
|
|
|
|
{Type: un, Literal: "_"},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "mixed",
|
|
|
|
input: "This is a line with mixed \t `stuff`, see\t==?",
|
2022-03-15 15:16:15 +01:00
|
|
|
exp: []token.Token{
|
2022-03-10 06:10:36 +01:00
|
|
|
{Type: word, Literal: "This"},
|
|
|
|
{Type: ws, Literal: " "},
|
|
|
|
{Type: word, Literal: "is"},
|
|
|
|
{Type: ws, Literal: " "},
|
|
|
|
{Type: word, Literal: "a"},
|
|
|
|
{Type: ws, Literal: " "},
|
|
|
|
{Type: word, Literal: "line"},
|
|
|
|
{Type: ws, Literal: " "},
|
|
|
|
{Type: word, Literal: "with"},
|
|
|
|
{Type: ws, Literal: " "},
|
|
|
|
{Type: word, Literal: "mixed"},
|
|
|
|
{Type: ws, Literal: " \t "},
|
|
|
|
{Type: bt, Literal: "`"},
|
|
|
|
{Type: word, Literal: "stuff"},
|
|
|
|
{Type: bt, Literal: "`"},
|
|
|
|
{Type: word, Literal: ","},
|
|
|
|
{Type: ws, Literal: " "},
|
|
|
|
{Type: word, Literal: "see"},
|
|
|
|
{Type: ws, Literal: "\t"},
|
|
|
|
{Type: eq, Literal: "=="},
|
|
|
|
{Type: word, Literal: "?"},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
} {
|
|
|
|
t.Run(tc.name, func(t *testing.T) {
|
|
|
|
input := strings.NewReader(tc.input)
|
2022-03-15 15:16:15 +01:00
|
|
|
lex := token.NewLexer(input)
|
|
|
|
act := []token.Token{}
|
2022-03-10 06:10:36 +01:00
|
|
|
stop := time.Now().Add(3 * time.Second)
|
|
|
|
|
|
|
|
T:
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case tok, ok := <-lex.Out():
|
|
|
|
if !ok {
|
|
|
|
break T
|
|
|
|
}
|
|
|
|
act = append(act, tok)
|
|
|
|
default:
|
|
|
|
if time.Now().After(stop) {
|
|
|
|
break T
|
|
|
|
}
|
|
|
|
time.Sleep(5 * time.Millisecond)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
test.OK(t, lex.Error())
|
2022-03-15 15:16:15 +01:00
|
|
|
exp := append(tc.exp, token.TOKEN_EOF)
|
2022-03-10 06:10:36 +01:00
|
|
|
test.Equals(t, exp, act)
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|