-
Notifications
You must be signed in to change notification settings - Fork 42
/
nlp_test.go
78 lines (67 loc) · 1.65 KB
/
nlp_test.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
package nlp
import (
"strings"
"testing"
"github.com/BurntSushi/toml"
"github.com/stretchr/testify/require"
)
/*
var tokenizeCases = []struct { // anonymous struct
text string
tokens []string
}{
{"Who's on first?", []string{"who", "s", "on", "first"}},
{"", nil},
}
*/
type tokenizeCase struct {
Text string
Tokens []string
}
func loadTokenizeCases(t *testing.T) []tokenizeCase {
/*
data, err := ioutil.ReadFile("tokenize_cases.toml")
require.NoError(t, err, "Read file")
*/
var testCases struct {
Cases []tokenizeCase
}
// err = toml.Unmarshal(data, &testCases)
_, err := toml.DecodeFile("testdata/tokenize_cases.toml", &testCases)
require.NoError(t, err, "Unmarshal TOML")
return testCases.Cases
}
// Exercise: Read test cases from tokenize_cases.toml
// Use github.com/BurntSushi/toml to read TOML
func TestTokenizeTable(t *testing.T) {
// for _, tc := range tokenizeCases {
for _, tc := range loadTokenizeCases(t) {
t.Run(tc.Text, func(t *testing.T) {
tokens := Tokenize(tc.Text)
require.Equal(t, tc.Tokens, tokens)
})
}
}
func TestTokenize(t *testing.T) {
text := "What's on second?"
expected := []string{"what", "on", "second"}
tokens := Tokenize(text)
require.Equal(t, expected, tokens)
/* Before testify
// if tokens != expected { // Can't compare slices with == in Go (only to nil)
if !reflect.DeepEqual(expected, tokens) {
t.Fatalf("expected %#v, got %#v", expected, tokens)
}
*/
}
func FuzzTokenize(f *testing.F) {
f.Fuzz(func(t *testing.T, text string) {
tokens := Tokenize(text)
lText := strings.ToLower(text)
for _, tok := range tokens {
if !strings.Contains(lText, tok) {
t.Fatal(tok)
}
}
})
}