-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathstemmer_test.go
107 lines (88 loc) · 2.06 KB
/
stemmer_test.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
package stemmer
import (
"strings"
"testing"
"github.com/antonbaumann/german-go-stemmer/internal/util"
)
type testSet struct {
value string
expected string
}
func BenchmarkStemWord(b *testing.B) {
words, err := util.ReadWordList("testdata/voc.txt")
if err != nil {
b.Error(err)
b.Fail()
}
b.StartTimer()
for i := 0; i < b.N; i++ {
_ = StemWord(words[i%len(words)])
}
b.StopTimer()
}
func BenchmarkStemQuery(b *testing.B) {
words, err := util.ReadWordList("testdata/voc.txt")
if err != nil {
b.Error(err)
b.Fail()
}
b.StartTimer()
for i := 0; i < b.N; i++ {
_ = Stem(words[i%len(words)])
}
b.StopTimer()
}
func TestStemQuery(t *testing.T) {
query := "wie wird das wetter \t morgen in \nmünchen"
expected := "wett morg munch"
result := Stem(query)
if !strings.EqualFold(expected, result) {
t.Errorf("test failed.\nexpected:\t %v\ngot:\t\t %v", expected, result)
}
}
func TestStemWords(t *testing.T) {
words, err := util.ReadWordList("testdata/voc.txt")
if err != nil {
t.Error(err)
t.Fail()
}
expected, err := util.ReadWordList("testdata/stemmed.txt")
if err != nil {
t.Error(err)
t.Fail()
}
if len(words) != len(expected) {
t.Errorf("wordlist and result list should have same size")
t.Fail()
}
result := StemWords(words)
if !util.SlicesEqual(expected, result) {
t.Errorf("test failed.\nexpected:\t %v\ngot:\t\t %v", expected, result)
}
}
func TestStemWord(t *testing.T) {
words, err := util.ReadWordList("testdata/voc.txt")
if err != nil {
t.Error(err)
t.Fail()
}
expected, err := util.ReadWordList("testdata/stemmed.txt")
if err != nil {
t.Error(err)
t.Fail()
}
if len(words) != len(expected) {
t.Errorf("wordlist and result list should have same size")
t.Fail()
}
tests := make([]*testSet, 0, len(words))
for i, v := range words {
tests = append(tests, &testSet{value: v, expected: expected[i]})
}
for _, test := range tests {
result := StemWord(test.value)
if !strings.EqualFold(test.expected, result) {
t.Errorf("test failed.\nexpected:\t %v\ngot:\t\t %v", test.expected, result)
}
}
}