-
Notifications
You must be signed in to change notification settings - Fork 0
/
ngram_test.go
80 lines (69 loc) · 1.8 KB
/
ngram_test.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
package gotagger
import "testing"
func TestNgrams(t *testing.T) {
var n = 3
var input = []string{"Go", "(", "often", "referred", "to", "as", "golang", ")", "is", "a", "programming", "language"}
var expected = [][]string{
{"Go", "(", "often"},
{"(", "often", "referred"},
{"often", "referred", "to"},
{"referred", "to", "as"},
{"to", "as", "golang"},
{"as", "golang", ")"},
{"golang", ")", "is"},
{")", "is", "a"},
{"is", "a", "programming"},
{"a", "programming", "language"},
}
var results = ngrams(input, n)
if len(results) != len(expected) {
t.Errorf("Expect %d, got %d", len(expected), len(results))
return
}
for i := 0; i < len(results); i++ {
if len(results[i]) != len(expected[i]) {
t.Errorf("Expect %d, got %d", len(expected[i]), len(results[i]))
continue
}
for j := 0; j < len(results[i]); j++ {
if results[i][j] != expected[i][j] {
t.Errorf("Expect %q, got %q", expected[i][j], results[i][j])
}
}
}
}
func TestNgramsRecursive(t *testing.T) {
var n = 3
var input = []string{"Go", "is", "a", "programming", "language"}
var expected = [][]string{
{"Go", "is", "a"},
{"is", "a", "programming"},
{"a", "programming", "language"},
{"Go", "is"},
{"is", "a"},
{"a", "programming"},
{"programming", "language"},
{"Go"},
{"is"},
{"a"},
{"programming"},
{"language"},
}
var results = ngramsRecursive(input, n)
if len(results) != len(expected) {
t.Errorf("Expect %d, got %d", len(expected), len(results))
return
}
for i := 0; i < len(results); i++ {
if len(results[i]) != len(expected[i]) {
t.Errorf("Expect %d, got %d", len(expected[i]), len(results[i]))
return
}
for j := 0; j < len(results[i]); j++ {
if results[i][j] != expected[i][j] {
t.Errorf("Expect %q, got %q", expected[i][j], results[i][j])
return
}
}
}
}