-
Notifications
You must be signed in to change notification settings - Fork 8
/
ac_test.go
146 lines (133 loc) · 3.38 KB
/
ac_test.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
/*
* @Author: Daiming Liu (xingrufeng)
*/
package ahocorasick
import (
"bufio"
"fmt"
"io"
"os"
"runtime"
"strconv"
"strings"
"testing"
"time"
)
func readFile(input string) []rune {
file, err := os.Open(input)
if err != nil {
return nil
}
defer file.Close()
content := make([]rune, 0)
bufReader := bufio.NewReader(file)
for {
line, _, err := bufReader.ReadLine()
if err != nil {
break
}
keyword := strings.TrimSpace(string(line))
if keyword == "" {
continue
}
content = append(content, []rune(keyword)...)
}
return content
}
func checkFileIsExist(filename string) bool {
if _, err := os.Stat(filename); os.IsNotExist(err) {
return false
}
return true
}
func writeFile(filename string, contents []Hit) {
var f *os.File
var err1 error
if checkFileIsExist(filename) { //如果文件存在
f, err1 = os.OpenFile(filename, os.O_APPEND, 0666) //打开文件
fmt.Println("文件存在")
} else {
f, err1 = os.Create(filename) //创建文件
fmt.Println("文件不存在")
}
defer f.Close()
if err1 != nil {
panic(err1)
}
for _, v := range contents {
str := strconv.Itoa(v.Begin) + "\t" + strconv.Itoa(v.End) + "\t" + string(v.Value) + "\n"
io.WriteString(f, str)
}
}
func TestBuild(t *testing.T) {
start := time.Now().UnixNano()
ac, err := BuildFromFile("./dictionary.txt")
//ac, err := BuildFromFile("./black.txt")
fmt.Println(err)
runTime := (time.Now().UnixNano() - start) / 1000 / 1000
fmt.Println("字典加载时间(ms)", runTime)
start = time.Now().UnixNano()
content := readFile("./text.txt")
runTime = (time.Now().UnixNano() - start) / 1000 / 1000
fmt.Println("测试文件加载时间(ms)", runTime)
start = time.Now().UnixNano()
ac.MultiPatternIndexes(content)
/*
search := ac.MultiPatternSearch([]rune("一群"))
for _, v := range search {
fmt.Printf("%d\t%d\t%s\n", v.Begin, v.End, string(v.Value))
}
*/
runTime = (time.Now().UnixNano() - start) / 1000 / 1000
fmt.Println("检索时间(ms)", runTime)
//writeFile("result2", result)
}
func TestAb(t *testing.T) {
/*
kws := []string{
"hers", "his", "she", "he",
}
*/
kws := []string{
"中华人民共和国", "中华人民", "人民共和国", "中华人民",
}
/*
kws := []string{
"一", "群", "一群羊",
}
*/
ac, err := Build(kws)
//ac, err := Build(kws)
//ac, err := BuildFromFile("./dictionary.txt")
if err != nil {
fmt.Println(err)
}
search := ac.MultiPatternSearch([]rune("中华人民共和国"))
//search := ac.MultiPatternSearch([]rune("ushers"))
//search := ac.MultiPatternSearch([]rune("一群"))
for _, v := range search {
fmt.Printf("%d\t%d\t%s\n", v.Begin, v.End, string(v.Value))
}
}
func TestMulti(t *testing.T) {
start := time.Now().UnixNano()
ac, err := BuildFromFile("./dictionary.txt")
fmt.Println(err)
runTime := (time.Now().UnixNano() - start) / 1000 / 1000
fmt.Println("字典加载时间(ms)", runTime)
start = time.Now().UnixNano()
content := readFile("./text.txt")
runTime = (time.Now().UnixNano() - start) / 1000 / 1000
fmt.Println("测试文件加载时间(ms)", runTime)
runtime.GC()
start = time.Now().UnixNano()
runtime.GC()
runTime = (time.Now().UnixNano() - start) / 1000 / 1000
fmt.Println("gc时间(ms)", runTime)
start = time.Now().UnixNano()
for i := 0; i < 100; i++ {
ac.MultiPatternIndexes(content)
}
runTime = (time.Now().UnixNano() - start) / 1000 / 1000
fmt.Println("检索时间(ms)", runTime)
}