mirror of
https://github.com/fumiama/jieba.git
synced 2026-06-12 21:20:26 +08:00
move tokenizer.go to top directory
This commit is contained in:
@@ -1,65 +0,0 @@
|
||||
package dictionary
|
||||
|
||||
import (
|
||||
"math"
|
||||
"testing"
|
||||
)
|
||||
|
||||
var d *Dictionary
|
||||
|
||||
func init() {
|
||||
d = New()
|
||||
}
|
||||
|
||||
func TestLoadDictionary(t *testing.T) {
|
||||
if err := d.LoadDictionary("../dict.txt"); err != nil {
|
||||
t.Fatalf("Failed to load dict.txt, err = %s", err)
|
||||
}
|
||||
n := len(d.freqMap)
|
||||
|
||||
d.LoadDictionary("../foobar.txt")
|
||||
if len(d.freqMap) == n {
|
||||
t.Fatalf("Failed to load foobar.txt")
|
||||
}
|
||||
}
|
||||
|
||||
func TestLoadUserDictionary(t *testing.T) {
|
||||
err := d.LoadUserDictionary("../userdict.txt")
|
||||
if err != nil {
|
||||
t.Fatalf("Failed to load userdict.txt, err = %s", err)
|
||||
}
|
||||
if _, ok := d.Frequency("八一双鹿"); !ok {
|
||||
t.Fatalf("Failed to load userdict.txt, no frequency for word \"八一双鹿\"")
|
||||
}
|
||||
}
|
||||
|
||||
func TestFrequency(t *testing.T) {
|
||||
d.LoadUserDictionary("../userdict.txt")
|
||||
if f, _ := d.Frequency("八一双鹿"); f != 3.0 {
|
||||
t.Fatalf("Wrong frequency for word \"八一双鹿\", expect 3.0, got %f", f)
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
func TestTotal(t *testing.T) {
|
||||
d.LoadDictionary("../userdict.txt")
|
||||
if d.Total() != 319.0 {
|
||||
t.Fatalf("Wrong total for userdict.txt, expect 319.0, got %f", d.Total())
|
||||
}
|
||||
}
|
||||
|
||||
func TestLogTotal(t *testing.T) {
|
||||
d.LoadDictionary("../userdict.txt")
|
||||
if d.LogTotal() != math.Log(319.0) {
|
||||
t.Fatalf("Wrong total for userdict.txt, expect %f, got %f", math.Log(319.0), d.LogTotal())
|
||||
}
|
||||
}
|
||||
|
||||
func TestAddToken(t *testing.T) {
|
||||
d.LoadDictionary("../userdict.txt")
|
||||
token := Token{text: "超敏C反应蛋白", frequency: 100.0, pos: "nz"}
|
||||
d.AddToken(token)
|
||||
if f, _ := d.Frequency("超敏C反应蛋白"); f != 100.0 {
|
||||
t.Fatalf("Failed to add Token \"超敏C反应蛋白\", except frequency 100.0, got %f", f)
|
||||
}
|
||||
}
|
||||
@@ -17,3 +17,7 @@ func (t Token) Frequency() float64 {
|
||||
func (t Token) Pos() string {
|
||||
return t.pos
|
||||
}
|
||||
|
||||
func NewToken(text string, frequency float64, pos string) Token {
|
||||
return Token{text: text, frequency: frequency, pos: pos}
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user