1
0
mirror of https://github.com/fumiama/jieba.git synced 2026-06-24 05:06:23 +08:00

fs.File -> io.Reader

This commit is contained in:
源文雨
2022-12-03 10:54:06 +08:00
parent 35ac98dc5f
commit 36c17a10b5
11 changed files with 28 additions and 28 deletions

View File

@@ -1,7 +1,7 @@
package tokenizers
import (
"io/fs"
"io"
"regexp"
"strconv"
@@ -42,7 +42,7 @@ Parameters:
"交换机" as a single word. If searchMode is true, it will further split
this word into "交换", "换机", which are valid Chinese words.
*/
func NewJiebaTokenizer(dictFile fs.File, hmm, searchMode bool) (analysis.Tokenizer, error) {
func NewJiebaTokenizer(dictFile io.Reader, hmm, searchMode bool) (analysis.Tokenizer, error) {
seg, err := jieba.LoadDictionary(dictFile)
return &JiebaTokenizer{
seg: seg,
@@ -131,7 +131,7 @@ JiebaTokenizerConstructor creates a JiebaTokenizer.
Parameter config should contains at least one parameter:
file: the path of the dictionary file or fs.File.
file: the path of the dictionary file or io.Reader.
hmm: optional, specify whether to use Hidden Markov Model, see NewJiebaTokenizer for details.
@@ -150,7 +150,7 @@ func JiebaTokenizerConstructor(config map[string]interface{}, cache *registry.Ca
if ok {
return NewJiebaTokenizerAt(dictFilePath, hmm, searchMode)
}
dictFile := config["file"].(fs.File)
dictFile := config["file"].(io.Reader)
return NewJiebaTokenizer(dictFile, hmm, searchMode)
}