Documentation
¶
Index ¶
- Constants
- Variables
- type Jieba
- func (x *Jieba) AddWord(s string)
- func (x *Jieba) Cut(s string, hmm bool) []string
- func (x *Jieba) CutAll(s string) []string
- func (x *Jieba) CutForSearch(s string, hmm bool) []string
- func (x *Jieba) Extract(s string, topk int) []string
- func (x *Jieba) ExtractWithWeight(s string, topk int) []WordWeight
- func (x *Jieba) Free()
- func (x *Jieba) Tag(s string) []string
- func (x *Jieba) Tokenize(s string, mode TokenizeMode, hmm bool) []Word
- type TokenizeMode
- type Word
- type WordWeight
Examples ¶
Constants ¶
View Source
const TOTAL_DICT_PATH_NUMBER = 5
Variables ¶
Functions ¶
This section is empty.
Types ¶
type Jieba ¶
type Jieba struct {
// contains filtered or unexported fields
}
Example ¶
var s string var words []string use_hmm := true //equals with x := NewJieba(DICT_PATH, HMM_PATH, USER_DICT_PATH) x := NewJieba() defer x.Free() s = "我来到北京清华大学" words = x.CutAll(s) fmt.Println(s) fmt.Println("全模式:", strings.Join(words, "/")) words = x.Cut(s, use_hmm) fmt.Println(s) fmt.Println("精确模式:", strings.Join(words, "/")) s = "比特币" words = x.Cut(s, use_hmm) fmt.Println(s) fmt.Println("精确模式:", strings.Join(words, "/")) x.AddWord("比特币") s = "比特币" words = x.Cut(s, use_hmm) fmt.Println(s) fmt.Println("添加词典后,精确模式:", strings.Join(words, "/")) s = "他来到了网易杭研大厦" words = x.Cut(s, use_hmm) fmt.Println(s) fmt.Println("新词识别:", strings.Join(words, "/")) s = "小明硕士毕业于中国科学院计算所,后在日本京都大学深造" words = x.CutForSearch(s, use_hmm) fmt.Println(s) fmt.Println("搜索引擎模式:", strings.Join(words, "/")) s = "长春市长春药店" words = x.Tag(s) fmt.Println(s) fmt.Println("词性标注:", strings.Join(words, ",")) s = "区块链" words = x.Tag(s) fmt.Println(s) fmt.Println("词性标注:", strings.Join(words, ",")) s = "长江大桥" words = x.CutForSearch(s, !use_hmm) fmt.Println(s) fmt.Println("搜索引擎模式:", strings.Join(words, "/")) wordinfos := x.Tokenize(s, SearchMode, !use_hmm) fmt.Println(s) fmt.Println("Tokenize:", wordinfos)
Output: 我来到北京清华大学 全模式: 我/来到/北京/清华/清华大学/华大/大学 我来到北京清华大学 精确模式: 我/来到/北京/清华大学 比特币 精确模式: 比特/币 比特币 添加词典后,精确模式: 比特币 他来到了网易杭研大厦 新词识别: 他/来到/了/网易/杭研/大厦 小明硕士毕业于中国科学院计算所,后在日本京都大学深造 搜索引擎模式: 小明/硕士/毕业/于/中国/科学/学院/科学院/中国科学院/计算/计算所/,/后/在/日本/京都/大学/日本京都大学/深造 长春市长春药店 词性标注: 长春市/ns,长春/ns,药店/n 区块链 词性标注: 区块链/nz 长江大桥 搜索引擎模式: 长江/大桥/长江大桥 长江大桥 Tokenize: [{长江 0 6} {大桥 6 12} {长江大桥 0 12}]
func (*Jieba) ExtractWithWeight ¶
func (x *Jieba) ExtractWithWeight(s string, topk int) []WordWeight
type WordWeight ¶
Click to show internal directories.
Click to hide internal directories.