Documentation
¶
Index ¶
Constants ¶
This section is empty.
Variables ¶
View Source
var (
SpanishStopWords = []string{}/* 443 elements not displayed */
)
View Source
var (
SpanishTokenizer = NewStopWordsTokenizer(SpanishStopWords)
)
Functions ¶
This section is empty.
Types ¶
type IsMarkNonSpacingChecker ¶
type IsMarkNonSpacingChecker struct{}
func (*IsMarkNonSpacingChecker) Contains ¶
func (c *IsMarkNonSpacingChecker) Contains(r rune) bool
type SimpleTokenizer ¶
type SimpleTokenizer struct {
Tf Transformer
}
func NewSimpleTokenizer ¶
func NewSimpleTokenizer() *SimpleTokenizer
func (*SimpleTokenizer) Tokenize ¶
func (s *SimpleTokenizer) Tokenize(payload []byte) [][]byte
func (*SimpleTokenizer) TokenizeSingle ¶
func (s *SimpleTokenizer) TokenizeSingle(payload []byte) ([]byte, bool)
type StopWordsTokenizer ¶
type StopWordsTokenizer struct { T *SimpleTokenizer // contains filtered or unexported fields }
func NewStopWordsTokenizer ¶
func NewStopWordsTokenizer(stopWords []string) *StopWordsTokenizer
func (*StopWordsTokenizer) Tokenize ¶
func (st *StopWordsTokenizer) Tokenize(payload []byte) [][]byte
func (*StopWordsTokenizer) TokenizeSingle ¶
func (st *StopWordsTokenizer) TokenizeSingle(payload []byte) ([]byte, bool)
type Transformer ¶
Click to show internal directories.
Click to hide internal directories.