Documentation ¶
Index ¶
- func IsTimeoutError(err error) bool
- func SuggestRespToSuggestions(data []byte) ([]string, error)
- type DOMPaths
- type DOMPathsImages
- type EngineBase
- func (e EngineBase) Get(ctx *colly.Context, urll string, anonUrll string) error
- func (e EngineBase) GetName() engines.Name
- func (e EngineBase) GetOrigins() []engines.Name
- func (e *EngineBase) Init(ctx context.Context)
- func (e *EngineBase) InitSearcher(ctx context.Context)
- func (e *EngineBase) InitSuggester(ctx context.Context)
- func (e *EngineBase) OnHTML(goquerySelector string, f colly.HTMLCallback)
- func (e *EngineBase) OnRequest(f colly.RequestCallback)
- func (e *EngineBase) OnResponse(f colly.ResponseCallback)
- func (e EngineBase) PageFromContext(ctx *colly.Context) int
- func (e EngineBase) Post(ctx *colly.Context, urll string, body io.Reader, anonBody string) error
- func (e EngineBase) Wait()
- type Enginer
- type ImageSearcher
- type PageRankCounter
- type Suggester
- type WebSearcher
Constants ¶
This section is empty.
Variables ¶
This section is empty.
Functions ¶
func IsTimeoutError ¶
func SuggestRespToSuggestions ¶ added in v0.22.0
Converts a opensearch.xml compatible suggestions API JSON to a slice of suggestions.
Types ¶
type DOMPathsImages ¶
type EngineBase ¶
type EngineBase struct { Name engines.Name Origins []engines.Name // contains filtered or unexported fields }
Base struct for every search engine.
func (EngineBase) Get ¶
func (e EngineBase) Get(ctx *colly.Context, urll string, anonUrll string) error
func (EngineBase) GetName ¶
func (e EngineBase) GetName() engines.Name
Used to get the name of the search engine.
func (EngineBase) GetOrigins ¶
func (e EngineBase) GetOrigins() []engines.Name
Used to get the origins of the search engine.
func (*EngineBase) Init ¶
func (e *EngineBase) Init(ctx context.Context)
Used to initialize the EngineBase collector.
func (*EngineBase) InitSearcher ¶ added in v0.26.0
func (e *EngineBase) InitSearcher(ctx context.Context)
Used to initialize the EngineBase collector for searching web/images.
func (*EngineBase) InitSuggester ¶ added in v0.26.0
func (e *EngineBase) InitSuggester(ctx context.Context)
Used to initialize the EngineBase collector for searching suggestions.
func (*EngineBase) OnHTML ¶
func (e *EngineBase) OnHTML(goquerySelector string, f colly.HTMLCallback)
OnHTML registers a function. Function will be executed on every HTML element matched by the GoQuery Selector parameter. GoQuery Selector is a selector used by https://github.com/PuerkitoBio/goquery.
func (*EngineBase) OnRequest ¶
func (e *EngineBase) OnRequest(f colly.RequestCallback)
OnRequest registers a function. Function will be executed on every request made by the Collector.
func (*EngineBase) OnResponse ¶
func (e *EngineBase) OnResponse(f colly.ResponseCallback)
OnResponse registers a function. Function will be executed on every response.
func (EngineBase) PageFromContext ¶
func (e EngineBase) PageFromContext(ctx *colly.Context) int
func (EngineBase) Wait ¶
func (e EngineBase) Wait()
Wait returns when the collector jobs are finished.
type ImageSearcher ¶ added in v0.28.5
type ImageSearcher interface { Enginer InitSearcher(context.Context) ImageSearch(string, options.Options, chan result.ResultScraped) ([]error, bool) }
Interface that each search engine must implement to support searching image results.
type PageRankCounter ¶
type PageRankCounter struct {
// contains filtered or unexported fields
}
A goroutine-safe counter for PageRank.
func NewPageRankCounter ¶
func NewPageRankCounter(pages int) PageRankCounter
Create a new PageRankCounter.
func (*PageRankCounter) GetPlusOne ¶
func (prc *PageRankCounter) GetPlusOne(page int) int
Get the count for a page + 1.
func (*PageRankCounter) Increment ¶
func (prc *PageRankCounter) Increment(page int)
Increment the count for a page.