Versions in this module Expand all Collapse all v0 v0.1.1 Dec 12, 2022 v0.1.0 Dec 12, 2022 Changes in this version + var DefaultExtrator = &Extractor + var LINEREAK = fmt.Sprintln() + func CleanDoc(doc *goquery.Document) + func GetHTMLContent(articleContent *goquery.Selection) string + func GetTextContent(articleContent *goquery.Selection, customRender *TextRenderers) string + type Article struct + HTML string + Images []string + Meta Metadata + Text string + URL string + func FromReader(reader io.Reader, url *nurl.URL) (Article, error) + func FromURL(url *nurl.URL, timeout time.Duration) (Article, error) + type Extractor struct + CustomTextRenderers *TextRenderers + TextLineBreak string + func (extractor *Extractor) FromReader(reader io.Reader, url *nurl.URL) (Article, error) + func (extractor *Extractor) FromReaderWithSelector(reader io.Reader, selector string, url *nurl.URL) (Article, error) + func (extractor *Extractor) FromURL(url *nurl.URL, timeout time.Duration) (Article, error) + type Metadata struct + Author string + Excerpt string + Image string + MaxReadTime int + MinReadTime int + Title string + type RenderFunc func(node *html.Node, buf *bytes.Buffer) + type TextRenderers struct + LineBreak string + func NewNoobTextRenderers(lineBreak string) *TextRenderers + func NewTextRenderers(lineBreak string) *TextRenderers + func (r *TextRenderers) Register(tag string, before, after RenderFunc) error + func (r *TextRenderers) WriteLineBreak(buf *bytes.Buffer)