Documentation ¶
Overview ¶
Package htmlquery provides extract data from HTML documents using XPath expression.
Index ¶
- Variables
- func ExistsAttr(n *html.Node, name string) bool
- func Find(top *html.Node, expr string) []*html.Node
- func FindOne(top *html.Node, expr string) *html.Node
- func InnerText(n *html.Node) string
- func LoadDoc(path string) (*html.Node, error)
- func LoadURL(url string) (*html.Node, error)
- func OutputHTML(n *html.Node, self bool) string
- func Parse(r io.Reader) (*html.Node, error)
- func Query(top *html.Node, expr string) (*html.Node, error)
- func QueryAll(top *html.Node, expr string) ([]*html.Node, error)
- func QuerySelector(top *html.Node, selector *xpath.Expr) *html.Node
- func QuerySelectorAll(top *html.Node, selector *xpath.Expr) []*html.Node
- func SelectAttr(n *html.Node, name string) (val string)
- type NodeNavigator
- func (h *NodeNavigator) Copy() xpath.NodeNavigator
- func (h *NodeNavigator) Current() *html.Node
- func (h *NodeNavigator) LocalName() string
- func (h *NodeNavigator) MoveTo(other xpath.NodeNavigator) bool
- func (h *NodeNavigator) MoveToChild() bool
- func (h *NodeNavigator) MoveToFirst() bool
- func (h *NodeNavigator) MoveToNext() bool
- func (h *NodeNavigator) MoveToNextAttribute() bool
- func (h *NodeNavigator) MoveToParent() bool
- func (h *NodeNavigator) MoveToPrevious() bool
- func (h *NodeNavigator) MoveToRoot()
- func (h *NodeNavigator) NodeType() xpath.NodeType
- func (*NodeNavigator) Prefix() string
- func (h *NodeNavigator) String() string
- func (h *NodeNavigator) Value() string
Constants ¶
This section is empty.
Variables ¶
var DisableSelectorCache = false
DisableSelectorCache will disable caching for the query selector if value is true.
var Exports = map[string]interface{}{ "LoadHTMLDocument": func(htmlText interface{}) (*html.Node, error) { return Parse(strings.NewReader(utils.InterfaceToString(htmlText))) }, "Find": Find, "FindOne": FindOne, "QueryAll": QueryAll, "Query": Query, "InnerText": InnerText, "SelectAttr": SelectAttr, "ExistedAttr": ExistsAttr, "CreateXPathNavigator": CreateXPathNavigator, "OutputHTML": func(doc *html.Node) string { return OutputHTML(doc, false) }, "OutputHTMLSelf": func(doc *html.Node) string { return OutputHTML(doc, true) }, }
var SelectorCacheMaxEntries = 50
SelectorCacheMaxEntries allows how many selector object can be caching. Default is 50. Will disable caching if SelectorCacheMaxEntries <= 0.
Functions ¶
func ExistsAttr ¶
ExistsAttr returns whether attribute with specified name exists.
func Find ¶
Find is like QueryAll but Will panics if the expression `expr` cannot be parsed.
See `QueryAll()` function.
func FindOne ¶
FindOne is like Query but will panics if the expression `expr` cannot be parsed. See `Query()` function.
func OutputHTML ¶
OutputHTML returns the text including tags name.
func Query ¶
Query runs the given XPath expression against the given html.Node and returns the first matching html.Node, or nil if no matches are found.
Returns an error if the expression `expr` cannot be parsed.
func QueryAll ¶
QueryAll searches the html.Node that matches by the specified XPath expr. Return an error if the expression `expr` cannot be parsed.
func QuerySelector ¶
QuerySelector returns the first matched html.Node by the specified XPath selector.
func QuerySelectorAll ¶
QuerySelectorAll searches all of the html.Node that matches the specified XPath selectors.
Types ¶
type NodeNavigator ¶
type NodeNavigator struct {
// contains filtered or unexported fields
}
func CreateXPathNavigator ¶
func CreateXPathNavigator(top *html.Node) *NodeNavigator
CreateXPathNavigator creates a new xpath.NodeNavigator for the specified html.Node.
func (*NodeNavigator) Copy ¶
func (h *NodeNavigator) Copy() xpath.NodeNavigator
func (*NodeNavigator) Current ¶
func (h *NodeNavigator) Current() *html.Node
func (*NodeNavigator) LocalName ¶
func (h *NodeNavigator) LocalName() string
func (*NodeNavigator) MoveTo ¶
func (h *NodeNavigator) MoveTo(other xpath.NodeNavigator) bool
func (*NodeNavigator) MoveToChild ¶
func (h *NodeNavigator) MoveToChild() bool
func (*NodeNavigator) MoveToFirst ¶
func (h *NodeNavigator) MoveToFirst() bool
func (*NodeNavigator) MoveToNext ¶
func (h *NodeNavigator) MoveToNext() bool
func (*NodeNavigator) MoveToNextAttribute ¶
func (h *NodeNavigator) MoveToNextAttribute() bool
func (*NodeNavigator) MoveToParent ¶
func (h *NodeNavigator) MoveToParent() bool
func (*NodeNavigator) MoveToPrevious ¶
func (h *NodeNavigator) MoveToPrevious() bool
func (*NodeNavigator) MoveToRoot ¶
func (h *NodeNavigator) MoveToRoot()
func (*NodeNavigator) NodeType ¶
func (h *NodeNavigator) NodeType() xpath.NodeType
func (*NodeNavigator) Prefix ¶
func (*NodeNavigator) Prefix() string
func (*NodeNavigator) String ¶
func (h *NodeNavigator) String() string
func (*NodeNavigator) Value ¶
func (h *NodeNavigator) Value() string