Documentation ¶
Overview ¶
Package htmlquery provides extract data from HTML documents using XPath expression.
Index ¶
- Variables
- func ExistsAttr(n *html.Node, name string) bool
- func Find(top *html.Node, expr string) []*html.Node
- func FindOne(top *html.Node, expr string) *html.Node
- func InnerText(n *html.Node) string
- func LoadDoc(path string) (*html.Node, error)
- func LoadURL(url string) (*html.Node, error)
- func OutputHTML(n *html.Node, self bool) string
- func Parse(r io.Reader) (*html.Node, error)
- func Query(top *html.Node, expr string) (*html.Node, error)
- func QueryAll(top *html.Node, expr string) ([]*html.Node, error)
- func QuerySelector(top *html.Node, selector *xpath.Expr) *html.Node
- func QuerySelectorAll(top *html.Node, selector *xpath.Expr) []*html.Node
- func SelectAttr(n *html.Node, name string) (val string)
- type NodeNavigator
- func (h *NodeNavigator) Copy() xpath.NodeNavigator
- func (h *NodeNavigator) Current() *html.Node
- func (h *NodeNavigator) LocalName() string
- func (h *NodeNavigator) MoveTo(other xpath.NodeNavigator) bool
- func (h *NodeNavigator) MoveToChild() bool
- func (h *NodeNavigator) MoveToFirst() bool
- func (h *NodeNavigator) MoveToNext() bool
- func (h *NodeNavigator) MoveToNextAttribute() bool
- func (h *NodeNavigator) MoveToParent() bool
- func (h *NodeNavigator) MoveToPrevious() bool
- func (h *NodeNavigator) MoveToRoot()
- func (h *NodeNavigator) NodeType() xpath.NodeType
- func (*NodeNavigator) Prefix() string
- func (h *NodeNavigator) String() string
- func (h *NodeNavigator) Value() string
Constants ¶
This section is empty.
Variables ¶
var DisableSelectorCache = false
DisableSelectorCache will disable caching for the query selector if value is true.
var SelectorCacheMaxEntries = 50
SelectorCacheMaxEntries allows how many selector object can be caching. Default is 50. Will disable caching if SelectorCacheMaxEntries <= 0.
Functions ¶
func ExistsAttr ¶ added in v1.2.4
ExistsAttr returns whether attribute with specified name exists.
func Find ¶
Find is like QueryAll but Will panics if the expression `expr` cannot be parsed.
See `QueryAll()` function.
func FindOne ¶
FindOne is like Query but will panics if the expression `expr` cannot be parsed. See `Query()` function.
func LoadURL ¶
LoadURL loads the HTML document from the specified URL. Default enabling gzip on a HTTP request.
func OutputHTML ¶
OutputHTML returns the text including tags name.
func Query ¶ added in v1.1.0
Query runs the given XPath expression against the given html.Node and returns the first matching html.Node, or nil if no matches are found.
Returns an error if the expression `expr` cannot be parsed.
func QueryAll ¶ added in v1.1.0
QueryAll searches the html.Node that matches by the specified XPath expr. Return an error if the expression `expr` cannot be parsed.
func QuerySelector ¶ added in v1.1.0
QuerySelector returns the first matched html.Node by the specified XPath selector.
func QuerySelectorAll ¶ added in v1.1.0
QuerySelectorAll searches all of the html.Node that matches the specified XPath selectors.
Types ¶
type NodeNavigator ¶
type NodeNavigator struct {
// contains filtered or unexported fields
}
func CreateXPathNavigator ¶
func CreateXPathNavigator(top *html.Node) *NodeNavigator
CreateXPathNavigator creates a new xpath.NodeNavigator for the specified html.Node.
func (*NodeNavigator) Copy ¶
func (h *NodeNavigator) Copy() xpath.NodeNavigator
func (*NodeNavigator) Current ¶
func (h *NodeNavigator) Current() *html.Node
func (*NodeNavigator) LocalName ¶
func (h *NodeNavigator) LocalName() string
func (*NodeNavigator) MoveTo ¶
func (h *NodeNavigator) MoveTo(other xpath.NodeNavigator) bool
func (*NodeNavigator) MoveToChild ¶
func (h *NodeNavigator) MoveToChild() bool
func (*NodeNavigator) MoveToFirst ¶
func (h *NodeNavigator) MoveToFirst() bool
func (*NodeNavigator) MoveToNext ¶
func (h *NodeNavigator) MoveToNext() bool
func (*NodeNavigator) MoveToNextAttribute ¶
func (h *NodeNavigator) MoveToNextAttribute() bool
func (*NodeNavigator) MoveToParent ¶
func (h *NodeNavigator) MoveToParent() bool
func (*NodeNavigator) MoveToPrevious ¶
func (h *NodeNavigator) MoveToPrevious() bool
func (*NodeNavigator) MoveToRoot ¶
func (h *NodeNavigator) MoveToRoot()
func (*NodeNavigator) NodeType ¶
func (h *NodeNavigator) NodeType() xpath.NodeType
func (*NodeNavigator) Prefix ¶
func (*NodeNavigator) Prefix() string
func (*NodeNavigator) String ¶
func (h *NodeNavigator) String() string
func (*NodeNavigator) Value ¶
func (h *NodeNavigator) Value() string