Платформа ЦРНП "Мирокод" для разработки проектов
https://git.mirocod.ru
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
171 lines
4.8 KiB
171 lines
4.8 KiB
package goquery |
|
|
|
import ( |
|
"bytes" |
|
|
|
"golang.org/x/net/html" |
|
) |
|
|
|
// used to determine if a set (map[*html.Node]bool) should be used |
|
// instead of iterating over a slice. The set uses more memory and |
|
// is slower than slice iteration for small N. |
|
const minNodesForSet = 1000 |
|
|
|
var nodeNames = []string{ |
|
html.ErrorNode: "#error", |
|
html.TextNode: "#text", |
|
html.DocumentNode: "#document", |
|
html.CommentNode: "#comment", |
|
} |
|
|
|
// NodeName returns the node name of the first element in the selection. |
|
// It tries to behave in a similar way as the DOM's nodeName property |
|
// (https://developer.mozilla.org/en-US/docs/Web/API/Node/nodeName). |
|
// |
|
// Go's net/html package defines the following node types, listed with |
|
// the corresponding returned value from this function: |
|
// |
|
// ErrorNode : #error |
|
// TextNode : #text |
|
// DocumentNode : #document |
|
// ElementNode : the element's tag name |
|
// CommentNode : #comment |
|
// DoctypeNode : the name of the document type |
|
// |
|
func NodeName(s *Selection) string { |
|
if s.Length() == 0 { |
|
return "" |
|
} |
|
return nodeName(s.Get(0)) |
|
} |
|
|
|
// nodeName returns the node name of the given html node. |
|
// See NodeName for additional details on behaviour. |
|
func nodeName(node *html.Node) string { |
|
if node == nil { |
|
return "" |
|
} |
|
|
|
switch node.Type { |
|
case html.ElementNode, html.DoctypeNode: |
|
return node.Data |
|
default: |
|
if node.Type >= 0 && int(node.Type) < len(nodeNames) { |
|
return nodeNames[node.Type] |
|
} |
|
return "" |
|
} |
|
} |
|
|
|
// OuterHtml returns the outer HTML rendering of the first item in |
|
// the selection - that is, the HTML including the first element's |
|
// tag and attributes. |
|
// |
|
// Unlike InnerHtml, this is a function and not a method on the Selection, |
|
// because this is not a jQuery method (in javascript-land, this is |
|
// a property provided by the DOM). |
|
func OuterHtml(s *Selection) (string, error) { |
|
var buf bytes.Buffer |
|
|
|
if s.Length() == 0 { |
|
return "", nil |
|
} |
|
n := s.Get(0) |
|
if err := html.Render(&buf, n); err != nil { |
|
return "", err |
|
} |
|
return buf.String(), nil |
|
} |
|
|
|
// Loop through all container nodes to search for the target node. |
|
func sliceContains(container []*html.Node, contained *html.Node) bool { |
|
for _, n := range container { |
|
if nodeContains(n, contained) { |
|
return true |
|
} |
|
} |
|
|
|
return false |
|
} |
|
|
|
// Checks if the contained node is within the container node. |
|
func nodeContains(container *html.Node, contained *html.Node) bool { |
|
// Check if the parent of the contained node is the container node, traversing |
|
// upward until the top is reached, or the container is found. |
|
for contained = contained.Parent; contained != nil; contained = contained.Parent { |
|
if container == contained { |
|
return true |
|
} |
|
} |
|
return false |
|
} |
|
|
|
// Checks if the target node is in the slice of nodes. |
|
func isInSlice(slice []*html.Node, node *html.Node) bool { |
|
return indexInSlice(slice, node) > -1 |
|
} |
|
|
|
// Returns the index of the target node in the slice, or -1. |
|
func indexInSlice(slice []*html.Node, node *html.Node) int { |
|
if node != nil { |
|
for i, n := range slice { |
|
if n == node { |
|
return i |
|
} |
|
} |
|
} |
|
return -1 |
|
} |
|
|
|
// Appends the new nodes to the target slice, making sure no duplicate is added. |
|
// There is no check to the original state of the target slice, so it may still |
|
// contain duplicates. The target slice is returned because append() may create |
|
// a new underlying array. If targetSet is nil, a local set is created with the |
|
// target if len(target) + len(nodes) is greater than minNodesForSet. |
|
func appendWithoutDuplicates(target []*html.Node, nodes []*html.Node, targetSet map[*html.Node]bool) []*html.Node { |
|
// if there are not that many nodes, don't use the map, faster to just use nested loops |
|
// (unless a non-nil targetSet is passed, in which case the caller knows better). |
|
if targetSet == nil && len(target)+len(nodes) < minNodesForSet { |
|
for _, n := range nodes { |
|
if !isInSlice(target, n) { |
|
target = append(target, n) |
|
} |
|
} |
|
return target |
|
} |
|
|
|
// if a targetSet is passed, then assume it is reliable, otherwise create one |
|
// and initialize it with the current target contents. |
|
if targetSet == nil { |
|
targetSet = make(map[*html.Node]bool, len(target)) |
|
for _, n := range target { |
|
targetSet[n] = true |
|
} |
|
} |
|
for _, n := range nodes { |
|
if !targetSet[n] { |
|
target = append(target, n) |
|
targetSet[n] = true |
|
} |
|
} |
|
|
|
return target |
|
} |
|
|
|
// Loop through a selection, returning only those nodes that pass the predicate |
|
// function. |
|
func grep(sel *Selection, predicate func(i int, s *Selection) bool) (result []*html.Node) { |
|
for i, n := range sel.Nodes { |
|
if predicate(i, newSingleSelection(n, sel.document)) { |
|
result = append(result, n) |
|
} |
|
} |
|
return result |
|
} |
|
|
|
// Creates a new Selection object based on the specified nodes, and keeps the |
|
// source Selection object on the stack (linked list). |
|
func pushStack(fromSel *Selection, nodes []*html.Node) *Selection { |
|
result := &Selection{nodes, fromSel.document, fromSel} |
|
return result |
|
}
|
|
|