-
Notifications
You must be signed in to change notification settings - Fork 36
/
util.go
66 lines (61 loc) · 1.9 KB
/
util.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
package iok
import (
"golang.org/x/net/html"
"net/url"
"strings"
)
func extractHTML(node *html.Node, input *Input, funcs ...func(node *html.Node, input *Input)) {
for _, f := range funcs {
f(node, input)
}
for c := node.FirstChild; c != nil; c = c.NextSibling {
extractHTML(c, input, funcs...)
}
}
func extractEmbeddedAssets(node *html.Node, input *Input) {
if node.Type == html.ElementNode && node.Data == "style" && node.FirstChild != nil {
input.CSS = append(input.CSS, node.FirstChild.Data)
}
if node.Type == html.ElementNode && node.Data == "script" && node.FirstChild != nil {
input.JS = append(input.JS, node.FirstChild.Data)
}
}
func extractTitle(node *html.Node, input *Input) {
if node.Type == html.ElementNode &&
node.Data == "title" && // this is a <title> tag
node.Namespace == "" && // we're not within an <svg> element
node.FirstChild != nil {
input.Title = append(input.Title, strings.TrimSpace(node.FirstChild.Data))
}
}
// extractRequests analyses the html to determine what requests *would*
// be made if rendered in a browser.
// This is a subset of the actual requests made because this won't include
// any requests triggered dynamically e.g. by JavaScript or by CSS styles
func extractRequests(base *url.URL) func(node *html.Node, input *Input) {
return func(node *html.Node, input *Input) {
// TODO: handle <base> tag changing the base url
if node.Type != html.ElementNode {
return
}
for _, attr := range node.Attr {
var u string
switch {
case node.Data == "link" && attr.Key == "href": // todo: filter to just rel=stylesheet
fallthrough
case node.Data == "img" && attr.Key == "src":
fallthrough
case node.Data == "script" && attr.Key == "src":
u = attr.Val
}
if u == "" {
continue
}
href, err := url.Parse(u)
if err != nil {
continue
}
input.Requests = append(input.Requests, base.ResolveReference(href).String())
}
}
}