summaryrefslogtreecommitdiffstats
path: root/integrations/html_helper.go
blob: db4e2953e6c6bf49dd78850b3a75bf2ebdeb4d81 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
// Copyright 2017 The Gitea Authors. All rights reserved.
// Use of this source code is governed by a MIT-style
// license that can be found in the LICENSE file.

package integrations

import (
	"bytes"

	"golang.org/x/net/html"
)

type HtmlDoc struct {
	doc  *html.Node
	body *html.Node
}

func NewHtmlParser(content []byte) (*HtmlDoc, error) {
	doc, err := html.Parse(bytes.NewReader(content))
	if err != nil {
		return nil, err
	}

	return &HtmlDoc{doc: doc}, nil
}

func (doc *HtmlDoc) GetBody() *html.Node {
	if doc.body == nil {
		var b *html.Node
		var f func(*html.Node)
		f = func(n *html.Node) {
			if n.Type == html.ElementNode && n.Data == "body" {
				b = n
				return
			}
			for c := n.FirstChild; c != nil; c = c.NextSibling {
				f(c)
			}
		}
		f(doc.doc)
		if b != nil {
			doc.body = b
		} else {
			doc.body = doc.doc
		}
	}
	return doc.body
}

func (doc *HtmlDoc) GetAttribute(n *html.Node, key string) (string, bool) {
	for _, attr := range n.Attr {
		if attr.Key == key {
			return attr.Val, true
		}
	}
	return "", false
}

func (doc *HtmlDoc) checkAttr(n *html.Node, attr, val string) bool {
	if n.Type == html.ElementNode {
		s, ok := doc.GetAttribute(n, attr)
		if ok && s == val {
			return true
		}
	}
	return false
}

func (doc *HtmlDoc) traverse(n *html.Node, attr, val string) *html.Node {
	if doc.checkAttr(n, attr, val) {
		return n
	}

	for c := n.FirstChild; c != nil; c = c.NextSibling {
		result := doc.traverse(c, attr, val)
		if result != nil {
			return result
		}
	}

	return nil
}

func (doc *HtmlDoc) GetElementById(id string) *html.Node {
	return doc.traverse(doc.GetBody(), "id", id)
}

func (doc *HtmlDoc) GetInputValueById(id string) string {
	inp := doc.GetElementById(id)
	if inp == nil {
		return ""
	}

	val, _ := doc.GetAttribute(inp, "value")
	return val
}

func (doc *HtmlDoc) GetElementByName(name string) *html.Node {
	return doc.traverse(doc.GetBody(), "name", name)
}

func (doc *HtmlDoc) GetInputValueByName(name string) string {
	inp := doc.GetElementByName(name)
	if inp == nil {
		return ""
	}

	val, _ := doc.GetAttribute(inp, "value")
	return val
}