lunch-go/pkg/restaurants/html.go
2022-10-29 12:48:16 +02:00

85 lines
1.9 KiB
Go

package restaurants
import (
"errors"
"golang.org/x/net/html"
"golang.org/x/text/encoding/charmap"
)
func getAttribute(node *html.Node, key string) (string, error) {
for _, attr := range node.Attr {
if attr.Key == key {
return attr.Val, nil
}
}
return "", errors.New("couldn't find the provided key")
}
func hasKeyValue(node *html.Node, key string, value string) bool {
if node.Type == html.ElementNode {
attr, err := getAttribute(node, key)
if err != nil {
return false
}
return attr == value
}
return false
}
func findNodeBy(node *html.Node, key string, value string) (*html.Node, error) {
if hasKeyValue(node, key, value) {
return node, nil
}
for n := node.FirstChild; n != nil; n = n.NextSibling {
res, err := findNodeBy(n, key, value)
if err == nil {
return res, nil
}
}
return nil, errors.New("couldn't find a node with provided " + key + " \"" + value + "\"")
}
func findNodeByClass(node *html.Node, class string) (*html.Node, error) {
return findNodeBy(node, "class", class)
}
func findNodeById(node *html.Node, id string) (*html.Node, error) {
return findNodeBy(node, "id", id)
}
func getTextInternal(node *html.Node) (string, error) {
if node.Type == html.TextNode {
return node.Data, nil
}
return "", errors.New("not a text node")
}
func getText(node *html.Node) (string, error) {
if node.Type == html.TextNode {
return node.Data, nil
}
for n := node.FirstChild; n != nil; n = n.NextSibling {
text, err := getTextInternal(n)
if err == nil {
return text, nil
}
}
return "", errors.New("couldn't find a text node")
}
func getTextDecodeWindows1250(node *html.Node) (string, error) {
text, err := getText(node)
if err != nil {
return text, err
}
return decodeWindows1250(text)
}
func decodeWindows1250(text string) (string, error) {
dec := charmap.Windows1250.NewDecoder()
out, err := dec.String(text)
return out, err
}