summaryrefslogtreecommitdiff
path: root/crawler/utility.go
blob: 17ed47bc2c82c73718473f791e18a45a4dcf5289 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
package main

import (
	"log"
	"regexp"
	"strconv"
	"strings"

	"github.com/gocolly/colly"
)

func detect_spirit_type(name string) string {
	matched, err := regexp.MatchString(`(^|\s)Gin(\s|$)`, name)
	if err != nil {
		log.Fatal(err)
	}
	if matched {
		return "Gin"
	}
	matched, err = regexp.MatchString(`(^|\s)Rum(\s|$)`, name)
	if err != nil {
		log.Fatal(err)
	}
	if matched {
		return "Rum"
	}
	matched, err = regexp.MatchString(`(^|\s)[VW]odka(\s|$)`, name)
	if err != nil {
		log.Fatal(err)
	}
	if matched {
		return "Wodka"
	}
	matched, err = regexp.MatchString(`(^|\s)Whiske?y(\s|$)`, name)
	if err != nil {
		log.Fatal(err)
	}
	if matched {
		return "Whisky"
	}

	return "Verschiedenes"
}

func extract_volume(volume string) (float32, error) {
	r_liter, err := regexp.Compile(`[0-9]+([,.][0-9]+)?( )?[lL](iter)?`)
	if err != nil {
		log.Fatal(err)
	}
	volume_noisy := r_liter.FindString(volume)

	r_liter2, err := regexp.Compile(`[0-9]+([,.][0-9]+)?`)
	if err != nil {
		log.Fatal(err)
	}
	volume_noisy = r_liter2.FindString(volume_noisy)
	volume_noisy = strings.Replace(volume_noisy, ",", ".", 1)
	volume64, err := strconv.ParseFloat(volume_noisy, 32)
	if err != nil {
		return 0, err
	}

	return float32(volume64), err
}

func extract_abv(abv_noisy string) (float32, error) {
	if strings.Contains(abv_noisy, "%") {
		abv_noisy = strings.Replace(abv_noisy, "%", "", 1)
	}
	abv_noisy = strings.Replace(abv_noisy, ",", ".", 1)
	abv_noisy = strings.TrimSpace(abv_noisy)

	abv64, err := strconv.ParseFloat(abv_noisy, 32)
	if err != nil {
		return 0, err
	}

	return float32(abv64), nil
}

/*
 * In litre, but float.
 */
func get_volume(e *colly.HTMLElement) float32 {

	volume_noisy := e.Request.Ctx.Get("volume")

	matched, err := regexp.MatchString(`[lL](iter)?`, volume_noisy)
	if err != nil {
		log.Fatal(err)
	}
	if !matched {
		log.Println("get_volume: not matched: " + volume_noisy)
		return 0
	}

	volume, err := extract_volume(volume_noisy)
	if err != nil {
		log.Println("get_volume: " + volume_noisy)
		log.Fatal(err)
	}

	return volume
}

/*
 * In procent. (float)
 */
func get_abv(e *colly.HTMLElement) float32 {

	abv_noisy := e.Request.Ctx.Get("abv")

	if abv_noisy == "" {
		return 0
	}

	abv, err := extract_abv(abv_noisy)
	if err != nil {
		log.Println("get_abv: " + abv_noisy)
		log.Fatal(err)
	}

	return abv
}