summaryrefslogtreecommitdiff
path: root/bottleworld.go
diff options
context:
space:
mode:
Diffstat (limited to 'bottleworld.go')
-rw-r--r--bottleworld.go52
1 files changed, 52 insertions, 0 deletions
diff --git a/bottleworld.go b/bottleworld.go
new file mode 100644
index 0000000..2f5991a
--- /dev/null
+++ b/bottleworld.go
@@ -0,0 +1,52 @@
+package main
+
+import (
+ "fmt"
+ "log"
+ "regexp"
+ // "strings"
+
+ // "github.com/PuerkitoBio/goquery"
+ "github.com/gocolly/colly"
+)
+
+func ScrapeBottleWord() {
+ c := colly.NewCollector(
+ colly.AllowedDomains("bottleworld.de"),
+ colly.AllowedDomains("www.bottleworld.de"),
+ )
+
+ c.OnHTML("li.item", func(e *colly.HTMLElement) {
+ whisky_name := e.ChildText("h2 > a")
+
+ matched, err := regexp.MatchString("Whiske?y", whisky_name)
+ if err != nil {
+ log.Fatal(err)
+ }
+ if !matched {
+ return
+ }
+
+ whisky_url := e.ChildAttr("a", "href")
+ log.Println(whisky_name)
+ log.Println(whisky_url)
+
+ e.ForEach(".price-box", func(i int, e *colly.HTMLElement) {
+ e.ForEach(".old-price", func(i int, e *colly.HTMLElement) {
+ log.Println(e.ChildText(".price"))
+ })
+ e.ForEach(".special-price", func(i int, e *colly.HTMLElement) {
+ log.Println(e.ChildText(".price"))
+ })
+ })
+ log.Println(e.ChildAttr("img", "src"))
+
+ fmt.Println("")
+ })
+
+ c.Visit("https://www.bottleworld.de/aktuelle-sonderpreise/show/all")
+}
+
+func main() {
+ ScrapeBottleWord()
+}