summaryrefslogtreecommitdiff
path: root/whiskysitenl.go
diff options
context:
space:
mode:
authorMax2018-02-01 16:13:56 +0100
committerMax2018-02-01 16:13:56 +0100
commit35882837a2821749f3a2b1dfa23f19c4168004d3 (patch)
tree5d6ac5078aebac93db47e507f564842d120bd1a3 /whiskysitenl.go
parenta5bda60647639e787a777446dce693ac330fe940 (diff)
downloadalkobote-35882837a2821749f3a2b1dfa23f19c4168004d3.tar.gz
Crawled the first seven shops.
Diffstat (limited to 'whiskysitenl.go')
-rw-r--r--whiskysitenl.go44
1 files changed, 44 insertions, 0 deletions
diff --git a/whiskysitenl.go b/whiskysitenl.go
new file mode 100644
index 0000000..30af0ef
--- /dev/null
+++ b/whiskysitenl.go
@@ -0,0 +1,44 @@
+package main
+
+import (
+ "fmt"
+ "log"
+ "regexp"
+ "strings"
+
+ "github.com/gocolly/colly"
+)
+
+func ScrapeWhiskysitenl() {
+ c := colly.NewCollector(
+ colly.AllowedDomains("whiskysite.nl"),
+ colly.AllowedDomains("www.whiskysite.nl"),
+ )
+
+ c.OnHTML(".product-block", func(e *colly.HTMLElement) {
+
+ whisky_name := e.ChildAttr("img", "alt")
+ whisky_url := e.ChildAttr("a", "href")
+ log.Println(whisky_name)
+ log.Println(whisky_url)
+ regular_price := e.ChildText(".price-old")
+ price_discount_noisy := e.ChildText(".product-block-price")
+ r, err := regexp.Compile("[0-9]+(,[0-9]{1,2})")
+ if err != nil {
+ log.Fatal(err)
+ }
+ discounted_price := r.FindString(strings.Trim(strings.TrimPrefix(price_discount_noisy, regular_price), ""))
+ log.Println(discounted_price + "€")
+ log.Println(strings.TrimPrefix(regular_price, "€") + "€")
+
+ log.Println(e.ChildAttr("img", "src"))
+
+ fmt.Println("")
+ })
+
+ c.Visit("https://www.whiskysite.nl/en/specials/?limit=100")
+}
+
+func main() {
+ ScrapeWhiskysitenl()
+}