From 35882837a2821749f3a2b1dfa23f19c4168004d3 Mon Sep 17 00:00:00 2001 From: Max Date: Thu, 1 Feb 2018 16:13:56 +0100 Subject: Crawled the first seven shops. --- whiskyde.go | 46 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 46 insertions(+) create mode 100644 whiskyde.go (limited to 'whiskyde.go') diff --git a/whiskyde.go b/whiskyde.go new file mode 100644 index 0000000..aa00279 --- /dev/null +++ b/whiskyde.go @@ -0,0 +1,46 @@ +package main + +import ( + "fmt" + "log" + + "github.com/gocolly/colly" +) + +func ScrapeWhiskyde() { + c := colly.NewCollector( + colly.AllowedDomains("whisky.de"), + colly.AllowedDomains("www.whisky.de"), + ) + + c.OnHTML(".is-buyable", func(e *colly.HTMLElement) { + + whisky_name := e.ChildAttr("a", "title") + whisky_url := e.ChildAttr("a", "href") + log.Println(whisky_name) + log.Println(whisky_url) + + e.ForEach(".article-price-original", func(i int, e *colly.HTMLElement) { + log.Println(e.ChildText("del")) + }) + e.ForEach(".article-price", func(i int, e *colly.HTMLElement) { + log.Println(e.ChildText(".article-price-default")) + }) + + e.ForEach(".article-thumbnail", func(i int, e *colly.HTMLElement) { + log.Println(e.ChildAttr("img", "data-src")) + }) + + e.ForEach(".article-price-prefix", func(i int, e *colly.HTMLElement) { + log.Println(e.ChildText(".article-price-special")) + }) + + fmt.Println("") + }) + + c.Visit("https://www.whisky.de/shop/Aktuell/Sonderangebote/") +} + +func main() { + ScrapeWhiskyde() +} -- cgit v1.2.3