From 0ab75dabe3a9547b8cb716d950d5657eafb28293 Mon Sep 17 00:00:00 2001 From: horus_arch Date: Sun, 4 Feb 2018 15:37:50 +0100 Subject: Adds structured data processing. --- whiskyde.go | 17 ++++++++++++++++- 1 file changed, 16 insertions(+), 1 deletion(-) (limited to 'whiskyde.go') diff --git a/whiskyde.go b/whiskyde.go index 99df1ff..90032ba 100644 --- a/whiskyde.go +++ b/whiskyde.go @@ -7,7 +7,9 @@ import ( "github.com/gocolly/colly" ) -func ScrapeWhiskyde() { +func ScrapeWhiskyde() []Angebot { + Whiskys := []Angebot{} + c := colly.NewCollector( colly.AllowedDomains("whisky.de"), colly.AllowedDomains("www.whisky.de"), @@ -15,28 +17,41 @@ func ScrapeWhiskyde() { c.OnHTML(".is-buyable", func(e *colly.HTMLElement) { + W := Angebot{} + whisky_name := e.ChildAttr("a", "title") + W.Name = whisky_name whisky_url := e.ChildAttr("a", "href") + W.Url = whisky_url + log.Println(whisky_name) log.Println(whisky_url) e.ForEach(".article-price-original", func(i int, e *colly.HTMLElement) { + W.Original_price = e.ChildText("del") log.Println(e.ChildText("del")) }) e.ForEach(".article-price", func(i int, e *colly.HTMLElement) { + W.Discounted_price = e.ChildText(".article-price-default") log.Println(e.ChildText(".article-price-default")) }) e.ForEach(".article-thumbnail", func(i int, e *colly.HTMLElement) { + W.Image_url = e.ChildAttr("img", "data-src") log.Println(e.ChildAttr("img", "data-src")) }) e.ForEach(".article-price-prefix", func(i int, e *colly.HTMLElement) { + W.Valid_until = e.ChildText(".article-price-special") log.Println(e.ChildText(".article-price-special")) }) + Whiskys = append(Whiskys, W) + fmt.Println("") }) c.Visit("https://www.whisky.de/shop/Aktuell/Sonderangebote/") + + return Whiskys } -- cgit v1.2.3