diff options
| author | horus_arch | 2018-02-04 15:37:50 +0100 |
|---|---|---|
| committer | horus_arch | 2018-02-04 15:37:50 +0100 |
| commit | 0ab75dabe3a9547b8cb716d950d5657eafb28293 (patch) | |
| tree | 66cd62c1212a074e8e24a449a7b7ab1b808f27ae /whiskyde.go | |
| parent | b42583bf37db833649e7687655e2623cf50716db (diff) | |
| download | alkobote-0ab75dabe3a9547b8cb716d950d5657eafb28293.tar.gz | |
Adds structured data processing.
Diffstat (limited to 'whiskyde.go')
| -rw-r--r-- | whiskyde.go | 17 |
1 files changed, 16 insertions, 1 deletions
diff --git a/whiskyde.go b/whiskyde.go index 99df1ff..90032ba 100644 --- a/whiskyde.go +++ b/whiskyde.go @@ -7,7 +7,9 @@ import ( "github.com/gocolly/colly" ) -func ScrapeWhiskyde() { +func ScrapeWhiskyde() []Angebot { + Whiskys := []Angebot{} + c := colly.NewCollector( colly.AllowedDomains("whisky.de"), colly.AllowedDomains("www.whisky.de"), @@ -15,28 +17,41 @@ func ScrapeWhiskyde() { c.OnHTML(".is-buyable", func(e *colly.HTMLElement) { + W := Angebot{} + whisky_name := e.ChildAttr("a", "title") + W.Name = whisky_name whisky_url := e.ChildAttr("a", "href") + W.Url = whisky_url + log.Println(whisky_name) log.Println(whisky_url) e.ForEach(".article-price-original", func(i int, e *colly.HTMLElement) { + W.Original_price = e.ChildText("del") log.Println(e.ChildText("del")) }) e.ForEach(".article-price", func(i int, e *colly.HTMLElement) { + W.Discounted_price = e.ChildText(".article-price-default") log.Println(e.ChildText(".article-price-default")) }) e.ForEach(".article-thumbnail", func(i int, e *colly.HTMLElement) { + W.Image_url = e.ChildAttr("img", "data-src") log.Println(e.ChildAttr("img", "data-src")) }) e.ForEach(".article-price-prefix", func(i int, e *colly.HTMLElement) { + W.Valid_until = e.ChildText(".article-price-special") log.Println(e.ChildText(".article-price-special")) }) + Whiskys = append(Whiskys, W) + fmt.Println("") }) c.Visit("https://www.whisky.de/shop/Aktuell/Sonderangebote/") + + return Whiskys } |
