diff options
| author | Max | 2018-02-01 16:13:56 +0100 |
|---|---|---|
| committer | Max | 2018-02-01 16:13:56 +0100 |
| commit | 35882837a2821749f3a2b1dfa23f19c4168004d3 (patch) | |
| tree | 5d6ac5078aebac93db47e507f564842d120bd1a3 /mcwhisky.go | |
| parent | a5bda60647639e787a777446dce693ac330fe940 (diff) | |
| download | alkobote-35882837a2821749f3a2b1dfa23f19c4168004d3.tar.gz | |
Crawled the first seven shops.
Diffstat (limited to 'mcwhisky.go')
| -rw-r--r-- | mcwhisky.go | 42 |
1 files changed, 42 insertions, 0 deletions
diff --git a/mcwhisky.go b/mcwhisky.go new file mode 100644 index 0000000..a70750f --- /dev/null +++ b/mcwhisky.go @@ -0,0 +1,42 @@ +package main + +import ( + "fmt" + "log" + // "strings" + + // "github.com/PuerkitoBio/goquery" + "github.com/gocolly/colly" +) + +func ScrapeMCWhisky() { + c := colly.NewCollector( + colly.AllowedDomains("mcwhisky.com"), + colly.AllowedDomains("www.mcwhisky.com"), + ) + + c.OnHTML("li.item", func(e *colly.HTMLElement) { + whisky_name := e.ChildAttr("a", "title") + whisky_url := e.ChildAttr("a", "href") + log.Println(whisky_name) + log.Println(whisky_url) + + e.ForEach(".price-box", func(i int, e *colly.HTMLElement) { + e.ForEach(".old-price", func(i int, e *colly.HTMLElement) { + log.Println(e.ChildText(".price")) + }) + e.ForEach(".special-price", func(i int, e *colly.HTMLElement) { + log.Println(e.ChildText(".price")) + }) + }) + log.Println(e.ChildAttr("img", "src")) + + fmt.Println("") + }) + + c.Visit("https://www.mcwhisky.com/whisky/whisky-sonderangebote.html") +} + +func main() { + ScrapeMCWhisky() +} |
