1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
|
package main
import (
"fmt"
"time"
_ "database/sql"
_ "github.com/go-sql-driver/mysql"
//_ "github.com/mattn/go-sqlite3"
log "github.com/Sirupsen/logrus"
"github.com/jmoiron/sqlx"
flag "github.com/spf13/pflag"
)
type App struct {
Offers []Angebot
Shops []Shop
Config *Config
DB *sqlx.DB
Now int64
Debug bool
}
func main() {
var err error
// copy global config to avoid woring with globals
_own_config := _conf
app := App{Config: &_own_config}
// overwrite the global
_conf = Config{}
app.Now = time.Now().Unix()
if "sqlite3" == app.Config.DBDriver {
app.DB, err = sqlx.Connect(app.Config.DBDriver, app.Config.DBPath)
} else {
log.Debug(fmt.Sprintf(`Connecting to "%s" database "%s" as user "%s" on host "%s:%s" with extra options "%s".`, app.Config.DBDriver, app.Config.DBDBName, app.Config.DBUser, app.Config.DBHost, app.Config.DBPort, app.Config.DBOptions))
app.DB, err = sqlx.Connect(app.Config.DBDriver, app.Config.DBUser+":"+app.Config.DBPassword+"@tcp("+app.Config.DBHost+":"+app.Config.DBPort+")/"+app.Config.DBDBName+app.Config.DBOptions)
}
if err != nil {
Fatal(err, "Cannot connect to database")
}
if err = app.DB.Ping(); err != nil {
Fatal(err, "No connection to database")
}
defer app.DB.Close()
err = app.createTables()
if err != nil {
Fatal(err, "Creating table failed")
}
err = app.insertShops()
if err != nil {
Fatal(err, "Inserting shops failed")
}
shops, err := app.getShops()
if err != nil {
Fatal(err, "Getting shops failed")
}
// prints all crawlable shops
_flag := flag.Lookup("list-shops")
if _flag != nil && "true" == _flag.Value.String() {
log.SetLevel(log.InfoLevel)
for _, shop := range shops {
log.WithFields(
log.Fields{
"shop_id": shop.Id,
"shop_url": shop.Url,
"shop_short_url": shop.Short_url,
"shop_logo_url": shop.Logo_url,
"shipping costs": shop.Shipping_costs,
"free shipping": shop.Free_shipping,
},
).Info(shop.Name)
}
return
}
// reruns sanitizing functions over database
if app.Config.FixDatabase {
err := app.fix_db()
if err != nil {
Fatal(err, "Fix: Fixing database failed")
}
return
}
app.ScrapeHTML(shops)
// short url
err = app.post_process()
if err != nil {
Fatal(err, "Post processing failed")
}
}
|