diff options
Diffstat (limited to 'crawler/sanitize.go')
| -rw-r--r-- | crawler/sanitize.go | 30 |
1 files changed, 30 insertions, 0 deletions
diff --git a/crawler/sanitize.go b/crawler/sanitize.go new file mode 100644 index 0000000..ddcd4f6 --- /dev/null +++ b/crawler/sanitize.go @@ -0,0 +1,30 @@ +package main + +import ( + "log" + "regexp" + "strings" +) + +func sanitize_offer(angebote []Angebot) []Angebot { + + for _, offer := range angebote { + offer.Name = sanitize_name(offer.Name) + } + + return angebote +} + +func sanitize_name(name string) string { + if strings.Contains(name, "y.o.") { + name = strings.Replace(name, "y.o.", "Jahre", 1) + } + r_liter, err := regexp.Compile("[0-9]+([,.][0-9](([lL])| ([Ll]iter))?") + if err != nil { + log.Fatal(err) + } + name_liter := r_liter.FindString(name) + name = strings.Replace(name, name_liter, "", 1) + + return name +} |
