-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathgovid19.go
131 lines (120 loc) · 3.3 KB
/
govid19.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
package govid19
import (
"fmt"
"github.com/gocarina/gocsv"
"github.com/gocolly/colly"
"os"
"strconv"
"strings"
"time"
)
type Country struct {
Name string `csv:"country_other"`
TotalCases int `csv:"total_cases"`
NewCases int `csv:"new_cases"`
TotalDeaths int `csv:"total_deaths"`
NewDeaths int `csv:"new_deaths"`
TotalRecovered int `csv:"total_recovered"`
ActiveCases int `csv:"active_cases"`
SeriousCritical int `csv:"seriousor_critical"`
TotalCases1MPop int `csv:"total_cases_1m_pop"`
Deaths1MPop int `csv:"deaths_1m_pop"`
TotalTests int `csv:"total_tests"`
Tests1MPop int `csv:"tests_1m_pop"`
}
func parseToInt(str string) int {
if val, err := strconv.ParseInt(strings.ReplaceAll(strings.ReplaceAll(str, ",", ""), " ", ""), 10, 64); err == nil {
return int(val)
}
return 0
}
func WriteToCSV(countries []*Country) error {
fn := fmt.Sprintf("covid-%s.csv", time.Now().Format(time.RFC3339))
file, err := os.Create(fn)
if err != nil {
return err
}
defer file.Close()
fmt.Printf("Saving scraped data in %s...\n", fn)
err = gocsv.MarshalFile(&countries, file)
if err != nil {
return err
}
return nil
}
func Scrape() []*Country {
url := "https://www.worldometers.info/coronavirus/"
countries := []*Country{}
c := colly.NewCollector()
c.OnRequest(func(r *colly.Request) {
fmt.Println("Visiting", r.URL)
})
c.OnHTML("#main_table_countries_today > tbody", func(e *colly.HTMLElement) {
e.ForEach("tr", func(_ int, e *colly.HTMLElement) {
if e.Attr("class") != "total_row_world" {
country := Country{}
e.ForEach("td", func(col int, e *colly.HTMLElement) {
switch col {
case 0:
if val, err := e.DOM.Children().Html(); err == nil {
country.Name = val
}
case 1:
if val, err := e.DOM.Html(); err == nil {
country.TotalCases = parseToInt(val)
}
case 2:
if val, err := e.DOM.Html(); err == nil {
country.NewCases = parseToInt(val)
}
case 3:
if val, err := e.DOM.Html(); err == nil {
country.TotalDeaths = parseToInt(val)
}
case 4:
if val, err := e.DOM.Html(); err == nil {
country.NewDeaths = parseToInt(val)
}
case 5:
if val, err := e.DOM.Html(); err == nil {
country.TotalRecovered = parseToInt(val)
}
case 6:
if val, err := e.DOM.Html(); err == nil {
country.ActiveCases = parseToInt(val)
}
case 7:
if val, err := e.DOM.Html(); err == nil {
country.SeriousCritical = parseToInt(val)
}
case 8:
if val, err := e.DOM.Html(); err == nil {
country.TotalCases1MPop = parseToInt(val)
}
case 9:
if val, err := e.DOM.Html(); err == nil {
country.Deaths1MPop = parseToInt(val)
}
case 10:
if val, err := e.DOM.Html(); err == nil {
country.TotalTests = parseToInt(val)
}
case 11:
if val, err := e.DOM.Html(); err == nil {
country.Tests1MPop = parseToInt(val)
}
case 12:
if val, err := e.DOM.Html(); err == nil {
country.Tests1MPop = parseToInt(val)
}
default:
fmt.Printf("Found extranous column in position %d\n", col)
}
})
countries = append(countries, &country)
}
})
})
c.Visit(url)
return countries
}