-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathscrap.R
40 lines (27 loc) · 1.34 KB
/
scrap.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
library(dplyr)
library(rvest)
ap <- read_html("html_data/apygardos.html",encoding="utf-8")
apl <- ap %>% html_nodes("table") %>% html_nodes("a") %>% html_attrs()
link_pref <- "http://www.vrk.lt/2016-seimo/rezultatai"
apl1 <- apl %>% lapply(function(x) {
names(x) <-NULL
paste0(link_pref,x)
}) %>% do.call("c",.)
fn <- apl1 %>% gsub(".*_rpgId-","",.)
writeLines(apl1,"link_data/apygardu_linkai.txt")
dap <- read_html("html_data/dm_apygardos.html", encoding="utf-8")
dapl <- dap %>% html_nodes("table")
dapl1 <- dapl[[3]] %>% html_nodes("a") %>% html_attrs() %>%
lapply(function(x) {
names(x) <-NULL
paste0(link_pref,x)
}) %>% do.call("c",.)
writeLines(dapl1,"link_data/dm_apygardu_linkai.txt")
dmr <- dapl[[2]] %>% html_table(fill = TRUE) %>% format_dm_main_table
colnames(dmr) <- c("partijos_no","partija","apylinkes","pastas","balsai","proc_rinkejai","mandatai")
dmr <- dmr %>% filter(partijos_no!="") %>%
mutate(partijos_no = as.integer(partijos_no), mandatai = as.integer(mandatai)) %>%
inner_join(pnames2 %>% select(partijos_no,partija1), by = "partijos_no") %>%
rename(partija_full = partija) %>% rename(partija = partija1)
dmr %>% write.csv2("csv_data/daugiamandaciu_rezultatai.csv", row.names = FALSE)
c("partijos_no","partija","apylinkes","pastas","balsai","proc_rinkejai","proc_rinkejai_lt","apygarda")