| @@ -153,10 +153,10 @@ parse_speech <- function(speech_xml, date) { | |||||
| } | } | ||||
| } else if (xml_name(node) == "kommentar") { | } else if (xml_name(node) == "kommentar") { | ||||
| # comments are of the form | # comments are of the form | ||||
| # <kommentar>(blabla [Fraktion] – blabla liasdf – bla)</kommentar> | |||||
| # <kommentar>(blabla [Fraktion] \u2013 blabla liasdf \u2013 bla)</kommentar> | |||||
| xml_text(node) %>% | xml_text(node) %>% | ||||
| str_sub(2, -2) %>% | str_sub(2, -2) %>% | ||||
| str_split("–") %>% | |||||
| str_split("\u2013") %>% | |||||
| `[[`(1) %>% | `[[`(1) %>% | ||||
| lapply(parse_comment, speech_id = speech_id, on_speaker = cur_speaker) -> | lapply(parse_comment, speech_id = speech_id, on_speaker = cur_speaker) -> | ||||
| cs | cs | ||||
| @@ -64,7 +64,7 @@ repair_talks <- function(talks) { | |||||
| #' | #' | ||||
| #' returns a lookup table | #' returns a lookup table | ||||
| lookup_speaker <- function(tb, speaker, name_variable) { | lookup_speaker <- function(tb, speaker, name_variable) { | ||||
| tobereplaced <- "[-–—‑- ]" | |||||
| tobereplaced <- "[\u002D\u2013\u2014\u2011\u00AD ]" | |||||
| speaker %>% | speaker %>% | ||||
| unite(name, prename, lastname, sep=".*") %>% | unite(name, prename, lastname, sep=".*") %>% | ||||
| mutate(name = str_replace_all(name, tobereplaced, ".*")) -> | mutate(name = str_replace_all(name, tobereplaced, ".*")) -> | ||||