-
Lucas Schons authoredLucas Schons authored
Code owners
Assign users and groups as approvers for specific file changes. Learn more.
ExtractFromXML.R 420 B
#!/usr/bin/env Rscript
library(xml2)
data <- read_xml("../data/Wikipedia-20181120103842.xml")
title.nodes <- xml_find_all(data, ".//title")
titles <- sapply(title.nodes, xml_text)
text.nodes <- xml_find_all(data, ".//text")
texts <- sapply(text.nodes, xml_text)
df.out <- data.frame(Title = titles,
Text = texts)
saveRDS(df.out, "../data/texte.RDS")
write.table(df.out, "../data/texte.csv")