webscraping后保存.txt文件,不带空格
这是我的代码,用于使用R进行Web垃圾处理,效果很好webscraping后保存.txt文件,不带空格,r,R,这是我的代码,用于使用R进行Web垃圾处理,效果很好 require(httr) require(rvest) library(KoNLP) useSejongDic() total = c() site = "http://movie.daum.net/moviedb/grade? movieId=92107&type=netizen&page=" for( i in 1:10){ url = paste0(site, i); mention = GET(
require(httr)
require(rvest)
library(KoNLP)
useSejongDic()
total = c()
site = "http://movie.daum.net/moviedb/grade?
movieId=92107&type=netizen&page="
for( i in 1:10){
url = paste0(site, i);
mention = GET(url) %>% read_html() %>%
html_nodes("p.desc_review") %>%
html_text() %>%
repair_encoding();
total = rbind(total, mention);
}
total = gsub("\t","",total)
total = gsub("\n","",total)
text1=extractNoun(total)
noun= sapply(total,extractNoun,USE.NAMES = FALSE)
undata= unlist(noun)
write(undata,"C:\\Users\\dlgof\\DATA.txt")
但是,txt文件中有太多的空格,如何删除它们
看起来您的undata中有很多“”。加 在你写作之前
undata = undata[undata != " "]