- 분석예시
- WordCloud
김형준
Data Analyst
pre_processing<-function(data, start_line, end_line)
{
bodydata<-data[start_line:end_line]
bodydata<-gsub("<P align=justify></P>","",bodydata)
bodydata<-str_replace_all(bodydata, "[[:punct:]]|[a-zA-Z]|[\t+]", " ")
bodydata<-str_replace_all(bodydata, "[[:space:]][[:space:]]+", "")
bodydata<-bodydata[bodydata!=""&bodydata!=" "]
return(bodydata)
}
wordcloud_proc<-function(bodydata)
{
nouns<-sapply(bodydata,extractNoun)
wordcount <- table(unlist(nouns))
wordcount <- wordcount[nchar(names(wordcount))!=1]
return(wordcount)
}
[source][http://www.hani.co.kr/arti/politics/politics_general/575390.html]
[source][http://stock.mt.co.kr/view/mtview.php?type=1&no=2008022510425323553]
[source][http://legacy.www.hani.co.kr/section-003000000/2003/02/003000000200302251026287.html]