不知为何程序乱了.....
library(tm)
library(tmcn)
library(Rwordseg)
Data <- read.csv("Data.csv",head=TRUE,sep=",")
Review <- unlist(Data$cont)
Rev <- vector()
times <- floor(length(Review)/2000)
for (j in 1:times) {
for(i in 1:2000) {
Rev[j] <- paste(Rev[j],as.character(Review[[i+(j-1)*2000+1]]))
}
}
review <- apply(Rev,segmentCN)
review <- sapply(review,strsplit,"")
result <- table(unlist(reviwe))
statistics <- rev(sort(result))
words <- data.frame(word=names(statistics), freq=statistics)
words <- subset(words, nchar(as.character(words$word))>1 & words$freq>=100)


雷达卡




京公网安备 11010802022788号







