R: wordcloud dari dua sumber
Jump to navigation
Jump to search
library(NLP)
library(RColorBrewer)
library(tm)
library(wordcloud)
tryTolower <- function(x){
y = NA
try_error = tryCatch(tolower(x), error = function(e) e)
if (!inherits(try_error, 'error'))
y = tolower(x)
return(y)
}
custom.stopwords <- c(stopwords('english'), 'sorry', 'amp', 'delta', 'amazon')
clean.vec <- function(text.vec){
text.vec <- tryTolower(text.vec)
text.vec <- removeWords(text.vec, custom.stopwords)
text.vec <- removePunctuation(text.vec)
text.vec <- stripWhitespace(text.vec)
text.vec <- removeNumbers(text.vec)
return(text.vec)
}
amzn<-read.csv('amzn_cs.csv')
delta<-read.csv('oct_delta.csv')
amzn.vec<-clean.vec(amzn$text)
delta.vec<-clean.vec(delta$text)
amzn.vec <- paste(amzn.vec, collapse=" ")
delta.vec <- paste(delta.vec, collapse=" ")
all <- c(amzn.vec, delta.vec)
all <- c(delta.vec, delta.vec)
corpus <- VCorpus(VectorSource(all))
tdm <- TermDocumentMatrix(corpus)
tdm.m <- as.matrix(tdm)
colnames(tdm.m) = c("Amazon", "delta")
display.brewer.all() pal <- brewer.pal(8, "Purples") pal <- pal[-(1:4)] commonality.cloud(tdm.m, max.words=200, random.order=FALSE,colors=pal)