niderhoff
8/17/2017 - 8:08 AM

whatsapp tag cloud

whatsapp tag cloud

# https://github.com/iPALVIKAS
d <- read.delim("pog.txt", header=F)
d <- sapply(data,function(row) iconv(row, 'latin1', 'ASCII',sub = ''))

library(tm)

newCorpus <- Corpus(VectorSource(d))
newCorpus <- tm_map(newCorpus, content_transformer(tolower))
newCorpus <- tm_map(newCorpus, removePunctuation)
newCorpus <- tm_map(newCorpus, removeNumbers)
newCorpus <- tm_map(newCorpus, stripWhitespace)
newCorpus <- tm_map(newCorpus, removeWords, stopwords("german"))
newCorpus <- tm_map(newCorpus, stemDocument, language = 'german')

ndtm <- DocumentTermMatrix(newCorpus)
nndtm <- as.matrix(ndtm)

library(wordcloud)

f <- colSums(nndtm)
f <- sort(f, decreasing = TRUE)

words <- names(f)
words <- as.vector(words)

f1 <- as.data.frame(f)
freq <- f1$f

wordcloud(words = words, 
          freq = freq, 
          min.freq = 4,
          scale = c(2,0.5),
          random.order = FALSE,
          colors = brewer.pal(8, "Dark2"))