whatsapp tag cloud
# https://github.com/iPALVIKAS
d <- read.delim("pog.txt", header=F)
d <- sapply(data,function(row) iconv(row, 'latin1', 'ASCII',sub = ''))
library(tm)
newCorpus <- Corpus(VectorSource(d))
newCorpus <- tm_map(newCorpus, content_transformer(tolower))
newCorpus <- tm_map(newCorpus, removePunctuation)
newCorpus <- tm_map(newCorpus, removeNumbers)
newCorpus <- tm_map(newCorpus, stripWhitespace)
newCorpus <- tm_map(newCorpus, removeWords, stopwords("german"))
newCorpus <- tm_map(newCorpus, stemDocument, language = 'german')
ndtm <- DocumentTermMatrix(newCorpus)
nndtm <- as.matrix(ndtm)
library(wordcloud)
f <- colSums(nndtm)
f <- sort(f, decreasing = TRUE)
words <- names(f)
words <- as.vector(words)
f1 <- as.data.frame(f)
freq <- f1$f
wordcloud(words = words,
freq = freq,
min.freq = 4,
scale = c(2,0.5),
random.order = FALSE,
colors = brewer.pal(8, "Dark2"))