sergiolucero · November 9, 2017 19:00 · sergiolucero · Nov 9, 2017 · sergiolucero · Nov 9, 2017
diff --git a/wordcloud.R b/wordcloud.R
 library(tm);library(wordcloud);library(memoise)

 books <<- list("A Mid Summer Night's Dream" = "summer",
              "Glamorama" = "Glamorama1")     # The list of valid books

 getTermMatrix <- memoise(function(book) { # Using "memoise" to automatically cache the results
  if (!(book %in% books))  stop("Unknown book")
  text <- readLines(sprintf("./%s.txt.gz", book), encoding="UTF-8")

  myCorpus = Corpus(VectorSource(text))
  myCorpus = tm_map(myCorpus, content_transformer(tolower))
  myCorpus = tm_map(myCorpus, removePunctuation)
  myCorpus = tm_map(myCorpus, removeNumbers)
  myCorpus = tm_map(myCorpus, removeWords,
         c(stopwords("SMART"), "thy", "thou", "thee", "the", "and", "but"))

  myDTM = TermDocumentMatrix(myCorpus, control = list(minWordLength = 1))
  m = as.matrix(myDTM)
  sort(rowSums(m), decreasing = TRUE)
 })
	library(tm);library(wordcloud);library(memoise)

	books <<- list("A Mid Summer Night's Dream" = "summer",
	"Glamorama" = "Glamorama1") # The list of valid books

	getTermMatrix <- memoise(function(book) { # Using "memoise" to automatically cache the results
	if (!(book %in% books)) stop("Unknown book")
	text <- readLines(sprintf("./%s.txt.gz", book), encoding="UTF-8")

	myCorpus = Corpus(VectorSource(text))
	myCorpus = tm_map(myCorpus, content_transformer(tolower))
	myCorpus = tm_map(myCorpus, removePunctuation)
	myCorpus = tm_map(myCorpus, removeNumbers)
	myCorpus = tm_map(myCorpus, removeWords,
	c(stopwords("SMART"), "thy", "thou", "thee", "the", "and", "but"))

	myDTM = TermDocumentMatrix(myCorpus, control = list(minWordLength = 1))
	m = as.matrix(myDTM)
	sort(rowSums(m), decreasing = TRUE)
	})