0
#Loading Packages

library(tm)
library(wordcloud)

library(RColorBrewer)

speech="/Users/GregDuncan/Desktop/bills.txt"
modi_txt = readLines(speech)


modi<-Corpus(VectorSource(modi_txt))


modi_data<-tm_map(modi,stripWhitespace)

modi_data<-tm_map(modi_data,tolower)

modi_data<-tm_map(modi_data,removeNumbers)

modi_data<-tm_map(modi_data,removePunctuation)

modi_data<-tm_map(modi_data,removeWords, stopwords(“english”))


tdm_modi<-TermDocumentMatrix (modi_data) #Creates a TDM

TDM1<-as.matrix(tdm_modi) #Convert this into a matrix format

v = sort(rowSums(TDM1), decreasing = TRUE) #Gives you the frequencies for every word

Summary(v)



wordcloud (modi_data, scale=c(5,0.5), max.words=1, random.order=FALSE, rot.per=0.35, use.r.layout=FALSE, colors=brewer.pal(8, “Dark2″))

所以我试图从一个文档中制作一个词云。我正在尝试使用 Rscript 运行它,但遇到了这样的问题

  enter Error: unexpected input in "modi_data<-tm_map(modi_data,removeWords, stopwords(?"
Execution haltedcode here

   unexpected input in "wordcloud (modi_data, scale=c(5,0.5), max.words=1, random.order=FALSE, rot.per=0.35, use.r.layout=FALSE, colors=brewer.pal(8, �"

我对 R 很陌生,所以我试图学习基础知识。不知道有没有经验的人能很快看到问题

4

1 回答 1

0

请注意下面的更改,它应该运行。我使用crude了 tm 包中的数据集。

library(tm)
library(wordcloud)

library(RColorBrewer)

data(crude)
modi_txt <- crude

modi<-Corpus(VectorSource(modi_txt))


modi_data<-tm_map(modi,stripWhitespace)

modi_data<-tm_map(modi_data,tolower)

modi_data<-tm_map(modi_data,removeNumbers)

modi_data<-tm_map(modi_data,removePunctuation)

modi_data<-tm_map(modi_data, removeWords, stopwords("english")) # NB quote marks were wrong.  This can happen if you copied from Word, for example

modi_data<-tm_map(modi_data, PlainTextDocument) # NB: added this call

tdm_modi<-TermDocumentMatrix (modi_data)

TDM1<-as.matrix(tdm_modi) 

v = sort(rowSums(TDM1), decreasing = TRUE) 

summary(v) # NB need lower case "s"

wordcloud (modi_data, scale=c(5,0.5), max.words=1, random.order=FALSE, rot.per=0.35,
           use.r.layout=FALSE, colors=brewer.pal(8, "Dark2"))  # NB had to fix quotes for "D...

这里的结果很奇怪,但是您可能想尝试一下您的wordcloud论点。

在此处输入图像描述

于 2015-05-22T01:33:54.590 回答