mycorpus <- corpus_subset(data_corpus_inaugural, Year>1900)
mydict <- dictionary(list(christmas = c("Christmas", "Santa", "holiday"),
opposition = c("Opposition", "reject", "notincorpus"),
taxing = "taxing",
taxation = "taxation",
taxregex = "tax*",
country = "america"))
head(dfm(mycorpus, dictionary = mydict))
# also works
mydict2 <- dictionary(christmas = c("Christmas", "Santa", "holiday"),
opposition = c("Opposition", "reject", "notincorpus"))
dfm(mycorpus, dictionary = mydict2)
## Not run: ------------------------------------
# # import the Laver-Garry dictionary from http://bit.ly/1FH2nvf
# lgdict <- dictionary(file = "http://www.kenbenoit.net/courses/essex2014qta/LaverGarry.cat",
# format = "wordstat")
# head(dfm(data_corpus_inaugural, dictionary = lgdict))
#
# # import a LIWC formatted dictionary from http://www.moralfoundations.org
# mfdict <- dictionary(file = "http://ow.ly/VMRkL", format = "LIWC")
# head(dfm(data_corpus_inaugural, dictionary = mfdict))
## ---------------------------------------------
Run the code above in your browser using DataLab