# NOT RUN {
dfmat1 <- dfm(data_corpus_irishbudget2010)
# lemmatization
lis <- c("foci", "focus", "focused", "focuses", "focusing", "focussed", "focusses")
lemma <- rep("focus", length(lis))
dfmat2 <- dfm_replace(dfmat1, pattern = lis, replacement = lemma)
featnames(dfm_select(dfmat2, pattern = lis))
# stemming
feat <- featnames(dfmat1)
featstem <- char_wordstem(feat, "porter")
dfmat3 <- dfm_replace(dfmat1, pattern = feat, replacement = featstem, case_insensitive = FALSE)
identical(dfmat3, dfm_wordstem(dfmat1, "porter"))
# }
Run the code above in your browser using DataLab