# NOT RUN {
# create tokens object from list of characters with custom concatenator
dict <- dictionary(list(country = 'United States',
sea = c('Atlantic Ocean', 'Pacific Ocean')))
lis <- list(c('The', 'United-States', 'has', 'the', 'Atlantic-Ocean',
'and', 'the', 'Pacific-Ocean', '.'))
toks <- as.tokens(lis, concatenator = '-')
tokens_lookup(toks, dict)
# combining tokens
toks1 <- tokens(c(doc1 = "a b c d e", doc2 = "f g h"))
toks2 <- tokens(c(doc3 = "1 2 3"))
toks1 + toks2
c(toks1, toks2)
# }
Run the code above in your browser using DataLab