use(pkg = "RcppCWB", corpus = "REUTERS")
# look up single tokens
cpos("REUTERS", query = "oil")
corpus("REUTERS") %>% cpos(query = "oil")
corpus("REUTERS") %>%
subset(grepl("saudi-arabia", places)) %>%
cpos(query = "oil")
partition("REUTERS", places = "saudi-arabia", regex = TRUE) %>%
cpos(query = "oil")
# use CQP query syntax
cpos("REUTERS", query = '"Saudi" "Arabia"')
corpus("REUTERS") %>% cpos(query = '"Saudi" "Arabia"')
corpus("REUTERS") %>%
subset(grepl("saudi-arabia", places)) %>%
cpos(query = '"Saudi" "Arabia"', cqp = TRUE)
partition("REUTERS", places = "saudi-arabia", regex = TRUE) %>%
cpos(query = '"Saudi" "Arabia"', cqp = TRUE)
Run the code above in your browser using DataLab