lexicon_size <- cl_lexicon_size(
"REUTERS",
p_attribute = "word",
registry = get_tmp_registry()
)
token_ids <- seq.int(from = 0, to = lexicon_size - 1)
cl_id2str(
"REUTERS",
p_attribute = "word",
id = token_ids,
registry = get_tmp_registry()
)
Run the code above in your browser using DataLab