# NOT RUN {
# This example assumes that the directories used by the CWB do not yet exist, so
# temporary directories are created.
cwb_dirs <- cwbtools::create_cwb_directories(prefix = tempdir(), ask = FALSE)
samplemode <- TRUE
corpus_id <- "GERMAPARLSAMPLE" # for full corpus: corpus_id <- "GERMAPARL"
dir.create(file.path(cwb_dirs[["corpus_dir"]], tolower(corpus_id)))
# Download topic model
germaparl_download_lda(
k = 30, # k = 250 recommended for full GERMAPARL corpus
data_dir = file.path(cwb_dirs[["corpus_dir"]], tolower(corpus_id)),
sample = samplemode
)
lda <- germaparl_load_lda(
k = 30L, registry_dir = cwb_dirs[["registry_dir"]],
sample = samplemode
)
lda_terms <- topicmodels::terms(lda, 10)
# }
Run the code above in your browser using DataLab