This function detects multi-word expressions (collocations) of specified sizes that appear at least a specified number of times in the provided tokens.
Examples
if (interactive()) {
mydata <- TextAnalysisR::SpecialEduTech
united_tbl <- TextAnalysisR::unite_cols(
mydata,
listed_vars = c("title", "keyword", "abstract")
)
tokens <- TextAnalysisR::prep_texts(united_tbl, text_field = "united_texts")
collocations <- TextAnalysisR::detect_multi_words(tokens, size = 2:5, min_count = 2)
print(collocations)
}
