Tokenize text files in `path` in parallel using `n_workers`
tokenize_folder(
path,
extensions = NULL,
folders = NULL,
output_dir = NULL,
skip_if_exists = TRUE,
output_names = NULL,
n_workers = 6,
rules = NULL,
tok = NULL,
encoding = "utf8"
)
path
extensions
folders
output_dir
skip_if_exists
output_names
number of workers
rules
tokenizer
encoding
None