src.corpora.auto.auto_detokenize

auto_detokenize(dataset_id: str, dataset: DatasetDict, preprocess_path: Path, preprocessing_num_proc: int = 4) DatasetDict[source]