modelzoo.transformers.data_processing.slimpajama.preprocessing.filter.get_short_documents#

modelzoo.transformers.data_processing.slimpajama.preprocessing.filter.get_short_documents(input_dir, threshold, n_proc, proc_idx, docs_queue, dataset_name)[source]#