modelzoo.transformers.data_processing.slimpajama.dedup.to_hash.get_documents#

modelzoo.transformers.data_processing.slimpajama.dedup.to_hash.get_documents(input_dir, index_start, index_end, output_dir, dataset_name)[source]#