cerebras.modelzoo.data_preparation.nlp.data_dedup.generate_duplicate_pairs.split_files#

cerebras.modelzoo.data_preparation.nlp.data_dedup.generate_duplicate_pairs.split_files(input_dir, n_proc)[source]#