cerebras.modelzoo.data_preparation.nlp.slimpajama.dedup.generate_duplicate_pairs.lsh#

cerebras.modelzoo.data_preparation.nlp.slimpajama.dedup.generate_duplicate_pairs.lsh(out_file, doc_queue, idx)[source]#