cerebras.modelzoo.data_preparation.nlp.data_dedup.generate_duplicate_pairs.lsh#

cerebras.modelzoo.data_preparation.nlp.data_dedup.generate_duplicate_pairs.lsh(out_file, doc_queue, idx)[source]#