cerebras.modelzoo.data_preparation.nlp.slimpajama.dedup.generate_duplicate_pairs.split_files#

cerebras.modelzoo.data_preparation.nlp.slimpajama.dedup.generate_duplicate_pairs.split_files(input_dir, n_proc)[source]#