path # lines of code # active days days since first update days since last update # commits # contributors first updated last updated first contributor last contributor training/mup.py 278 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com utils/hub_sync.py 153 5 770 758 5 3 2023-05-23 2023-06-04 n.muennighoff@gmail.com n.muennighoff@gmail.com utils/hub_auth.py 12 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com utils/hf_dataset_subsampling.py 71 3 925 889 7 2 2022-12-19 2023-01-24 teven.lescao@gmail.com ola.piktus@gmail.com utils/errornodes.py 35 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com utils/flops-params_py.py 36 1 744 744 1 1 2023-06-18 2023-06-18 n.muennighoff@gmail.com n.muennighoff@gmail.com utils/merge_generative.py 79 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com utils/cleandirs.py 10 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com utils/csv_generative.py 46 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/save_rust_format.py 22 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/add_dedup_info.py 123 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/save_roots_sample.py 46 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/hf_dataset_to_file.py 71 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/suffix_dedup.py 22 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/save_dataset.py 9 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/download_oscar.py 15 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/dedup_oscar.py 26 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/filter_oscar_jsonl.py 23 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering/deduplication/save_dataset_sample.py 43 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com filtering_notebooks/blindspots.ipynb 2462 2 770 769 2 2 2023-05-23 2023-05-24 n.muennighoff@gmail.com teven.lescao@gmail.com plotstables/filtering.ipynb 800 1 769 769 1 1 2023-05-24 2023-05-24 n.muennighoff@gmail.com n.muennighoff@gmail.com plotstables/repetition.ipynb 1376 2 769 762 2 1 2023-05-24 2023-05-31 n.muennighoff@gmail.com n.muennighoff@gmail.com