Path Lines of Code src/datatrove/pipeline/dedup/bloom_filter.py 143 src/datatrove/pipeline/dedup/exact_substrings.py 229 src/datatrove/pipeline/filters/gopher_quality_filter.py 76 src/datatrove/pipeline/readers/ipc.py 64 src/datatrove/pipeline/tokens/context_shuffler.py 46 src/datatrove/utils/perplexity.py 138