in filtering/deduplication/hf_dataset_to_file.py [0:0]
def sep(): global UID UID += 1 return pre_sep + struct.pack("<I", UID) + post_sep