in misc/precision_filtering/slurm_count_word.py [0:0]
def generate_tokenizer_identifier(row): return f"{row['type']}-{row['tok_code']}"