in training/train_amused.py [0:0]
def __init__( self, hf_dataset, tokenizer, image_key, prompt_key, prompt_prefix=None, size=512,