in florence2-VQA/src_train/train_mlflow.py [0:0]
def collate_fn(batch, processor):
questions, answers, images = zip(*batch)
inputs = processor(text=list(questions), images=list(images), return_tensors="pt", padding=True).to(device)
return inputs, answers