in data/datasets.py [0:0]
def _get_messages(self, item, image_count=0):
messages = []
for text in item['texts']:
messages.append({"role": "user", "content": text['user']})
messages.append({"role": "assistant", "content": text['assistant']})
if image_count > 0:
messages[0]["content"] = self.tokenizer.image_token * image_count * self.mp_image_token_length + messages[0]["content"]
return messages