lm_eval/tasks/tmmluplus/default/utils.py (11 lines of code) (raw):

import datasets def process_docs(dataset: datasets.Dataset) -> datasets.Dataset: def _helper(doc): # modifies the contents of a single # document in our dataset. answer_list = ["A", "B", "C", "D"] out_doc = { "questions": doc["question"], "choices": [doc["A"], doc["B"], doc["C"], doc["D"]], "goal": answer_list.index(doc["answer"]), } return out_doc return dataset.map(_helper) # returns back a datasets.Dataset object