lmms_eval/tasks/ai2d/ai2d.yaml (33 lines of code) (raw):
dataset_path: lmms-lab/ai2d
task: "ai2d"
dataset_kwargs:
token: True
test_split: test
output_type: generate_until
doc_to_visual: !function utils.ai2d_doc_to_visual
doc_to_text: !function utils.ai2d_doc_to_text
doc_to_target: !function utils.ai2d_doc_to_target
generation_kwargs:
max_new_tokens: 16
temperature: 0
do_sample: False
metric_list:
- metric: exact_match
aggregation: mean
higher_is_better: true
ignore_case: true
ignore_punctuation: true
metadata:
- version: 0.0
model_specific_prompt_kwargs:
default:
prompt_format: mcq
pre_prompt: ""
post_prompt: "\nAnswer with the option's letter from the given choices directly."
# qwen formulate ai2d as question answering instead of mcq
qwen_vl:
prompt_format: qa
pre_prompt: ""
post_prompt: " Answer:"
model_specific_target_kwargs:
default: "mcq"
qwen_vl: "qa"