lm_eval/tasks/lambada_multilingual_stablelm/lambada_mt_stablelm_en.yaml (20 lines of code) (raw):
group:
- lambada_multilingual_stablelm
task: lambada_openai_mt_stablelm_en
dataset_path: marcob/lambada_multilingual
dataset_name: en
output_type: loglikelihood
test_split: test
doc_to_text: "{{text.split(' ')[:-1]|join(' ')}}"
doc_to_target: "{{' '+text.split(' ')[-1]}}"
should_decontaminate: true
doc_to_decontamination_query: "{{text}}"
metric_list:
- metric: perplexity
aggregation: perplexity
higher_is_better: false
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 1.0