lm_eval/tasks/lambada/lambada_standard.yaml (21 lines of code) (raw):
tag:
- lambada
task: lambada_standard
dataset_path: lambada
dataset_name: null
output_type: loglikelihood
validation_split: validation
test_split: test
doc_to_text: "{{text.split(' ')[:-1]|join(' ')}}"
doc_to_target: "{{' '+text.split(' ')[-1]}}"
should_decontaminate: true
doc_to_decontamination_query: "{{text}}"
metric_list:
- metric: perplexity
aggregation: perplexity
higher_is_better: false
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 1.0