in evals/eval/evaluate.py [0:0]
def get_avg_scores(results):
scores = {}
for lang_pair, datasets in results.items():
tran_scores = [
(tran, score) for data, trans in datasets.items() for tran, score in trans.items()
]
avg_scores = {
tran: statistics.mean([s for _, s in scores])
for tran, scores in groupby(lambda x: x[0], tran_scores).items()
}
scores[lang_pair] = avg_scores
return scores