def get_avg_scores()

in evals/eval/evaluate.py [0:0]


def get_avg_scores(results):
    scores = {}
    for lang_pair, datasets in results.items():
        tran_scores = [
            (tran, score) for data, trans in datasets.items() for tran, score in trans.items()
        ]
        avg_scores = {
            tran: statistics.mean([s for _, s in scores])
            for tran, scores in groupby(lambda x: x[0], tran_scores).items()
        }
        scores[lang_pair] = avg_scores
    return scores