in utils/compute_score.py [0:0]
def main(model, path):
files = os.listdir(f'{path}')
qa_bert_list = []
tg_bert_list, sub_task_tg_bert_list = [], []
qa_list, tg_list, e2z_bleu_list, e2z_comet_list, z2e_bleu_list, z2e_comet_list, comet_list, acc_list, f1_list = [], [], [], [], [], [], [], [], []
sub_task_qa_list, sub_task_tg_list, sub_task_tc_list, sub_task_re_list = [], [], [], []
for f in files:
if model in f:
print('Model: %s' % model)
file_path = f'{path}/{f}'
# QA
rouge_l, qa_bert = compute_finqa(file_path)
qa_list.append(rouge_l)
qa_bert_list.append(qa_bert)
# TG
rouge_l_tg, sub_task_tg, tg_bert, tg_sub_task_bert = compute_text_generation(file_path)
tg_list.append(rouge_l_tg)
sub_task_tg_list.append(sub_task_tg)
tg_bert_list.append(tg_bert)
sub_task_tg_bert_list.append(tg_sub_task_bert)
# MT-e2zh
bleu, comet = compute_nmt_en2zh(file_path)
e2z_bleu_list.append(bleu)
e2z_comet_list.append(comet)
# MT-zh2e
bleu, comet = compute_nmt_zh2en(file_path)
z2e_bleu_list.append(bleu)
z2e_comet_list.append(comet)
# TC
acc, sub_task_acc = compute_text_classification(file_path)
acc_list.append(acc)
sub_task_tc_list.append(sub_task_acc)
# RE
f1, sub_task_re = compute_extraction(file_path)
f1_list.append(f1)
sub_task_re_list.append(sub_task_re)
# 总分类
print('QA mean: %s' % np.mean(qa_list), '\n')
print('QA Std: %s' % np.std(qa_list), '\n')
print('QA bert mean: %s' % np.mean(qa_bert_list), '\n')
print('QA bert Std: %s' % np.std(qa_bert_list), '\n')
print('TG mean: %s' % np.mean(tg_list), '\n')
print('TG Std: %s' % np.std(tg_list), '\n')
print('TG bert mean: %s' % np.mean(tg_bert_list), '\n')
print('TG bert Std: %s' % np.std(tg_bert_list), '\n')
print('EN2CH mean: %s' % np.mean(e2z_bleu_list), '\n')
print('EN2CH Std: %s' % np.std(e2z_bleu_list), '\n')
print('EN2CH comet mean: %s' % np.mean(e2z_comet_list), '\n')
print('EN2CH comet Std: %s' % np.std(e2z_comet_list), '\n')
print('CH2EN mean: %s' % np.mean(z2e_bleu_list), '\n')
print('CH2EN Std: %s' % np.std(z2e_bleu_list), '\n')
print('CH2EN comet mean: %s' % np.mean(z2e_comet_list), '\n')
print('CH2EN comet Std: %s' % np.std(z2e_comet_list), '\n')
print('TG mean: %s' % np.mean(tg_list), '\n')
print('TG Std: %s' % np.std(tg_list), '\n')
## 子任务分类
# TG
tg_df = pd.DataFrame(sub_task_tg_list)
print('TG sub task mean: %s' % tg_df.mean())
print('TG sub task std: %s' % tg_df.std())
tg_bert_df = pd.DataFrame(sub_task_tg_bert_list)
print('TG sub task bert mean: %s' % tg_bert_df.mean())
print('TG sub task bert std: %s' % tg_bert_df.std())
# TC
tc_df = pd.DataFrame(sub_task_tc_list)
print('TG sub task mean: %s' % tc_df.mean())
print('TG sub task std: %s' % tc_df.std())
# RE
re_df = pd.DataFrame(sub_task_re_list)
print('TG sub task mean: %s' % re_df.mean())
print('TG sub task std: %s' % re_df.std())