in DianJin-R1/src/evaluate/eval.py [0:0]
def eval_finqa(path):
correct_cnt = 0
total_cnt = 0
with open(path) as f:
for line in f:
total_cnt += 1
line = line.strip()
item = json.loads(line)
# gpt-4o评估结果
response = item['output']
if "boxed{{1}}" in response:
correct_cnt += 1
print("=" * 20 + " Accuracy " + "=" * 20)
print(correct_cnt)
print(total_cnt)
print(correct_cnt / total_cnt)