in simpleqa_eval.py [0:0]
def grade_sample(self, question: str, target: str, predicted_answer: str) -> str:
grader_prompt = GRADER_TEMPLATE.format(
question=question,
target=target,
predicted_answer=predicted_answer,
)
prompt_messages = [
self.grader_model._pack_message(content=grader_prompt, role="user")
]
grading_response = self.grader_model(prompt_messages)
match = re.search(r"(A|B|C)", grading_response)
return match.group(0) if match else "C" # Default to "NOT_ATTEMPTED" if no match