in human_eval/evaluation.py [0:0]
def evaluate_functional_correctness( sample_file: str, k: List[int] = [1, 10, 100], n_workers: int = 4, timeout: float = 3.0, problem_file: str = HUMAN_EVAL,