Path Lines of Code evals/data_test.py 35 evals/elsuite/already_said_that/test_distractors.py 170 evals/elsuite/basic/fuzzy_match_test.py 49 evals/elsuite/basic/includes_test.py 55 evals/elsuite/basic/json_match_test.py 74 evals/elsuite/basic/json_validator_test.py 46 evals/elsuite/basic/match_test.py 73 evals/elsuite/bluff/bluff/test_bluff_game.py 30 evals/elsuite/cant_do_that_anymore/chess/board_test.py 63 evals/elsuite/function_deduction/solvers_test.py 130 evals/elsuite/hr_ml_agent_bench/tests/test_actions.py 84 evals/elsuite/make_me_pay/makemepay_test.py 94 evals/elsuite/make_me_say/makemesay_test.py 715 evals/elsuite/skill_acquisition/test_skill_acquisition.py 98 evals/elsuite/test/match.py 28 evals/elsuite/twenty_questions/test_utils.py 22 evals/elsuite/utils_test.py 29 evals/record_test.py 26 evals/registry/data/stats-tests/samples.jsonl 3 evals/registry/data/test_comp_sci/questions.jsonl 3 evals/registry/data/test_english_pronunciations/samples.jsonl 3 evals/registry/data/test_fuzzy_match/samples.jsonl 3 evals/registry/data/test_japanese_english_numerals/samples.jsonl 3 evals/registry/data/test_japanese_radical/samples.jsonl 3 evals/registry/data/test_japanese_units/samples.jsonl 3 evals/registry/data/test_metaeval/joke_fruits_labeled.jsonl 3 evals/registry/data/test_modelgraded/humor_people_jp.jsonl 3 evals/registry/data/test_modelgraded/joke_fruits.jsonl 3 evals/registry/data/test_multiio/battles/joke_animals_vs_fruits.jsonl 3 evals/registry/data/test_multiio/battles/rap_animals_vs_fruits.jsonl 3 evals/registry/data/test_multiio/battles/rap_people_vs_fruits.jsonl 3 evals/registry/data/test_multiio/battles/rap_people_vs_people.jsonl 3 evals/registry/data/test_time_zone_conversion/samples.v0.jsonl 3 evals/registry/data/theory_of_mind/socialiqa/test.jsonl 3 evals/registry/data/theory_of_mind/tomi/test.jsonl 3 evals/registry/evals/logical_reasoning_letter_series_test.yaml 8 evals/registry/evals/number_series_test.yaml 7 evals/registry/evals/test_english_pronunciations.yaml 8 evals/registry/evals/test_japanese_english_numerals.yaml 8 evals/registry/evals/test_japanese_radical.yaml 8 evals/registry/evals/test_japanese_units.yaml 8 evals/registry_test.py 28 evals/solvers/postprocessors/postprocessors_test.py 55 evals/solvers/providers/anthropic/anthropic_solver_test.py 96 evals/solvers/providers/google/gemini_solver_test.py 47 evals/solvers/providers/openai/openai_assistants_solver_test.py 173 evals/solvers/providers/together/together_solver_test.py 98 evals/solvers/solver_test.py 55 evals/utils/test.py 17 tests/unit/evals/test_metrics.py 20