path # lines of code # active days days since first update days since last update # commits # contributors first updated last updated first contributor last contributor scripts/modelgraded_generator.py 185 6 781 481 9 5 2023-03-16 2024-01-10 shane@openai.com 140545726+ianmckenzie-oai@users.noreply.github.com scripts/pattern_identification_generator.py 48 6 782 481 6 6 2023-03-15 2024-01-10 jasonwei@openai.com 140545726+ianmckenzie-oai@users.noreply.github.com scripts/battle_generator.py 49 6 781 481 7 5 2023-03-16 2024-01-10 shane@openai.com 140545726+ianmckenzie-oai@users.noreply.github.com MANIFEST.in 4 3 767 754 4 3 2023-03-30 2023-04-12 jwang47@users.noreply.github.com 120423412+andrew-openai@users.noreply.github.com pyproject.toml 64 20 776 369 32 19 2023-03-21 2024-05-01 1520816+andremafei@users.noreply.github.com erik.t.ritter@gmail.com evals/base.py 51 5 777 587 5 4 2023-03-20 2023-09-26 343165+rlbayes@users.noreply.github.com lukevanseters@gmail.com evals/solvers/prompts/cot.py 4 2 543 403 2 2 2023-11-09 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/solvers/prompts/hhh.py 99 4 543 418 4 3 2023-11-09 2024-03-13 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/solvers/postprocessors/base.py 6 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/solvers/postprocessors/postprocessors.py 20 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/solvers/solver.py 125 4 543 403 4 2 2023-11-09 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/solvers/nested/fewshot_solver.py 91 2 462 418 2 2 2024-01-29 2024-03-13 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/solvers/nested/hhh_solver.py 33 2 462 418 2 2 2024-01-29 2024-03-13 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/solvers/nested/cot_solver.py 61 3 462 403 3 2 2024-01-29 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/solvers/nested/self_consistency_solver.py 118 3 462 403 3 2 2024-01-29 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/solvers/memory.py 50 1 403 403 1 1 2024-03-28 2024-03-28 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/solvers/utils.py 37 4 543 403 4 2 2023-11-09 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/solvers/providers/together/together_solver.py 68 1 403 403 1 1 2024-03-28 2024-03-28 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/solvers/providers/google/gemini_solver.py 157 1 405 405 1 1 2024-03-26 2024-03-26 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/solvers/providers/openai/openai_assistants_solver.py 186 1 403 403 1 1 2024-03-28 2024-03-28 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/solvers/providers/openai/openai_solver.py 181 1 403 403 1 1 2024-03-28 2024-03-28 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/solvers/providers/anthropic/anthropic_solver.py 89 2 410 405 2 2 2024-03-21 2024-03-26 giulio.starace@gmail.com oliver.jaffe@hotmail.co.uk evals/solvers/human_cli_solver.py 29 4 543 418 4 3 2023-11-09 2024-03-13 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/task_state.py 13 1 543 543 1 1 2023-11-09 2023-11-09 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/utils/log_utils.py 53 2 537 412 2 2 2023-11-15 2024-03-19 junshern@users.noreply.github.com giulio.starace@gmail.com evals/utils/misc.py 19 1 703 703 1 1 2023-06-02 2023-06-02 pan93412@gmail.com pan93412@gmail.com evals/utils/snowflake.py 100 1 744 744 1 1 2023-04-22 2023-04-22 max.rhodin@gmail.com max.rhodin@gmail.com evals/utils/api_utils.py 15 10 779 405 11 8 2023-03-18 2024-03-26 120423412+andrew-openai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/__init__.py 14 2 755 700 2 2 2023-04-11 2023-06-05 73198383+hwchung27@users.noreply.github.com pan93412@gmail.com evals/elsuite/error_recovery/scripts/dataset_creation.py 106 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/error_recovery/scripts/make_plots.py 446 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/error_recovery/defaults.py 12 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/error_recovery/eval.py 204 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/lambada.py 39 2 703 587 2 2 2023-06-02 2023-09-26 jwang47@users.noreply.github.com bomarni@googlemail.com evals/elsuite/translate.py 66 2 755 587 2 2 2023-04-11 2023-09-26 73198383+hwchung27@users.noreply.github.com lukevanseters@gmail.com evals/elsuite/sandbagging/scripts/sandbagging_subset_plots.py 46 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/sandbagging/scripts/consistency_plots.py 88 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/sandbagging/scripts/sandbagging_all_plots.py 27 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/sandbagging/scripts/utils.py 100 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/sandbagging/solvers.py 152 3 537 462 3 3 2023-11-15 2024-01-29 oliver.jaffe@hotmail.co.uk junshern@users.noreply.github.com evals/elsuite/sandbagging/sandbagging_eval.py 68 2 537 481 2 2 2023-11-15 2024-01-10 oliver.jaffe@hotmail.co.uk 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/sandbagging/mmlu_eval.py 60 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/sandbagging/defaults.py 12 2 537 481 2 2 2023-11-15 2024-01-10 oliver.jaffe@hotmail.co.uk 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/sandbagging/utils.py 47 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/multistep_web_tasks/solvers/webarena_solvers/webarena_prompts.py 12 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/solvers/webarena_solvers/webarena_solvers.py 94 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/solvers/strong_solver/strong_solver.py 173 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/solvers/strong_solver/strong_prompts.py 4 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/session.py 416 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/constants.py 70 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/bash_browser_env/bash_browser_utils.py 11 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/bash_browser_env/bash_browser_env.py 89 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/bash_env/actions.py 17 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/bash_env/__init__.py 1 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/bash_env/bash_utils.py 15 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/bash_env/basic_bash_env.py 163 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/processors.py 495 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/actions.py 1014 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/__init__.py 1 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/browser_utils.py 78 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/auto_login.py 100 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/helper_functions.py 129 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/env_config.py 29 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/constants.py 282 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/browser_env/basic_browser_env.py 191 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/evaluation_harness/evaluators.py 273 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/evaluation_harness/__init__.py 1 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/evaluation_harness/helper_functions.py 110 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/core/playwright_api.py 279 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/core/env.py 75 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/core/utils.py 188 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/eval_run.py 277 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/webarena/task_description.py 2 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/eval.py 51 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/utils.py 33 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/reproducibility/run_environments.py 29 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/reproducibility/make_task_jsonl.py 38 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/reproducibility/make_plots.py 94 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/docker/flask-playwright/app.py 165 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/docker/homepage/templates/index.html 108 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/docker/homepage/templates/scratchpad.html 105 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/docker/homepage/templates/calculator.html 106 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/multistep_web_tasks/docker/homepage/app.py 16 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/theory_of_mind/scripts/data_generation.py 66 1 537 537 1 1 2023-11-15 2023-11-15 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/theory_of_mind/scripts/make_plots.py 90 1 537 537 1 1 2023-11-15 2023-11-15 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/multiple_choice.py 84 2 728 587 2 2 2023-05-08 2023-09-26 jwang47@users.noreply.github.com bomarni@googlemail.com evals/elsuite/bluff/strategy_solver.py 88 3 537 403 3 3 2023-11-15 2024-03-28 33967107+johny-b@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/bluff/scripts/make_plots.py 103 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/elsuite/bluff/bluff/players.py 107 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/elsuite/bluff/bluff/cards.py 206 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/elsuite/bluff/bluff/__init__.py 1 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/elsuite/bluff/bluff/game.py 48 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/elsuite/bluff/bluff/round.py 37 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/elsuite/bluff/bluff/task_description.py 1 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/elsuite/bluff/solver_player.py 82 2 537 418 2 2 2023-11-15 2024-03-13 33967107+johny-b@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/bluff/eval.py 164 2 537 511 2 2 2023-11-15 2023-12-11 33967107+johny-b@users.noreply.github.com erik.t.ritter@gmail.com evals/elsuite/bluff/prompts.py 6 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/elsuite/make_me_pay/solvers/lm_con_artist_solver.py 64 2 537 462 2 2 2023-11-15 2024-01-29 oliver.jaffe@hotmail.co.uk junshern@users.noreply.github.com evals/elsuite/make_me_pay/solvers/prompts.py 18 2 537 481 2 2 2023-11-15 2024-01-10 oliver.jaffe@hotmail.co.uk 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/make_me_pay/scripts/make_plots.py 102 2 537 418 2 1 2023-11-15 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/make_me_pay/makemepay.py 222 2 594 537 2 2 2023-09-19 2023-11-15 140545726+ianmckenzie-oai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/make_me_pay/eval.py 126 3 594 418 3 2 2023-09-19 2024-03-13 140545726+ianmckenzie-oai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/make_me_pay/utils.py 47 3 594 517 3 3 2023-09-19 2023-12-05 140545726+ianmckenzie-oai@users.noreply.github.com erik.t.ritter@gmail.com evals/elsuite/make_me_pay/task_description.py 57 3 537 418 3 2 2023-11-15 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/self_prompting/solvers/custom_cot_solver.py 57 2 537 462 2 1 2023-11-15 2024-01-29 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/elsuite/self_prompting/solvers/baselines.py 45 2 537 462 2 1 2023-11-15 2024-01-29 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/elsuite/self_prompting/scripts/dataset/compile_data.py 67 1 537 537 1 1 2023-11-15 2023-11-15 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/elsuite/self_prompting/scripts/dataset/eval_list.py 52 1 537 537 1 1 2023-11-15 2023-11-15 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/elsuite/self_prompting/scripts/make_plots.py 118 1 537 537 1 1 2023-11-15 2023-11-15 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/elsuite/self_prompting/eval.py 210 1 537 537 1 1 2023-11-15 2023-11-15 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/elsuite/self_prompting/task_description.py 2 1 537 537 1 1 2023-11-15 2023-11-15 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/elsuite/already_said_that/scripts/gen_data.py 50 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/already_said_that/scripts/make_plots.py 263 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/already_said_that/solvers.py 29 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/already_said_that/eval.py 130 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/already_said_that/prompts.py 1 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/already_said_that/utils.py 104 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/already_said_that/distractors.py 81 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/ballots/scripts/make_plots.py 233 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/ballots/eval.py 161 3 594 502 3 2 2023-09-19 2023-12-20 140545726+ianmckenzie-oai@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/ballots/prompts.py 44 3 594 481 3 2 2023-09-19 2024-01-10 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/ballots/utils.py 118 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/basic/json_validator.py 41 4 752 693 4 2 2023-04-14 2023-06-12 120423412+andrew-openai@users.noreply.github.com 120423412+andrew-openai@users.noreply.github.com evals/elsuite/basic/includes.py 48 7 755 693 7 4 2023-04-11 2023-06-12 73198383+hwchung27@users.noreply.github.com 120423412+andrew-openai@users.noreply.github.com evals/elsuite/basic/json_match.py 77 1 556 556 1 1 2023-10-27 2023-10-27 vthorsteinsson@users.noreply.github.com vthorsteinsson@users.noreply.github.com evals/elsuite/basic/match.py 57 5 755 587 5 4 2023-04-11 2023-09-26 73198383+hwchung27@users.noreply.github.com lukevanseters@gmail.com evals/elsuite/basic/match_with_solvers.py 65 2 543 418 2 2 2023-11-09 2024-03-13 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/basic/fuzzy_match.py 49 5 755 700 5 4 2023-04-11 2023-06-05 73198383+hwchung27@users.noreply.github.com jwang47@users.noreply.github.com evals/elsuite/cant_do_that_anymore/chess/notation.py 61 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/chess/board.py 162 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/chess/move_variants.py 113 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/chess/pieces.py 203 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/chess/utils.py 75 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/scripts/dataset_creation.py 235 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/scripts/diagonal_dataset_creation.py 216 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/scripts/make_plots.py 100 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/defaults.py 2 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/eval.py 170 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/cant_do_that_anymore/utils.py 178 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/bugged_tools/tools.py 497 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/bugged_tools/scripts/plot_experiments.py 107 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/bugged_tools/bugged_tools.py 132 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/bugged_tools/eval.py 210 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/bugged_tools/utils.py 48 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/bugged_tools/task_description.py 9 2 412 403 2 1 2024-03-19 2024-03-28 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/identifying_variables/renderers/base.py 11 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/renderers/__init__.py 10 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/renderers/corrset.py 216 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/renderers/templates.py 26 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/renderers/tabular.py 125 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/scripts/plotting_utils.py 128 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/scripts/gen_data.py 319 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/scripts/table_utils.py 36 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/scripts/make_plots.py 325 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/structs.py 18 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/latent_funcs.py 30 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/solvers.py 27 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/constants.py 10 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/metrics.py 54 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/eval.py 227 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/prompts.py 8 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/utils.py 72 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/identifying_variables/graph_utils.py 130 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/steganography/scripts/dataset/custom_datasets.py 197 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/steganography/scripts/dataset/complexity_metrics.py 29 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/steganography/scripts/dataset/csv2jsonl.py 16 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/steganography/scripts/dataset/utils.py 29 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/steganography/scripts/dataset/dataset.py 106 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/steganography/scripts/make_plots.py 75 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/steganography/reconstruction_metrics.py 30 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/steganography/steganography.py 84 2 594 481 2 1 2023-09-19 2024-01-10 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/steganography/monitor.py 52 2 594 481 2 1 2023-09-19 2024-01-10 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/steganography/eval.py 69 2 594 481 2 1 2023-09-19 2024-01-10 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/steganography/prompts.py 55 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/solver_tools_convo.py 181 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/hr_ml_agent_bench/solvers/baseline.py 90 2 410 403 2 2 2024-03-21 2024-03-28 danesherbs@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/hr_ml_agent_bench/scripts/plot_experiments.py 307 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/scripts/run_experiments.py 60 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/actions.py 37 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/spaceship_titanic/scripts/prepare.py 22 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/spaceship_titanic/scripts/grade.py 26 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/spaceship_titanic/env/train.py 34 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/__init__.py 1 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/pong/scripts/grade.py 44 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/pong/env/train.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/pong/baselines/naive.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/pong/baselines/human.py 43 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/bipedal_walker/scripts/grade.py 31 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/bipedal_walker/env/train.py 27 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/bipedal_walker/baselines/naive.py 27 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/bipedal_walker/baselines/human.py 57 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/ogbn_arxiv/scripts/prepare.py 4 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/ogbn_arxiv/scripts/grade.py 53 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/ogbn_arxiv/env/train.py 126 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/parkinsons_disease/scripts/prepare.py 98 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/parkinsons_disease/scripts/grade.py 22 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/parkinsons_disease/env/train.py 124 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/vectorization/scripts/human_baseline.py 83 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/vectorization/scripts/grade.py 64 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/vectorization/env/train.py 118 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/house_price/scripts/prepare.py 20 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/house_price/scripts/grade.py 33 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/house_price/env/train.py 41 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/inverted_pendulum/scripts/grade.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/inverted_pendulum/env/train.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/inverted_pendulum/baselines/naive.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/inverted_pendulum/baselines/human.py 31 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/imdb/scripts/grade.py 27 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/imdb/env/train.py 21 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/pusher/scripts/grade.py 45 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/pusher/env/train.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/pusher/baselines/naive.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/pusher/baselines/human.py 29 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/feedback/scripts/prepare.py 24 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/feedback/scripts/grade.py 36 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/feedback/env/train.py 66 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/cartpole/scripts/grade.py 40 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/cartpole/env/train.py 27 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/cartpole/baselines/naive.py 27 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/cartpole/baselines/human.py 30 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/humanoid/scripts/grade.py 45 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/humanoid/env/train.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/humanoid/baselines/naive.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/humanoid/baselines/human.py 33 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/ant/scripts/grade.py 43 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/ant/env/train.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/ant/baselines/naive.py 28 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/ant/baselines/human.py 36 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/cifar10/scripts/prepare.py 5 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/cifar10/scripts/grade.py 35 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/benchmarks/cifar10/env/train.py 105 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/__init__.py 1 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/environment.py 283 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/high_level_actions.py 191 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/auto_marking.py 53 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/autoeval.py 172 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/schema.py 46 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/eval.py 91 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/prompts.py 26 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/utils.py 112 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/low_level_actions.py 304 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/hr_ml_agent_bench/prepare_task.py 40 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/elsuite/make_me_say/autoeval.py 116 4 594 517 4 4 2023-09-19 2023-12-05 140545726+ianmckenzie-oai@users.noreply.github.com erik.t.ritter@gmail.com evals/elsuite/make_me_say/defaults.py 34 2 594 481 2 1 2023-09-19 2024-01-10 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/make_me_say/core.py 223 3 594 418 3 2 2023-09-19 2024-03-13 140545726+ianmckenzie-oai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/make_me_say/eval.py 48 3 594 403 3 2 2023-09-19 2024-03-28 140545726+ianmckenzie-oai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/make_me_say/utils.py 34 6 594 502 6 5 2023-09-19 2023-12-20 140545726+ianmckenzie-oai@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/modelgraded/base.py 16 4 762 739 4 1 2023-04-04 2023-04-27 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/elsuite/modelgraded/classify.py 97 19 781 587 27 7 2023-03-16 2023-09-26 shane@openai.com bomarni@googlemail.com evals/elsuite/modelgraded/classify_utils.py 145 5 762 595 5 2 2023-04-04 2023-09-18 343165+rlbayes@users.noreply.github.com 97272807+sohenze@users.noreply.github.com evals/elsuite/incontext_rl/anti-cot_solver.py 29 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/incontext_rl/scripts/plot_experiments.py 233 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/incontext_rl/defaults.py 11 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/incontext_rl/eval.py 246 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/incontext_rl/env_setup.py 7 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/incontext_rl/baselines.py 93 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/track_the_stat/prompts/median.py 2 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/track_the_stat/prompts/__init__.py 11 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/track_the_stat/prompts/mode.py 2 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/track_the_stat/scripts/make_plots.py 235 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/track_the_stat/solvers.py 72 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/track_the_stat/eval.py 80 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/track_the_stat/utils.py 47 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/elsuite/utils.py 150 10 775 587 10 6 2023-03-22 2023-09-26 343165+rlbayes@users.noreply.github.com bomarni@googlemail.com evals/elsuite/skill_acquisition/scraping/scrape_distractor_articles.py 76 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/skill_acquisition/scraping/scrape_miskito.py 106 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/skill_acquisition/scripts/make_plots.py 157 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/skill_acquisition/solvers.py 13 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/skill_acquisition/eval.py 313 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/skill_acquisition/utils.py 115 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/skill_acquisition/task_description.py 1 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/mmmu/eval.py 159 3 501 488 3 1 2023-12-21 2024-01-03 erik.t.ritter@gmail.com erik.t.ritter@gmail.com evals/elsuite/schelling_point/eval.py 73 2 594 507 2 2 2023-09-19 2023-12-15 140545726+ianmckenzie-oai@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/schelling_point/prompts.py 25 3 594 481 3 2 2023-09-19 2024-01-10 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/schelling_point/utils.py 61 2 507 481 2 2 2023-12-15 2024-01-10 129281094+james-aung@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/text_compression/scripts/dataset/custom_datasets.py 119 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/text_compression/scripts/dataset/complexity_metrics.py 29 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/text_compression/scripts/dataset/csv2jsonl.py 16 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/text_compression/scripts/dataset/utils.py 29 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/text_compression/scripts/dataset/dataset.py 63 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/text_compression/scripts/make_plots.py 63 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/elsuite/text_compression/reconstruction_metrics.py 30 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/text_compression/compression.py 83 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/text_compression/eval.py 52 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/text_compression/prompts.py 46 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/elsuite/twenty_questions/scripts/make_plots.py 111 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/twenty_questions/eval.py 169 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/twenty_questions/utils.py 47 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/elsuite/function_deduction/scripts/dataset/create_dataset.py 44 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/function_deduction/scripts/make_plots.py 195 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/function_deduction/solvers.py 140 2 412 403 2 2 2024-03-19 2024-03-28 129281094+james-aung@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/function_deduction/eval.py 244 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/elsuite/function_deduction/prompts.py 6 2 412 403 2 2 2024-03-19 2024-03-28 129281094+james-aung@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/elsuite/function_deduction/baselines.py 91 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/data.py 148 9 780 398 10 10 2023-03-17 2024-04-02 343165+rlbayes@users.noreply.github.com 150190178+josnyder-2@users.noreply.github.com evals/registry.py 242 22 776 403 24 17 2023-03-21 2024-03-28 343165+rlbayes@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/track_the_stat.yaml 75 2 412 403 2 2 2024-03-19 2024-03-28 giulio.starace@gmail.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/function_deduction.yaml 174 2 412 403 2 2 2024-03-19 2024-03-28 129281094+james-aung@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/bluff.yaml 80 2 462 403 2 2 2024-01-29 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/together.yaml 85 2 409 403 2 2 2024-03-22 2024-03-28 giulio.starace@gmail.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/self_prompting.yaml 96 2 462 403 2 2 2024-01-29 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/skill_acquisition.yaml 267 2 412 403 2 2 2024-03-19 2024-03-28 inwaves@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/twenty_questions.yaml 75 2 412 403 2 2 2024-03-19 2024-03-28 inwaves@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/cant_do_that_anymore.yaml 16 2 412 403 2 1 2024-03-19 2024-03-28 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/solvers/identifying_variables.yaml 4 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/registry/solvers/anthropic.yaml 90 1 410 410 1 1 2024-03-21 2024-03-21 giulio.starace@gmail.com giulio.starace@gmail.com evals/registry/solvers/hr-ml-agent-bench.yaml 37 2 410 403 2 2 2024-03-21 2024-03-28 danesherbs@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/theory_of_mind.yaml 394 3 462 403 3 2 2024-01-29 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/multistep_web_tasks.yaml 56 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/solvers/already_said_that.yaml 75 2 412 403 2 2 2024-03-19 2024-03-28 giulio.starace@gmail.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/error_recovery.yaml 33 2 412 403 2 1 2024-03-19 2024-03-28 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/solvers/gemini.yaml 15 1 405 405 1 1 2024-03-26 2024-03-26 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/solvers/sandbagging.yaml 109 1 462 462 1 1 2024-01-29 2024-01-29 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/registry/solvers/incontext_rl.yaml 24 2 412 403 2 2 2024-03-19 2024-03-28 129281094+james-aung@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/defaults.yaml 294 3 462 403 3 2 2024-01-29 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/solvers/make-me-pay.yaml 101 2 462 403 2 2 2024-01-29 2024-03-28 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/data/hindi_words/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 36335769+0x34d@users.noreply.github.com 36335769+0x34d@users.noreply.github.com evals/registry/data/integer-sequence-predictions/obscure-sequences.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 davehdorzback@gmail.com davehdorzback@gmail.com evals/registry/data/integer-sequence-predictions/misc-and-recent-sequences.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 davehdorzback@gmail.com davehdorzback@gmail.com evals/registry/data/integer-sequence-predictions/samples.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 davehdorzback@gmail.com davehdorzback@gmail.com evals/registry/data/integer-sequence-predictions/notable-sequences.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 davehdorzback@gmail.com davehdorzback@gmail.com evals/registry/data/dutch-lexicon/samples.jsonl 3 2 744 698 2 2 2023-04-22 2023-06-07 riedel777@gmail.com laszlo.vandenhoek@gmail.com evals/registry/data/chinese-lantern-riddles/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 50411747+chenzhao44@users.noreply.github.com 50411747+chenzhao44@users.noreply.github.com evals/registry/data/reasoning_with_contradictory_statements/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 rishadzzzz@gmail.com rishadzzzz@gmail.com evals/registry/data/invert_word_wise/invert.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 38587927+ach-in@users.noreply.github.com 38587927+ach-in@users.noreply.github.com evals/registry/data/next-val-series/next-val-series.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 36852564+hmzakhalid@users.noreply.github.com 36852564+hmzakhalid@users.noreply.github.com evals/registry/data/sort_numeric/samples.jsonl 3 1 740 740 1 1 2023-04-26 2023-04-26 albertgozzi@gmail.com albertgozzi@gmail.com evals/registry/data/thirty_six_stratagems/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 20484971+cookfish@users.noreply.github.com 20484971+cookfish@users.noreply.github.com evals/registry/data/korean_yaminjeongeum/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 penandlim@gmail.com penandlim@gmail.com evals/registry/data/shared_border/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 paulgb@gmail.com paulgb@gmail.com evals/registry/data/code_combination/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 psingley@gmail.com psingley@gmail.com evals/registry/data/non-compound-names/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 jeremym@allenai.org jeremym@allenai.org evals/registry/data/non-compound-names/samples_meta.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 jeremym@allenai.org jeremym@allenai.org evals/registry/data/convert-hex-hsl-lightness/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 harley@hturan.com harley@hturan.com evals/registry/data/hebrew_plurals/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 59704420+relvok@users.noreply.github.com 59704420+relvok@users.noreply.github.com evals/registry/data/japanese_mahjong_discard_tile/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 mauryskull@gmail.com mauryskull@gmail.com evals/registry/data/shape_in_shape/shape_in_shape.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 70836043+pawel-krzych@users.noreply.github.com 70836043+pawel-krzych@users.noreply.github.com evals/registry/data/icelandic-inflection-medium/samples.jsonl 3 1 556 556 1 1 2023-10-27 2023-10-27 vthorsteinsson@users.noreply.github.com vthorsteinsson@users.noreply.github.com evals/registry/data/error_recovery/medium.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/error_recovery/small.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/error_recovery/main.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/decrypt_caesar_cipher/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 me@mattfalconer.com me@mattfalconer.com evals/registry/data/svg_alphabet/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 127973459+tudoratlumiai@users.noreply.github.com 127973459+tudoratlumiai@users.noreply.github.com evals/registry/data/belarusian_word_analogy_inflection/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/data/medmcqa/convert.js 44 1 744 744 1 1 2023-04-22 2023-04-22 shuriken209master@googlemail.com shuriken209master@googlemail.com evals/registry/data/medmcqa/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 shuriken209master@googlemail.com shuriken209master@googlemail.com evals/registry/data/code_progress/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 danielstrizhevsky@gmail.com danielstrizhevsky@gmail.com evals/registry/data/finance_calc/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 gondek.christopher@gmail.com gondek.christopher@gmail.com evals/registry/data/recurrence-relation/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 omarhishamk@gmail.com omarhishamk@gmail.com evals/registry/data/korean-postposition/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 lena.h.hong@gmail.com lena.h.hong@gmail.com evals/registry/data/countries/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 76214963+rxfxt@users.noreply.github.com 76214963+rxfxt@users.noreply.github.com evals/registry/data/relative_orientations/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 dbautista.cs@gmail.com dbautista.cs@gmail.com evals/registry/data/vigenere/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 grahamzemel@gmail.com grahamzemel@gmail.com evals/registry/data/dutch-rhymes/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 jonathan@verhe.es jonathan@verhe.es evals/registry/data/find-letter/samples.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 u.sivasweatha@gmail.com u.sivasweatha@gmail.com evals/registry/data/rare-and-loanwords-dutch-lexicon/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 135169801+riskablebe@users.noreply.github.com 135169801+riskablebe@users.noreply.github.com evals/registry/data/food/samples.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 christopherb737@gmail.com christopherb737@gmail.com evals/registry/data/spanish-lexicon/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 carlos@domintia.com carlos@domintia.com evals/registry/data/unsolvable_questions/convert.js 51 1 710 710 1 1 2023-05-26 2023-05-26 lucasklaassen@users.noreply.github.com lucasklaassen@users.noreply.github.com evals/registry/data/unsolvable_questions/findFailures.js 43 1 710 710 1 1 2023-05-26 2023-05-26 lucasklaassen@users.noreply.github.com lucasklaassen@users.noreply.github.com evals/registry/data/unsolvable_questions/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 lucasklaassen@users.noreply.github.com lucasklaassen@users.noreply.github.com evals/registry/data/coq-editing/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 jasongross9@gmail.com jasongross9@gmail.com evals/registry/data/coq-editing/labeled-samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 jasongross9@gmail.com jasongross9@gmail.com evals/registry/data/medication_dose/samples.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 130315355+mickaw2@users.noreply.github.com 130315355+mickaw2@users.noreply.github.com evals/registry/data/chinese_chu_ci/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 arvinx@foxmail.com arvinx@foxmail.com evals/registry/data/nepali_numerals/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 nepalsamyok@gmail.com nepalsamyok@gmail.com evals/registry/data/matrix_mult_rows/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 71815905+javrtg@users.noreply.github.com 71815905+javrtg@users.noreply.github.com evals/registry/data/belarusian_russian_translation/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/data/russian-verse/samples.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 halonazar1997@gmail.com halonazar1997@gmail.com evals/registry/data/number_reading/number_reading.jsonl 3 1 768 768 1 1 2023-03-29 2023-03-29 benjaminliu.eecs@gmail.com benjaminliu.eecs@gmail.com evals/registry/data/chinese_hard_translations/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 nicognaw@outlook.com nicognaw@outlook.com evals/registry/data/product-ie/zeroshot/product_ie_zero_shot_samples.jsonl 3 1 634 634 1 1 2023-08-10 2023-08-10 4548970+abrinkmann@users.noreply.github.com 4548970+abrinkmann@users.noreply.github.com evals/registry/data/product-ie/fewshot/product_ie_one_shot_samples.jsonl 3 1 634 634 1 1 2023-08-10 2023-08-10 4548970+abrinkmann@users.noreply.github.com 4548970+abrinkmann@users.noreply.github.com evals/registry/data/financial-derivatives/questions.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 hidemi@gmail.com hidemi@gmail.com evals/registry/data/map-electronic-component-part-to-fact/samples.jsonl 3 2 782 781 2 2 2023-03-15 2023-03-16 omattos@gmail.com 120423412+andrew-openai@users.noreply.github.com evals/registry/data/game_theory/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 phelps-sg@users.noreply.github.com phelps-sg@users.noreply.github.com evals/registry/data/german-part-of-speech/buildDataDe.py 69 2 704 587 2 2 2023-06-01 2023-09-26 vasco@piranhafleisch.de bomarni@googlemail.com evals/registry/data/german-part-of-speech/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 vasco@piranhafleisch.de vasco@piranhafleisch.de evals/registry/data/german-part-of-speech/parsePosDe.py 172 2 704 587 2 2 2023-06-01 2023-09-26 vasco@piranhafleisch.de bomarni@googlemail.com evals/registry/data/turkish-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/probability_questions/probability_questions.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 101657559+steven-luabase@users.noreply.github.com 101657559+steven-luabase@users.noreply.github.com evals/registry/data/macedonian-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/bias_detection/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 131893786+domenicomireles@users.noreply.github.com 131893786+domenicomireles@users.noreply.github.com evals/registry/data/sandbagging/samples-all-large.jsonl 3 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/sandbagging/samples-ast.jsonl 3 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/sandbagging/samples-non-ast.jsonl 3 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/sandbagging/samples-all.jsonl 3 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/ascii-digit-recognition/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 52069185+dddraxxx@users.noreply.github.com 52069185+dddraxxx@users.noreply.github.com evals/registry/data/spanish-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/complex-analogies-en-ru/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 karinageneraly@gmail.com karinageneraly@gmail.com evals/registry/data/brazilian_laws/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 lucianosb@users.noreply.github.com lucianosb@users.noreply.github.com evals/registry/data/find-thirukkural/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 u.sivasweatha@gmail.com u.sivasweatha@gmail.com evals/registry/data/italian_big_math_expression/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 38102850+danielepoterti@users.noreply.github.com 38102850+danielepoterti@users.noreply.github.com evals/registry/data/tetris/tetris.jsonl 3 1 715 715 1 1 2023-05-21 2023-05-21 sandmann@codedata.solutions sandmann@codedata.solutions evals/registry/data/raven-matrices/symbolic/distribute_nine.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic/center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic/up_center_single_down_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic/in_distribute_four_out_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic/distribute_four.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic/left_center_single_right_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic/in_center_single_out_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text/distribute_nine.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text/center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text/up_center_single_down_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text/in_distribute_four_out_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text/distribute_four.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text/left_center_single_right_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text/in_center_single_out_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic-open/distribute_nine.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic-open/center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic-open/up_center_single_down_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic-open/in_distribute_four_out_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic-open/distribute_four.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic-open/left_center_single_right_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/symbolic-open/in_center_single_out_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text-open/distribute_nine.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text-open/center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text-open/up_center_single_down_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text-open/in_distribute_four_out_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text-open/distribute_four.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text-open/left_center_single_right_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/raven-matrices/text-open/in_center_single_out_center_single.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/arithmetical_puzzles/arithmetical_puzzles.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 l.malmqvist@gmail.com l.malmqvist@gmail.com evals/registry/data/hebrew_homophones/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 59704420+relvok@users.noreply.github.com 59704420+relvok@users.noreply.github.com evals/registry/data/music_theory_scale_modes/samples.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 21stcenturydigitaljeff@gmail.com 21stcenturydigitaljeff@gmail.com evals/registry/data/superficialpatterns/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 hholt1@protonmail.com hholt1@protonmail.com evals/registry/data/beam_analysis/beam-analysis.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 jamesphillipturpin@gmail.com jamesphillipturpin@gmail.com evals/registry/data/chess/match.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 t.zehle@gmail.com t.zehle@gmail.com evals/registry/data/dna_melting_calculation/samples.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 isaacbeing@gmail.com isaacbeing@gmail.com evals/registry/data/rhetorical_devices/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 sirwesleybarlow@gmail.com sirwesleybarlow@gmail.com evals/registry/data/stock_options/stock_options_iron_condor_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_options_bear_call_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_options_inverse_iron_condor_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_option_terms_iron_condor_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_option_terms_bull_call_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_options_bull_call_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_option_terms_iron_butterfly_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_options_inverse_iron_butterfly_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_options_iron_butterfly_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_option_terms_inverse_iron_condor_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_option_terms_inverse_iron_butterfly_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/stock_options/stock_option_terms_bear_call_spread.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/data/korean-consonant-vowel-combination/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 dennis.hong@kakaocorp.com dennis.hong@kakaocorp.com evals/registry/data/abstract-causal-reasoning/symbolic_samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/abstract-causal-reasoning/text_samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/chinese_poem/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 bicheng.cao@gmail.com bicheng.cao@gmail.com evals/registry/data/sql/co_sql.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 pybbae@gmail.com pybbae@gmail.com evals/registry/data/sql/spider_sql.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 mark@haym.me mark@haym.me evals/registry/data/chess_piece_count/fuzzy_match.jsonl 3 1 781 781 2 2 2023-03-16 2023-03-16 120423412+andrew-openai@users.noreply.github.com jatinparab98@gmail.com evals/registry/data/chinese_homophonic/chinese_homophonic.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 124559520+hello-oscar@users.noreply.github.com 124559520+hello-oscar@users.noreply.github.com evals/registry/data/lunar_calendar/iso_to_lunar_calendar.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 132530236+clearlyloc@users.noreply.github.com 132530236+clearlyloc@users.noreply.github.com evals/registry/data/lunar_calendar/lunar_calendar_to_iso.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 132530236+clearlyloc@users.noreply.github.com 132530236+clearlyloc@users.noreply.github.com evals/registry/data/directions/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 rohan.m.kshirsagar@gmail.com rohan.m.kshirsagar@gmail.com evals/registry/data/pararule-plus-multi-step-deductive-reasoning/pararule-plus-multi-step-deductive-reasoning.jsonl 3 1 709 709 1 1 2023-05-27 2023-05-27 741150372@qq.com 741150372@qq.com evals/registry/data/numbers_game/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 134487556+ivafractal@users.noreply.github.com 134487556+ivafractal@users.noreply.github.com evals/registry/data/seating_arrangements/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 danielsj9@gmail.com danielsj9@gmail.com evals/registry/data/ascii_wordart/ascii_wordart.jsonl 3 1 721 721 1 1 2023-05-15 2023-05-15 61651096+derewah@users.noreply.github.com 61651096+derewah@users.noreply.github.com evals/registry/data/job_listing_title_for_a_caregiver_in_japan/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 tt@hcmj.biz tt@hcmj.biz evals/registry/data/rubiks-colors/samples.jsonl 3 1 717 717 1 1 2023-05-19 2023-05-19 zaidhaan03@gmail.com zaidhaan03@gmail.com evals/registry/data/chinese_zodiac/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 exjang0@gmail.com exjang0@gmail.com evals/registry/data/poker_hand_ranks/full_samples.jsonl 3 1 775 775 1 1 2023-03-22 2023-03-22 54050333+msilva-00@users.noreply.github.com 54050333+msilva-00@users.noreply.github.com evals/registry/data/polish-lexicon/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 rafalzawadzki@users.noreply.github.com rafalzawadzki@users.noreply.github.com evals/registry/data/bulgarian-lexicon/samples.jsonl 3 1 768 768 1 1 2023-03-29 2023-03-29 mdatsev@users.noreply.github.com mdatsev@users.noreply.github.com evals/registry/data/sindarin_fluency/sindarin_nouns.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 aaron@aaronsmith.tv aaron@aaronsmith.tv evals/registry/data/GPT-model-text-detection/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 udaykumaradusumilli97@gmail.com udaykumaradusumilli97@gmail.com evals/registry/data/backgammon/generate_samples.ipynb 1349 1 683 683 1 1 2023-06-22 2023-06-22 bakebrain@gmail.com bakebrain@gmail.com evals/registry/data/backgammon/backgammon-can-hit.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 bakebrain@gmail.com bakebrain@gmail.com evals/registry/data/backgammon/backgammon-illegal-move.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 bakebrain@gmail.com bakebrain@gmail.com evals/registry/data/italian-new-words/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 sdiviney@gmail.com sdiviney@gmail.com evals/registry/data/belarusian_grammar/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/data/ru_rhyming_phrases/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 36363097+latand@users.noreply.github.com 36363097+latand@users.noreply.github.com evals/registry/data/brazilian-lexicon/samples.jsonl 3 1 755 755 1 1 2023-04-11 2023-04-11 32521301+mreismendes@users.noreply.github.com 32521301+mreismendes@users.noreply.github.com evals/registry/data/internal_representations/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 syn@zbeacon.org syn@zbeacon.org evals/registry/data/polish-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/logic-riddles/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 55913678+cholotook@users.noreply.github.com 55913678+cholotook@users.noreply.github.com evals/registry/data/swedish_sat/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 justus.karlsson@hotmail.se justus.karlsson@hotmail.se evals/registry/data/reverse_string/reverse_string.jsonl 3 1 783 783 2 2 2023-03-14 2023-03-14 120423412+andrew-openai@users.noreply.github.com logan@openai.com evals/registry/data/cube-pack/samples.jsonl 3 2 782 781 3 2 2023-03-15 2023-03-16 emil@radix.ai emil@radix.ai evals/registry/data/vietnamese-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/theory_of_mind/hitom/hitom-multiple-choice.jsonl 3 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/theory_of_mind/hitom/hitom.jsonl 3 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/russian-english-homonym-context-resolution/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 10080307+gradientsky@users.noreply.github.com 10080307+gradientsky@users.noreply.github.com evals/registry/data/italian-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/aime_evaluation/samples.jsonl 3 1 718 718 1 1 2023-05-18 2023-05-18 emilymu@mit.edu emilymu@mit.edu evals/registry/data/viewport_to_grid_size/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 agoldsmith@alumni.scu.edu agoldsmith@alumni.scu.edu evals/registry/data/math_logic_operations/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 96959673+nathanstew7@users.noreply.github.com 96959673+nathanstew7@users.noreply.github.com evals/registry/data/portuguese-syllable-count/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 tucalipe@gmail.com tucalipe@gmail.com evals/registry/data/numerical-cabbala-casanova/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 giacomoran@gmail.com giacomoran@gmail.com evals/registry/data/compare-countries-area/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 69503759+yohei0731@users.noreply.github.com 69503759+yohei0731@users.noreply.github.com evals/registry/data/algebra_word_problems/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 alextraul@gmail.com alextraul@gmail.com evals/registry/data/reverse-polish-notation/questions.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 andrew.prokhorenkov@gmail.com andrew.prokhorenkov@gmail.com evals/registry/data/date-calculator/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 45112646+leoliu-xingchi@users.noreply.github.com 45112646+leoliu-xingchi@users.noreply.github.com evals/registry/data/mazes/3x3-mazes.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/mazes/nxn_maze_eval_generator.py 162 2 691 587 2 2 2023-06-14 2023-09-26 douglas.monsky@gmail.com bomarni@googlemail.com evals/registry/data/mazes/4x4-mazes.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/mazes/4x4-mazes-singlemove.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/mazes/3x3-mazes-singlemove.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/mazes/10x10-mazes-singlemove.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/mazes/10x10-mazes.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/Japanese_onomatopoeia/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 sap-csd@a-c-japan.com sap-csd@a-c-japan.com evals/registry/data/swedish-spelling/samples.jsonl 3 1 755 755 1 1 2023-04-11 2023-04-11 129839173+eellofgren@users.noreply.github.com 129839173+eellofgren@users.noreply.github.com evals/registry/data/balance_chemical_equation/samples.jsonl 3 2 781 715 3 2 2023-03-16 2023-05-21 120423412+andrew-openai@users.noreply.github.com scruelt@hotmail.com evals/registry/data/which_is_heavier/which_is_heavier.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 scottlanyon@gmail.com scottlanyon@gmail.com evals/registry/data/mapping_to_matricies/data_generator.py 30 2 698 587 2 2 2023-06-07 2023-09-26 danum7@gmail.com bomarni@googlemail.com evals/registry/data/mapping_to_matricies/samples.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 danum7@gmail.com danum7@gmail.com evals/registry/data/hindi_upsc/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 shivamd1810@gmail.com shivamd1810@gmail.com evals/registry/data/math_equations/math_equations.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 767683+raxityo@users.noreply.github.com 767683+raxityo@users.noreply.github.com evals/registry/data/tracking-shuffled-objects/samples.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 google@mryao.org google@mryao.org evals/registry/data/chinese_homonym/samples.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 yichenfeng66@gmail.com yichenfeng66@gmail.com evals/registry/data/heart-disease/samples.jsonl 3 1 755 755 1 1 2023-04-11 2023-04-11 nick@clyde.tech nick@clyde.tech evals/registry/data/japanese_driving_license/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 60774986+yji5212@users.noreply.github.com 60774986+yji5212@users.noreply.github.com evals/registry/data/osm_mapping/osm_mapping_one_way.jsonl 3 1 556 556 1 1 2023-10-27 2023-10-27 adrianmargin@users.noreply.github.com adrianmargin@users.noreply.github.com evals/registry/data/cricket_situations/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 134620553+ai-scale@users.noreply.github.com 134620553+ai-scale@users.noreply.github.com evals/registry/data/premature-conclusions/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 138718051+natanaelwf@users.noreply.github.com 138718051+natanaelwf@users.noreply.github.com evals/registry/data/dhammapada-reference/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 lance.miyamoto@gmail.com lance.miyamoto@gmail.com evals/registry/data/singapore_data_protection_decisions/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 iamkaiwei@gmail.com iamkaiwei@gmail.com evals/registry/data/comprehensive-graph-reasoning/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 42741744+edmundlaowang@users.noreply.github.com 42741744+edmundlaowang@users.noreply.github.com evals/registry/data/bulgarian-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/portuguese-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/ral_to_hex/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 nikolasarmstrong@gmail.com nikolasarmstrong@gmail.com evals/registry/data/ner_finance/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 anthony@candlestick.ai anthony@candlestick.ai evals/registry/data/german-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/formal_logic/formal_logic_expressions.jsonl 3 1 775 775 1 1 2023-03-22 2023-03-22 christopher@wolfram.com christopher@wolfram.com evals/registry/data/wkt_understanding/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 vinooganesh@users.noreply.github.com vinooganesh@users.noreply.github.com evals/registry/data/hebrew_talmud_suka/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 ysrael@reflectiz.com ysrael@reflectiz.com evals/registry/data/japanese_approval/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 omonaotab@gmail.com omonaotab@gmail.com evals/registry/data/infiniteloop-match/infiniteloop-match.jsonl 3 1 777 777 1 1 2023-03-20 2023-03-20 44745172+dottedant-dooz@users.noreply.github.com 44745172+dottedant-dooz@users.noreply.github.com evals/registry/data/manga-translation/pages.jsonl 3 1 768 768 1 1 2023-03-29 2023-03-29 mindful.jt@gmail.com mindful.jt@gmail.com evals/registry/data/manga-translation/panels.jsonl 3 1 768 768 1 1 2023-03-29 2023-03-29 mindful.jt@gmail.com mindful.jt@gmail.com evals/registry/data/manga-translation/bubbles.jsonl 3 1 768 768 1 1 2023-03-29 2023-03-29 mindful.jt@gmail.com mindful.jt@gmail.com evals/registry/data/points_on_line/eval_generator.py 73 1 700 700 1 1 2023-06-05 2023-06-05 aaron@aaronsmith.tv aaron@aaronsmith.tv evals/registry/data/points_on_line/points_on_line.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 aaron@aaronsmith.tv aaron@aaronsmith.tv evals/registry/data/2d_movement/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 eugene.l.huang@gmail.com eugene.l.huang@gmail.com evals/registry/data/russian_sarcasm/samples.jsonl 3 1 699 699 1 1 2023-06-06 2023-06-06 vtolm@vtolm.com vtolm@vtolm.com evals/registry/data/abstract2title/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 96370219+piupiupiuu@users.noreply.github.com 96370219+piupiupiuu@users.noreply.github.com evals/registry/data/norwegian-rhymes/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 137759176+monocle-pastels@users.noreply.github.com 137759176+monocle-pastels@users.noreply.github.com evals/registry/data/self_prompting/samples.jsonl 3 1 537 537 1 1 2023-11-15 2023-11-15 junshern@users.noreply.github.com junshern@users.noreply.github.com evals/registry/data/korean-honorific/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 greenmon@kaist.ac.kr greenmon@kaist.ac.kr evals/registry/data/path_enclosed_area/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 ahmedallawi01@gmail.com ahmedallawi01@gmail.com evals/registry/data/imperial_date_to_string/samples.jsonl 3 1 769 769 1 1 2023-03-28 2023-03-28 dd@davisinfo.com dd@davisinfo.com evals/registry/data/russian-lexicon/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 gydronik@gmail.com gydronik@gmail.com evals/registry/data/nepali-song-singer/nepali-song-singer.jsonl 3 1 718 718 1 1 2023-05-18 2023-05-18 36022153+oshanoshu@users.noreply.github.com 36022153+oshanoshu@users.noreply.github.com evals/registry/data/hard_russian_computer_science_tasks/samples.jsonl 3 1 634 634 1 1 2023-08-10 2023-08-10 halonazar1997@gmail.com halonazar1997@gmail.com evals/registry/data/turkish_characters/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 130087573+cardwiz@users.noreply.github.com 130087573+cardwiz@users.noreply.github.com evals/registry/data/urdu-lexicon/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 usama.anwar09@gmail.com usama.anwar09@gmail.com evals/registry/data/poker_analysis/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/poker_analysis/poker_analysis_sample_generator.py 95 2 700 587 2 2 2023-06-05 2023-09-26 douglas.monsky@gmail.com bomarni@googlemail.com evals/registry/data/determinant/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 80975912+vitoraqdev@users.noreply.github.com 80975912+vitoraqdev@users.noreply.github.com evals/registry/data/vintage_phone_keyboard_decode/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 touchtheus@gmail.com touchtheus@gmail.com evals/registry/data/day-of-week-from-date/samples.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 john@drivecentric.com john@drivecentric.com evals/registry/data/diagrammatic_logic/samples.jsonl 3 1 775 775 1 1 2023-03-22 2023-03-22 freddie.nicholson123@gmail.com freddie.nicholson123@gmail.com evals/registry/data/3d_object_manipulation/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 pomichterstash@gmail.com pomichterstash@gmail.com evals/registry/data/anagrams/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 97240159+l-mutricy@users.noreply.github.com 97240159+l-mutricy@users.noreply.github.com evals/registry/data/anagrams/fewshot.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 97240159+l-mutricy@users.noreply.github.com 97240159+l-mutricy@users.noreply.github.com evals/registry/data/logic-statements/logic-statements.jsonl 3 2 771 770 2 2 2023-03-26 2023-03-27 44057111+kasperkristiansen@users.noreply.github.com 117690718+joe-at-openai@users.noreply.github.com evals/registry/data/nutrition/facts.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 blum.stephen@gmail.com blum.stephen@gmail.com evals/registry/data/rock-climbing/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 gavin@meetsoci.com gavin@meetsoci.com evals/registry/data/iambic-pentameter/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 790279+ianonavy@users.noreply.github.com 790279+ianonavy@users.noreply.github.com evals/registry/data/finnish-rhyme/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 130182869+ouztsa@users.noreply.github.com 130182869+ouztsa@users.noreply.github.com evals/registry/data/multi-step-equations/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 kara@voxel-fox.com kara@voxel-fox.com evals/registry/data/arabic-literature-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/belarusian_orthography/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/data/already_said_that/500_100.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/registry/data/irish_plural_nouns/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 68754265+aaronbrennan1@users.noreply.github.com 68754265+aaronbrennan1@users.noreply.github.com evals/registry/data/convert-bwt-num-and-chinese-num/n_to_c_upper_samples_few_shot.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 yichenfeng66@gmail.com yichenfeng66@gmail.com evals/registry/data/convert-bwt-num-and-chinese-num/n_to_c_lower_samples_few_shot.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 yichenfeng66@gmail.com yichenfeng66@gmail.com evals/registry/data/convert-bwt-num-and-chinese-num/c_lower_to_n_samples_few_shot.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 yichenfeng66@gmail.com yichenfeng66@gmail.com evals/registry/data/convert-bwt-num-and-chinese-num/c_upper_to_n_samples_few_shot.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 yichenfeng66@gmail.com yichenfeng66@gmail.com evals/registry/data/belarusian_antonyms/samples.jsonl 3 1 556 556 1 1 2023-10-27 2023-10-27 tanya.shagova@gmail.com tanya.shagova@gmail.com evals/registry/data/Chinese_character_riddles/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 71001519+tesla2678@users.noreply.github.com 71001519+tesla2678@users.noreply.github.com evals/registry/data/cardinal-directions/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 dbautista.cs@gmail.com dbautista.cs@gmail.com evals/registry/data/hindi_shuddha/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 36335769+0x34d@users.noreply.github.com 36335769+0x34d@users.noreply.github.com evals/registry/data/benjaminmoore_to_hex/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 bryanvaz@users.noreply.github.com bryanvaz@users.noreply.github.com evals/registry/data/romanian_homonyms/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 mail@adrianapan.com mail@adrianapan.com evals/registry/data/korean-phonetics/samples.jsonl 3 1 693 693 1 1 2023-06-12 2023-06-12 136151309+jaiwonrhi2@users.noreply.github.com 136151309+jaiwonrhi2@users.noreply.github.com evals/registry/data/spanish_feminine_noun_masculine_article/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 21stcenturydigitaljeff@gmail.com 21stcenturydigitaljeff@gmail.com evals/registry/data/pattern_identification/samples.v0.jsonl 3 2 782 781 3 2 2023-03-15 2023-03-16 jasonwei@openai.com jasonwei@openai.com evals/registry/data/ballots/samples25.jsonl 3 2 594 507 2 2 2023-09-19 2023-12-15 140545726+ianmckenzie-oai@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/data/ballots/samples02.jsonl 3 2 594 507 2 2 2023-09-19 2023-12-15 140545726+ianmckenzie-oai@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/data/illinois-law/samples.jsonl 3 1 769 769 1 1 2023-03-28 2023-03-28 seancye@gmail.com seancye@gmail.com evals/registry/data/squares-gpt/square-samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 38587927+ach-in@users.noreply.github.com 38587927+ach-in@users.noreply.github.com evals/registry/data/french_homonym_and_homograph/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 6842725+yannl@users.noreply.github.com 6842725+yannl@users.noreply.github.com evals/registry/data/word_association/related_words_5.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/word_association/related_words_4.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/word_association/corpus_tools/sample_generators.py 154 2 671 587 2 2 2023-07-04 2023-09-26 douglas.monsky@gmail.com bomarni@googlemail.com evals/registry/data/word_association/corpus_tools/logger_config.py 8 2 671 587 2 2 2023-07-04 2023-09-26 douglas.monsky@gmail.com bomarni@googlemail.com evals/registry/data/word_association/corpus_tools/corpus.py 58 2 671 587 2 2 2023-07-04 2023-09-26 douglas.monsky@gmail.com bomarni@googlemail.com evals/registry/data/word_association/corpus_tools/__init__.py 1 1 671 671 1 1 2023-07-04 2023-07-04 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/word_association/corpus_tools/validators.py 151 4 671 481 4 4 2023-07-04 2024-01-10 douglas.monsky@gmail.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/word_association/corpus_tools/pipelines.py 14 2 671 587 2 2 2023-07-04 2023-09-26 douglas.monsky@gmail.com bomarni@googlemail.com evals/registry/data/word_association/corpus_tools/related_words.py 64 2 671 587 2 2 2023-07-04 2023-09-26 douglas.monsky@gmail.com bomarni@googlemail.com evals/registry/data/word_association/corpus_tools/processor.py 36 2 671 587 2 2 2023-07-04 2023-09-26 douglas.monsky@gmail.com bomarni@googlemail.com evals/registry/data/word_association/related_words_2.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/word_association/related_words_3.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/data/canto_wu_pronunciation/samples_zero.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 timeroot.alex@gmail.com timeroot.alex@gmail.com evals/registry/data/canto_wu_pronunciation/samples_few.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 timeroot.alex@gmail.com timeroot.alex@gmail.com evals/registry/data/canto_wu_pronunciation/csv_to_json.py 55 2 703 587 2 2 2023-06-02 2023-09-26 timeroot.alex@gmail.com bomarni@googlemail.com evals/registry/data/simple-charting/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 daoduyducduong@gmail.com daoduyducduong@gmail.com evals/registry/data/music_theory/music_theory_chord_notes.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 steventsao@me.com steventsao@me.com evals/registry/data/music_theory/music_theory_chord_names.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 steventsao@me.com steventsao@me.com evals/registry/data/css-selectors/verbal.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 ilanharel@gmail.com ilanharel@gmail.com evals/registry/data/css-selectors/explain.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 ilanharel@gmail.com ilanharel@gmail.com evals/registry/data/body_movement/body_movement.jsonl 3 1 717 717 1 1 2023-05-19 2023-05-19 30339662+tescao@users.noreply.github.com 30339662+tescao@users.noreply.github.com evals/registry/data/logical_reasoning_letter_series_test/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 54538772+hussnainghani@users.noreply.github.com 54538772+hussnainghani@users.noreply.github.com evals/registry/data/naughty_strings/samples.jsonl 3 2 755 711 2 2 2023-04-11 2023-05-25 lucianosb@users.noreply.github.com christopherb737@gmail.com evals/registry/data/naughty_strings/security.jsonl 3 1 755 755 1 1 2023-04-11 2023-04-11 lucianosb@users.noreply.github.com lucianosb@users.noreply.github.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_comparison.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_fluency_style.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_prep.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_fluency_other.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_partvoice.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_number.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_aspect.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_tense.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_ungrammaticalstructure.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_case.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_fluency_repetition.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_verbvoice.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_gender.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_other.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_verbaform.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_fluency_calque.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_grammar_conjunction.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/ukraine_gec/ukraine_gec_fluency_poorflow.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/data/portuguese-kinship-riddles/samples.jsonl 3 1 690 690 1 1 2023-06-15 2023-06-15 zbu@ezpapel.com zbu@ezpapel.com evals/registry/data/korean_date_counting/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 127706211+jess-hwang@users.noreply.github.com 127706211+jess-hwang@users.noreply.github.com evals/registry/data/belarusian_lexicon/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/data/atpl_exams/samples.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 perrosnk@gmail.com perrosnk@gmail.com evals/registry/data/pure_korean/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 68699959+soooim@users.noreply.github.com 68699959+soooim@users.noreply.github.com evals/registry/data/french-lexicon/samples.jsonl 3 1 709 709 1 1 2023-05-27 2023-05-27 mathieuhawry@gmail.com mathieuhawry@gmail.com evals/registry/data/color_theory/complementary.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 penandlim@gmail.com penandlim@gmail.com evals/registry/data/consensus_summary/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 95278127+ali-consensus@users.noreply.github.com 95278127+ali-consensus@users.noreply.github.com evals/registry/data/greek_nt_manuscripts/codes-sigla-centuries.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 andy@honeyrunsoftware.com andy@honeyrunsoftware.com evals/registry/data/banking77/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 ouassim.fari@gmail.com ouassim.fari@gmail.com evals/registry/data/simple-knowledge-mongolian/samples.v0.jsonl 3 1 752 752 1 1 2023-04-14 2023-04-14 joseph.lelic@gmail.com joseph.lelic@gmail.com evals/registry/data/japanese-national-medical-exam02/japanese-national-medical-exam02.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 93697462+nakata-daisuke-mb@users.noreply.github.com 93697462+nakata-daisuke-mb@users.noreply.github.com evals/registry/data/chinese_shi_jing/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 netsailer@gmail.com netsailer@gmail.com evals/registry/data/human-safety/human-safety.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 46403813+bertod@users.noreply.github.com 46403813+bertod@users.noreply.github.com evals/registry/data/chinese-remainder-theorem/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 carlos.hellin@uah.es carlos.hellin@uah.es evals/registry/data/cant_do_that_anymore/diagonal_moves_dataset.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/cant_do_that_anymore/special_moves_dataset.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/cant_do_that_anymore/gpt-4-0314_dataset.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/cant_do_that_anymore/gpt-4-0125-preview_dataset.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/cant_do_that_anymore/gpt-3.5-turbo-instruct_dataset.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/cant_do_that_anymore/gpt-3.5-turbo-0125_dataset.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/security_guide/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 134000058+gpsandhu23@users.noreply.github.com 134000058+gpsandhu23@users.noreply.github.com evals/registry/data/taxes/samples.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 andrewmlu3@gmail.com andrewmlu3@gmail.com evals/registry/data/guess_the_singer/samples.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 130565081+yuryrudnitski@users.noreply.github.com 130565081+yuryrudnitski@users.noreply.github.com evals/registry/data/gpt-protocol-buffers/samples.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 jdavis@pcprogramming.com jdavis@pcprogramming.com evals/registry/data/bugged_tools/main_small.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/bugged_tools/main.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/data/logic_and_probability/logic_and_probability.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 135593135+hbvlmedia@users.noreply.github.com 135593135+hbvlmedia@users.noreply.github.com evals/registry/data/building_floorplan/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 sjknauer@gmail.com sjknauer@gmail.com evals/registry/data/norwegian-lexicon/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 info@dyar.no info@dyar.no evals/registry/data/identifying_variables/balanced_ctrl_vars.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/registry/data/identifying_variables/balanced_hypotheses.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/registry/data/jee-math/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 anant@kix.in anant@kix.in evals/registry/data/japanese-itpassport-exam01/japanese-itpassport-exam01.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 azutake@users.noreply.github.com azutake@users.noreply.github.com evals/registry/data/logic-container/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 onder.secen@gmail.com onder.secen@gmail.com evals/registry/data/categorize_with_distractors/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 yuvalshirav@gmail.com yuvalshirav@gmail.com evals/registry/data/interlingual-homograph/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 53555762+y-nakamura-github@users.noreply.github.com 53555762+y-nakamura-github@users.noreply.github.com evals/registry/data/connect4/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 83553535+kierandon@users.noreply.github.com 83553535+kierandon@users.noreply.github.com evals/registry/data/korean_foreign_words/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 pringle0531@gmail.com pringle0531@gmail.com evals/registry/data/alternate_numeral_systems/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 matt.lavin@gmail.com matt.lavin@gmail.com evals/registry/data/track_objects/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 45925348+christophedc@users.noreply.github.com 45925348+christophedc@users.noreply.github.com evals/registry/data/chinese_ancient_poetry/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 jiahaoyu04@gmail.com jiahaoyu04@gmail.com evals/registry/data/count_intersections_polynomial/samples.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 63267585+cauvmou@users.noreply.github.com 63267585+cauvmou@users.noreply.github.com evals/registry/data/simple_math/simple_math.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 135593135+hbvlmedia@users.noreply.github.com 135593135+hbvlmedia@users.noreply.github.com evals/registry/data/russian_medical/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 gydronik@gmail.com gydronik@gmail.com evals/registry/data/japanese-national-medical-exam01/japanese-national-medical-exam01.jsonl 3 1 740 740 1 1 2023-04-26 2023-04-26 93697462+nakata-daisuke-mb@users.noreply.github.com 93697462+nakata-daisuke-mb@users.noreply.github.com evals/registry/data/hebrew_bible/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 ophir.ido@gmail.com ophir.ido@gmail.com evals/registry/data/context-free-grammar/samples.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 135289321+horizonauto@users.noreply.github.com 135289321+horizonauto@users.noreply.github.com evals/registry/data/largest_country/samples.jsonl 3 1 718 718 1 1 2023-05-18 2023-05-18 36363097+latand@users.noreply.github.com 36363097+latand@users.noreply.github.com evals/registry/data/simple-visual-understanding/simple-visual-understanding.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 felipe.castro@friday.ai felipe.castro@friday.ai evals/registry/data/portuguese-sarcasm/samples.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 lucas.arki@gmail.com lucas.arki@gmail.com evals/registry/data/sarcasm/few_shot.jsonl 3 1 771 771 1 1 2023-03-26 2023-03-26 56776590+ronaldruckus@users.noreply.github.com 56776590+ronaldruckus@users.noreply.github.com evals/registry/data/sarcasm/samples.jsonl 3 1 771 771 1 1 2023-03-26 2023-03-26 56776590+ronaldruckus@users.noreply.github.com 56776590+ronaldruckus@users.noreply.github.com evals/registry/data/svg_understanding/samples.jsonl 3 1 742 742 1 1 2023-04-24 2023-04-24 joshuagruenstein@users.noreply.github.com joshuagruenstein@users.noreply.github.com evals/registry/data/chinese_modern_poem_identification/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 netsailer@gmail.com netsailer@gmail.com evals/registry/data/belarusian_rhyme/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/data/asl-classifiers/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 135167270+docequity@users.noreply.github.com 135167270+docequity@users.noreply.github.com evals/registry/data/french-part-of-speech/samples.jsonl 3 1 709 709 1 1 2023-05-27 2023-05-27 vasco@piranhafleisch.de vasco@piranhafleisch.de evals/registry/data/croatian-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/afrikaans-lexicon/samples.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 richard.wooding@gmail.com richard.wooding@gmail.com evals/registry/data/regex-match/samples.jsonl 3 1 769 769 1 1 2023-03-28 2023-03-28 davidchen@gliacloud.com davidchen@gliacloud.com evals/registry/data/smiles_to_formula/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 33544440+glichtner@users.noreply.github.com 33544440+glichtner@users.noreply.github.com evals/registry/data/steganography/samples.jsonl 3 2 594 419 2 2 2023-09-19 2024-03-12 140545726+ianmckenzie-oai@users.noreply.github.com giulio.starace@gmail.com evals/registry/data/hebrew_grammar/samples.jsonl 3 1 642 642 1 1 2023-08-02 2023-08-02 idoyana@gmail.com idoyana@gmail.com evals/registry/data/corr2cause/corr2cause.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 vasarmilan@gmail.com vasarmilan@gmail.com evals/registry/data/linear-regression/samples.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 128815441+jonclar@users.noreply.github.com 128815441+jonclar@users.noreply.github.com evals/registry/data/linear-regression/labeled-samples.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 128815441+jonclar@users.noreply.github.com 128815441+jonclar@users.noreply.github.com evals/registry/data/research-question-extraction/research-question-extraction-samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 92821098+pancoaster@users.noreply.github.com 92821098+pancoaster@users.noreply.github.com evals/registry/data/actors-sequence/samples.jsonl 3 1 774 774 1 1 2023-03-23 2023-03-23 125162997+mcaledonensis@users.noreply.github.com 125162997+mcaledonensis@users.noreply.github.com evals/registry/data/logical-black-scholes/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 dsims21@gmail.com dsims21@gmail.com evals/registry/data/formal-grammar-to-regex/formal-grammar-to-regex.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 chatgpt@zyxcv.com chatgpt@zyxcv.com evals/registry/data/solve-for-variable/tools/solve.py 231 2 703 587 2 2 2023-06-02 2023-09-26 130226176+juan-de-salgado@users.noreply.github.com bomarni@googlemail.com evals/registry/data/solve-for-variable/tools/tester.py 94 2 703 587 2 2 2023-06-02 2023-09-26 130226176+juan-de-salgado@users.noreply.github.com bomarni@googlemail.com evals/registry/data/solve-for-variable/tools/template.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 130226176+juan-de-salgado@users.noreply.github.com 130226176+juan-de-salgado@users.noreply.github.com evals/registry/data/solve-for-variable/tools/main.py 65 2 703 587 2 2 2023-06-02 2023-09-26 130226176+juan-de-salgado@users.noreply.github.com bomarni@googlemail.com evals/registry/data/solve-for-variable/tools/problem.py 90 2 703 587 2 2 2023-06-02 2023-09-26 130226176+juan-de-salgado@users.noreply.github.com bomarni@googlemail.com evals/registry/data/solve-for-variable/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 130226176+juan-de-salgado@users.noreply.github.com 130226176+juan-de-salgado@users.noreply.github.com evals/registry/data/qa/q_and_a.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 43813768+keremnalbant@users.noreply.github.com 43813768+keremnalbant@users.noreply.github.com evals/registry/data/monthly_metric_comparison/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 6182673+robi-ng@users.noreply.github.com 6182673+robi-ng@users.noreply.github.com evals/registry/data/find_country_from_svg/samples.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 lucasfougeras93@gmail.com lucasfougeras93@gmail.com evals/registry/data/islands/japanese_remote_island_to_prefecture.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 nakagawa.mai@gmail.com nakagawa.mai@gmail.com evals/registry/data/csharp-linq/questions.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 6028199+joshdixon@users.noreply.github.com 6028199+joshdixon@users.noreply.github.com evals/registry/data/japanese_populer_video_game_title_and_the_publisher/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 snsk@users.noreply.github.com snsk@users.noreply.github.com evals/registry/data/polish-syllable-count/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 yaru.uvva@gmail.com yaru.uvva@gmail.com evals/registry/data/bigrams/samples.jsonl 3 1 777 777 1 1 2023-03-20 2023-03-20 oscar-king@users.noreply.github.com oscar-king@users.noreply.github.com evals/registry/data/iqbal-poetry-translation/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 usama.anwar09@gmail.com usama.anwar09@gmail.com evals/registry/data/iqbal-poetry-translation/labeled-samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 usama.anwar09@gmail.com usama.anwar09@gmail.com evals/registry/data/number_series_test/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 63540629+hammad-programmer@users.noreply.github.com 63540629+hammad-programmer@users.noreply.github.com evals/registry/data/unwanted-rhyming/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 forexdude1234@gmail.com forexdude1234@gmail.com evals/registry/data/syntax-check/samples.jsonl 3 1 718 718 1 1 2023-05-18 2023-05-18 aargoldsmith@gmail.com aargoldsmith@gmail.com evals/registry/data/korean_spelling/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 yjkimjunior@gmail.com yjkimjunior@gmail.com evals/registry/data/syllables_long_words/long_word_samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 eschulma@gmail.com eschulma@gmail.com evals/registry/data/chinese_famous_novel/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 litonglitong@hotmail.com litonglitong@hotmail.com evals/registry/data/resource_id_extraction/samples.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 andrewcemil@users.noreply.github.com andrewcemil@users.noreply.github.com evals/registry/data/korean_romanization/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 soo@novelastudio.com soo@novelastudio.com evals/registry/data/crepe/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 46582003+seacowx@users.noreply.github.com 46582003+seacowx@users.noreply.github.com evals/registry/data/japanese_city_name_pronunciation/samples.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 679040+akazah@users.noreply.github.com 679040+akazah@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/bipedal-walker.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/spaceship_titanic/spaceship-titanic.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/pong/gpu.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/pong/cpu.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/inverted-pendulum.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/ogbn_arxiv/ogbn-arxiv.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/parkinsons_disease/dataset/public_timeseries_testing_util.py 48 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/parkinsons_disease/parkinsons-disease.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/imdb.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/house_price/house-price.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/pusher.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/cartpole.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/vectorization.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/feedback/feedback.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/humanoid/gpu.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/humanoid/cpu.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/ant/gpu.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/ant/cpu.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/hr_ml_agent_bench/cifar10.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/european_date_format_challenge/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 yuvalshirav@gmail.com yuvalshirav@gmail.com evals/registry/data/complex_replace_characters/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 petrgazarov@gmail.com petrgazarov@gmail.com evals/registry/data/dice-rotation-sequence/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 g.h.garrett13@gmail.com g.h.garrett13@gmail.com evals/registry/data/count_token_freq_dna/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 zl432@cantab.ac.uk zl432@cantab.ac.uk evals/registry/data/sexagenary_cycle_calculation/samples.jsonl 3 1 720 720 1 1 2023-05-16 2023-05-16 dunedainstrider.a@gmail.com dunedainstrider.a@gmail.com evals/registry/data/utah_real_estate/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 42595698+thechaincollective@users.noreply.github.com 42595698+thechaincollective@users.noreply.github.com evals/registry/data/direct-speech-tag/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 mariusburtscheidt@gmail.com mariusburtscheidt@gmail.com evals/registry/data/make_me_say/medium.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/make_me_say/very-hard.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/make_me_say/medium-and-hard.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/make_me_say/easy.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/make_me_say/hard.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/music-theory/triads-few-shot.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 105930198+f7b5@users.noreply.github.com 105930198+f7b5@users.noreply.github.com evals/registry/data/music-theory/tetrads-samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 105930198+f7b5@users.noreply.github.com 105930198+f7b5@users.noreply.github.com evals/registry/data/music-theory/tetrads-few-shot.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 105930198+f7b5@users.noreply.github.com 105930198+f7b5@users.noreply.github.com evals/registry/data/music-theory/triads-samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 105930198+f7b5@users.noreply.github.com 105930198+f7b5@users.noreply.github.com evals/registry/data/fcc_amateur_extra/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 34941300+ckb2@users.noreply.github.com 34941300+ckb2@users.noreply.github.com evals/registry/data/polish-proverbs/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 kasiakloc00@gmail.com kasiakloc00@gmail.com evals/registry/data/adultery-state-laws/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 108371552+loadedmediainc@users.noreply.github.com 108371552+loadedmediainc@users.noreply.github.com evals/registry/data/mandaliof-table/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 ali.risheh876@gmail.com ali.risheh876@gmail.com evals/registry/data/emoji_riddle/fuzzy_match.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 dib.amir@gmail.com dib.amir@gmail.com evals/registry/data/tricky-word-problems/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 jackurbs@gmail.com jackurbs@gmail.com evals/registry/data/passing-balls/passing-balls.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 131498134+lucid-max@users.noreply.github.com 131498134+lucid-max@users.noreply.github.com evals/registry/data/tokyo-station-number/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 torufuru@users.noreply.github.com torufuru@users.noreply.github.com evals/registry/data/reverse-shell/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 32207883+robinzixuan@users.noreply.github.com 32207883+robinzixuan@users.noreply.github.com evals/registry/data/first-letters/samples.jsonl 3 1 775 775 1 1 2023-03-22 2023-03-22 67751757+kallyaleksiev@users.noreply.github.com 67751757+kallyaleksiev@users.noreply.github.com evals/registry/data/crontab/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 google@mryao.org google@mryao.org evals/registry/data/base64_decode/base64_decode.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 70709113+alessiogr@users.noreply.github.com 70709113+alessiogr@users.noreply.github.com evals/registry/data/json_patch_object/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 eugene@goforward.com eugene@goforward.com evals/registry/data/linear_equations/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 alexno0401@gmail.com alexno0401@gmail.com evals/registry/data/japanese_prime_minister/samples.jsonl 3 1 488 488 1 1 2024-01-03 2024-01-03 40705236+return-nil@users.noreply.github.com 40705236+return-nil@users.noreply.github.com evals/registry/data/product-matching/rules/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 26688318+rpeeters85@users.noreply.github.com 26688318+rpeeters85@users.noreply.github.com evals/registry/data/product-matching/zeroshot/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 26688318+rpeeters85@users.noreply.github.com 26688318+rpeeters85@users.noreply.github.com evals/registry/data/product-matching/fewshot/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 26688318+rpeeters85@users.noreply.github.com 26688318+rpeeters85@users.noreply.github.com evals/registry/data/urdu-transliteration/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 usama.anwar09@gmail.com usama.anwar09@gmail.com evals/registry/data/isosceles-right-triangle/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 alexbuzanis@gmail.com alexbuzanis@gmail.com evals/registry/data/math_polish/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 krzycho@wapp.pl krzycho@wapp.pl evals/registry/data/indonesian_numbers/indonesian_numbers.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 aarongpower@gmail.com aarongpower@gmail.com evals/registry/data/3d_globe_movement/samples.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 travis.hairfield@gmail.com travis.hairfield@gmail.com evals/registry/data/cissp-study-questions/few_shot.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 randy.lariar@gmail.com randy.lariar@gmail.com evals/registry/data/cissp-study-questions/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 randy.lariar@gmail.com randy.lariar@gmail.com evals/registry/data/override-system-instruction/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 mail@thooyavan.me mail@thooyavan.me evals/registry/data/loss_logic/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 temberature@gmail.com temberature@gmail.com evals/registry/data/korean_spaces/samples.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 howon92@gmail.com howon92@gmail.com evals/registry/data/south-african-bands/south-african-bands.jsonl 3 1 717 717 1 1 2023-05-19 2023-05-19 richard.wooding@spandigital.com richard.wooding@spandigital.com evals/registry/data/icelandic-inflection-hard/samples.jsonl 3 1 556 556 1 1 2023-10-27 2023-10-27 vthorsteinsson@users.noreply.github.com vthorsteinsson@users.noreply.github.com evals/registry/data/utility_price_parsing/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 131423049+dz-pika@users.noreply.github.com 131423049+dz-pika@users.noreply.github.com evals/registry/data/incontext_rl/samples.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/data/incontext_rl/samples_gymnasium_only.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/data/incontext_rl/samples_dev.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/data/ab/samples.jsonl 3 1 556 556 1 1 2023-10-27 2023-10-27 42742390+mmtmn@users.noreply.github.com 42742390+mmtmn@users.noreply.github.com evals/registry/data/moral_exceptQA/samples.jsonl 3 1 754 754 1 1 2023-04-12 2023-04-12 kblin@outlook.com kblin@outlook.com evals/registry/data/icelandic-sentences-gec/samples.jsonl 3 1 481 481 1 1 2024-01-10 2024-01-10 24214261+svanhvitlilja@users.noreply.github.com 24214261+svanhvitlilja@users.noreply.github.com evals/registry/data/unified_patch/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 me@andrebaltazar.com me@andrebaltazar.com evals/registry/data/hebrew_same_noun_gender/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 elisimhayev@gmail.com elisimhayev@gmail.com evals/registry/data/finger-tracking/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 chris@notus.ai chris@notus.ai evals/registry/data/russian-rhyme/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 tbs.micle@gmail.com tbs.micle@gmail.com evals/registry/data/blackfoot-numerals-modern/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 george@orbitalimpact.com george@orbitalimpact.com evals/registry/data/soc_codes/samples.jsonl 3 1 693 693 1 1 2023-06-12 2023-06-12 21990717+lrperkins@users.noreply.github.com 21990717+lrperkins@users.noreply.github.com evals/registry/data/counterfactual-reasoning/counterfactual_reasoning_samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 89385155+neolizhe@users.noreply.github.com 89385155+neolizhe@users.noreply.github.com evals/registry/data/geometry_puzzle/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 52676620+moeen-movahednia@users.noreply.github.com 52676620+moeen-movahednia@users.noreply.github.com evals/registry/data/shopping_discount_comparison/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 35208156+lillichoung@users.noreply.github.com 35208156+lillichoung@users.noreply.github.com evals/registry/data/logic-liar-paradox/samples.jsonl 3 1 727 727 1 1 2023-05-09 2023-05-09 robertbateman@users.noreply.github.com robertbateman@users.noreply.github.com evals/registry/data/pointer-value-retrieval/hard_many_examples.jsonl 3 1 699 699 1 1 2023-06-06 2023-06-06 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/pointer-value-retrieval/medium_many_examples.jsonl 3 1 699 699 1 1 2023-06-06 2023-06-06 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/pointer-value-retrieval/easy_many_examples.jsonl 3 1 699 699 1 1 2023-06-06 2023-06-06 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/pointer-value-retrieval/hard_few_examples.jsonl 3 1 699 699 1 1 2023-06-06 2023-06-06 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/pointer-value-retrieval/easy_few_examples.jsonl 3 1 699 699 1 1 2023-06-06 2023-06-06 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/pointer-value-retrieval/medium_few_examples.jsonl 3 1 699 699 1 1 2023-06-06 2023-06-06 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/data/korean_dialects/samples.jsonl 3 1 694 694 1 1 2023-06-11 2023-06-11 134977380+racheroni@users.noreply.github.com 134977380+racheroni@users.noreply.github.com evals/registry/data/chinese_tang_poetries/sample.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 clvrobj@gmail.com clvrobj@gmail.com evals/registry/data/word_vector_over_reliance/word_vector_over_reliance_samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 89385155+neolizhe@users.noreply.github.com 89385155+neolizhe@users.noreply.github.com evals/registry/data/astro_eval/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 andrerbreton@gmail.com andrerbreton@gmail.com evals/registry/data/italian_rhyme/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 webdaemon3@gmail.com webdaemon3@gmail.com evals/registry/data/simple-block-puzzles/block-puzzles.v1.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 bird.seanmichael@gmail.com bird.seanmichael@gmail.com evals/registry/data/arc/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 3322313+theo3@users.noreply.github.com 3322313+theo3@users.noreply.github.com evals/registry/data/serbian-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/rot13/rot13.jsonl 3 1 771 771 1 1 2023-03-26 2023-03-26 greg@siteorigin.com greg@siteorigin.com evals/registry/data/split_chinese_characters/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 mzou@pisrc.com mzou@pisrc.com evals/registry/data/prompt-injection/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 alianse777@users.noreply.github.com alianse777@users.noreply.github.com evals/registry/data/logic/samples.jsonl 3 1 767 767 1 1 2023-03-30 2023-03-30 dustin.wehr@gmail.com dustin.wehr@gmail.com evals/registry/data/simple_physics_engine/solver.py 90 1 703 703 1 1 2023-06-02 2023-06-02 ssansovich@gmail.com ssansovich@gmail.com evals/registry/data/simple_physics_engine/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 ssansovich@gmail.com ssansovich@gmail.com evals/registry/data/simple_physics_engine/samples_generator.py 59 1 703 703 1 1 2023-06-02 2023-06-02 ssansovich@gmail.com ssansovich@gmail.com evals/registry/data/simple_physics_engine/wave_function_collapse.py 157 2 703 587 2 2 2023-06-02 2023-09-26 ssansovich@gmail.com bomarni@googlemail.com evals/registry/data/ambiguous-sentences/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 59383957+erauner12@users.noreply.github.com 59383957+erauner12@users.noreply.github.com evals/registry/data/emotional-intelligence/samples.jsonl 3 1 755 755 1 1 2023-04-11 2023-04-11 16432683+dpys@users.noreply.github.com 16432683+dpys@users.noreply.github.com evals/registry/data/aba_mrpc_true_false/samples.jsonl 3 1 776 776 1 1 2023-03-21 2023-03-21 avery@offerfit.ai avery@offerfit.ai evals/registry/data/tempo_to_measure_count/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 sam.lucyk@gmail.com sam.lucyk@gmail.com evals/registry/data/greek_vocabulary/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 99351112+0xacx@users.noreply.github.com 99351112+0xacx@users.noreply.github.com evals/registry/data/multistep-web-tasks/all_tasks.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_7.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_5.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_4.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/simple.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_3.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/medium_tasks.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_1.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_9.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/easy_tasks.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_8.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_2.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/task_6.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/multistep-web-tasks/hard_tasks.jsonl 3 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/data/reasoning/samples.jsonl 3 1 777 777 1 1 2023-03-20 2023-03-20 oscar-king@users.noreply.github.com oscar-king@users.noreply.github.com evals/registry/data/nfl-point-combinations/samples.jsonl 3 1 694 694 1 1 2023-06-11 2023-06-11 136047342+dougkwanna@users.noreply.github.com 136047342+dougkwanna@users.noreply.github.com evals/registry/data/nfl-point-combinations/combinations_generator.py 25 1 694 694 1 1 2023-06-11 2023-06-11 136047342+dougkwanna@users.noreply.github.com 136047342+dougkwanna@users.noreply.github.com evals/registry/data/proofreader/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 ramiel@users.noreply.github.com ramiel@users.noreply.github.com evals/registry/data/multistep-word-problems/samples.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 forexdude1234@gmail.com forexdude1234@gmail.com evals/registry/data/belarusian_numerals/samples.jsonl 3 1 690 690 1 1 2023-06-15 2023-06-15 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/data/list_comparison_missing_name/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 37917398+davidbeesley@users.noreply.github.com 37917398+davidbeesley@users.noreply.github.com evals/registry/data/invoice_due_date_leap_day_adjustment/samples.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 132409761+techlocke@users.noreply.github.com 132409761+techlocke@users.noreply.github.com evals/registry/data/irrelevant-negative-diversion/irrelevant-negative-diversion.jsonl 3 1 655 655 1 1 2023-07-20 2023-07-20 anders@wangrask.com anders@wangrask.com evals/registry/data/ukraine_eit/samples.jsonl 3 1 769 769 1 1 2023-03-28 2023-03-28 badt@appar.at badt@appar.at evals/registry/data/born_first/born_first.jsonl 3 2 782 781 2 2 2023-03-15 2023-03-16 njbbaer@gmail.com 120423412+andrew-openai@users.noreply.github.com evals/registry/data/forth_stack_sim/detailed_samples.jsonl 3 1 768 768 1 1 2023-03-29 2023-03-29 gooseus@users.noreply.github.com gooseus@users.noreply.github.com evals/registry/data/forth_stack_sim/basic_samples.jsonl 3 1 768 768 1 1 2023-03-29 2023-03-29 gooseus@users.noreply.github.com gooseus@users.noreply.github.com evals/registry/data/forth_stack_sim/samples.jsonl 3 1 775 775 1 1 2023-03-22 2023-03-22 gooseus@users.noreply.github.com gooseus@users.noreply.github.com evals/registry/data/logic-grid/logic-grid.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 austinstarnes@pm.me austinstarnes@pm.me evals/registry/data/math-derivatives/questions.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 andrew.prokhorenkov@gmail.com andrew.prokhorenkov@gmail.com evals/registry/data/russian-nlp-tasks/samples.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 hormold@gmail.com hormold@gmail.com evals/registry/data/chinese_ancient_masterpieces_dynasty/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 136729222+meganjohnson96@users.noreply.github.com 136729222+meganjohnson96@users.noreply.github.com evals/registry/data/mate-in-one/samples.jsonl 3 1 712 712 1 1 2023-05-24 2023-05-24 90597795+mradul-kanugo@users.noreply.github.com 90597795+mradul-kanugo@users.noreply.github.com evals/registry/data/belarusian_syllable_count/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/data/knot-theory/knot-theory-unknotting-numbers.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 matthaigh27@gmail.com matthaigh27@gmail.com evals/registry/data/knot-theory/knot-theory-unknotting-problems.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 matthaigh27@gmail.com matthaigh27@gmail.com evals/registry/data/knot-theory/knot-theory-code-conversions.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 matthaigh27@gmail.com matthaigh27@gmail.com evals/registry/data/skill_acquisition/miskito/knowledge_base/human_rights_miskito.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/knowledge_base/honduras.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/knowledge_base/miskito_people.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/knowledge_base/mosquito.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/knowledge_base/miskito_language.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/knowledge_base/nicaragua.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/knowledge_base/miskito_lessons.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/knowledge_base/mosquito_coast.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/qa_pairs_by_lesson.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_test_translation_fewshot.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_test_manipulation_fewshot.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_test_all.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_test_all_fewshot.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_test_manipulation.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_train_translation.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_train_manipulation.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_test_translation.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/skill_acquisition/miskito/variants/miskito_train_all.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/marxist_philosophy_exam/fuzzy_match.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 cxjwin@users.noreply.github.com cxjwin@users.noreply.github.com evals/registry/data/math_for_5th-grader/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 42082942+mochisky@users.noreply.github.com 42082942+mochisky@users.noreply.github.com evals/registry/data/coq-proof-step/match.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 amit9oct@gmail.com amit9oct@gmail.com evals/registry/data/historical-kana-orthography-reading/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 135117004+hozen-ai@users.noreply.github.com 135117004+hozen-ai@users.noreply.github.com evals/registry/data/belarusian_synonyms/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 tanya.shagova@gmail.com tanya.shagova@gmail.com evals/registry/data/irony/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 scott@linfords.com scott@linfords.com evals/registry/data/icelandic-inflection-easy/samples.jsonl 3 1 556 556 1 1 2023-10-27 2023-10-27 vthorsteinsson@users.noreply.github.com vthorsteinsson@users.noreply.github.com evals/registry/data/logiqa/logiqa.jsonl 3 1 755 755 2 2 2023-04-11 2023-04-11 kondrich@openai.com 62553364+csitfun@users.noreply.github.com evals/registry/data/imo_exact_answers/samples.jsonl 3 1 296 296 1 1 2024-07-13 2024-07-13 justin@lin.bot justin@lin.bot evals/registry/data/schelling_point/owt_5.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/schelling_point/wikipedia_5.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/schelling_point/mix.jsonl 3 1 507 507 1 1 2023-12-15 2023-12-15 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/data/schelling_point/random_numbers_10_3.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/schelling_point/random_words_10.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/belarusian_proverbs/samples.jsonl 3 1 700 700 1 1 2023-06-05 2023-06-05 130565081+yuryrudnitski@users.noreply.github.com 130565081+yuryrudnitski@users.noreply.github.com evals/registry/data/japanese-station/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 pabst2009@gmail.com pabst2009@gmail.com evals/registry/data/lithuanian-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/french-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/newsology/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 130502202+newsology@users.noreply.github.com 130502202+newsology@users.noreply.github.com evals/registry/data/kanji-idioms/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 peach921110@gmail.com peach921110@gmail.com evals/registry/data/text_compression/samples.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/data/three-pt-mapping/three_pt_mapping.jsonl 3 1 740 740 1 1 2023-04-26 2023-04-26 keke060114@163.com keke060114@163.com evals/registry/data/romanian-logic/romanian-logic.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 marius.patru@gmail.com marius.patru@gmail.com evals/registry/data/missing_operators/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 kodamap0@gmail.com kodamap0@gmail.com evals/registry/data/mendelian_inheritance/samples.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 constantin_goeldel@t-online.de constantin_goeldel@t-online.de evals/registry/data/hungarian-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/japanese_romantic_context/samples.jsonl 3 1 655 655 1 1 2023-07-20 2023-07-20 115438292+missionteam@users.noreply.github.com 115438292+missionteam@users.noreply.github.com evals/registry/data/logical_counting/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 jocca1985@gmail.com jocca1985@gmail.com evals/registry/data/unique_combinations/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 50557586+sypherd@users.noreply.github.com 50557586+sypherd@users.noreply.github.com evals/registry/data/physics-interaction/samples.jsonl 3 1 715 715 1 1 2023-05-21 2023-05-21 jelgt2011@gmail.com jelgt2011@gmail.com evals/registry/data/rucola/few_shot.jsonl 3 1 762 762 1 1 2023-04-04 2023-04-04 alex@alexkuk.ru alex@alexkuk.ru evals/registry/data/rucola/samples.jsonl 3 1 762 762 1 1 2023-04-04 2023-04-04 alex@alexkuk.ru alex@alexkuk.ru evals/registry/data/ph_calculation/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 61839320+bilski311@users.noreply.github.com 61839320+bilski311@users.noreply.github.com evals/registry/data/detect-hshd/detect-hshd.jsonl 3 1 711 711 1 1 2023-05-25 2023-05-25 45504048+mysterious-progression@users.noreply.github.com 45504048+mysterious-progression@users.noreply.github.com evals/registry/data/japanese_number_reading/japanese_number_reading.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 shunji.makino@gmail.com shunji.makino@gmail.com evals/registry/data/lat_long_identify/samples.jsonl 3 1 777 777 1 1 2023-03-20 2023-03-20 vishaal16119@iiitd.ac.in vishaal16119@iiitd.ac.in evals/registry/data/irish-lexicon/samples.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 getintouchwithseanryan@gmail.com getintouchwithseanryan@gmail.com evals/registry/data/automata-and-complexity/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 peter@stakoun.com peter@stakoun.com evals/registry/data/seo_keywords/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 me+github@gerdemann.me me+github@gerdemann.me evals/registry/data/ukraine_electronic_petitions/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 yaru.uvva@gmail.com yaru.uvva@gmail.com evals/registry/data/partially_solved_crossword_clues/samples.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 francois_lr@hotmail.fr francois_lr@hotmail.fr evals/registry/data/polish_rhymes_generation/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 9194961+r2d34@users.noreply.github.com 9194961+r2d34@users.noreply.github.com evals/registry/data/numeral-type-comparisons/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 101950345+noahcdc@users.noreply.github.com 101950345+noahcdc@users.noreply.github.com evals/registry/data/confusing_korean/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 youngwook.kim@gmail.com youngwook.kim@gmail.com evals/registry/data/ordered-history-events/samples.jsonl 3 1 719 719 1 1 2023-05-17 2023-05-17 itc0r3@gmail.com itc0r3@gmail.com evals/registry/data/allergen-information/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 ophir.ido@gmail.com ophir.ido@gmail.com evals/registry/data/GOL/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 agoldsmith@alumni.scu.edu agoldsmith@alumni.scu.edu evals/registry/data/swap-words/samples.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 pranavgade20@gmail.com pranavgade20@gmail.com evals/registry/data/python_list_comprehension/samples.jsonl 3 1 710 710 1 1 2023-05-26 2023-05-26 67437435+michailmelonas@users.noreply.github.com 67437435+michailmelonas@users.noreply.github.com evals/registry/data/arithmetic-expression/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 gustavo.santos@vortexa.com gustavo.santos@vortexa.com evals/registry/data/arithmetic-expression/labeled-samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 gustavo.santos@vortexa.com gustavo.santos@vortexa.com evals/registry/data/escher_sentences/samples.jsonl 3 1 753 753 1 1 2023-04-13 2023-04-13 churchjohnr@protonmail.com churchjohnr@protonmail.com evals/registry/data/twenty_questions/dataset.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/twenty_questions/lexicon_nouns.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/data/invoices/match.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 dpattersoncole@gmail.com dpattersoncole@gmail.com evals/registry/data/event_categories/samples.jsonl 3 1 721 721 1 1 2023-05-15 2023-05-15 javier@javier.nyc javier@javier.nyc evals/registry/data/gujarati_numerals/samples.jsonl 3 1 594 594 1 1 2023-09-19 2023-09-19 38771624+roshan-d@users.noreply.github.com 38771624+roshan-d@users.noreply.github.com evals/registry/data/rectangles/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 sam@samestep.com sam@samestep.com evals/registry/data/persian-kinship-riddles/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 137618076+evalevalian@users.noreply.github.com 137618076+evalevalian@users.noreply.github.com evals/registry/data/date-booking/samples.jsonl 3 1 706 706 1 1 2023-05-30 2023-05-30 popstas@gmail.com popstas@gmail.com evals/registry/data/bitwise/samples.jsonl 3 1 740 740 1 1 2023-04-26 2023-04-26 scottmortonashton@gmail.com scottmortonashton@gmail.com evals/registry/data/phonetics-identify-words-needing-missing-gpcs/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 31624048+climpyaardvark@users.noreply.github.com 31624048+climpyaardvark@users.noreply.github.com evals/registry/data/euler_problems/euler_problems.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 pcashworth83@gmail.com pcashworth83@gmail.com evals/registry/data/arabic-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/resistor_ohm_calculator/samples.jsonl 3 1 714 714 1 1 2023-05-22 2023-05-22 mfolnovic@gmail.com mfolnovic@gmail.com evals/registry/data/positive-binary-operations/samples.jsonl 3 1 745 745 1 1 2023-04-21 2023-04-21 106610412+omar-heshamr@users.noreply.github.com 106610412+omar-heshamr@users.noreply.github.com evals/registry/data/positive-binary-operations/fewshot.jsonl 3 2 745 595 2 2 2023-04-21 2023-09-18 106610412+omar-heshamr@users.noreply.github.com 133797909+jorge-openai@users.noreply.github.com evals/registry/data/accounting_audit/samples.jsonl 3 1 728 728 1 1 2023-05-08 2023-05-08 npedowitz@yahoo.com npedowitz@yahoo.com evals/registry/data/albanian-exams-qa/samples.jsonl 3 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/data/finance/credit.jsonl 3 1 753 753 1 1 2023-04-13 2023-04-13 prenterjack@gmail.com prenterjack@gmail.com evals/registry/data/russe/few_shot.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 alex@alexkuk.ru alex@alexkuk.ru evals/registry/data/russe/samples.jsonl 3 1 744 744 1 1 2023-04-22 2023-04-22 alex@alexkuk.ru alex@alexkuk.ru evals/registry/data/us_tort_law/few_shot.jsonl 3 1 771 771 1 1 2023-03-26 2023-03-26 jonathanagustin@gmail.com jonathanagustin@gmail.com evals/registry/data/us_tort_law/samples.jsonl 3 1 771 771 1 1 2023-03-26 2023-03-26 jonathanagustin@gmail.com jonathanagustin@gmail.com evals/registry/data/gregorian-to-hebrew-date/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 orelbiton27@gmail.com orelbiton27@gmail.com evals/registry/data/cybersecurity/filepaths.jsonl 3 1 698 698 1 1 2023-06-07 2023-06-07 glmcdona@gmail.com glmcdona@gmail.com evals/registry/data/chinese_idioms/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 32207883+robinzixuan@users.noreply.github.com 32207883+robinzixuan@users.noreply.github.com evals/registry/data/latin_grammar/samples.jsonl 3 1 662 662 1 1 2023-07-13 2023-07-13 125713831+d3287t328@users.noreply.github.com 125713831+d3287t328@users.noreply.github.com evals/registry/data/parable-to-moral-match/parable-to-moral-match-zh.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 nlanesmith@gmail.com nlanesmith@gmail.com evals/registry/data/parable-to-moral-match/parable-to-moral-match-en.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 nlanesmith@gmail.com nlanesmith@gmail.com evals/registry/data/reverse-sort-words-eng/samples.jsonl 3 1 703 703 1 1 2023-06-02 2023-06-02 112826784+bluefoxprime@users.noreply.github.com 112826784+bluefoxprime@users.noreply.github.com evals/registry/data/japanese-decimal-units/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 hiroaki.iwai@shaperon-inc.com hiroaki.iwai@shaperon-inc.com evals/registry/data/ordering_randomised_versionlist/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 jiejie@live.nl jiejie@live.nl evals/registry/data/gears_rotation/samples.jsonl 3 1 683 683 1 1 2023-06-22 2023-06-22 0xh3xy@gmail.com 0xh3xy@gmail.com evals/registry/data/logiqa-logical-reasoning-plus/logiqav2-logical-reasoning-plus.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 qbao775@aucklanduni.ac.nz qbao775@aucklanduni.ac.nz evals/registry/data/logiqa-logical-reasoning-plus/reclor-logical-reasoning-plus.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 qbao775@aucklanduni.ac.nz qbao775@aucklanduni.ac.nz evals/registry/data/logiqa-logical-reasoning-plus/logiqa-logical-reasoning-plus.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 qbao775@aucklanduni.ac.nz qbao775@aucklanduni.ac.nz evals/registry/data/svg_to_text/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 andrewcemil@gmail.com andrewcemil@gmail.com evals/registry/data/quartz/few_shot.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 rodrigoga@users.noreply.github.com rodrigoga@users.noreply.github.com evals/registry/data/quartz/samples.jsonl 3 1 705 705 1 1 2023-05-31 2023-05-31 rodrigoga@users.noreply.github.com rodrigoga@users.noreply.github.com evals/registry/data/singlestore-vectorsearch/samples.jsonl 3 1 677 677 1 1 2023-06-28 2023-06-28 137553926+pvgenflowai@users.noreply.github.com 137553926+pvgenflowai@users.noreply.github.com evals/registry/data/function_deduction/data.jsonl 3 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/data/last_word_nth/samples.jsonl 3 1 777 777 1 1 2023-03-20 2023-03-20 trevor.annedenise@icloud.com trevor.annedenise@icloud.com evals/registry/data/Unfamiliar-Chinese-Character/samples.jsonl 3 1 691 691 1 1 2023-06-14 2023-06-14 100397782+marc518@users.noreply.github.com 100397782+marc518@users.noreply.github.com evals/registry/data/diabetes/samples.jsonl 3 1 713 713 1 1 2023-05-23 2023-05-23 130139652+mooihi@users.noreply.github.com 130139652+mooihi@users.noreply.github.com evals/registry/data/number_pattern/samples.jsonl 3 1 770 770 1 1 2023-03-27 2023-03-27 scruelt@hotmail.com scruelt@hotmail.com evals/registry/data/population_span_extraction/samples.jsonl 3 1 697 697 1 1 2023-06-08 2023-06-08 94173501+iges-institut@users.noreply.github.com 94173501+iges-institut@users.noreply.github.com evals/registry/data/probabilities-word-problems/samples.jsonl 3 1 671 671 1 1 2023-07-04 2023-07-04 omarhishamk@gmail.com omarhishamk@gmail.com evals/registry/data/pantone_to_hex/samples.jsonl 3 1 694 694 1 1 2023-06-11 2023-06-11 bahar@getdigraph.com bahar@getdigraph.com evals/registry/data/chinese_song_ci/samples.jsonl 3 1 704 704 1 1 2023-06-01 2023-06-01 134827783+thomasnyderp@users.noreply.github.com 134827783+thomasnyderp@users.noreply.github.com evals/registry/data/hebrew_rhyme/samples.jsonl 3 1 774 774 1 1 2023-03-23 2023-03-23 ytsaig@gmail.com ytsaig@gmail.com evals/registry/modelgraded/research-question-extraction.yaml 19 1 615 615 1 1 2023-08-29 2023-08-29 92821098+pancoaster@users.noreply.github.com 92821098+pancoaster@users.noreply.github.com evals/registry/modelgraded/possible.yaml 18 1 683 683 1 1 2023-06-22 2023-06-22 rishadzzzz@gmail.com rishadzzzz@gmail.com evals/registry/modelgraded/best.yaml 10 4 777 595 4 2 2023-03-20 2023-09-18 343165+rlbayes@users.noreply.github.com 55913678+cholotook@users.noreply.github.com evals/registry/modelgraded/fact.yaml 19 1 775 775 1 1 2023-03-22 2023-03-22 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/modelgraded/keywords.yaml 20 1 662 662 1 1 2023-07-13 2023-07-13 me+github@gerdemann.me me+github@gerdemann.me evals/registry/modelgraded/battle.yaml 21 1 775 775 1 1 2023-03-22 2023-03-22 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/modelgraded/singlestore.yaml 24 1 677 677 1 1 2023-06-28 2023-06-28 137553926+pvgenflowai@users.noreply.github.com 137553926+pvgenflowai@users.noreply.github.com evals/registry/modelgraded/arithmetic-expression.yaml 24 1 677 677 1 1 2023-06-28 2023-06-28 gustavo.santos@vortexa.com gustavo.santos@vortexa.com evals/registry/modelgraded/diversity.yaml 13 2 775 739 2 1 2023-03-22 2023-04-27 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/modelgraded/onomatopoeia.yaml 30 1 691 691 1 1 2023-06-14 2023-06-14 sap-csd@a-c-japan.com sap-csd@a-c-japan.com evals/registry/modelgraded/humor.yaml 17 2 775 760 2 1 2023-03-22 2023-04-06 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/modelgraded/closedqa.yaml 21 2 775 742 2 1 2023-03-22 2023-04-24 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/modelgraded/sql.yaml 24 3 745 706 3 2 2023-04-21 2023-05-30 mark@haym.me 133797909+jorge-openai@users.noreply.github.com evals/registry/modelgraded/iambic_pentameter.yaml 14 1 703 703 1 1 2023-06-02 2023-06-02 790279+ianonavy@users.noreply.github.com 790279+ianonavy@users.noreply.github.com evals/registry/modelgraded/translation.yaml 19 1 683 683 1 1 2023-06-22 2023-06-22 usama.anwar09@gmail.com usama.anwar09@gmail.com evals/registry/modelgraded/regression-equation.yaml 26 1 711 711 1 1 2023-05-25 2023-05-25 128815441+jonclar@users.noreply.github.com 128815441+jonclar@users.noreply.github.com evals/registry/modelgraded/security.yaml 14 1 755 755 1 1 2023-04-11 2023-04-11 lucianosb@users.noreply.github.com lucianosb@users.noreply.github.com evals/registry/modelgraded/rhyming.yaml 13 1 710 710 1 1 2023-05-26 2023-05-26 forexdude1234@gmail.com forexdude1234@gmail.com evals/registry/eval_sets/chinese-numbers.yaml 6 1 683 683 1 1 2023-06-22 2023-06-22 yichenfeng66@gmail.com yichenfeng66@gmail.com evals/registry/eval_sets/schelling_point.yaml 6 1 418 418 1 1 2024-03-13 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/eval_sets/mmmu.yaml 3 1 501 501 1 1 2023-12-21 2023-12-21 erik.t.ritter@gmail.com erik.t.ritter@gmail.com evals/registry/eval_sets/raven-matrices.yaml 30 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/eval_sets/exams-all.yaml 18 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/eval_sets/test-basic.yaml 6 1 754 754 1 1 2023-04-12 2023-04-12 tony@rizkocircle.com tony@rizkocircle.com evals/registry/eval_sets/hr-ml-agent-bench.yaml 34 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/eval_sets/test-modelgraded.yaml 14 3 780 760 4 2 2023-03-17 2023-04-06 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/eval_sets/coqa-ex.yaml 7 2 780 742 3 2 2023-03-17 2023-04-24 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/eval_sets/stock-options.yaml 14 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/eval_sets/manga-translation.yaml 5 1 768 768 1 1 2023-03-29 2023-03-29 mindful.jt@gmail.com mindful.jt@gmail.com evals/registry/eval_sets/logiqa-logical-reasoning-plus.yaml 5 1 705 705 1 1 2023-05-31 2023-05-31 qbao775@aucklanduni.ac.nz qbao775@aucklanduni.ac.nz evals/registry/eval_sets/css-selectors.yaml 4 1 662 662 1 1 2023-07-13 2023-07-13 ilanharel@gmail.com ilanharel@gmail.com evals/registry/eval_sets/ukraine-gec.yaml 20 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/eval_sets/test-all.yaml 21 5 781 742 8 3 2023-03-16 2023-04-24 shane@openai.com 343165+rlbayes@users.noreply.github.com evals/registry/eval_sets/word-associations.yaml 6 1 671 671 1 1 2023-07-04 2023-07-04 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/eval_sets/pointer-value-retrieval.yaml 8 1 699 699 1 1 2023-06-06 2023-06-06 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/eval_sets/mazes.yaml 8 1 691 691 1 1 2023-06-14 2023-06-14 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/completion_fns/cot.yaml 16 2 755 595 2 2 2023-04-11 2023-09-18 73198383+hwchung27@users.noreply.github.com douglas.monsky@gmail.com evals/registry/completion_fns/langchain_chains.yaml 2 1 755 755 1 1 2023-04-11 2023-04-11 hw.chase.17@gmail.com hw.chase.17@gmail.com evals/registry/completion_fns/langchain_llms.yaml 24 3 755 501 3 3 2023-04-11 2023-12-21 73198383+hwchung27@users.noreply.github.com lorenzo.pacchiardi@stats.ox.ac.uk evals/registry/evals/language.yaml 15 2 728 703 2 1 2023-05-08 2023-06-02 jwang47@users.noreply.github.com jwang47@users.noreply.github.com evals/registry/evals/irrelevant-negative-diversion.yaml 3 1 655 655 1 1 2023-07-20 2023-07-20 anders@wangrask.com anders@wangrask.com evals/registry/evals/chinese_homonym.yaml 3 1 698 698 1 1 2023-06-07 2023-06-07 yichenfeng66@gmail.com yichenfeng66@gmail.com evals/registry/evals/infiniteloop-match.yaml 3 1 777 777 1 1 2023-03-20 2023-03-20 44745172+dottedant-dooz@users.noreply.github.com 44745172+dottedant-dooz@users.noreply.github.com evals/registry/evals/simple_math.yaml 8 1 698 698 1 1 2023-06-07 2023-06-07 135593135+hbvlmedia@users.noreply.github.com 135593135+hbvlmedia@users.noreply.github.com evals/registry/evals/chinese_song_ci.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 134827783+thomasnyderp@users.noreply.github.com 134827783+thomasnyderp@users.noreply.github.com evals/registry/evals/Unfamiliar-Chinese-Character.yaml 9 1 691 691 1 1 2023-06-14 2023-06-14 100397782+marc518@users.noreply.github.com 100397782+marc518@users.noreply.github.com evals/registry/evals/resource_id_extraction.yaml 8 1 698 698 1 1 2023-06-07 2023-06-07 andrewcemil@users.noreply.github.com andrewcemil@users.noreply.github.com evals/registry/evals/superficial-patterns.yaml 9 1 712 712 1 1 2023-05-24 2023-05-24 hholt1@protonmail.com hholt1@protonmail.com evals/registry/evals/actors-sequence.yaml 8 1 774 774 1 1 2023-03-23 2023-03-23 125162997+mcaledonensis@users.noreply.github.com 125162997+mcaledonensis@users.noreply.github.com evals/registry/evals/track_the_stat.yaml 20 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/registry/evals/reverse-sort-words-eng.yaml 8 1 703 703 1 1 2023-06-02 2023-06-02 112826784+bluefoxprime@users.noreply.github.com 112826784+bluefoxprime@users.noreply.github.com evals/registry/evals/svg_alphabet.yaml 8 1 671 671 1 1 2023-07-04 2023-07-04 127973459+tudoratlumiai@users.noreply.github.com 127973459+tudoratlumiai@users.noreply.github.com evals/registry/evals/dutch-lexicon.yaml 3 1 744 744 1 1 2023-04-22 2023-04-22 riedel777@gmail.com riedel777@gmail.com evals/registry/evals/emotional-intelligence.yaml 3 1 755 755 1 1 2023-04-11 2023-04-11 16432683+dpys@users.noreply.github.com 16432683+dpys@users.noreply.github.com evals/registry/evals/word-association.yaml 32 1 671 671 1 1 2023-07-04 2023-07-04 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/evals/cybersecurity-filepaths.yaml 8 1 698 698 1 1 2023-06-07 2023-06-07 glmcdona@gmail.com glmcdona@gmail.com evals/registry/evals/product-matching.yaml 46 1 704 704 1 1 2023-06-01 2023-06-01 26688318+rpeeters85@users.noreply.github.com 26688318+rpeeters85@users.noreply.github.com evals/registry/evals/islands.yaml 8 1 713 713 1 1 2023-05-23 2023-05-23 nakagawa.mai@gmail.com nakagawa.mai@gmail.com evals/registry/evals/rock-climbing.yaml 7 1 703 703 1 1 2023-06-02 2023-06-02 gavin@meetsoci.com gavin@meetsoci.com evals/registry/evals/tempo_to_measure_count.yaml 3 1 745 745 1 1 2023-04-21 2023-04-21 sam.lucyk@gmail.com sam.lucyk@gmail.com evals/registry/evals/greek-nt-manuscripts.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 andy@honeyrunsoftware.com andy@honeyrunsoftware.com evals/registry/evals/number-pattern.yaml 7 1 770 770 1 1 2023-03-27 2023-03-27 scruelt@hotmail.com scruelt@hotmail.com evals/registry/evals/spanish_feminine_noun_masculine_article.yaml 8 1 712 712 1 1 2023-05-24 2023-05-24 21stcenturydigitaljeff@gmail.com 21stcenturydigitaljeff@gmail.com evals/registry/evals/test-modelgraded-battle.yaml 36 5 781 742 6 3 2023-03-16 2023-04-24 shane@openai.com 343165+rlbayes@users.noreply.github.com evals/registry/evals/code_progress.yaml 8 1 677 677 1 1 2023-06-28 2023-06-28 danielstrizhevsky@gmail.com danielstrizhevsky@gmail.com evals/registry/evals/belarusian-rhyme.yaml 3 1 691 691 1 1 2023-06-14 2023-06-14 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/evals/day-of-week-from-date.yaml 7 1 719 719 1 1 2023-05-17 2023-05-17 john@drivecentric.com john@drivecentric.com evals/registry/evals/research-question-extraction.yaml 11 1 615 615 1 1 2023-08-29 2023-08-29 92821098+pancoaster@users.noreply.github.com 92821098+pancoaster@users.noreply.github.com evals/registry/evals/finnish-rhyme.yaml 8 1 706 706 1 1 2023-05-30 2023-05-30 130182869+ouztsa@users.noreply.github.com 130182869+ouztsa@users.noreply.github.com evals/registry/evals/python_list_comprehension.yaml 8 1 710 710 1 1 2023-05-26 2023-05-26 67437435+michailmelonas@users.noreply.github.com 67437435+michailmelonas@users.noreply.github.com evals/registry/evals/geometry_puzzle.yaml 3 1 705 705 1 1 2023-05-31 2023-05-31 52676620+moeen-movahednia@users.noreply.github.com 52676620+moeen-movahednia@users.noreply.github.com evals/registry/evals/allergen-information.yaml 3 1 705 705 1 1 2023-05-31 2023-05-31 ophir.ido@gmail.com ophir.ido@gmail.com evals/registry/evals/bluff.yaml 39 1 537 537 1 1 2023-11-15 2023-11-15 33967107+johny-b@users.noreply.github.com 33967107+johny-b@users.noreply.github.com evals/registry/evals/phonetics-identify-words-needing-missing-gpcs.yaml 8 1 704 704 1 1 2023-06-01 2023-06-01 31624048+climpyaardvark@users.noreply.github.com 31624048+climpyaardvark@users.noreply.github.com evals/registry/evals/time-zone-conversion.yaml 8 1 714 714 1 1 2023-05-22 2023-05-22 alex@machinekoder.com alex@machinekoder.com evals/registry/evals/korean_date_counting.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 127706211+jess-hwang@users.noreply.github.com 127706211+jess-hwang@users.noreply.github.com evals/registry/evals/polish-proverbs.yaml 2 1 662 662 1 1 2023-07-13 2023-07-13 kasiakloc00@gmail.com kasiakloc00@gmail.com evals/registry/evals/russe.yaml 10 1 744 744 1 1 2023-04-22 2023-04-22 alex@alexkuk.ru alex@alexkuk.ru evals/registry/evals/rare-and-loanwords-dutch-lexicon.yaml 3 1 700 700 1 1 2023-06-05 2023-06-05 135169801+riskablebe@users.noreply.github.com 135169801+riskablebe@users.noreply.github.com evals/registry/evals/ner_finance.yaml 9 1 671 671 1 1 2023-07-04 2023-07-04 anthony@candlestick.ai anthony@candlestick.ai evals/registry/evals/belarusian-antonyms.yaml 3 1 556 556 1 1 2023-10-27 2023-10-27 tanya.shagova@gmail.com tanya.shagova@gmail.com evals/registry/evals/italian-rhyme.yaml 8 1 706 706 1 1 2023-05-30 2023-05-30 webdaemon3@gmail.com webdaemon3@gmail.com evals/registry/evals/indonesian_numbers.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 aarongpower@gmail.com aarongpower@gmail.com evals/registry/evals/russian-lexicon.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 gydronik@gmail.com gydronik@gmail.com evals/registry/evals/japanese_city_name_pronuciation.yaml 3 1 711 711 1 1 2023-05-25 2023-05-25 679040+akazah@users.noreply.github.com 679040+akazah@users.noreply.github.com evals/registry/evals/finance.yaml 3 1 753 753 1 1 2023-04-13 2023-04-13 prenterjack@gmail.com prenterjack@gmail.com evals/registry/evals/schelling_point.yaml 66 3 594 418 3 3 2023-09-19 2024-03-13 140545726+ianmckenzie-oai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/evals/self_prompting.yaml 19 2 537 418 2 2 2023-11-15 2024-03-13 junshern@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/evals/gears_rotation.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 0xh3xy@gmail.com 0xh3xy@gmail.com evals/registry/evals/knot-theory.yaml 21 1 744 744 1 1 2023-04-22 2023-04-22 matthaigh27@gmail.com matthaigh27@gmail.com evals/registry/evals/portuguese-syllable-count.yaml 9 1 710 710 1 1 2023-05-26 2023-05-26 tucalipe@gmail.com tucalipe@gmail.com evals/registry/evals/simple-charting.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 daoduyducduong@gmail.com daoduyducduong@gmail.com evals/registry/evals/singlestore-vectorsearch.yaml 10 1 677 677 1 1 2023-06-28 2023-06-28 137553926+pvgenflowai@users.noreply.github.com 137553926+pvgenflowai@users.noreply.github.com evals/registry/evals/logic-grid-eval.yaml 11 1 704 704 1 1 2023-06-01 2023-06-01 austinstarnes@pm.me austinstarnes@pm.me evals/registry/evals/naughty_strings.yaml 36 1 755 755 1 1 2023-04-11 2023-04-11 lucianosb@users.noreply.github.com lucianosb@users.noreply.github.com evals/registry/evals/mandaliof-table.yaml 3 1 712 712 1 1 2023-05-24 2023-05-24 ali.risheh876@gmail.com ali.risheh876@gmail.com evals/registry/evals/prompt-injection.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 alianse777@users.noreply.github.com alianse777@users.noreply.github.com evals/registry/evals/numbers_game.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 134487556+ivafractal@users.noreply.github.com 134487556+ivafractal@users.noreply.github.com evals/registry/evals/building_floorplan.yaml 8 1 714 714 1 1 2023-05-22 2023-05-22 sjknauer@gmail.com sjknauer@gmail.com evals/registry/evals/count_intersections_polynomial.yaml 8 1 713 713 1 1 2023-05-23 2023-05-23 63267585+cauvmou@users.noreply.github.com 63267585+cauvmou@users.noreply.github.com evals/registry/evals/icelandic-inflection-medium.yaml 3 1 556 556 1 1 2023-10-27 2023-10-27 vthorsteinsson@users.noreply.github.com vthorsteinsson@users.noreply.github.com evals/registry/evals/numerical-cabbala-casanova.yaml 10 1 677 677 1 1 2023-06-28 2023-06-28 giacomoran@gmail.com giacomoran@gmail.com evals/registry/evals/adultery_state_laws.yaml 8 1 706 706 1 1 2023-05-30 2023-05-30 108371552+loadedmediainc@users.noreply.github.com 108371552+loadedmediainc@users.noreply.github.com evals/registry/evals/chinese_ancient_masterpieces_dynasty.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 136729222+meganjohnson96@users.noreply.github.com 136729222+meganjohnson96@users.noreply.github.com evals/registry/evals/hebrew_talmud_suka.yaml 8 1 691 691 1 1 2023-06-14 2023-06-14 ysrael@reflectiz.com ysrael@reflectiz.com evals/registry/evals/gpt-protocol-buffers.yaml 7 1 697 697 1 1 2023-06-08 2023-06-08 jdavis@pcprogramming.com jdavis@pcprogramming.com evals/registry/evals/skill_acquisition.yaml 94 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/evals/nfl-point-combinations.yaml 3 1 694 694 1 1 2023-06-11 2023-06-11 136047342+dougkwanna@users.noreply.github.com 136047342+dougkwanna@users.noreply.github.com evals/registry/evals/bulgarian-lexicon.yaml 3 1 768 768 1 1 2023-03-29 2023-03-29 mdatsev@users.noreply.github.com mdatsev@users.noreply.github.com evals/registry/evals/human-safety.yaml 8 1 700 700 1 1 2023-06-05 2023-06-05 46403813+bertod@users.noreply.github.com 46403813+bertod@users.noreply.github.com evals/registry/evals/mmlu.yaml 399 1 728 728 1 1 2023-05-08 2023-05-08 jwang47@users.noreply.github.com jwang47@users.noreply.github.com evals/registry/evals/twenty_questions.yaml 54 1 412 412 1 1 2024-03-19 2024-03-19 inwaves@users.noreply.github.com inwaves@users.noreply.github.com evals/registry/evals/isosceles-right-triangle.yaml 7 1 714 714 1 1 2023-05-22 2023-05-22 alexbuzanis@gmail.com alexbuzanis@gmail.com evals/registry/evals/belarusian-grammar.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/evals/abstract-causal-reasoning.yaml 16 1 700 700 1 1 2023-06-05 2023-06-05 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/evals/corr2cause.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 vasarmilan@gmail.com vasarmilan@gmail.com evals/registry/evals/anagrams.yaml 10 1 776 776 1 1 2023-03-21 2023-03-21 97240159+l-mutricy@users.noreply.github.com 97240159+l-mutricy@users.noreply.github.com evals/registry/evals/3d_object_manipulation.yaml 8 1 662 662 1 1 2023-07-13 2023-07-13 pomichterstash@gmail.com pomichterstash@gmail.com evals/registry/evals/finance_calc.yaml 8 1 662 662 1 1 2023-07-13 2023-07-13 gondek.christopher@gmail.com gondek.christopher@gmail.com evals/registry/evals/chinese-lantern-riddles.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 50411747+chenzhao44@users.noreply.github.com 50411747+chenzhao44@users.noreply.github.com evals/registry/evals/unsolvable_questions.yaml 7 1 710 710 1 1 2023-05-26 2023-05-26 lucasklaassen@users.noreply.github.com lucasklaassen@users.noreply.github.com evals/registry/evals/accounting_audit.yaml 7 1 662 662 1 1 2023-07-13 2023-07-13 55913678+cholotook@users.noreply.github.com 55913678+cholotook@users.noreply.github.com evals/registry/evals/utility_price_parsing.yaml 7 1 745 745 1 1 2023-04-21 2023-04-21 131423049+dz-pika@users.noreply.github.com 131423049+dz-pika@users.noreply.github.com evals/registry/evals/resistor-ohm-calculator.yaml 3 1 714 714 1 1 2023-05-22 2023-05-22 mfolnovic@gmail.com mfolnovic@gmail.com evals/registry/evals/partially_solved_crossword_clues.yaml 7 1 770 770 1 1 2023-03-27 2023-03-27 francois_lr@hotmail.fr francois_lr@hotmail.fr evals/registry/evals/arithmetical_puzzles.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 l.malmqvist@gmail.com l.malmqvist@gmail.com evals/registry/evals/russian_sarcasm.yaml 8 1 699 699 1 1 2023-06-06 2023-06-06 vtolm@vtolm.com vtolm@vtolm.com evals/registry/evals/word_vector_over_reliance.yaml 9 1 712 712 1 1 2023-05-24 2023-05-24 89385155+neolizhe@users.noreply.github.com 89385155+neolizhe@users.noreply.github.com evals/registry/evals/directions.yaml 8 1 712 712 1 1 2023-05-24 2023-05-24 rohan.m.kshirsagar@gmail.com rohan.m.kshirsagar@gmail.com evals/registry/evals/pure_korean.yaml 8 1 703 703 1 1 2023-06-02 2023-06-02 68699959+soooim@users.noreply.github.com 68699959+soooim@users.noreply.github.com evals/registry/evals/unified-patch.yaml 7 1 745 745 1 1 2023-04-21 2023-04-21 me@andrebaltazar.com me@andrebaltazar.com evals/registry/evals/coq-editing.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 jasongross9@gmail.com jasongross9@gmail.com evals/registry/evals/diagrammatic_logic.yaml 7 1 775 775 1 1 2023-03-22 2023-03-22 freddie.nicholson123@gmail.com freddie.nicholson123@gmail.com evals/registry/evals/marxist_philosophy_exam.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 cxjwin@users.noreply.github.com cxjwin@users.noreply.github.com evals/registry/evals/swedish-spelling.yaml 3 1 755 755 1 1 2023-04-11 2023-04-11 129839173+eellofgren@users.noreply.github.com 129839173+eellofgren@users.noreply.github.com evals/registry/evals/mmmu.yaml 390 1 501 501 1 1 2023-12-21 2023-12-21 erik.t.ritter@gmail.com erik.t.ritter@gmail.com evals/registry/evals/cant_do_that_anymore.yaml 20 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/evals/utah_real_estate.yaml 8 1 691 691 1 1 2023-06-14 2023-06-14 42595698+thechaincollective@users.noreply.github.com 42595698+thechaincollective@users.noreply.github.com evals/registry/evals/dhammapada-reference.yaml 8 1 671 671 1 1 2023-07-04 2023-07-04 lance.miyamoto@gmail.com lance.miyamoto@gmail.com evals/registry/evals/brazilian_laws.yaml 8 1 703 703 1 1 2023-06-02 2023-06-02 lucianosb@users.noreply.github.com lucianosb@users.noreply.github.com evals/registry/evals/korean-consonant-vowel-combination.yaml 3 1 712 712 1 1 2023-05-24 2023-05-24 dennis.hong@kakaocorp.com dennis.hong@kakaocorp.com evals/registry/evals/decrypt-caesar-cipher.yaml 7 1 776 776 1 1 2023-03-21 2023-03-21 me@mattfalconer.com me@mattfalconer.com evals/registry/evals/nepali-song-singer.yaml 3 1 718 718 1 1 2023-05-18 2023-05-18 36022153+oshanoshu@users.noreply.github.com 36022153+oshanoshu@users.noreply.github.com evals/registry/evals/find-letter.yaml 7 1 713 713 1 1 2023-05-23 2023-05-23 u.sivasweatha@gmail.com u.sivasweatha@gmail.com evals/registry/evals/chinese_tang_poetries.yaml 4 1 710 710 1 1 2023-05-26 2023-05-26 clvrobj@gmail.com clvrobj@gmail.com evals/registry/evals/reasoning_with_contradictory_statements.yaml 9 1 683 683 1 1 2023-06-22 2023-06-22 rishadzzzz@gmail.com rishadzzzz@gmail.com evals/registry/evals/belarusian-proverbs.yaml 2 1 700 700 1 1 2023-06-05 2023-06-05 130565081+yuryrudnitski@users.noreply.github.com 130565081+yuryrudnitski@users.noreply.github.com evals/registry/evals/qa.yaml 3 1 744 744 1 1 2023-04-22 2023-04-22 43813768+keremnalbant@users.noreply.github.com 43813768+keremnalbant@users.noreply.github.com evals/registry/evals/points-on-line.yaml 3 1 700 700 1 1 2023-06-05 2023-06-05 aaron@aaronsmith.tv aaron@aaronsmith.tv evals/registry/evals/russian-english-homonym-context-resolution.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 10080307+gradientsky@users.noreply.github.com 10080307+gradientsky@users.noreply.github.com evals/registry/evals/korean_foreign_words.yaml 8 1 677 677 1 1 2023-06-28 2023-06-28 pringle0531@gmail.com pringle0531@gmail.com evals/registry/evals/stats-tests.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 61809814+jackaldenryan@users.noreply.github.com 61809814+jackaldenryan@users.noreply.github.com evals/registry/evals/portuguese-sarcasm.yaml 8 1 713 713 1 1 2023-05-23 2023-05-23 lucas.arki@gmail.com lucas.arki@gmail.com evals/registry/evals/parable-to-moral-match.yaml 14 1 705 705 1 1 2023-05-31 2023-05-31 nlanesmith@gmail.com nlanesmith@gmail.com evals/registry/evals/physics-interaction.yaml 3 1 715 715 1 1 2023-05-21 2023-05-21 jelgt2011@gmail.com jelgt2011@gmail.com evals/registry/evals/portuguese-kinship-riddles.yaml 8 1 690 690 1 1 2023-06-15 2023-06-15 zbu@ezpapel.com zbu@ezpapel.com evals/registry/evals/chinese_chu_ci.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 arvinx@foxmail.com arvinx@foxmail.com evals/registry/evals/override-system-instruction.yaml 7 1 705 705 1 1 2023-05-31 2023-05-31 mail@thooyavan.me mail@thooyavan.me evals/registry/evals/comprehensive-graph-reasoning.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 42741744+edmundlaowang@users.noreply.github.com 42741744+edmundlaowang@users.noreply.github.com evals/registry/evals/raven-matrices.yaml 224 1 697 697 1 1 2023-06-08 2023-06-08 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/evals/quartz.yaml 10 1 705 705 1 1 2023-05-31 2023-05-31 rodrigoga@users.noreply.github.com rodrigoga@users.noreply.github.com evals/registry/evals/norwegian-lexicon.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 info@dyar.no info@dyar.no evals/registry/evals/test-comp-sci.yaml 9 1 776 776 1 1 2023-03-21 2023-03-21 samennis127@gmail.com samennis127@gmail.com evals/registry/evals/logic-container.yaml 10 1 662 662 1 1 2023-07-13 2023-07-13 onder.secen@gmail.com onder.secen@gmail.com evals/registry/evals/iqbal-poetry-translation.yaml 24 1 683 683 1 1 2023-06-22 2023-06-22 usama.anwar09@gmail.com usama.anwar09@gmail.com evals/registry/evals/forth-stack-sim.yaml 19 2 775 768 2 1 2023-03-22 2023-03-29 gooseus@users.noreply.github.com gooseus@users.noreply.github.com evals/registry/evals/identifying_variables.yaml 123 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/registry/evals/korean-phonetics.yaml 8 1 693 693 1 1 2023-06-12 2023-06-12 136151309+jaiwonrhi2@users.noreply.github.com 136151309+jaiwonrhi2@users.noreply.github.com evals/registry/evals/icelandic-inflection-easy.yaml 3 1 556 556 1 1 2023-10-27 2023-10-27 vthorsteinsson@users.noreply.github.com vthorsteinsson@users.noreply.github.com evals/registry/evals/swedish_sat.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 justus.karlsson@hotmail.se justus.karlsson@hotmail.se evals/registry/evals/hebrew-homophones.yaml 8 1 671 671 1 1 2023-07-04 2023-07-04 59704420+relvok@users.noreply.github.com 59704420+relvok@users.noreply.github.com evals/registry/evals/medmcqa.yaml 7 1 744 744 1 1 2023-04-22 2023-04-22 shuriken209master@googlemail.com shuriken209master@googlemail.com evals/registry/evals/belarusian-syllable-count.yaml 3 1 700 700 1 1 2023-06-05 2023-06-05 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/evals/poker_analysis.yaml 3 1 700 700 1 1 2023-06-05 2023-06-05 douglas.monsky@gmail.com douglas.monsky@gmail.com evals/registry/evals/regex-match.yaml 7 1 769 769 1 1 2023-03-28 2023-03-28 davidchen@gliacloud.com davidchen@gliacloud.com evals/registry/evals/japanese_driving_license.yaml 3 1 745 745 1 1 2023-04-21 2023-04-21 60774986+yji5212@users.noreply.github.com 60774986+yji5212@users.noreply.github.com evals/registry/evals/music-theory-chord-notes.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 steventsao@me.com steventsao@me.com evals/registry/evals/linear-regression.yaml 21 1 711 711 1 1 2023-05-25 2023-05-25 128815441+jonclar@users.noreply.github.com 128815441+jonclar@users.noreply.github.com evals/registry/evals/map-electronic-component-part-to-fact.yaml 7 2 782 781 2 2 2023-03-15 2023-03-16 omattos@gmail.com 120423412+andrew-openai@users.noreply.github.com evals/registry/evals/pantone_to_hex.yaml 7 1 694 694 1 1 2023-06-11 2023-06-11 bahar@getdigraph.com bahar@getdigraph.com evals/registry/evals/number-reading.yaml 3 1 768 768 1 1 2023-03-29 2023-03-29 benjaminliu.eecs@gmail.com benjaminliu.eecs@gmail.com evals/registry/evals/sexagenary-cycle-calculation.yaml 7 1 720 720 1 1 2023-05-16 2023-05-16 dunedainstrider.a@gmail.com dunedainstrider.a@gmail.com evals/registry/evals/taxes.yaml 7 1 770 770 1 1 2023-03-27 2023-03-27 andrewmlu3@gmail.com andrewmlu3@gmail.com evals/registry/evals/tricky-word-problems.yaml 3 1 671 671 1 1 2023-07-04 2023-07-04 jackurbs@gmail.com jackurbs@gmail.com evals/registry/evals/simple-block-puzzles.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 bird.seanmichael@gmail.com bird.seanmichael@gmail.com evals/registry/evals/syllables_long_words.yaml 7 1 705 705 1 1 2023-05-31 2023-05-31 eschulma@gmail.com eschulma@gmail.com evals/registry/evals/invoice_due_date_leap_day_adjustment.yaml 7 1 719 719 1 1 2023-05-17 2023-05-17 132409761+techlocke@users.noreply.github.com 132409761+techlocke@users.noreply.github.com evals/registry/evals/gregorian-to-hebrew-date.yaml 9 1 683 683 1 1 2023-06-22 2023-06-22 orelbiton27@gmail.com orelbiton27@gmail.com evals/registry/evals/multistep-word-problems.yaml 3 1 711 711 1 1 2023-05-25 2023-05-25 forexdude1234@gmail.com forexdude1234@gmail.com evals/registry/evals/south-african-bands.yaml 3 1 717 717 1 1 2023-05-19 2023-05-19 richard.wooding@spandigital.com richard.wooding@spandigital.com evals/registry/evals/italian_big_math_expression.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 38102850+danielepoterti@users.noreply.github.com 38102850+danielepoterti@users.noreply.github.com evals/registry/evals/monthly_metric_comparison.yaml 8 1 700 700 1 1 2023-06-05 2023-06-05 6182673+robi-ng@users.noreply.github.com 6182673+robi-ng@users.noreply.github.com evals/registry/evals/cricket_situations.yaml 8 1 705 705 1 1 2023-05-31 2023-05-31 134620553+ai-scale@users.noreply.github.com 134620553+ai-scale@users.noreply.github.com evals/registry/evals/greek-vocabulary.yaml 7 1 744 744 1 1 2023-04-22 2023-04-22 99351112+0xacx@users.noreply.github.com 99351112+0xacx@users.noreply.github.com evals/registry/evals/shopping_discount_comparison.yaml 3 1 705 705 1 1 2023-05-31 2023-05-31 35208156+lillichoung@users.noreply.github.com 35208156+lillichoung@users.noreply.github.com evals/registry/evals/japanese_populer_video_game_title_and_the_publisher.yaml 3 1 712 712 1 1 2023-05-24 2023-05-24 snsk@users.noreply.github.com snsk@users.noreply.github.com evals/registry/evals/internal_representations.yaml 7 1 706 706 1 1 2023-05-30 2023-05-30 syn@zbeacon.org syn@zbeacon.org evals/registry/evals/latin_grammar.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 125713831+d3287t328@users.noreply.github.com 125713831+d3287t328@users.noreply.github.com evals/registry/evals/cube-pack.yaml 7 2 782 781 3 2 2023-03-15 2023-03-16 emil@radix.ai 120423412+andrew-openai@users.noreply.github.com evals/registry/evals/korean-postposition.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 lena.h.hong@gmail.com lena.h.hong@gmail.com evals/registry/evals/ordering_randomised_versionlist.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 jiejie@live.nl jiejie@live.nl evals/registry/evals/moral_exceptQA.yaml 8 1 754 754 1 1 2023-04-12 2023-04-12 kblin@outlook.com kblin@outlook.com evals/registry/evals/illinois-law.yaml 3 1 769 769 1 1 2023-03-28 2023-03-28 seancye@gmail.com seancye@gmail.com evals/registry/evals/complex-analogies-en-ru.yaml 7 1 705 705 1 1 2023-05-31 2023-05-31 karinageneraly@gmail.com karinageneraly@gmail.com evals/registry/evals/connect-4.yaml 7 1 776 776 1 1 2023-03-21 2023-03-21 83553535+kierandon@users.noreply.github.com 83553535+kierandon@users.noreply.github.com evals/registry/evals/pattern_identification.yaml 7 2 782 781 2 2 2023-03-15 2023-03-16 jasonwei@openai.com 120423412+andrew-openai@users.noreply.github.com evals/registry/evals/hindi_words.yaml 7 1 710 710 1 1 2023-05-26 2023-05-26 36335769+0x34d@users.noreply.github.com 36335769+0x34d@users.noreply.github.com evals/registry/evals/thirty_six_stratagems.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 20484971+cookfish@users.noreply.github.com 20484971+cookfish@users.noreply.github.com evals/registry/evals/hebrew-rhyme.yaml 8 1 774 774 1 1 2023-03-23 2023-03-23 ytsaig@gmail.com ytsaig@gmail.com evals/registry/evals/proofreader.yaml 8 1 677 677 1 1 2023-06-28 2023-06-28 ramiel@users.noreply.github.com ramiel@users.noreply.github.com evals/registry/evals/logic-liar-paradox.yaml 3 1 727 727 1 1 2023-05-09 2023-05-09 robertbateman@users.noreply.github.com robertbateman@users.noreply.github.com evals/registry/evals/convert-hex-hsl-lightness.yaml 8 1 776 776 1 1 2023-03-21 2023-03-21 harley@hturan.com harley@hturan.com evals/registry/evals/food.yaml 7 1 711 711 1 1 2023-05-25 2023-05-25 christopherb737@gmail.com christopherb737@gmail.com evals/registry/evals/sort-numeric.yaml 8 1 740 740 1 1 2023-04-26 2023-04-26 albertgozzi@gmail.com albertgozzi@gmail.com evals/registry/evals/simple-knowledge-mongolian.yaml 3 1 752 752 1 1 2023-04-14 2023-04-14 joseph.lelic@gmail.com joseph.lelic@gmail.com evals/registry/evals/population_span_extraction.yaml 10 1 697 697 1 1 2023-06-08 2023-06-08 94173501+iges-institut@users.noreply.github.com 94173501+iges-institut@users.noreply.github.com evals/registry/evals/ral_to_hex.yaml 7 1 683 683 1 1 2023-06-22 2023-06-22 nikolasarmstrong@gmail.com nikolasarmstrong@gmail.com evals/registry/evals/ru_rhymes.yaml 11 1 704 704 1 1 2023-06-01 2023-06-01 36363097+latand@users.noreply.github.com 36363097+latand@users.noreply.github.com evals/registry/evals/norwegian-rhymes.yaml 8 1 677 677 1 1 2023-06-28 2023-06-28 137759176+monocle-pastels@users.noreply.github.com 137759176+monocle-pastels@users.noreply.github.com evals/registry/evals/aba-mrpc-true-false.yaml 7 1 776 776 1 1 2023-03-21 2023-03-21 avery@offerfit.ai avery@offerfit.ai evals/registry/evals/persian-kinship-riddles.yaml 8 1 677 677 1 1 2023-06-28 2023-06-28 137618076+evalevalian@users.noreply.github.com 137618076+evalevalian@users.noreply.github.com evals/registry/evals/unwanted-rhyming.yaml 9 1 710 710 1 1 2023-05-26 2023-05-26 forexdude1234@gmail.com forexdude1234@gmail.com evals/registry/evals/invert_word_wise.yaml 8 1 714 714 1 1 2023-05-22 2023-05-22 38587927+ach-in@users.noreply.github.com 38587927+ach-in@users.noreply.github.com evals/registry/evals/vigenere.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 grahamzemel@gmail.com grahamzemel@gmail.com evals/registry/evals/code_combination.yaml 3 1 700 700 1 1 2023-06-05 2023-06-05 psingley@gmail.com psingley@gmail.com evals/registry/evals/dice-rotation-sequence.yaml 3 1 745 745 1 1 2023-04-21 2023-04-21 g.h.garrett13@gmail.com g.h.garrett13@gmail.com evals/registry/evals/next-val-series.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 36852564+hmzakhalid@users.noreply.github.com 36852564+hmzakhalid@users.noreply.github.com evals/registry/evals/test-basic.yaml 32 2 754 719 2 2 2023-04-12 2023-05-17 tony@rizkocircle.com jwang47@users.noreply.github.com evals/registry/evals/guess-the-singer.yaml 2 1 713 713 1 1 2023-05-23 2023-05-23 130565081+yuryrudnitski@users.noreply.github.com 130565081+yuryrudnitski@users.noreply.github.com evals/registry/evals/italian-new-words.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 sdiviney@gmail.com sdiviney@gmail.com evals/registry/evals/atpl_exams.yaml 7 1 711 711 1 1 2023-05-25 2023-05-25 perrosnk@gmail.com perrosnk@gmail.com evals/registry/evals/steganography.yaml 3 2 594 418 2 2 2023-09-19 2024-03-13 140545726+ianmckenzie-oai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/evals/alternate-numeral-systems.yaml 3 1 700 700 1 1 2023-06-05 2023-06-05 matt.lavin@gmail.com matt.lavin@gmail.com evals/registry/evals/music-theory-chord-names.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 steventsao@me.com steventsao@me.com evals/registry/evals/logical-black-scholes.yaml 8 1 662 662 1 1 2023-07-13 2023-07-13 dsims21@gmail.com dsims21@gmail.com evals/registry/evals/wkt_understanding.yaml 8 1 706 706 1 1 2023-05-30 2023-05-30 vinooganesh@users.noreply.github.com vinooganesh@users.noreply.github.com evals/registry/evals/passing-balls.yaml 3 1 705 705 1 1 2023-05-31 2023-05-31 131498134+lucid-max@users.noreply.github.com 131498134+lucid-max@users.noreply.github.com evals/registry/evals/spanish-lexicon.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 carlos@domintia.com carlos@domintia.com evals/registry/evals/tokyo-station-number.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 torufuru@users.noreply.github.com torufuru@users.noreply.github.com evals/registry/evals/hr-ml-agent-bench.yaml 137 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/evals/japanese_romantic_context.yaml 7 1 655 655 1 1 2023-07-20 2023-07-20 115438292+missionteam@users.noreply.github.com 115438292+missionteam@users.noreply.github.com evals/registry/evals/ukraine-eit.yaml 7 1 769 769 1 1 2023-03-28 2023-03-28 badt@appar.at badt@appar.at evals/registry/evals/convert_bwt_num_and_chinese_num.yaml 32 1 683 683 1 1 2023-06-22 2023-06-22 yichenfeng66@gmail.com yichenfeng66@gmail.com evals/registry/evals/irish-lexicon.yaml 3 1 719 719 1 1 2023-05-17 2023-05-17 getintouchwithseanryan@gmail.com getintouchwithseanryan@gmail.com evals/registry/evals/reverse-polish-notation.yaml 3 1 711 711 1 1 2023-05-25 2023-05-25 andrew.prokhorenkov@gmail.com andrew.prokhorenkov@gmail.com evals/registry/evals/gujarati_numerals.yaml 3 1 594 594 1 1 2023-09-19 2023-09-19 38771624+roshan-d@users.noreply.github.com 38771624+roshan-d@users.noreply.github.com evals/registry/evals/test-modelgraded.yaml 81 7 777 595 7 3 2023-03-20 2023-09-18 343165+rlbayes@users.noreply.github.com 55913678+cholotook@users.noreply.github.com evals/registry/evals/imperial_date_to_string.yaml 7 1 769 769 1 1 2023-03-28 2023-03-28 dd@davisinfo.com dd@davisinfo.com evals/registry/evals/cardinal-directions.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 dbautista.cs@gmail.com dbautista.cs@gmail.com evals/registry/evals/belarusian-synonyms.yaml 3 1 704 704 1 1 2023-06-01 2023-06-01 tanya.shagova@gmail.com tanya.shagova@gmail.com evals/registry/evals/automata-and-complexity.yaml 3 1 677 677 1 1 2023-06-28 2023-06-28 peter@stakoun.com peter@stakoun.com evals/registry/evals/astro_eval.yaml 8 1 662 662 1 1 2023-07-13 2023-07-13 andrerbreton@gmail.com andrerbreton@gmail.com evals/registry/evals/belarusian-lexicon.yaml 3 1 776 776 1 1 2023-03-21 2023-03-21 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/evals/japanese_onomatopoeia.yaml 9 1 691 691 1 1 2023-06-14 2023-06-14 sap-csd@a-c-japan.com sap-csd@a-c-japan.com evals/registry/evals/coqa-ex.yaml 55 4 780 742 5 3 2023-03-17 2023-04-24 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/evals/syntax-check.yaml 3 1 718 718 1 1 2023-05-18 2023-05-18 aargoldsmith@gmail.com aargoldsmith@gmail.com evals/registry/evals/test-modelgraded-generated.yaml 9 3 781 770 4 2 2023-03-16 2023-03-27 shane@openai.com 343165+rlbayes@users.noreply.github.com evals/registry/evals/seo_keywords.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 me+github@gerdemann.me me+github@gerdemann.me evals/registry/evals/ascii-digit-recognition.yaml 8 1 691 691 1 1 2023-06-14 2023-06-14 52069185+dddraxxx@users.noreply.github.com 52069185+dddraxxx@users.noreply.github.com evals/registry/evals/ab.yaml 3 1 556 556 1 1 2023-10-27 2023-10-27 42742390+mmtmn@users.noreply.github.com 42742390+mmtmn@users.noreply.github.com evals/registry/evals/chinese_hard_translations.yaml 4 1 691 691 1 1 2023-06-14 2023-06-14 nicognaw@outlook.com nicognaw@outlook.com evals/registry/evals/theory_of_mind.yaml 48 2 482 418 2 1 2024-01-09 2024-03-13 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/evals/body-movement.yaml 3 1 717 717 1 1 2023-05-19 2023-05-19 30339662+tescao@users.noreply.github.com 30339662+tescao@users.noreply.github.com evals/registry/evals/german-part-of-speech.yaml 3 1 704 704 1 1 2023-06-01 2023-06-01 vasco@piranhafleisch.de vasco@piranhafleisch.de evals/registry/evals/exams.yaml 112 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/evals/singapore_data_protection_decisions.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 iamkaiwei@gmail.com iamkaiwei@gmail.com evals/registry/evals/soc_codes.yaml 10 1 693 693 1 1 2023-06-12 2023-06-12 21990717+lrperkins@users.noreply.github.com 21990717+lrperkins@users.noreply.github.com evals/registry/evals/swap-words.yaml 7 1 713 713 1 1 2023-05-23 2023-05-23 pranavgade20@gmail.com pranavgade20@gmail.com evals/registry/evals/security_guide.yaml 10 1 706 706 1 1 2023-05-30 2023-05-30 134000058+gpsandhu23@users.noreply.github.com 134000058+gpsandhu23@users.noreply.github.com evals/registry/evals/jee-math.yaml 7 1 714 714 1 1 2023-05-22 2023-05-22 anant@kix.in anant@kix.in evals/registry/evals/multistep_web_tasks.yaml 60 1 410 410 1 1 2024-03-21 2024-03-21 danesherbs@users.noreply.github.com danesherbs@users.noreply.github.com evals/registry/evals/mendelian_inheritance.yaml 7 1 770 770 1 1 2023-03-27 2023-03-27 constantin_goeldel@t-online.de constantin_goeldel@t-online.de evals/registry/evals/iambic-pentameter.yaml 10 1 703 703 1 1 2023-06-02 2023-06-02 790279+ianonavy@users.noreply.github.com 790279+ianonavy@users.noreply.github.com evals/registry/evals/solve-for-variable.yaml 8 1 703 703 1 1 2023-06-02 2023-06-02 130226176+juan-de-salgado@users.noreply.github.com 130226176+juan-de-salgado@users.noreply.github.com evals/registry/evals/logic.yaml 9 1 770 770 1 1 2023-03-27 2023-03-27 343165+rlbayes@users.noreply.github.com 343165+rlbayes@users.noreply.github.com evals/registry/evals/banking77.yaml 8 1 744 744 1 1 2023-04-22 2023-04-22 ouassim.fari@gmail.com ouassim.fari@gmail.com evals/registry/evals/shared-borders.yaml 8 1 712 712 1 1 2023-05-24 2023-05-24 paulgb@gmail.com paulgb@gmail.com evals/registry/evals/already_said_that.yaml 45 1 412 412 1 1 2024-03-19 2024-03-19 giulio.starace@gmail.com giulio.starace@gmail.com evals/registry/evals/finger-tracking.yaml 8 1 662 662 1 1 2023-07-13 2023-07-13 chris@notus.ai chris@notus.ai evals/registry/evals/invoices.yaml 3 1 744 744 1 1 2023-04-22 2023-04-22 dpattersoncole@gmail.com dpattersoncole@gmail.com evals/registry/evals/korean-honorific.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 greenmon@kaist.ac.kr greenmon@kaist.ac.kr evals/registry/evals/newsology.yaml 8 1 706 706 1 1 2023-05-30 2023-05-30 130502202+newsology@users.noreply.github.com 130502202+newsology@users.noreply.github.com evals/registry/evals/find_country_from_svg.yaml 3 1 713 713 1 1 2023-05-23 2023-05-23 lucasfougeras93@gmail.com lucasfougeras93@gmail.com evals/registry/evals/asl-classifiers.yaml 3 1 700 700 1 1 2023-06-05 2023-06-05 135167270+docequity@users.noreply.github.com 135167270+docequity@users.noreply.github.com evals/registry/evals/us-tort-law.yaml 11 1 771 771 1 1 2023-03-26 2023-03-26 jonathanagustin@gmail.com jonathanagustin@gmail.com evals/registry/evals/hebrew_grammar.yaml 8 1 642 642 1 1 2023-08-02 2023-08-02 idoyana@gmail.com idoyana@gmail.com evals/registry/evals/bias_detection.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 131893786+domenicomireles@users.noreply.github.com 131893786+domenicomireles@users.noreply.github.com evals/registry/evals/complex-replace-characters.yaml 8 1 776 776 1 1 2023-03-21 2023-03-21 petrgazarov@gmail.com petrgazarov@gmail.com evals/registry/evals/bigrams.yaml 7 1 777 777 1 1 2023-03-20 2023-03-20 oscar-king@users.noreply.github.com oscar-king@users.noreply.github.com evals/registry/evals/balance-chemical-equation.yaml 7 1 781 781 2 2 2023-03-16 2023-03-16 120423412+andrew-openai@users.noreply.github.com scruelt@hotmail.com evals/registry/evals/sarcasm.yaml 10 1 771 771 1 1 2023-03-26 2023-03-26 56776590+ronaldruckus@users.noreply.github.com 56776590+ronaldruckus@users.noreply.github.com evals/registry/evals/job_listing_title_for_a_caregiver_in_japan.yaml 9 1 744 744 1 1 2023-04-22 2023-04-22 tt@hcmj.biz tt@hcmj.biz evals/registry/evals/squares-gpt.yaml 4 1 714 714 1 1 2023-05-22 2023-05-22 38587927+ach-in@users.noreply.github.com 38587927+ach-in@users.noreply.github.com evals/registry/evals/arithmetic-expression.yaml 21 1 677 677 1 1 2023-06-28 2023-06-28 gustavo.santos@vortexa.com gustavo.santos@vortexa.com evals/registry/evals/gol.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 agoldsmith@alumni.scu.edu agoldsmith@alumni.scu.edu evals/registry/evals/chinese_ancient_poetry.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 jiahaoyu04@gmail.com jiahaoyu04@gmail.com evals/registry/evals/japanese-itpassport-exam01.yaml 8 1 710 710 1 1 2023-05-26 2023-05-26 azutake@users.noreply.github.com azutake@users.noreply.github.com evals/registry/evals/polish-lexicon.yaml 3 1 705 705 1 1 2023-05-31 2023-05-31 rafalzawadzki@users.noreply.github.com rafalzawadzki@users.noreply.github.com evals/registry/evals/music_theory_scale_modes.yaml 3 1 711 711 1 1 2023-05-25 2023-05-25 21stcenturydigitaljeff@gmail.com 21stcenturydigitaljeff@gmail.com evals/registry/evals/blackfoot-numerals-modern.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 george@orbitalimpact.com george@orbitalimpact.com evals/registry/evals/lunar-calendar.yaml 20 1 710 710 1 1 2023-05-26 2023-05-26 132530236+clearlyloc@users.noreply.github.com 132530236+clearlyloc@users.noreply.github.com evals/registry/evals/icelandic-sentences-gec.yaml 3 1 481 481 1 1 2024-01-10 2024-01-10 24214261+svanhvitlilja@users.noreply.github.com 24214261+svanhvitlilja@users.noreply.github.com evals/registry/evals/nepali-numerals.yaml 3 1 677 677 1 1 2023-06-28 2023-06-28 nepalsamyok@gmail.com nepalsamyok@gmail.com evals/registry/evals/crepe.yaml 7 1 776 776 1 1 2023-03-21 2023-03-21 46582003+seacowx@users.noreply.github.com 46582003+seacowx@users.noreply.github.com evals/registry/evals/math_equations.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 767683+raxityo@users.noreply.github.com 767683+raxityo@users.noreply.github.com evals/registry/evals/dutch-rhymes.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 jonathan@verhe.es jonathan@verhe.es evals/registry/evals/determinant.yaml 7 1 776 776 1 1 2023-03-21 2023-03-21 80975912+vitoraqdev@users.noreply.github.com 80975912+vitoraqdev@users.noreply.github.com evals/registry/evals/urdu-transliteration.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 usama.anwar09@gmail.com usama.anwar09@gmail.com evals/registry/evals/compare-countries-area.yaml 3 1 744 744 1 1 2023-04-22 2023-04-22 69503759+yohei0731@users.noreply.github.com 69503759+yohei0731@users.noreply.github.com evals/registry/evals/chess-piece-count.yaml 3 1 781 781 3 2 2023-03-16 2023-03-16 120423412+andrew-openai@users.noreply.github.com jatinparab98@gmail.com evals/registry/evals/algebra-word-problems.yaml 9 1 745 745 1 1 2023-04-21 2023-04-21 alextraul@gmail.com alextraul@gmail.com evals/registry/evals/japanese-national-medical-exam02.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 93697462+nakata-daisuke-mb@users.noreply.github.com 93697462+nakata-daisuke-mb@users.noreply.github.com evals/registry/evals/sindarin-fluency.yaml 3 1 698 698 1 1 2023-06-07 2023-06-07 aaron@aaronsmith.tv aaron@aaronsmith.tv evals/registry/evals/relative-orientations.yaml 7 1 671 671 1 1 2023-07-04 2023-07-04 dbautista.cs@gmail.com dbautista.cs@gmail.com evals/registry/evals/korean_dialects.yaml 3 1 694 694 1 1 2023-06-11 2023-06-11 134977380+racheroni@users.noreply.github.com 134977380+racheroni@users.noreply.github.com evals/registry/evals/japanese-decimal-units.yaml 8 1 691 691 1 1 2023-06-14 2023-06-14 hiroaki.iwai@shaperon-inc.com hiroaki.iwai@shaperon-inc.com evals/registry/evals/interlingual-homograph.yaml 3 1 677 677 1 1 2023-06-28 2023-06-28 53555762+y-nakamura-github@users.noreply.github.com 53555762+y-nakamura-github@users.noreply.github.com evals/registry/evals/chinese_homophonic.yaml 9 1 683 683 1 1 2023-06-22 2023-06-22 124559520+hello-oscar@users.noreply.github.com 124559520+hello-oscar@users.noreply.github.com evals/registry/evals/math-derivatives.yaml 3 1 671 671 1 1 2023-07-04 2023-07-04 andrew.prokhorenkov@gmail.com andrew.prokhorenkov@gmail.com evals/registry/evals/canto_wu_pronunciation_fewshot.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 timeroot.alex@gmail.com timeroot.alex@gmail.com evals/registry/evals/ascii-wordart.yaml 3 1 721 721 1 1 2023-05-15 2023-05-15 61651096+derewah@users.noreply.github.com 61651096+derewah@users.noreply.github.com evals/registry/evals/chinese_zodiac.yaml 7 1 700 700 1 1 2023-06-05 2023-06-05 exjang0@gmail.com exjang0@gmail.com evals/registry/evals/math_for_5th-grader.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 42082942+mochisky@users.noreply.github.com 42082942+mochisky@users.noreply.github.com evals/registry/evals/rot13.yaml 3 1 771 771 1 1 2023-03-26 2023-03-26 greg@siteorigin.com greg@siteorigin.com evals/registry/evals/stock-options.yaml 96 1 770 770 1 1 2023-03-27 2023-03-27 troydcalandra@gmail.com troydcalandra@gmail.com evals/registry/evals/math_logic_operations.yaml 3 1 691 691 1 1 2023-06-14 2023-06-14 96959673+nathanstew7@users.noreply.github.com 96959673+nathanstew7@users.noreply.github.com evals/registry/evals/ballots.yaml 34 3 594 418 3 3 2023-09-19 2024-03-13 140545726+ianmckenzie-oai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/evals/error_recovery.yaml 31 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/evals/logic-riddles.yaml 9 1 700 700 1 1 2023-06-05 2023-06-05 55913678+cholotook@users.noreply.github.com 55913678+cholotook@users.noreply.github.com evals/registry/evals/japanese_approval.yaml 8 1 677 677 1 1 2023-06-28 2023-06-28 omonaotab@gmail.com omonaotab@gmail.com evals/registry/evals/Chinese_character_riddles.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 71001519+tesla2678@users.noreply.github.com 71001519+tesla2678@users.noreply.github.com evals/registry/evals/sandbagging.yaml 54 1 537 537 1 1 2023-11-15 2023-11-15 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/evals/music-theory.yaml 20 1 703 703 1 1 2023-06-02 2023-06-02 105930198+f7b5@users.noreply.github.com 105930198+f7b5@users.noreply.github.com evals/registry/evals/ambiguous-sentences.yaml 8 1 710 710 1 1 2023-05-26 2023-05-26 59383957+erauner12@users.noreply.github.com 59383957+erauner12@users.noreply.github.com evals/registry/evals/hard_russian_computer_science_tasks.yaml 10 1 634 634 1 1 2023-08-10 2023-08-10 halonazar1997@gmail.com halonazar1997@gmail.com evals/registry/evals/loss-logic.yaml 9 2 745 744 2 2 2023-04-21 2023-04-22 temberature@gmail.com 120423412+andrew-openai@users.noreply.github.com evals/registry/evals/rubiks-colors.yaml 8 1 717 717 1 1 2023-05-19 2023-05-19 zaidhaan03@gmail.com zaidhaan03@gmail.com evals/registry/evals/premature-conclusions.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 138718051+natanaelwf@users.noreply.github.com 138718051+natanaelwf@users.noreply.github.com evals/registry/evals/counterfactual-reasoning.yaml 8 1 714 714 1 1 2023-05-22 2023-05-22 89385155+neolizhe@users.noreply.github.com 89385155+neolizhe@users.noreply.github.com evals/registry/evals/arc.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 3322313+theo3@users.noreply.github.com 3322313+theo3@users.noreply.github.com evals/registry/evals/irish-plural-nouns.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 68754265+aaronbrennan1@users.noreply.github.com 68754265+aaronbrennan1@users.noreply.github.com evals/registry/evals/french-lexicon.yaml 3 1 709 709 1 1 2023-05-27 2023-05-27 mathieuhawry@gmail.com mathieuhawry@gmail.com evals/registry/evals/missing-operators.yaml 9 1 710 710 1 1 2023-05-26 2023-05-26 kodamap0@gmail.com kodamap0@gmail.com evals/registry/evals/incontext_rl.yaml 53 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/evals/context-free-grammar.yaml 8 1 698 698 1 1 2023-06-07 2023-06-07 135289321+horizonauto@users.noreply.github.com 135289321+horizonauto@users.noreply.github.com evals/registry/evals/bugged_tools.yaml 28 1 412 412 1 1 2024-03-19 2024-03-19 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/registry/evals/first-letters.yaml 7 1 775 775 1 1 2023-03-22 2023-03-22 67751757+kallyaleksiev@users.noreply.github.com 67751757+kallyaleksiev@users.noreply.github.com evals/registry/evals/financial-derivatives.yaml 8 1 706 706 1 1 2023-05-30 2023-05-30 hidemi@gmail.com hidemi@gmail.com evals/registry/evals/afrikaans-lexicon.yaml 3 1 719 719 1 1 2023-05-17 2023-05-17 richard.wooding@gmail.com richard.wooding@gmail.com evals/registry/evals/diabetes.yaml 7 1 713 713 1 1 2023-05-23 2023-05-23 130139652+mooihi@users.noreply.github.com 130139652+mooihi@users.noreply.github.com evals/registry/evals/coq-proof-step.yaml 4 1 662 662 1 1 2023-07-13 2023-07-13 amit9oct@gmail.com amit9oct@gmail.com evals/registry/evals/function-deduction.yaml 4 1 412 412 1 1 2024-03-19 2024-03-19 129281094+james-aung@users.noreply.github.com 129281094+james-aung@users.noreply.github.com evals/registry/evals/simple_physics_engine.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 ssansovich@gmail.com ssansovich@gmail.com evals/registry/evals/historical-kana-orthography-reading.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 135117004+hozen-ai@users.noreply.github.com 135117004+hozen-ai@users.noreply.github.com evals/registry/evals/romanian-logic.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 marius.patru@gmail.com marius.patru@gmail.com evals/registry/evals/event-categories.yaml 10 2 721 709 2 2 2023-05-15 2023-05-27 javier@javier.nyc 133797909+jorge-openai@users.noreply.github.com evals/registry/evals/find-thirukkural.yaml 8 2 714 662 2 2 2023-05-22 2023-07-13 u.sivasweatha@gmail.com 55913678+cholotook@users.noreply.github.com evals/registry/evals/pararule-plus-multi-step-deductive-reasoning.yaml 8 1 709 709 1 1 2023-05-27 2023-05-27 741150372@qq.com 741150372@qq.com evals/registry/evals/belarusian-orthography.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/evals/date-booking.yaml 7 1 706 706 1 1 2023-05-30 2023-05-30 popstas@gmail.com popstas@gmail.com evals/registry/evals/game-theory.yaml 9 1 704 704 1 1 2023-06-01 2023-06-01 phelps-sg@users.noreply.github.com phelps-sg@users.noreply.github.com evals/registry/evals/brazilian-lexicon.yaml 3 1 755 755 1 1 2023-04-11 2023-04-11 32521301+mreismendes@users.noreply.github.com 32521301+mreismendes@users.noreply.github.com evals/registry/evals/direct-speech-tag.yaml 7 1 706 706 1 1 2023-05-30 2023-05-30 mariusburtscheidt@gmail.com mariusburtscheidt@gmail.com evals/registry/evals/russian_medical.yaml 7 1 745 745 1 1 2023-04-21 2023-04-21 gydronik@gmail.com gydronik@gmail.com evals/registry/evals/manga-translation.yaml 21 1 768 768 1 1 2023-03-29 2023-03-29 mindful.jt@gmail.com mindful.jt@gmail.com evals/registry/evals/vintage_phone_keyboard_decode.yaml 8 1 714 714 1 1 2023-05-22 2023-05-22 touchtheus@gmail.com touchtheus@gmail.com evals/registry/evals/benjaminmoore_to_hex.yaml 7 1 683 683 1 1 2023-06-22 2023-06-22 bryanvaz@users.noreply.github.com bryanvaz@users.noreply.github.com evals/registry/evals/mate-in-one.yaml 8 1 712 712 1 1 2023-05-24 2023-05-24 90597795+mradul-kanugo@users.noreply.github.com 90597795+mradul-kanugo@users.noreply.github.com evals/registry/evals/logiqa-logical-reasoning-plus.yaml 24 1 705 705 1 1 2023-05-31 2023-05-31 qbao775@aucklanduni.ac.nz qbao775@aucklanduni.ac.nz evals/registry/evals/consensus_summary.yaml 3 1 691 691 1 1 2023-06-14 2023-06-14 95278127+ali-consensus@users.noreply.github.com 95278127+ali-consensus@users.noreply.github.com evals/registry/evals/numeral-type-comparisons.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 101950345+noahcdc@users.noreply.github.com 101950345+noahcdc@users.noreply.github.com evals/registry/evals/confusing_korean.yaml 3 1 671 671 1 1 2023-07-04 2023-07-04 youngwook.kim@gmail.com youngwook.kim@gmail.com evals/registry/evals/positive-binary-operations.yaml 10 1 745 745 1 1 2023-04-21 2023-04-21 106610412+omar-heshamr@users.noreply.github.com 106610412+omar-heshamr@users.noreply.github.com evals/registry/evals/GPT-model-text-detection.yaml 4 1 671 671 1 1 2023-07-04 2023-07-04 udaykumaradusumilli97@gmail.com udaykumaradusumilli97@gmail.com evals/registry/evals/russian-rhyme.yaml 8 1 744 744 1 1 2023-04-22 2023-04-22 tbs.micle@gmail.com tbs.micle@gmail.com evals/registry/evals/russian-verse.yaml 8 1 698 698 1 1 2023-06-07 2023-06-07 halonazar1997@gmail.com halonazar1997@gmail.com evals/registry/evals/korean_spaces.yaml 3 1 594 594 1 1 2023-09-19 2023-09-19 howon92@gmail.com howon92@gmail.com evals/registry/evals/chinese_poem.yaml 7 1 710 710 1 1 2023-05-26 2023-05-26 bicheng.cao@gmail.com bicheng.cao@gmail.com evals/registry/evals/belarusian-russian-translation.yaml 3 1 700 700 1 1 2023-06-05 2023-06-05 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/evals/svg_understanding.yaml 8 1 742 742 1 1 2023-04-24 2023-04-24 joshuagruenstein@users.noreply.github.com joshuagruenstein@users.noreply.github.com evals/registry/evals/chinese_modern_poem_identification.yaml 7 1 671 671 1 1 2023-07-04 2023-07-04 netsailer@gmail.com netsailer@gmail.com evals/registry/evals/probability_questions.yaml 3 1 719 719 1 1 2023-05-17 2023-05-17 101657559+steven-luabase@users.noreply.github.com 101657559+steven-luabase@users.noreply.github.com evals/registry/evals/logic_and_probability.yaml 8 1 698 698 1 1 2023-06-07 2023-06-07 135593135+hbvlmedia@users.noreply.github.com 135593135+hbvlmedia@users.noreply.github.com evals/registry/evals/chinese_shi_jing.yaml 7 1 671 671 1 1 2023-07-04 2023-07-04 netsailer@gmail.com netsailer@gmail.com evals/registry/evals/css-selectors.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 ilanharel@gmail.com ilanharel@gmail.com evals/registry/evals/which-is-heavier.yaml 3 1 770 770 1 1 2023-03-27 2023-03-27 scottlanyon@gmail.com scottlanyon@gmail.com evals/registry/evals/hebrew-same-noun-gender.yaml 8 1 706 706 1 1 2023-05-30 2023-05-30 elisimhayev@gmail.com elisimhayev@gmail.com evals/registry/evals/formal_logic.yaml 3 1 775 775 1 1 2023-03-22 2023-03-22 christopher@wolfram.com christopher@wolfram.com evals/registry/evals/viewport_to_grid_size.yaml 8 1 671 671 1 1 2023-07-04 2023-07-04 agoldsmith@alumni.scu.edu agoldsmith@alumni.scu.edu evals/registry/evals/french_homonym_and_homograph.yaml 8 1 671 671 1 1 2023-07-04 2023-07-04 6842725+yannl@users.noreply.github.com 6842725+yannl@users.noreply.github.com evals/registry/evals/osm_mapping_one_way.yaml 3 1 556 556 1 1 2023-10-27 2023-10-27 adrianmargin@users.noreply.github.com adrianmargin@users.noreply.github.com evals/registry/evals/russian-nlp-tasks.yaml 7 1 770 770 1 1 2023-03-27 2023-03-27 hormold@gmail.com hormold@gmail.com evals/registry/evals/csharp-linq.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 6028199+joshdixon@users.noreply.github.com 6028199+joshdixon@users.noreply.github.com evals/registry/evals/ukraine-gec.yaml 180 1 703 703 1 1 2023-06-02 2023-06-02 roman.mashta@gmail.com roman.mashta@gmail.com evals/registry/evals/list_comparison_missing_name.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 37917398+davidbeesley@users.noreply.github.com 37917398+davidbeesley@users.noreply.github.com evals/registry/evals/last-word-nth.yaml 3 1 777 777 1 1 2023-03-20 2023-03-20 trevor.annedenise@icloud.com trevor.annedenise@icloud.com evals/registry/evals/hebrew_plurals.yaml 8 1 671 671 1 1 2023-07-04 2023-07-04 59704420+relvok@users.noreply.github.com 59704420+relvok@users.noreply.github.com evals/registry/evals/belarusian-numerals.yaml 3 1 690 690 1 1 2023-06-15 2023-06-15 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/evals/sql.yaml 5 2 745 709 2 2 2023-04-21 2023-05-27 mark@haym.me 133797909+jorge-openai@users.noreply.github.com evals/registry/evals/heart-disease.yaml 3 1 755 755 1 1 2023-04-11 2023-04-11 nick@clyde.tech nick@clyde.tech evals/registry/evals/chess.yaml 3 1 776 776 1 1 2023-03-21 2023-03-21 t.zehle@gmail.com t.zehle@gmail.com evals/registry/evals/urdu-lexicon.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 usama.anwar09@gmail.com usama.anwar09@gmail.com evals/registry/evals/simple-visual-understanding.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 felipe.castro@friday.ai felipe.castro@friday.ai evals/registry/evals/json_patch_object.yaml 3 1 704 704 1 1 2023-06-01 2023-06-01 eugene@goforward.com eugene@goforward.com evals/registry/evals/chinese_famous_novel.yaml 8 1 662 662 1 1 2023-07-13 2023-07-13 litonglitong@hotmail.com litonglitong@hotmail.com evals/registry/evals/tetris.yaml 8 1 715 715 1 1 2023-05-21 2023-05-21 sandmann@codedata.solutions sandmann@codedata.solutions evals/registry/evals/multi-step-equations.yaml 7 1 744 744 1 1 2023-04-22 2023-04-22 kara@voxel-fox.com kara@voxel-fox.com evals/registry/evals/formal-grammar-to-regex.yaml 7 1 703 703 1 1 2023-06-02 2023-06-02 chatgpt@zyxcv.com chatgpt@zyxcv.com evals/registry/evals/make-me-say.yaml 25 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/evals/mapping_to_matricies.yaml 7 1 698 698 1 1 2023-06-07 2023-06-07 danum7@gmail.com danum7@gmail.com evals/registry/evals/japanese_prime_minister.yaml 7 1 488 488 1 1 2024-01-03 2024-01-03 40705236+return-nil@users.noreply.github.com 40705236+return-nil@users.noreply.github.com evals/registry/evals/logic-statements.yaml 7 2 771 770 2 2 2023-03-26 2023-03-27 44057111+kasperkristiansen@users.noreply.github.com 117690718+joe-at-openai@users.noreply.github.com evals/registry/evals/count_token_freq_dna.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 zl432@cantab.ac.uk zl432@cantab.ac.uk evals/registry/evals/euler_problems.yaml 10 1 705 705 1 1 2023-05-31 2023-05-31 pcashworth83@gmail.com pcashworth83@gmail.com evals/registry/evals/hindi_upsc.yaml 7 1 745 745 1 1 2023-04-21 2023-04-21 shivamd1810@gmail.com shivamd1810@gmail.com evals/registry/evals/fcc_amateur_extra.yaml 9 1 745 745 1 1 2023-04-21 2023-04-21 34941300+ckb2@users.noreply.github.com 34941300+ckb2@users.noreply.github.com evals/registry/evals/countries.yaml 7 1 706 706 1 1 2023-05-30 2023-05-30 76214963+rxfxt@users.noreply.github.com 76214963+rxfxt@users.noreply.github.com evals/registry/evals/co-sql.yaml 4 1 671 671 1 1 2023-07-04 2023-07-04 pybbae@gmail.com pybbae@gmail.com evals/registry/evals/rucola.yaml 10 1 762 762 1 1 2023-04-04 2023-04-04 alex@alexkuk.ru alex@alexkuk.ru evals/registry/evals/medication_dose.yaml 3 1 698 698 1 1 2023-06-07 2023-06-07 130315355+mickaw2@users.noreply.github.com 130315355+mickaw2@users.noreply.github.com evals/registry/evals/recurrence-relation.yaml 8 1 683 683 1 1 2023-06-22 2023-06-22 omarhishamk@gmail.com omarhishamk@gmail.com evals/registry/evals/chinese_idioms.yaml 3 1 683 683 1 1 2023-06-22 2023-06-22 32207883+robinzixuan@users.noreply.github.com 32207883+robinzixuan@users.noreply.github.com evals/registry/evals/emoji-riddle.yaml 3 1 745 745 1 1 2023-04-21 2023-04-21 dib.amir@gmail.com dib.amir@gmail.com evals/registry/evals/polish_rhymes_generation.yaml 8 1 710 710 1 1 2023-05-26 2023-05-26 9194961+r2d34@users.noreply.github.com 9194961+r2d34@users.noreply.github.com evals/registry/evals/kanji-idioms.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 peach921110@gmail.com peach921110@gmail.com evals/registry/evals/seating_arrangements.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 danielsj9@gmail.com danielsj9@gmail.com evals/registry/evals/belarusian-word-analogy-inflection.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 50818265+somerandomguyontheweb@users.noreply.github.com 50818265+somerandomguyontheweb@users.noreply.github.com evals/registry/evals/bitwise.yaml 3 1 740 740 1 1 2023-04-26 2023-04-26 scottmortonashton@gmail.com scottmortonashton@gmail.com evals/registry/evals/product-ie.yaml 28 1 634 634 1 1 2023-08-10 2023-08-10 4548970+abrinkmann@users.noreply.github.com 4548970+abrinkmann@users.noreply.github.com evals/registry/evals/hindi_shuddha.yaml 7 1 710 710 1 1 2023-05-26 2023-05-26 36335769+0x34d@users.noreply.github.com 36335769+0x34d@users.noreply.github.com evals/registry/evals/abstract2title.yaml 4 1 683 683 1 1 2023-06-22 2023-06-22 96370219+piupiupiuu@users.noreply.github.com 96370219+piupiupiuu@users.noreply.github.com evals/registry/evals/reverse-string.yaml 3 1 783 783 2 2 2023-03-14 2023-03-14 120423412+andrew-openai@users.noreply.github.com logan@openai.com evals/registry/evals/smiles_to_formula.yaml 7 1 671 671 1 1 2023-07-04 2023-07-04 33544440+glichtner@users.noreply.github.com 33544440+glichtner@users.noreply.github.com evals/registry/evals/canto_wu_pronunciation.yaml 3 1 703 703 1 1 2023-06-02 2023-06-02 timeroot.alex@gmail.com timeroot.alex@gmail.com evals/registry/evals/matrix-mult-rows.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 71815905+javrtg@users.noreply.github.com 71815905+javrtg@users.noreply.github.com evals/registry/evals/ph_calculation.yaml 3 1 744 744 1 1 2023-04-22 2023-04-22 61839320+bilski311@users.noreply.github.com 61839320+bilski311@users.noreply.github.com evals/registry/evals/born-first.yaml 3 2 782 781 2 2 2023-03-15 2023-03-16 njbbaer@gmail.com 120423412+andrew-openai@users.noreply.github.com evals/registry/evals/color_theory_complementary.yaml 3 1 713 713 1 1 2023-05-23 2023-05-23 penandlim@gmail.com penandlim@gmail.com evals/registry/evals/ukraine_electronic_petitions.yaml 9 1 705 705 1 1 2023-05-31 2023-05-31 yaru.uvva@gmail.com yaru.uvva@gmail.com evals/registry/evals/three-pt-mapping.yaml 3 1 740 740 1 1 2023-04-26 2023-04-26 keke060114@163.com keke060114@163.com evals/registry/evals/imo_exact_answers.yaml 8 1 296 296 1 1 2024-07-13 2024-07-13 justin@lin.bot justin@lin.bot evals/registry/evals/icelandic-inflection-hard.yaml 3 1 556 556 1 1 2023-10-27 2023-10-27 vthorsteinsson@users.noreply.github.com vthorsteinsson@users.noreply.github.com evals/registry/evals/date-calculator.yaml 7 1 706 706 1 1 2023-05-30 2023-05-30 45112646+leoliu-xingchi@users.noreply.github.com 45112646+leoliu-xingchi@users.noreply.github.com evals/registry/evals/path_enclosed_area.yaml 8 1 691 691 1 1 2023-06-14 2023-06-14 ahmedallawi01@gmail.com ahmedallawi01@gmail.com evals/registry/evals/european-date-format-challenge.yaml 3 1 712 712 1 1 2023-05-24 2023-05-24 yuvalshirav@gmail.com yuvalshirav@gmail.com evals/registry/evals/nutrition.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 blum.stephen@gmail.com blum.stephen@gmail.com evals/registry/evals/korean_spelling.yaml 7 1 706 706 1 1 2023-05-30 2023-05-30 yjkimjunior@gmail.com yjkimjunior@gmail.com evals/registry/evals/cissp-study-questions.yaml 10 1 712 712 1 1 2023-05-24 2023-05-24 randy.lariar@gmail.com randy.lariar@gmail.com evals/registry/evals/2d_movement.yaml 3 1 710 710 1 1 2023-05-26 2023-05-26 eugene.l.huang@gmail.com eugene.l.huang@gmail.com evals/registry/evals/categorize_with_distractors.yaml 3 1 744 744 1 1 2023-04-22 2023-04-22 yuvalshirav@gmail.com yuvalshirav@gmail.com evals/registry/evals/poker_hand_ranks.yaml 7 1 775 775 1 1 2023-03-22 2023-03-22 54050333+msilva-00@users.noreply.github.com 54050333+msilva-00@users.noreply.github.com evals/registry/evals/crontab.yaml 7 1 706 706 1 1 2023-05-30 2023-05-30 google@mryao.org google@mryao.org evals/registry/evals/lat_long_identify.yaml 7 1 777 777 1 1 2023-03-20 2023-03-20 vishaal16119@iiitd.ac.in vishaal16119@iiitd.ac.in evals/registry/evals/polish-syllable-count.yaml 7 1 705 705 1 1 2023-05-31 2023-05-31 yaru.uvva@gmail.com yaru.uvva@gmail.com evals/registry/evals/rectangles.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 sam@samestep.com sam@samestep.com evals/registry/evals/math_polish.yaml 3 1 691 691 1 1 2023-06-14 2023-06-14 krzycho@wapp.pl krzycho@wapp.pl evals/registry/evals/svg_to_text.yaml 8 1 691 691 1 1 2023-06-14 2023-06-14 andrewcemil@gmail.com andrewcemil@gmail.com evals/registry/evals/korean_yaminjeongeum.yaml 8 1 700 700 1 1 2023-06-05 2023-06-05 penandlim@gmail.com penandlim@gmail.com evals/registry/evals/unique_combinations.yaml 8 1 714 714 1 1 2023-05-22 2023-05-22 50557586+sypherd@users.noreply.github.com 50557586+sypherd@users.noreply.github.com evals/registry/evals/largest_country.yaml 8 1 718 718 1 1 2023-05-18 2023-05-18 36363097+latand@users.noreply.github.com 36363097+latand@users.noreply.github.com evals/registry/evals/japanese-station.yaml 7 1 677 677 1 1 2023-06-28 2023-06-28 pabst2009@gmail.com pabst2009@gmail.com evals/registry/evals/japanese-national-medical-exam01.yaml 7 1 740 740 1 1 2023-04-26 2023-04-26 93697462+nakata-daisuke-mb@users.noreply.github.com 93697462+nakata-daisuke-mb@users.noreply.github.com evals/registry/evals/probabilities-word-problems.yaml 3 1 671 671 1 1 2023-07-04 2023-07-04 omarhishamk@gmail.com omarhishamk@gmail.com evals/registry/evals/romanian_homonyms.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 mail@adrianapan.com mail@adrianapan.com evals/registry/evals/3d_globe_movement.yaml 3 1 698 698 1 1 2023-06-07 2023-06-07 travis.hairfield@gmail.com travis.hairfield@gmail.com evals/registry/evals/japanese_mahjong_discard_tile.yaml 3 1 677 677 1 1 2023-06-28 2023-06-28 mauryskull@gmail.com mauryskull@gmail.com evals/registry/evals/escher-sentences.yaml 7 1 753 753 1 1 2023-04-13 2023-04-13 churchjohnr@protonmail.com churchjohnr@protonmail.com evals/registry/evals/irony.yaml 8 1 706 706 1 1 2023-05-30 2023-05-30 scott@linfords.com scott@linfords.com evals/registry/evals/french-part-of-speech.yaml 3 1 709 709 1 1 2023-05-27 2023-05-27 vasco@piranhafleisch.de vasco@piranhafleisch.de evals/registry/evals/rhetorical-devices.yaml 3 1 706 706 1 1 2023-05-30 2023-05-30 sirwesleybarlow@gmail.com sirwesleybarlow@gmail.com evals/registry/evals/turkish_characters.yaml 8 1 705 705 1 1 2023-05-31 2023-05-31 130087573+cardwiz@users.noreply.github.com 130087573+cardwiz@users.noreply.github.com evals/registry/evals/reverse-shell.yaml 3 1 677 677 1 1 2023-06-28 2023-06-28 32207883+robinzixuan@users.noreply.github.com 32207883+robinzixuan@users.noreply.github.com evals/registry/evals/logical_counting.yaml 7 1 714 714 1 1 2023-05-22 2023-05-22 jocca1985@gmail.com jocca1985@gmail.com evals/registry/evals/make-me-pay.yaml 59 3 594 418 3 2 2023-09-19 2024-03-13 140545726+ianmckenzie-oai@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/registry/evals/logiqa.yaml 7 1 755 755 1 1 2023-04-11 2023-04-11 62553364+csitfun@users.noreply.github.com 62553364+csitfun@users.noreply.github.com evals/registry/evals/text_compression.yaml 3 1 594 594 1 1 2023-09-19 2023-09-19 140545726+ianmckenzie-oai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/registry/evals/beam-analysis.yaml 3 1 705 705 1 1 2023-05-31 2023-05-31 jamesphillipturpin@gmail.com jamesphillipturpin@gmail.com evals/registry/evals/backgammon.yaml 16 1 683 683 1 1 2023-06-22 2023-06-22 bakebrain@gmail.com bakebrain@gmail.com evals/registry/evals/tracking-shuffled-objects.yaml 7 1 713 713 1 1 2023-05-23 2023-05-23 google@mryao.org google@mryao.org evals/registry/evals/chinese-remainder-theorem.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 carlos.hellin@uah.es carlos.hellin@uah.es evals/registry/evals/dna-melting-calculation.yaml 3 1 711 711 1 1 2023-05-25 2023-05-25 isaacbeing@gmail.com isaacbeing@gmail.com evals/registry/evals/hebrew-bible.yaml 8 1 704 704 1 1 2023-06-01 2023-06-01 ophir.ido@gmail.com ophir.ido@gmail.com evals/registry/evals/linear-equations.yaml 7 1 714 714 1 1 2023-05-22 2023-05-22 alexno0401@gmail.com alexno0401@gmail.com evals/registry/evals/base64-decode.yaml 3 1 677 677 1 1 2023-06-28 2023-06-28 70709113+alessiogr@users.noreply.github.com 70709113+alessiogr@users.noreply.github.com evals/registry/evals/pointer-value-retrieval.yaml 48 1 699 699 1 1 2023-06-06 2023-06-06 44269117+ggendro@users.noreply.github.com 44269117+ggendro@users.noreply.github.com evals/registry/evals/split_chinese_characters.yaml 7 1 704 704 1 1 2023-06-01 2023-06-01 mzou@pisrc.com mzou@pisrc.com evals/registry/evals/integer-sequence-predictions.yaml 28 1 719 719 1 1 2023-05-17 2023-05-17 davehdorzback@gmail.com davehdorzback@gmail.com evals/registry/evals/arabic-literature-qa.yaml 7 1 615 615 1 1 2023-08-29 2023-08-29 135200318+samta-kamboj@users.noreply.github.com 135200318+samta-kamboj@users.noreply.github.com evals/registry/evals/detect-hshd.yaml 7 1 711 711 1 1 2023-05-25 2023-05-25 45504048+mysterious-progression@users.noreply.github.com 45504048+mysterious-progression@users.noreply.github.com evals/registry/evals/aime_evaluation.yaml 3 1 718 718 1 1 2023-05-18 2023-05-18 emilymu@mit.edu emilymu@mit.edu evals/registry/evals/korean_romanization.yaml 3 1 662 662 1 1 2023-07-13 2023-07-13 soo@novelastudio.com soo@novelastudio.com evals/registry/evals/shape-in-shape.yaml 3 2 719 662 2 2 2023-05-17 2023-07-13 70836043+pawel-krzych@users.noreply.github.com 55913678+cholotook@users.noreply.github.com evals/registry/evals/mazes.yaml 48 2 691 662 2 2 2023-06-14 2023-07-13 douglas.monsky@gmail.com 55913678+cholotook@users.noreply.github.com evals/registry/evals/ordered-history-events.yaml 7 1 719 719 1 1 2023-05-17 2023-05-17 itc0r3@gmail.com itc0r3@gmail.com evals/registry/evals/track_objects.yaml 3 1 712 712 1 1 2023-05-24 2023-05-24 45925348+christophedc@users.noreply.github.com 45925348+christophedc@users.noreply.github.com evals/registry/evals/japanese_number_reading.yaml 3 1 713 713 1 1 2023-05-23 2023-05-23 shunji.makino@gmail.com shunji.makino@gmail.com evals/cli/oaievalset.py 111 5 776 481 5 4 2023-03-21 2024-01-10 343165+rlbayes@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/cli/oaieval.py 253 19 779 217 22 18 2023-03-18 2024-09-30 120423412+andrew-openai@users.noreply.github.com steven@openai.com evals/metrics.py 52 3 703 587 3 3 2023-06-02 2023-09-26 21045365+kjbilton@users.noreply.github.com bomarni@googlemail.com evals/prompt/base.py 64 4 768 418 4 3 2023-03-29 2024-03-13 343165+rlbayes@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/eval.py 170 9 777 403 10 9 2023-03-20 2024-03-28 2406911+zhangmarvin@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/completion_fns/langchain_math.py 21 3 755 517 4 4 2023-04-11 2023-12-05 jwang47@users.noreply.github.com erik.t.ritter@gmail.com evals/completion_fns/retrieval.py 68 3 754 481 3 3 2023-04-12 2024-01-10 120423412+andrew-openai@users.noreply.github.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/completion_fns/cot.py 47 1 755 755 2 2 2023-04-11 2023-04-11 jwang47@users.noreply.github.com 73198383+hwchung27@users.noreply.github.com evals/completion_fns/__init__.py 1 1 755 755 1 1 2023-04-11 2023-04-11 73198383+hwchung27@users.noreply.github.com 73198383+hwchung27@users.noreply.github.com evals/completion_fns/solver_completion_fn.py 47 1 403 403 1 1 2024-03-28 2024-03-28 oliver.jaffe@hotmail.co.uk oliver.jaffe@hotmail.co.uk evals/completion_fns/openai.py 147 5 755 405 6 6 2023-04-11 2024-03-26 jwang47@users.noreply.github.com oliver.jaffe@hotmail.co.uk evals/completion_fns/langchain_llm.py 70 3 755 488 4 4 2023-04-11 2024-01-03 jwang47@users.noreply.github.com z@hyperf.io evals/record.py 450 13 781 465 15 9 2023-03-16 2024-01-26 shane@openai.com 140545726+ianmckenzie-oai@users.noreply.github.com evals/api.py 61 5 769 697 5 4 2023-03-28 2023-06-08 jwang47@users.noreply.github.com 131678108+wingsdrafterwork@users.noreply.github.com