evals/registry/solvers/defaults.yaml (294 lines of code) (raw):

# ------------------ # Human input # ------------------ human_cli: class: evals.solvers.human_cli_solver:HumanCliSolver # ------------------ # gpt-3.5-turbo # ------------------ # generation tasks generation/direct/gpt-3.5-turbo: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-3.5-turbo extra_options: temperature: 1 max_tokens: 512 generation/cot/gpt-3.5-turbo: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-3.5-turbo extra_options: temperature: 1 max_tokens: 512 extract_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-3.5-turbo extra_options: temperature: 1 max_tokens: 512 # classification tasks classification/direct/gpt-3.5-turbo: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-3.5-turbo extra_options: temperature: 0 max_tokens: 1 valid_answers: ["A", "B", "C", "D"] classification/cot/gpt-3.5-turbo: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-3.5-turbo extra_options: temperature: 1 max_tokens: 512 extract_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-3.5-turbo extra_options: temperature: 0 max_tokens: 1 valid_answers: ["A", "B", "C", "D"] # ------------------ # gpt-4 # ------------------ # generation tasks generation/direct/gpt-4: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4 extra_options: temperature: 1 max_tokens: 512 generation/cot/gpt-4: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4 extra_options: temperature: 1 max_tokens: 512 extract_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4 extra_options: temperature: 1 max_tokens: 512 # classification tasks classification/direct/gpt-4: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4 extra_options: temperature: 0 max_tokens: 1 valid_answers: ["A", "B", "C", "D"] classification/cot/gpt-4: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4 extra_options: temperature: 1 max_tokens: 512 extract_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4 extra_options: temperature: 0 max_tokens: 1 valid_answers: ["A", "B", "C", "D"] # ------------------ # gpt-4-turbo-preview # ------------------ # generation tasks generation/direct/gpt-4-turbo-preview: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-turbo-preview extra_options: temperature: 1 max_tokens: 512 generation/cot/gpt-4-turbo-preview: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-turbo-preview extra_options: temperature: 1 max_tokens: 512 extract_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-turbo-preview extra_options: temperature: 1 max_tokens: 512 # classification tasks classification/direct/gpt-4-turbo-preview: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-turbo-preview extra_options: temperature: 0 max_tokens: 1 valid_answers: ["A", "B", "C", "D"] classification/cot/gpt-4-turbo-preview: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-turbo-preview extra_options: temperature: 1 max_tokens: 512 extract_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-turbo-preview extra_options: temperature: 0 max_tokens: 1 valid_answers: ["A", "B", "C", "D"] # ------------------ # gpt-4-base # ------------------ # generation tasks generation/hhh/gpt-4-base: class: evals.solvers.nested.hhh_solver:HHHSolver args: solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-base extra_options: temperature: 1 max_tokens: 512 generation/cot_hhh/gpt-4-base: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.nested.hhh_solver:HHHSolver args: solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-base extra_options: temperature: 1 max_tokens: 512 extract_solver: class: evals.solvers.nested.hhh_solver:HHHSolver args: solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-base extra_options: temperature: 1 max_tokens: 512 # classification tasks classification/hhh/gpt-4-base: class: evals.solvers.nested.hhh_solver:HHHSolver args: solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-base extra_options: temperature: 0 max_tokens: 1 valid_answers: ["A", "B", "C", "D"] classification/cot_hhh/gpt-4-base: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.nested.hhh_solver:HHHSolver args: solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-base extra_options: temperature: 1 max_tokens: 512 extract_solver: class: evals.solvers.nested.hhh_solver:HHHSolver args: solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-base extra_options: temperature: 0 max_tokens: 1 valid_answers: ["A", "B", "C", "D"] # ------------------ # Assistants API # ------------------ generation/assistants/gpt-3.5-turbo: class: evals.solvers.openai_assistants_solver:OpenAIAssistantsSolver args: tools: - type: code_interpreter - type: retrieval model: gpt-3.5-turbo generation/cot_assistant/gpt-3.5-turbo: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.openai_assistants_solver:OpenAIAssistantsSolver args: tools: - type: code_interpreter - type: retrieval model: gpt-3.5-turbo extract_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-3.5-turbo extra_options: temperature: 1 max_tokens: 512 generation/assistants/gpt-4-turbo-preview: class: evals.solvers.openai_assistants_solver:OpenAIAssistantsSolver args: tools: - type: code_interpreter - type: retrieval model: gpt-4-turbo-preview generation/cot_assistant/gpt-4-turbo-preview: class: evals.solvers.nested.cot_solver:CoTSolver args: cot_solver: class: evals.solvers.openai_assistants_solver:OpenAIAssistantsSolver args: tools: - type: code_interpreter - type: retrieval model: gpt-4-turbo-preview extract_solver: class: evals.solvers.providers.openai.openai_solver:OpenAISolver args: completion_fn_options: model: gpt-4-turbo-preview extra_options: temperature: 1 max_tokens: 512