evals/registry/solvers/track_the_stat.yaml (75 lines of code) (raw):
track_the_stat/explicit_state/gemini-pro:
class: evals.elsuite.track_the_stat.solvers:ExplicitStateSolver
args:
underlying_solver:
class: evals.solvers.providers.google.gemini_solver:GeminiSolver
args:
model_name: gemini-pro
state_role: "user"
track_the_stat/explicit_state/llama-2-70b-chat:
class: evals.elsuite.track_the_stat.solvers:ExplicitStateSolver
args:
underlying_solver:
class: evals.solvers.providers.together.together_solver:TogetherSolver
args:
completion_fn_options:
model: meta-llama/Llama-2-70b-chat-hf
extra_options:
temperature: 1
max_tokens: 512
track_the_stat/explicit_state/mixtral-8x7b-instruct:
class: evals.elsuite.track_the_stat.solvers:ExplicitStateSolver
args:
underlying_solver:
class: evals.solvers.providers.together.together_solver:TogetherSolver
args:
completion_fn_options:
model: mistralai/Mixtral-8x7B-Instruct-v0.1
extra_options:
temperature: 1
max_tokens: 512
track_the_stat/explicit_state/gpt-3.5-turbo:
class: evals.elsuite.track_the_stat.solvers:ExplicitStateSolver
args:
underlying_solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-3.5-turbo
extra_options:
temperature: 1
max_tokens: 512
track_the_stat/explicit_state/gpt-4-turbo-preview:
class: evals.elsuite.track_the_stat.solvers:ExplicitStateSolver
args:
underlying_solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4-turbo-preview
extra_options:
temperature: 1
max_tokens: 512
track_the_stat/explicit_state/hhh/gpt-4-base:
class: evals.elsuite.track_the_stat.solvers:ExplicitStateSolver
args:
underlying_solver:
class: evals.solvers.nested.hhh_solver:HHHSolver
args:
solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4-base
extra_options:
temperature: 1
max_tokens: 512
track_the_stat/human_cli:
class: evals.elsuite.track_the_stat.solvers:TrackTheStatHuman
args:
human_cli_solver:
class: evals.solvers.human_cli_solver:HumanCliSolver
args:
registry: null
track_the_stat/random_baseline:
class: evals.elsuite.track_the_stat.solvers:RandomBaselineSolver