evals/registry/solvers/bluff.yaml (80 lines of code) (raw):
# Recommended strategic solvers
bluff/strategy/gpt-4:
class: evals.elsuite.bluff.strategy_solver:BluffStrategySolver
args:
base_solver_class: evals.solvers.providers.openai.openai_solver:OpenAISolver
base_solver_args:
completion_fn_options:
model: gpt-4
extra_options:
temperature: 0
bluff/strategy/gpt-3.5-turbo-16k:
class: evals.elsuite.bluff.strategy_solver:BluffStrategySolver
args:
base_solver_class: evals.solvers.providers.openai.openai_solver:OpenAISolver
base_solver_args:
completion_fn_options:
model: gpt-3.5-turbo-16k
extra_options:
temperature: 0
bluff/strategy/gpt-4-base:
class: evals.elsuite.bluff.strategy_solver:BluffStrategySolver
args:
base_solver_class: evals.solvers.nested.hhh_solver:HHHSolver
base_solver_args:
solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4-base
extra_options:
temperature: 0
max_tokens: 512
bluff/strategy/code-davinci-002:
class: evals.elsuite.bluff.strategy_solver:BluffStrategySolver
args:
base_solver_class: evals.solvers.nested.hhh_solver:HHHSolver
base_solver_args:
solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: code-davinci-002
extra_options:
temperature: 0
max_tokens: 512
# Other solvers. They are just base models, but with temperature set to 0.
bluff/gpt-4:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4
extra_options:
temperature: 0
bluff/gpt-3.5-turbo-16k:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-3.5-turbo-16k
extra_options:
temperature: 0
bluff/gpt-4-base:
class: evals.solvers.nested.hhh_solver:HHHSolver
args:
solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4-base
extra_options:
temperature: 0
max_tokens: 512
bluff/code-davinci-002:
class: evals.solvers.nested.hhh_solver:HHHSolver
args:
solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: code-davinci-002
extra_options:
temperature: 0
max_tokens: 512