evals/registry/solvers/make-me-pay.yaml (101 lines of code) (raw):
make-me-pay/baseline/gpt-3.5-turbo-16k:
class: evals.elsuite.make_me_pay.solvers.lm_con_artist_solver:LMConArtistSolver
args:
base_solver_class: evals.solvers.providers.openai.openai_solver:OpenAISolver
base_solver_args:
completion_fn_options:
model: gpt-3.5-turbo-16k
extra_options:
temperature: 1.0
max_tokens: 1000
make-me-pay/baseline/gpt-4:
class: evals.elsuite.make_me_pay.solvers.lm_con_artist_solver:LMConArtistSolver
args:
base_solver_class: evals.solvers.providers.openai.openai_solver:OpenAISolver
base_solver_args:
completion_fn_options:
model: gpt-4
extra_options:
temperature: 1.0
max_tokens: 1000
make-me-pay/baseline/gpt-4-32k:
class: evals.elsuite.make_me_pay.solvers.lm_con_artist_solver:LMConArtistSolver
args:
base_solver_class: evals.solvers.providers.openai.openai_solver:OpenAISolver
base_solver_args:
completion_fn_options:
model: gpt-4-32k
extra_options:
temperature: 1.0
max_tokens: 1000
make-me-pay/gpt-3.5-turbo-16k:
class: evals.elsuite.make_me_pay.solvers.lm_con_artist_solver:LMConArtistSolver
args:
base_solver_class: evals.solvers.nested.cot_solver:CoTSolver
base_solver_args:
cot_solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-3.5-turbo-16k
extra_options:
temperature: 1
max_tokens: 1000
extract_solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-3.5-turbo-16k
extra_options:
temperature: 1
max_tokens: 1000
lm_system_prompt: True
time_reminder: True
make-me-pay/gpt-4:
class: evals.elsuite.make_me_pay.solvers.lm_con_artist_solver:LMConArtistSolver
args:
base_solver_class: evals.solvers.nested.cot_solver:CoTSolver
base_solver_args:
cot_solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4
extra_options:
temperature: 1
max_tokens: 1000
extract_solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4
extra_options:
temperature: 1
max_tokens: 1000
lm_system_prompt: True
time_reminder: True
make-me-pay/gpt-4-32k:
class: evals.elsuite.make_me_pay.solvers.lm_con_artist_solver:LMConArtistSolver
args:
base_solver_class: evals.solvers.nested.cot_solver:CoTSolver
base_solver_args:
cot_solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4-32k
extra_options:
temperature: 1
max_tokens: 1000
extract_solver:
class: evals.solvers.providers.openai.openai_solver:OpenAISolver
args:
completion_fn_options:
model: gpt-4-32k
extra_options:
temperature: 1
max_tokens: 1000
lm_system_prompt: True
time_reminder: True
make-me-pay/cli:
class: evals.solvers.human_cli_solver:HumanCliSolver