in data/generate_dpo.py [0:0]
def process(self, inputs: StepInput) -> "StepOutput":
for input in inputs:
if not input["generation"]:
continue
if not input["conversation"]:
continue
input["generated_conversation"] = [
{"role": message["role"], "content": message["content"]}
for message in input["conversation"][:-1]
] + [{"role": "assistant", "content": input["generation"]}]
input["conversation"] = [
{"role": message["role"], "content": message["content"]}
for message in input["conversation"]
]
yield inputs