graph G { compound="true" rankdir="TB" bgcolor="white" fontname="Tahoma" node [ fixedsize="false" fontname="Tahoma" color="white" fillcolor="deepskyblue2" fontcolor="black" shape="box" style="filled" penwidth="1.0" ] edge [ fontname="Arial" color="#00688b" fontcolor="black" fontsize="12" arrowsize="0.5" penwidth="1.0" ] "[trl/trainer/grpo_trainer.py]" -- "[trl/trainer/grpo_config.py]" [label=" 44 ", penwidth="10", color="#00688bFF"]; "[trl/trainer/sft_config.py]" -- "[trl/trainer/sft_trainer.py]" [label=" 16 ", penwidth="3", color="#00688b82"]; "[trl/trainer/kto_trainer.py]" -- "[trl/trainer/bco_trainer.py]" [label=" 15 ", penwidth="3", color="#00688b82"]; "[trl/trainer/dpo_trainer.py]" -- "[trl/trainer/bco_trainer.py]" [label=" 14 ", penwidth="3", color="#00688b82"]; "[trl/trainer/kto_trainer.py]" -- "[trl/trainer/dpo_trainer.py]" [label=" 14 ", penwidth="3", color="#00688b82"]; "[trl/trainer/orpo_trainer.py]" -- "[trl/trainer/bco_trainer.py]" [label=" 14 ", penwidth="3", color="#00688b82"]; "[trl/trainer/orpo_trainer.py]" -- "[trl/trainer/dpo_trainer.py]" [label=" 14 ", penwidth="3", color="#00688b82"]; "[trl/trainer/orpo_trainer.py]" -- "[trl/trainer/kto_trainer.py]" [label=" 14 ", penwidth="3", color="#00688b82"]; "[trl/trainer/orpo_trainer.py]" -- "[trl/trainer/cpo_trainer.py]" [label=" 14 ", penwidth="3", color="#00688b82"]; "[trl/trainer/cpo_trainer.py]" -- "[trl/trainer/bco_trainer.py]" [label=" 13 ", penwidth="2", color="#00688b70"]; "[trl/trainer/kto_trainer.py]" -- "[trl/trainer/cpo_trainer.py]" [label=" 13 ", penwidth="2", color="#00688b70"]; "[trl/trainer/dpo_trainer.py]" -- "[trl/trainer/cpo_trainer.py]" [label=" 13 ", penwidth="2", color="#00688b70"]; "[trl/trainer/utils.py]" -- "[trl/trainer/grpo_trainer.py]" [label=" 12 ", penwidth="2", color="#00688b70"]; "[trl/trainer/sft_config.py]" -- "[trl/trainer/dpo_config.py]" [label=" 12 ", penwidth="2", color="#00688b70"]; "[trl/trainer/rloo_trainer.py]" -- "[trl/trainer/ppo_trainer.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/cpo_config.py]" -- "[trl/trainer/bco_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/dpo_trainer.py]" -- "[trl/trainer/grpo_trainer.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/gkd_trainer.py]" -- "[trl/trainer/sft_trainer.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/dpo_trainer.py]" -- "[trl/trainer/sft_trainer.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/sft_config.py]" -- "[trl/trainer/utils.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/dpo_config.py]" -- "[trl/trainer/cpo_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/orpo_config.py]" -- "[trl/trainer/kto_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/orpo_config.py]" -- "[trl/trainer/dpo_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/dpo_config.py]" -- "[trl/trainer/bco_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/utils.py]" -- "[trl/trainer/grpo_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/dpo_trainer.py]" -- "[trl/trainer/dpo_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[setup.py]" -- "[trl/__init__.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/orpo_config.py]" -- "[trl/trainer/bco_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/kto_config.py]" -- "[trl/trainer/dpo_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/kto_config.py]" -- "[trl/trainer/cpo_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/kto_config.py]" -- "[trl/trainer/bco_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/orpo_config.py]" -- "[trl/trainer/cpo_config.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/data_utils.py]" -- "[trl/trainer/sft_trainer.py]" [label=" 10 ", penwidth="2", color="#00688b70"]; "[trl/trainer/sft_config.py]" -- "[trl/trainer/kto_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/online_dpo_config.py]" -- "[trl/trainer/kto_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/reward_config.py]" -- "[trl/trainer/orpo_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/reward_config.py]" -- "[trl/trainer/kto_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/sft_trainer.py]" -- "[trl/trainer/utils.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/reward_config.py]" -- "[trl/trainer/bco_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/online_dpo_config.py]" -- "[trl/trainer/bco_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/reward_config.py]" -- "[trl/trainer/prm_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/reward_config.py]" -- "[trl/trainer/online_dpo_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/reward_config.py]" -- "[trl/trainer/cpo_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/orpo_config.py]" -- "[trl/trainer/online_dpo_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/xpo_trainer.py]" -- "[trl/trainer/nash_md_trainer.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/online_dpo_config.py]" -- "[trl/trainer/cpo_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/sft_config.py]" -- "[trl/trainer/bco_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/sft_config.py]" -- "[trl/trainer/reward_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/reward_config.py]" -- "[trl/trainer/dpo_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; "[trl/trainer/sft_config.py]" -- "[trl/trainer/orpo_config.py]" [label=" 9 ", penwidth="2", color="#00688b70"]; }