in weak_to_strong/datasets.py [0:0]
def format_anthropic_hh(ex, rng): hard_label = int(rng.random() < 0.5) txt = ex["chosen"] if hard_label else ex["rejected"] return dict(txt=txt, hard_label=hard_label)