def __init__()

in cached_classes.py [0:0]


    def __init__(self, rm_size="large"):
        train_data_raw = read_jsonl(CACHED_REWARD_MODEL_SCORES.format(rm_size=rm_size, split='train'))
        test_data_raw = read_jsonl(CACHED_REWARD_MODEL_SCORES.format(rm_size=rm_size, split='test'))

        #items are hashed by (prompt, completion) pairs
        self.train_data = {tuple(d['prompt_completion']): d['rm_score'] for d in train_data_raw}
        self.test_data = {tuple(d['prompt_completion']): d['rm_score'] for d in test_data_raw}