in cached_classes.py [0:0]
def __init__(self, rm_size="large"):
train_data_raw = read_jsonl(CACHED_REWARD_MODEL_SCORES.format(rm_size=rm_size, split='train'))
test_data_raw = read_jsonl(CACHED_REWARD_MODEL_SCORES.format(rm_size=rm_size, split='test'))
#items are hashed by (prompt, completion) pairs
self.train_data = {tuple(d['prompt_completion']): d['rm_score'] for d in train_data_raw}
self.test_data = {tuple(d['prompt_completion']): d['rm_score'] for d in test_data_raw}