in rbr_weight_fitter.py [0:0]
def add_base_reward(self, base_reward: float): self.base_reward = base_reward