in env_humanoid_base.py [0:0]
def inspect_end_of_episode_per_agent(self, idx):
eoe_reason = []
name = self._sim_agent[idx].get_name()
if Env.EarlyTermChoice.Falldown in self._early_term_choices:
check = self._base_env.check_falldown(self._sim_agent[idx])
if check: eoe_reason.append('[%s] falldown'%name)
if Env.EarlyTermChoice.SimDiv in self._early_term_choices:
check = self._base_env.is_sim_div(self._sim_agent[idx])
if check: eoe_reason.append('[%s] sim_div'%name)
if Env.EarlyTermChoice.SimWindow in self._early_term_choices:
check = self.get_elapsed_time() > self._sim_window_time
if check: eoe_reason.append('[%s] sim_window'%name)
if Env.EarlyTermChoice.LowReward in self._early_term_choices:
check = np.mean(list(self._rew_queue[idx])) < self._et_low_reward_thres * self.reward_max()
if check: eoe_reason.append('[%s] low_rewards'%name)
return eoe_reason