def inspect_end_of_episode_per_agent()

in env_humanoid_base.py [0:0]


    def inspect_end_of_episode_per_agent(self, idx):
        eoe_reason = []
        name = self._sim_agent[idx].get_name()

        if Env.EarlyTermChoice.Falldown in self._early_term_choices:
            check = self._base_env.check_falldown(self._sim_agent[idx])
            if check: eoe_reason.append('[%s] falldown'%name)
        if Env.EarlyTermChoice.SimDiv in self._early_term_choices:
            check = self._base_env.is_sim_div(self._sim_agent[idx])
            if check: eoe_reason.append('[%s] sim_div'%name)
        if Env.EarlyTermChoice.SimWindow in self._early_term_choices:
            check = self.get_elapsed_time() > self._sim_window_time
            if check: eoe_reason.append('[%s] sim_window'%name)
        if Env.EarlyTermChoice.LowReward in self._early_term_choices:
            check = np.mean(list(self._rew_queue[idx])) < self._et_low_reward_thres * self.reward_max()
            if check: eoe_reason.append('[%s] low_rewards'%name)

        return eoe_reason