in gym3/interactive.py [0:0]
def _act(self, ac: Any) -> None:
self._env.act(ac)
batch_rew, batch_obs, batch_first = self._env.observe()
self._last_rew = batch_rew[0]
self._last_ob = batch_obs
self._last_ac = ac
first = batch_first[0]
info = copy.copy(self._env.get_info()[0])
for k in list(info.keys()):
if isinstance(info[k], np.ndarray):
del info[k]
self._episode_return += self._last_rew
self._steps += 1
self._episode_steps += 1
self._last_info = dict(
episode_steps=self._episode_steps,
episode_return=self._episode_return,
**info,
)
np.set_printoptions(precision=2)
return first