in ddppo_agents.py [0:0]
def reset(self) -> None:
self.test_recurrent_hidden_states = torch.zeros(
1,
self.actor_critic.net.num_recurrent_layers,
self.hidden_size,
device=self.device,
)
self.not_done_masks = torch.zeros(1, 1, device=self.device, dtype=torch.bool)
self.prev_actions = torch.zeros(1, 1, dtype=torch.long, device=self.device)