in lib/policy.py [0:0]
def forward(self, ob, state_in, context):
first = context["first"]
x = self.img_preprocess(ob["img"])
# Conv3D Prior to Impala
if self.conv3d_layer is not None:
x = self._conv3d_forward(x)
# Impala Stack
x = self.img_process(x)
if self.recurrent_layer is not None:
x, state_out = self.recurrent_layer(x, first, state_in)
x = F.relu(x, inplace=False)
pi_latent = self.lastlayer(x)
pi_latent = self.final_ln(x)
return (pi_latent, None), state_out