in replay_buffer.py [0:0]
def add(self, time_step):
for spec in self._data_specs:
value = time_step[spec.name]
if np.isscalar(value):
value = np.full(spec.shape, value, spec.dtype)
assert spec.shape == value.shape and spec.dtype == value.dtype
self._current_episode[spec.name].append(value)
if time_step.last():
episode = dict()
for spec in self._data_specs:
value = self._current_episode[spec.name]
episode[spec.name] = np.array(value, spec.dtype)
self._current_episode = defaultdict(list)
self._store_episode(episode)