in maddpg/common/distributions.py [0:0]
def sample(self): return self.low + tf.cast(tf.stack([p.sample() for p in self.categoricals], axis=-1), tf.int32)