in exp/testgui.py [0:0]
def tick():
global step
global obs
if step == 0:
obs = env.reset()
#env.p.named.data.qvel['ball'][0:3] = [10, 3, 4]
a = env.action_space.sample()
a *= 0
'''
if step < 1:
a[2] = 1
elif step < 100:
a[0] = 1
else:
a[2] = -1
'''
obs, r, d, i = env.step(a)
step += 1
if step > 200 or d:
print(r)
print(f'reset after {step} steps')
step = 0
time.sleep(0.05)
vw.render()