step-based counting
This commit is contained in:
2
tools.py
2
tools.py
@@ -161,7 +161,7 @@ def simulate(agent, envs, steps=0, episodes=0, state=None):
|
||||
done = np.stack(done)
|
||||
episode += int(done.sum())
|
||||
length += 1
|
||||
step += (done * length).sum()
|
||||
step += len(envs)
|
||||
length *= 1 - done
|
||||
|
||||
return (step - steps, episode - episodes, done, length, obs, agent_state, reward)
|
||||
|
||||
Reference in New Issue
Block a user