From 0e13913816544abcdfff81d0ca4b13ef38c3217d Mon Sep 17 00:00:00 2001 From: Erik Nygren <erik.nygren@sbb.ch> Date: Mon, 13 May 2019 17:37:00 +0200 Subject: [PATCH] fixed missing loop over agent when episode is solved --- examples/training_navigation.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/examples/training_navigation.py b/examples/training_navigation.py index ee360a1..dabeafe 100644 --- a/examples/training_navigation.py +++ b/examples/training_navigation.py @@ -161,7 +161,8 @@ for trials in range(1, n_trials + 1): obs = next_obs.copy() if done['__all__']: env_done = 1 - agent.step(final_obs[a], final_action_dict[a], all_rewards[a], final_obs_next[a], done[a]) + for a in range(env.get_num_agents()): + agent.step(final_obs[a], final_action_dict[a], all_rewards[a], final_obs_next[a], done[a]) break # Epsilon decay eps = max(eps_end, eps_decay * eps) # decrease epsilon -- GitLab