From a2da7c285ff2350193b1f32325ce5ce1c77ed2df Mon Sep 17 00:00:00 2001 From: Erik Nygren <erik.nygren@sbb.ch> Date: Sun, 1 Sep 2019 19:07:33 -0400 Subject: [PATCH] fixed reward bug --- torch_training/training_navigation.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/torch_training/training_navigation.py b/torch_training/training_navigation.py index 3ed4840..c97f1f5 100644 --- a/torch_training/training_navigation.py +++ b/torch_training/training_navigation.py @@ -163,7 +163,7 @@ def main(argv): if not done[a]: if agent_obs_buffer[a] is not None and register_action_state[a]: agent_delayed_next = agent_obs[a].copy() - agent.step(agent_obs_buffer[a], agent_action_buffer[a], cummulated_reward[a], + agent.step(agent_obs_buffer[a], agent_action_buffer[a], all_rewards[a], agent_delayed_next, done[a]) cummulated_reward[a] = 0. if register_action_state[a]: -- GitLab