diff --git a/torch_training/training_navigation.py b/torch_training/training_navigation.py index 3ed48408de20216d30a0cae3a0a7e714f497ddf9..c97f1f5df2e171410f05f482a594d2b840c42dbc 100644 --- a/torch_training/training_navigation.py +++ b/torch_training/training_navigation.py @@ -163,7 +163,7 @@ def main(argv): if not done[a]: if agent_obs_buffer[a] is not None and register_action_state[a]: agent_delayed_next = agent_obs[a].copy() - agent.step(agent_obs_buffer[a], agent_action_buffer[a], cummulated_reward[a], + agent.step(agent_obs_buffer[a], agent_action_buffer[a], all_rewards[a], agent_delayed_next, done[a]) cummulated_reward[a] = 0. if register_action_state[a]: