From 2d8e4556fe1a240fa630eb498a44d2289986be66 Mon Sep 17 00:00:00 2001 From: hagrid67 <jdhwatson@gmail.com> Date: Wed, 29 Jul 2020 12:13:10 +0100 Subject: [PATCH] fixed reward/penalty tests - malfunction step penalty was being applied twice --- flatland/envs/rail_env.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/flatland/envs/rail_env.py b/flatland/envs/rail_env.py index 1fa69f8a..3412ff6e 100644 --- a/flatland/envs/rail_env.py +++ b/flatland/envs/rail_env.py @@ -742,7 +742,8 @@ class RailEnv(Environment): # full step penalty in this case if agent.malfunction_data['malfunction'] > 0: self.motionCheck.addAgent(i_agent, agent.position, agent.position) - self.rewards_dict[i_agent] += self.step_penalty * agent.speed_data['speed'] + # agent will get penalty in step_agent2_cf + #self.rewards_dict[i_agent] += self.step_penalty * agent.speed_data['speed'] return # Is the agent at the beginning of the cell? Then, it can take an action. -- GitLab