From 2d8e4556fe1a240fa630eb498a44d2289986be66 Mon Sep 17 00:00:00 2001
From: hagrid67 <jdhwatson@gmail.com>
Date: Wed, 29 Jul 2020 12:13:10 +0100
Subject: [PATCH] fixed reward/penalty tests - malfunction step penalty was
 being applied twice

---
 flatland/envs/rail_env.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/flatland/envs/rail_env.py b/flatland/envs/rail_env.py
index 1fa69f8a..3412ff6e 100644
--- a/flatland/envs/rail_env.py
+++ b/flatland/envs/rail_env.py
@@ -742,7 +742,8 @@ class RailEnv(Environment):
         # full step penalty in this case
         if agent.malfunction_data['malfunction'] > 0:
             self.motionCheck.addAgent(i_agent, agent.position, agent.position)
-            self.rewards_dict[i_agent] += self.step_penalty * agent.speed_data['speed']
+            # agent will get penalty in step_agent2_cf
+            #self.rewards_dict[i_agent] += self.step_penalty * agent.speed_data['speed']
             return
 
         # Is the agent at the beginning of the cell? Then, it can take an action.
-- 
GitLab