From 36714e2c3f025acfc3f9b89f2f5186d594a0405f Mon Sep 17 00:00:00 2001 From: Erik Nygren <erik.nygren@sbb.ch> Date: Mon, 13 May 2019 17:10:51 +0200 Subject: [PATCH] fixed bug in reward function when all agents terminate --- flatland/envs/rail_env.py | 1 + 1 file changed, 1 insertion(+) diff --git a/flatland/envs/rail_env.py b/flatland/envs/rail_env.py index 3135e9e..40e4ab7 100644 --- a/flatland/envs/rail_env.py +++ b/flatland/envs/rail_env.py @@ -180,6 +180,7 @@ class RailEnv(Environment): self.rewards_dict[iAgent] = 0 if self.dones["__all__"]: + self.rewards_dict = [r + global_reward for r in self.rewards_dict] return self._get_observations(), self.rewards_dict, self.dones, {} # for i in range(len(self.agents_handles)): -- GitLab