Skip to content
Snippets Groups Projects
Commit 320dabf7 authored by Egli Adrian (IT-SCI-API-PFI)'s avatar Egli Adrian (IT-SCI-API-PFI)
Browse files

.

parent c20d4638
No related branches found
Tags submission-v7.1
No related merge requests found
...@@ -474,7 +474,7 @@ def eval_policy(env, tree_observation, policy, train_params, obs_params): ...@@ -474,7 +474,7 @@ def eval_policy(env, tree_observation, policy, train_params, obs_params):
if __name__ == "__main__": if __name__ == "__main__":
parser = ArgumentParser() parser = ArgumentParser()
parser.add_argument("-n", "--n_episodes", help="number of episodes to run", default=2500, type=int) parser.add_argument("-n", "--n_episodes", help="number of episodes to run", default=12500, type=int)
parser.add_argument("-t", "--training_env_config", help="training config id (eg 0 for Test_0)", default=2, type=int) parser.add_argument("-t", "--training_env_config", help="training config id (eg 0 for Test_0)", default=2, type=int)
parser.add_argument("-e", "--evaluation_env_config", help="evaluation config id (eg 0 for Test_0)", default=0, parser.add_argument("-e", "--evaluation_env_config", help="evaluation config id (eg 0 for Test_0)", default=0,
type=int) type=int)
...@@ -482,8 +482,8 @@ if __name__ == "__main__": ...@@ -482,8 +482,8 @@ if __name__ == "__main__":
parser.add_argument("--checkpoint_interval", help="checkpoint interval", default=100, type=int) parser.add_argument("--checkpoint_interval", help="checkpoint interval", default=100, type=int)
parser.add_argument("--eps_start", help="max exploration", default=1.0, type=float) parser.add_argument("--eps_start", help="max exploration", default=1.0, type=float)
parser.add_argument("--eps_end", help="min exploration", default=0.01, type=float) parser.add_argument("--eps_end", help="min exploration", default=0.01, type=float)
parser.add_argument("--eps_decay", help="exploration decay", default=0.99, type=float) parser.add_argument("--eps_decay", help="exploration decay", default=0.998, type=float)
parser.add_argument("--buffer_size", help="replay buffer size", default=int(1e5), type=int) parser.add_argument("--buffer_size", help="replay buffer size", default=int(1e7), type=int)
parser.add_argument("--buffer_min_size", help="min buffer size to start training", default=0, type=int) parser.add_argument("--buffer_min_size", help="min buffer size to start training", default=0, type=int)
parser.add_argument("--restore_replay_buffer", help="replay buffer to restore", default="", type=str) parser.add_argument("--restore_replay_buffer", help="replay buffer to restore", default="", type=str)
parser.add_argument("--save_replay_buffer", help="save replay buffer at each evaluation interval", default=False, parser.add_argument("--save_replay_buffer", help="save replay buffer at each evaluation interval", default=False,
......
...@@ -25,7 +25,7 @@ from reinforcement_learning.dddqn_policy import DDDQNPolicy ...@@ -25,7 +25,7 @@ from reinforcement_learning.dddqn_policy import DDDQNPolicy
VERBOSE = True VERBOSE = True
# Checkpoint to use (remember to push it!) # Checkpoint to use (remember to push it!)
checkpoint = "./checkpoints/201103180606-1400.pth" checkpoint = "./checkpoints/201103221432-3000.pth"
# Use last action cache # Use last action cache
USE_ACTION_CACHE = True USE_ACTION_CACHE = True
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment