From b905b1e29aa43142ea0658f61b5e63cd3cd96e7a Mon Sep 17 00:00:00 2001 From: Guillaume Mollard <guillaume.mollard2@gmail.com> Date: Fri, 28 Jun 2019 18:10:26 +0200 Subject: [PATCH] last training set up before freeze --- .../config_example/config.gin | 25 +++++++++++++++++++ 1 file changed, 25 insertions(+) create mode 100644 RLLib_training/experiment_configs/config_example/config.gin diff --git a/RLLib_training/experiment_configs/config_example/config.gin b/RLLib_training/experiment_configs/config_example/config.gin new file mode 100644 index 0000000..7a4c7c1 --- /dev/null +++ b/RLLib_training/experiment_configs/config_example/config.gin @@ -0,0 +1,25 @@ +run_experiment.name = "experiment_example" +run_experiment.num_iterations = 1002 +run_experiment.save_every = 100 +run_experiment.hidden_sizes = [32, 32] + +run_experiment.map_width = 20 +run_experiment.map_height = 20 +run_experiment.n_agents = 7#{"grid_search": [3, 4, 5, 6, 7, 8]} +run_experiment.rail_generator = "complex_rail_generator" +run_experiment.nr_extra = 5 +run_experiment.policy_folder_name = "ppo_policy_two_obs_with_predictions_n_agents_{config[n_agents]}_"#_map_size_{config[map_width]}" + +run_experiment.seed = 123 + +run_experiment.conv_model = False + +run_experiment.obs_builder = @TreeObsForRailEnv() +TreeObsForRailEnv.predictor = @ShortestPathPredictorForRailEnv() +TreeObsForRailEnv.max_depth = 2 + +run_experiment.entropy_coeff = 0.001 +run_experiment.kl_coeff = 0.2 +run_experiment.lambda_gae = 0.9 +run_experiment.step_memory = 2 +run_experiment.min_dist = 10 -- GitLab