Commit cf8a93b7 authored by nilabha's avatar nilabha

Merge branch 'flatland-paper-baselines' into 'master'

Add CCPPO checkpoints and results

See merge request !19
parents d8bfd096 8abfda27
Pipeline #5776 failed with stage
in 2 minutes and 56 seconds
This source diff could not be displayed because it is stored in LFS. You can view the blob instead.
This source diff could not be displayed because it is stored in LFS. You can view the blob instead.
This source diff could not be displayed because it is stored in LFS. You can view the blob instead.
This source diff could not be displayed because it is stored in LFS. You can view the blob instead.
This source diff could not be displayed because it is stored in LFS. You can view the blob instead.
This source diff could not be displayed because it is stored in LFS. You can view the blob instead.
......@@ -82,11 +82,21 @@ echo "===================="
echo "CPPO"
echo "===================="
python rollout.py baselines/checkpoints/ccppo-tree-obs-0/checkpoint_6084/checkpoint-6084 --run CcTransformer --no-render --episodes 50 --env 'flatland_sparse' --config '{"env_config": {"sparse_reward":"True","done_reward":1, "not_finished_reward": -1, "seed":1000000000,"generator": "sparse_rail_generator", "generator_config": "small_v0", "observation": "tree", "observation_config": {"max_depth": 2, "shortest_path_max_depth": 30}}, "model": {"custom_model": "cc_transformer","fcnet_activation": "relu", "fcnet_hiddens":[512,512,512],"vf_share_layers": "True" , "custom_options": {"max_num_agents": 15,"actor":{"activation_fn": "relu","hidden_layers": [512,512,512]},"critic":{"centralized": "True", "embedding_size": 32, "num_heads": 4, "d_model": 32, "use_scale": "True", "activation_fn": "relu","hidden_layers": [512,512,512]},"embedding":{"activation_fn": "relu","hidden_layers": [512,512,512]}}}}'
python rollout.py baselines/checkpoints/ccppo-tree-obs-1/checkpoint_5740/checkpoint-5740 --run CcTransformer --no-render --episodes 50 --env 'flatland_sparse' --config '{"env_config": {"sparse_reward":"True","done_reward":1, "not_finished_reward": -1, "seed":1000000000,"generator": "sparse_rail_generator", "generator_config": "small_v0", "observation": "tree", "observation_config": {"max_depth": 2, "shortest_path_max_depth": 30}}, "model": {"custom_model": "cc_transformer","fcnet_activation": "relu", "fcnet_hiddens":[512,512,512],"vf_share_layers": "True" , "custom_options": {"max_num_agents": 15,"actor":{"activation_fn": "relu","hidden_layers": [512,512,512]},"critic":{"centralized": "True", "embedding_size": 32, "num_heads": 4, "d_model": 32, "use_scale": "True", "activation_fn": "relu","hidden_layers": [512,512,512]},"embedding":{"activation_fn": "relu","hidden_layers": [512,512,512]}}}}'
python rollout.py baselines/checkpoints/ccppo-tree-obs-2/checkpoint_5820/checkpoint-5820 --run CcTransformer --no-render --episodes 50 --env 'flatland_sparse' --config '{"env_config": {"sparse_reward":"True","done_reward":1, "not_finished_reward": -1, "seed":1000000000,"generator": "sparse_rail_generator", "generator_config": "small_v0", "observation": "tree", "observation_config": {"max_depth": 2, "shortest_path_max_depth": 30}}, "model": {"custom_model": "cc_transformer","fcnet_activation": "relu", "fcnet_hiddens":[512,512,512],"vf_share_layers": "True" , "custom_options": {"max_num_agents": 15,"actor":{"activation_fn": "relu","hidden_layers": [512,512,512]},"critic":{"centralized": "True", "embedding_size": 32, "num_heads": 4, "d_model": 32, "use_scale": "True", "activation_fn": "relu","hidden_layers": [512,512,512]},"embedding":{"activation_fn": "relu","hidden_layers": [512,512,512]}}}}'
echo "===================="
echo "CPPO Base"
echo "===================="
python rollout.py baselines/checkpoints/ccppo-transformer-tree-obs-0/checkpoint_5933/checkpoint-5933 --run CcConcatenate --no-render --episodes 50 --env 'flatland_sparse' --config '{"env_config": {"seed":1000000000,"generator": "sparse_rail_generator", "generator_config": "small_v0", "observation": "tree", "observation_config": {"max_depth": 2, "shortest_path_max_depth": 30}}, "model": {"custom_model": "cc_concatenate","fcnet_activation": "relu", "fcnet_hiddens":[512,512,512],"vf_share_layers": "True" , "custom_options": {"max_num_agents": 15,"actor":{"activation_fn": "relu","hidden_layers": [512,512,512]},"critic":{"centralized": "True", "embedding_size": 32, "num_heads": 4, "d_model": 32, "use_scale": "True", "activation_fn": "relu","hidden_layers": [512,512,512]},"embedding":{"activation_fn": "relu","hidden_layers": [512,512,512]}}}}'
python rollout.py baselines/checkpoints/ccppo-transformer-tree-obs-1/checkpoint_5914/checkpoint-5914 --run CcConcatenate --no-render --episodes 50 --env 'flatland_sparse' --config '{"env_config": {"seed":1000000000,"generator": "sparse_rail_generator", "generator_config": "small_v0", "observation": "tree", "observation_config": {"max_depth": 2, "shortest_path_max_depth": 30}}, "model": {"custom_model": "cc_concatenate","fcnet_activation": "relu", "fcnet_hiddens":[512,512,512],"vf_share_layers": "True" , "custom_options": {"max_num_agents": 15,"actor":{"activation_fn": "relu","hidden_layers": [512,512,512]},"critic":{"centralized": "True", "embedding_size": 32, "num_heads": 4, "d_model": 32, "use_scale": "True", "activation_fn": "relu","hidden_layers": [512,512,512]},"embedding":{"activation_fn": "relu","hidden_layers": [512,512,512]}}}}'
python rollout.py baselines/checkpoints/ccppo-transformer-tree-obs-2/checkpoint_5847/checkpoint-5847 --run CcConcatenate --no-render --episodes 50 --env 'flatland_sparse' --config '{"env_config": {"seed":1000000000,"generator": "sparse_rail_generator", "generator_config": "small_v0", "observation": "tree", "observation_config": {"max_depth": 2, "shortest_path_max_depth": 30}}, "model": {"custom_model": "cc_concatenate","fcnet_activation": "relu", "fcnet_hiddens":[512,512,512],"vf_share_layers": "True" , "custom_options": {"max_num_agents": 15,"actor":{"activation_fn": "relu","hidden_layers": [512,512,512]},"critic":{"centralized": "True", "embedding_size": 32, "num_heads": 4, "d_model": 32, "use_scale": "True", "activation_fn": "relu","hidden_layers": [512,512,512]},"embedding":{"activation_fn": "relu","hidden_layers": [512,512,512]}}}}'
echo "===================="
echo "PPO MASK TREE OBS"
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment