Commit e6c5b194 authored by umbra99's avatar umbra99

compair configs

parent d63fba40
Pipeline #4951 failed with stage
in 4 minutes and 18 seconds
...@@ -10,8 +10,6 @@ flatland-random-sparse-small-tree-fc-cctransformer: ...@@ -10,8 +10,6 @@ flatland-random-sparse-small-tree-fc-cctransformer:
config: config:
clip_rewards: True clip_rewards: True
clip_param: 0.1 clip_param: 0.1
vf_clip_param: 500.0
entropy_coeff: 0.01
# effective batch_size: train_batch_size * num_agents_in_each_environment [5, 10] # effective batch_size: train_batch_size * num_agents_in_each_environment [5, 10]
# see https://github.com/ray-project/ray/issues/4628 # see https://github.com/ray-project/ray/issues/4628
train_batch_size: 1000 # 5000 train_batch_size: 1000 # 5000
...@@ -20,16 +18,16 @@ flatland-random-sparse-small-tree-fc-cctransformer: ...@@ -20,16 +18,16 @@ flatland-random-sparse-small-tree-fc-cctransformer:
num_sgd_iter: 10 num_sgd_iter: 10
num_workers: 2 num_workers: 2
num_envs_per_worker: 5 num_envs_per_worker: 5
batch_mode: truncate_episodes batch_mode: complete_episodes
observation_filter: NoFilter
vf_share_layers: True vf_share_layers: True
lr: 0.0001
vf_loss_coeff: 0.000001
num_gpus: 1 num_gpus: 1
env_config: env_config:
observation: tree observation: tree
resolve_deadlocks: false sparse_reward: True
done_reward: 1
not_finished_reward: -1
observation_config: observation_config:
max_depth: 2 max_depth: 2
shortest_path_max_depth: 30 shortest_path_max_depth: 30
...@@ -70,5 +68,5 @@ flatland-random-sparse-small-tree-fc-cctransformer: ...@@ -70,5 +68,5 @@ flatland-random-sparse-small-tree-fc-cctransformer:
- 512 - 512
- 512 - 512
fcnet_activation: relu fcnet_activation: relu
fcnet_hiddens: [256, 256] fcnet_hiddens: [512, 512,512]
vf_share_layers: True # False vf_share_layers: True # False
...@@ -23,18 +23,19 @@ flatland-random-sparse-small-tree-fc-cctransformer: ...@@ -23,18 +23,19 @@ flatland-random-sparse-small-tree-fc-cctransformer:
num_gpus: 1 num_gpus: 1
env_config: env_config:
observation: tree observation: tree
resolve_deadlocks: True
observation_config: observation_config:
max_depth: 2 max_depth: 2
shortest_path_max_depth: 30 shortest_path_max_depth: 30
# skip_no_choice_cells: True
# accumulate_skipped_rewards: True
generator: sparse_rail_generator generator: sparse_rail_generator
generator_config: small_v0 generator_config: small_v0
wandb: wandb:
project: flatland project: flatland
entity: entity: masterscrat
tags: ["small_v0", "tree_obs"] # TODO should be set programmatically tags: ["small_v0", "tree_obs", "ccppo", "transformer"] # TODO should be set programmatically
model: model:
custom_model: cc_concatenate custom_model: cc_concatenate
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment