Commit 850e912b authored by Dipam Chakraborty's avatar Dipam Chakraborty
Browse files
parents 49af838c 11d40811
......@@ -45,17 +45,17 @@ procgen-ppo:
no_done_at_end: False
# Custom switches
skips: 9
n_pi: 9
skips: 0
n_pi: 18
num_retunes: 100
retune_epochs: 6
retune_epochs: 3
standardize_rewards: True
aux_mbsize: 4
augment_buffer: True
scale_reward: 1.0
reset_returns: False
flattened_buffer: True
augment_randint_num: 3 ## Hacky name fix later
augment_randint_num: 6 ## Hacky name fix later
aux_lr: 5.0e-4
value_lr: 1.0e-3
same_lr_everywhere: False
......
......@@ -62,7 +62,7 @@ procgen-ppo:
# Memory management, if batch size overflow, batch splitting is done to handle it
max_minibatch_size: 2048
updates_per_batch: 3
updates_per_batch: 8
normalize_actions: False
clip_rewards: null
......@@ -81,11 +81,11 @@ procgen-ppo:
depths: [32, 64, 64]
nlatents: 512
use_layernorm: True
diff_framestack: False
diff_framestack: True
d2rl: True
num_workers: 7
num_envs_per_worker: 9
num_envs_per_worker: 16
rollout_fragment_length: 256
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment