Commit 68e70de1 authored by Dipam Chakraborty's avatar Dipam Chakraborty
Browse files

ppg ent sched

parent b830f2f2
......@@ -120,7 +120,7 @@ class RetuneSelector:
self.ac_space = ac_space
self.ob_space = ob_space
self.cooldown_counter = 0
self.cooldown_counter = skips
self.replay_index = 0
self.flat_buffer = flat_buffer
......
......@@ -62,7 +62,7 @@ procgen-ppo:
final_lr: 5.0e-5
lr_schedule: 'linear'
final_entropy_coeff: 0.002
entropy_schedule: False
entropy_schedule: True
# Memory management, if batch size overflow, batch splitting is done to handle it
max_minibatch_size: 2048
......
......@@ -6,8 +6,8 @@ set -e
#########################################
# export EXPERIMENT_DEFAULT="experiments/impala-baseline.yaml"
export EXPERIMENT_DEFAULT="experiments/custom-torch-ppo.yaml"
# export EXPERIMENT_DEFAULT="experiments/custom-ppg.yaml"
# export EXPERIMENT_DEFAULT="experiments/custom-torch-ppo.yaml"
export EXPERIMENT_DEFAULT="experiments/custom-ppg.yaml"
export EXPERIMENT=${EXPERIMENT:-$EXPERIMENT_DEFAULT}
if [[ -z $AICROWD_IS_GRADING ]]; then
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment