Skip to content

Commit 7a99b3b

Browse files
authored
Merge pull request #418 from kywch/quick
Small changes to pufferl
2 parents 23babab + f1b08e6 commit 7a99b3b

File tree

3 files changed

+5
-3
lines changed

3 files changed

+5
-3
lines changed

pufferlib/config/default.ini

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@ precision = float32
2929
total_timesteps = 10_000_000
3030
learning_rate = 0.015
3131
anneal_lr = True
32-
min_learning_rate = 0.0
32+
min_lr_ratio = 0.0
3333
gamma = 0.995
3434
gae_lambda = 0.90
3535
update_epochs = 1

pufferlib/config/ocean/g2048.ini

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ snake_reward_weight = 0.0005
2626
# 512 hidden: https://wandb.ai/kywch/pufferlib/runs/5thsjr61?nw=nwuserkywch
2727
total_timesteps = 6_767_676_767
2828
anneal_lr = True
29-
min_learning_rate = 0.00005
29+
min_lr_ratio = 0.15
3030
batch_size = auto
3131
bptt_horizon = 64
3232
minibatch_size = 32768

pufferlib/pufferl.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -184,8 +184,9 @@ def __init__(self, config, vecenv, policy, logger=None):
184184

185185
# Learning rate scheduler
186186
epochs = config['total_timesteps'] // config['batch_size']
187+
eta_min = config['learning_rate'] * config['min_lr_ratio']
187188
self.scheduler = torch.optim.lr_scheduler.CosineAnnealingLR(
188-
optimizer, T_max=epochs, eta_min=config['min_learning_rate'])
189+
optimizer, T_max=epochs, eta_min=eta_min)
189190
self.total_epochs = epochs
190191

191192
# Automatic mixed precision
@@ -879,6 +880,7 @@ def __init__(self, args, load_id=None, resume='allow'):
879880
resume=resume,
880881
config=args,
881882
tags = [args['tag']] if args['tag'] is not None else [],
883+
settings=wandb.Settings(console="off"), # stop sending dashboard to wandb
882884
)
883885
self.wandb = wandb
884886
self.run_id = wandb.run.id

0 commit comments

Comments
 (0)