We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent f9f12bd commit 54220e2Copy full SHA for 54220e2
emerging_optimizers/psgd/psgd.py
@@ -200,9 +200,7 @@ def _update_precond_procrustes(
200
q_list: List of Kronecker factors.
201
lip_const_list: List of Lipschitz constants for the Kronecker factors.
202
"""
203
- dampened_momentum = exp_avg + (
204
- damping_noise_scale + torch.finfo(exp_avg.dtype).eps * exp_avg.abs()
205
- ) * torch.randn_like(exp_avg)
+ dampened_momentum = exp_avg + (damping_noise_scale + 1e-7 * exp_avg.abs()) * torch.randn_like(exp_avg)
206
pg = apply_preconditioner(q_list, dampened_momentum)
207
total_numel = pg.numel()
208
updated_q_list: List[torch.Tensor] = []
0 commit comments