update: NovoGrad recipes

kozistr · kozistr · commit b91a7dc55b64 · 2023-02-13T21:24:47.000+09:00
diff --git a/tests/constants.py b/tests/constants.py
@@ -22,6 +22,7 @@
     DiffRGrad,
     Lamb,
     Nero,
+    NovoGrad,
     RAdam,
     RaLamb,
     Ranger,
@@ -68,6 +69,7 @@
     'dadaptadam',
     'adams',
     'adafactor',
+    'novograd',
 ]
 
 VALID_LR_SCHEDULER_NAMES: List[str] = [
@@ -158,6 +160,7 @@
     (Apollo, {'lr': 5e-1, 'weight_decay': 1e-3}, 10),
     (Apollo, {'lr': 5e-1, 'weight_decay': 1e-3, 'rebound': 'belief'}, 10),
     (Apollo, {'lr': 5e-1, 'weight_decay': 1e-3, 'weight_decay_type': 'stable', 'warmup_steps': 0}, 50),
+    (NovoGrad, {'lr': 5e-1, 'weight_decay': 1e-3, 'grad_averaging': True}, 50),
 ]
 ADAMD_SUPPORTED_OPTIMIZERS: List[Tuple[Any, Dict[str, Union[float, bool, int]], int]] = [
     (build_lookahead, {'lr': 5e-1, 'weight_decay': 1e-3, 'adamd_debias_term': True}, 10),
@@ -172,4 +175,5 @@
     (Ranger21, {'lr': 5e-1, 'weight_decay': 1e-3, 'adamd_debias_term': True, 'num_iterations': 200}, 200),
     (AdaPNM, {'lr': 3e-1, 'weight_decay': 1e-3, 'adamd_debias_term': True}, 50),
     (AdamS, {'lr': 2e1, 'weight_decay': 1e-3, 'adamd_debias_term': True}, 50),
+    (NovoGrad, {'lr': 5e-1, 'weight_decay': 1e-3, 'adamd_debias_term': True}, 50),
 ]