|
563 | 563 | (FOCUS, {'lr': 1e-1, 'weight_decay': 1e-3}, 5), |
564 | 564 | (Kron, {'lr': 1e0, 'weight_decay': 1e-3}, 3), |
565 | 565 | (EXAdam, {'lr': 1e-1, 'weight_decay': 1e-3}, 5), |
566 | | - (Ranger25, {'lr': 5e-2}, 5), |
567 | | - (Ranger25, {'lr': 5e-2, 't_alpha_beta3': 5}, 5), |
568 | | - (Ranger25, {'lr': 5e-2, 'stable_adamw': False, 'orthograd': False, 'eps': None}, 5), |
| 566 | + (Ranger25, {'lr': 1e-1}, 3), |
| 567 | + (Ranger25, {'lr': 1e-1, 't_alpha_beta3': 5}, 3), |
| 568 | + (Ranger25, {'lr': 5e-2, 'stable_adamw': False, 'orthograd': False, 'eps': None}, 3), |
569 | 569 | ] |
570 | 570 | ADANORM_SUPPORTED_OPTIMIZERS: List[Tuple[Any, Dict[str, Union[float, bool, int]], int]] = [ |
571 | 571 | (AdaBelief, {'lr': 5e-1, 'weight_decay': 1e-3, 'adanorm': True}, 10), |
|
0 commit comments