|
565 | 565 | (FOCUS, {'lr': 1e-1, 'weight_decay': 1e-3}, 5), |
566 | 566 | (Kron, {'lr': 1e0, 'weight_decay': 1e-3}, 3), |
567 | 567 | (EXAdam, {'lr': 1e-1, 'weight_decay': 1e-3}, 5), |
568 | | - (SCION, {'lr': 5e-1, 'constraint': False, 'weight_decay': 1e-3}, 10), |
569 | | - (SCION, {'lr': 1e-1, 'constraint': True}, 10), |
| 568 | + (SCION, {'lr': 5e-1, 'constraint': False, 'weight_decay': 1e-3}, 5), |
| 569 | + (SCION, {'lr': 1e-1, 'constraint': True, 'lmo_type': 'col_norm'}, 10), |
570 | 570 | (Ranger25, {'lr': 1e-1}, 3), |
571 | 571 | (Ranger25, {'lr': 1e-1, 't_alpha_beta3': 5}, 3), |
572 | 572 | (Ranger25, {'lr': 5e-2, 'stable_adamw': False, 'orthograd': False, 'eps': None, 'lookahead_merge_time': 2}, 3), |
|
0 commit comments