diff --git a/emerging_optimizers/orthogonalized_optimizers/muon_utils.py b/emerging_optimizers/orthogonalized_optimizers/muon_utils.py index 79bd4f2..10775f7 100644 --- a/emerging_optimizers/orthogonalized_optimizers/muon_utils.py +++ b/emerging_optimizers/orthogonalized_optimizers/muon_utils.py @@ -38,14 +38,14 @@ ], "polar_express": [ # Polar Express iteration from: https://arxiv.org/abs/2505.16932 - (7.2086, -15.5131, 9.0178), - (3.9623, -2.5813, 0.4542), - (3.9466, -2.5765, 0.4544), - (3.8991, -2.5671, 0.4566), - (3.7186, -2.5308, 0.4653), - (3.1390, -2.3073, 0.4733), - (2.1715, -1.5246, 0.3885), - (1.8648, -1.2224, 0.3577), + (8.2051, -22.9019, 16.4607), + (4.0664, -2.8612, 0.5184), + (3.9096, -2.8234, 0.5250), + (3.2856, -2.4153, 0.4853), + (2.2779, -1.6198, 0.3985), + (1.8726, -1.2307, 0.3585), + (1.8564, -1.2132, 0.3568), + (1.8750, -1.2500, 0.3750), ], "aol": [ # from https://github.com/thib-s/flash-newton-schulz/blob/main/newton_schulz_triton.py#L511