ops: Fix vanilla-fp8 loaded lora quality (#12390)

rattus128 · web-flow · commit 123a7874a97c · 2026-02-10T13:38:28.000-05:00
This was missing the stochastic rounding required for fp8 downcast
to be consistent with model_patcher.patch_weight_to_device.

Missed in testing as I spend too much time with quantized tensors
and overlooked the simpler ones.
diff --git a/comfy/ops.py b/comfy/ops.py
@@ -169,8 +169,8 @@ def to_dequant(tensor, dtype):
                 if orig.dtype == dtype and len(fns) == 0:
                     #The layer actually wants our freshly saved QT
                     x = y
-            else:
-                y = x
+            elif update_weight:
+                y = comfy.float.stochastic_rounding(x, orig.dtype, seed = comfy.utils.string_to_seed(s.seed_key))
             if update_weight:
                 orig.copy_(y)
         for f in fns: