solve flake8 and pyright error

horasal · horasal · commit b175e6a10932 · 2025-10-28T07:25:16.000+09:00
diff --git a/gguf-py/gguf/quants.py b/gguf-py/gguf/quants.py
@@ -10,11 +10,13 @@
 
 import numpy as np
 
+
 # see ggml_e8m0_to_fp32_half in ggml-impl.h
 def e8m0_to_fp32_half(x: np.ndarray) -> np.ndarray:
     bits = np.where(x < 2, np.uint32(0x00200000) << np.uint32(x), np.uint32(x - 1) << np.uint32(23))
     return bits.view(np.float32)
 
+
 def quant_shape_to_byte_shape(shape: Sequence[int], quant_type: GGMLQuantizationType) -> tuple[int, ...]:
     block_size, type_size = GGML_QUANT_SIZES[quant_type]
     if shape[-1] % block_size != 0:
@@ -662,6 +664,10 @@ class MXFP4(__Quant, qtype=GGMLQuantizationType.MXFP4):
     # ref: https://www.opencompute.org/documents/ocp-microscaling-formats-mx-v1-0-spec-final-pdf
     kvalues = (0, 1, 2, 3, 4, 6, 8, 12, 0, -1, -2, -3, -4, -6, -8, -12)
 
+    @classmethod
+    def __e8m0_to_fp32_half(cls, x: np.ndarray) -> np.ndarray:
+        e8m0_to_fp32_half(x)
+
     @classmethod
     def quantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
         n_blocks = blocks.shape[0]
@@ -671,7 +677,7 @@ def quantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
         with np.errstate(divide="ignore"):
             e = np.where(d > 0, np.floor(np.log2(d)) - 2 + 127, 0).astype(np.uint8)
 
-        d = cls.e8m0_to_fp32_half(e)
+        d = cls.__e8m0_to_fp32_half(e)
 
         kvalues = np.array(cls.kvalues, dtype=np.int8).reshape((1, 1, 16))
 
@@ -691,7 +697,7 @@ def dequantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
 
         e, qs = np.hsplit(blocks, [1])
 
-        d = cls.e8m0_to_fp32_half(e)
+        d = cls.__e8m0_to_fp32_half(e)
 
         qs = qs.reshape((n_blocks, 1, cls.block_size // 2)) >> np.array([0, 4], dtype=np.uint8).reshape((1, 2, 1))
         qs = (qs & np.uint8(0x0F)).view(np.int8)
@@ -701,6 +707,7 @@ def dequantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
 
         return (d * qs.astype(np.float32))
 
+
 class MXFP6E3M2(__Quant, qtype=GGMLQuantizationType.MXFP6_E3M2):
     # e3m2 values (origin * 16)
     # ref: https://www.opencompute.org/documents/ocp-microscaling-formats-mx-v1-0-spec-final-pdf
@@ -713,6 +720,10 @@ class MXFP6E3M2(__Quant, qtype=GGMLQuantizationType.MXFP6_E3M2):
         -48, -56, -64, -80, -96, -112, -128, -160, -192, -224, -256, -320, -384, -448,
     )
 
+    @classmethod
+    def __e8m0_to_fp32_half(cls, x: np.ndarray) -> np.ndarray:
+        e8m0_to_fp32_half(x)
+
     @classmethod
     def quantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
         n_blocks = blocks.shape[0]
@@ -726,7 +737,7 @@ def quantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
             )
 
         # d is float of above e8m0
-        d = cls.e8m0_to_fp32_half(e)
+        d = cls.__e8m0_to_fp32_half(e)
 
         kvalues = np.array(cls.kvalues, dtype=np.int16).reshape((1, 1, 64))
 
@@ -763,7 +774,7 @@ def dequantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
 
         e, qs = np.hsplit(blocks, [1])
 
-        d = cls.e8m0_to_fp32_half(e).astype(np.float32)
+        d = cls.__e8m0_to_fp32_half(e).astype(np.float32)
 
         qs_groups = qs.reshape((n_blocks, -1, 3))
         b0 = qs_groups[..., 0]
@@ -796,6 +807,10 @@ class MXFP6E2M3(__Quant, qtype=GGMLQuantizationType.MXFP6_E2M3):
         -22, -24, -26, -28, -30, -32, -36, -40, -44, -48, -52, -56, -60,
     )
 
+    @classmethod
+    def __e8m0_to_fp32_half(cls, x: np.ndarray) -> np.ndarray:
+        e8m0_to_fp32_half(x)
+
     @classmethod
     def quantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
         n_blocks = blocks.shape[0]
@@ -809,7 +824,7 @@ def quantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
             )
 
         # d is float of above e8m0
-        d = cls.e8m0_to_fp32_half(e)
+        d = cls.__e8m0_to_fp32_half(e)
 
         kvalues = np.array(cls.kvalues, dtype=np.int16).reshape((1, 1, 64))
 
@@ -846,7 +861,7 @@ def dequantize_blocks(cls, blocks: np.ndarray) -> np.ndarray:
 
         e, qs = np.hsplit(blocks, [1])
 
-        d = cls.e8m0_to_fp32_half(e).astype(np.float32)
+        d = cls.__e8m0_to_fp32_half(e).astype(np.float32)
 
         qs_groups = qs.reshape((n_blocks, -1, 3))
         b0 = qs_groups[..., 0]