fixup format in test_divide

alexbaden · alexbaden · commit c8027e1921e9 · 2024-11-20T11:02:53.000-07:00
diff --git a/python/test/regression/test_divide.py b/python/test/regression/test_divide.py
@@ -1,10 +1,11 @@
+# flake8: noqa: F821, F841
 import torch
-aten = torch.ops.aten
-
-import pytest 
+import pytest
 
 import triton
-import triton.language as tl 
+import triton.language as tl
+
+aten = torch.ops.aten
 
 
 def patch_kernel(template, to_replace):
@@ -13,25 +14,27 @@ def patch_kernel(template, to_replace):
         kernel.src = kernel.src.replace(key, value)
     return kernel
 
+
 @pytest.mark.parametrize("float_div", [True, False])
 @pytest.mark.parametrize("floor", [True, False])
 @pytest.mark.parametrize("trunc", [True, False])
 def test_divide(float_div, floor, trunc, device):
-    # regression test for various division cases 
+    # regression test for various division cases
 
-    @triton.jit 
+    @triton.jit
     def divide_kernel(a, b, out_ptr0, out_ptr1, out_ptr2, out_ptr3, out_ptr4, xnumel, XBLOCK: tl.constexpr):
         xoffset = tl.program_id(0) * XBLOCK
         xindex = xoffset + tl.arange(0, XBLOCK)[:]
         xmask = xindex < xnumel
         x0 = xindex
         tmp0 = tl.load(a + (x0), xmask)
         tmp2 = tl.load(b + (x0), xmask)
-        # custom bits 
+        # custom bits
         tmp1 = tmp0.to(tl.float32)
         tmp3 = tmp2.to(tl.float32)
         tmp4 = tmp1 / tmp3
-        tmp5 = tl.where((tmp0 < 0) != (tmp2 < 0), tl.where(tmp0 % tmp2 != 0, tmp0 // tmp2 - 1, tmp0 // tmp2), tmp0 // tmp2)
+        tmp5 = tl.where((tmp0 < 0) != (tmp2 < 0), tl.where(tmp0 % tmp2 != 0, tmp0 // tmp2 - 1, tmp0 // tmp2),
+                        tmp0 // tmp2)
         tmp6 = tmp0 // tmp2
         GENERATE_OUTPUTS_HERE
 
@@ -41,7 +44,8 @@ def divide_kernel(a, b, out_ptr0, out_ptr1, out_ptr2, out_ptr3, out_ptr4, xnumel
     outputs_floor = "\n    tl.store(out_ptr1 + (x0), tmp5, xmask)\n    tl.store(out_ptr4 + (x0), tmp5, xmask)" if floor is True else ""
     outputs_trunc = "\n    tl.store(out_ptr2 + (x0), tmp6, xmask)" if trunc is True else ""
 
-    divide_kernel = patch_kernel(divide_kernel, {"GENERATE_OUTPUTS_HERE": f"{outputs_float_div}\n{outputs_floor}\n{outputs_trunc}"})
+    divide_kernel = patch_kernel(divide_kernel,
+                                 {"GENERATE_OUTPUTS_HERE": f"{outputs_float_div}\n{outputs_floor}\n{outputs_trunc}"})
 
     def launch_triton(a, b):
         output0 = torch.zeros_like(a)
@@ -57,15 +61,15 @@ def launch_triton(a, b):
         divide_kernel[grid](a, b, output0, output1, output2, output3, output4, n_elements, XBLOCK=128)
 
         return (output0, output1, output2, output3, output4)
-    
+
     def launch_torch(a, b):
-            return (
-                aten.div(a, b, rounding_mode=None) if float_div is True else torch.zeros_like(a),
-                aten.div(a, b, rounding_mode="floor") if floor is True else torch.zeros_like(a),
-                aten.div(a, b, rounding_mode="trunc") if trunc is True else torch.zeros_like(a),
-                a / b if float_div is True else torch.zeros_like(a),
-                a // b if floor is True else torch.zeros_like(a),
-            )
+        return (
+            aten.div(a, b, rounding_mode=None) if float_div is True else torch.zeros_like(a),
+            aten.div(a, b, rounding_mode="floor") if floor is True else torch.zeros_like(a),
+            aten.div(a, b, rounding_mode="trunc") if trunc is True else torch.zeros_like(a),
+            a / b if float_div is True else torch.zeros_like(a),
+            a // b if floor is True else torch.zeros_like(a),
+        )
 
     a = torch.randint(2**32, 2**40, [100, 100], device=device)
     b = torch.randint(-10, -1, [100, 100], device=device)
@@ -75,6 +79,6 @@ def launch_torch(a, b):
         torch_result = launch_torch(a, b)
 
         for i in range(5):
-            torch.testing.assert_close(triton_result[i], torch_result[i], check_dtype=False, msg=lambda msg: f"Float: {float_div}, Floor: {floor}, Trunc: {trunc}\nIteration {iter}, {i} failed\n{msg}")
-
-    
+            torch.testing.assert_close(
+                triton_result[i], torch_result[i], check_dtype=False, msg=lambda msg:
+                f"Float: {float_div}, Floor: {floor}, Trunc: {trunc}\nIteration {iter}, {i} failed\n{msg}")