fix flake8

tharittk · tharittk · commit ec883711a7e0 · 2025-10-09T02:46:02.000-05:00
diff --git a/pylops_mpi/Distributed.py b/pylops_mpi/Distributed.py
@@ -22,8 +22,8 @@ class DistributedMixIn:
     MPI installation is available, the latter with CuPy arrays when a CUDA-Aware
     MPI installation is not available).
     """
-    def _allreduce(self, base_comm, base_comm_nccl, 
-                   send_buf, recv_buf=None, op: MPI.Op = MPI.SUM, 
+    def _allreduce(self, base_comm, base_comm_nccl,
+                   send_buf, recv_buf=None, op: MPI.Op = MPI.SUM,
                    engine="numpy"):
         """Allreduce operation
         """
@@ -33,7 +33,7 @@ def _allreduce(self, base_comm, base_comm_nccl,
             return mpi_allreduce(base_comm, send_buf,
                                  recv_buf, engine, op)
 
-    def _allreduce_subcomm(self, sub_comm, base_comm_nccl, 
+    def _allreduce_subcomm(self, sub_comm, base_comm_nccl,
                            send_buf, recv_buf=None, op: MPI.Op = MPI.SUM,
                            engine="numpy"):
         """Allreduce operation with subcommunicator
@@ -44,7 +44,7 @@ def _allreduce_subcomm(self, sub_comm, base_comm_nccl,
             return mpi_allreduce(sub_comm, send_buf,
                                  recv_buf, engine, op)
 
-    def _allgather(self, base_comm, base_comm_nccl, 
+    def _allgather(self, base_comm, base_comm_nccl,
                    send_buf, recv_buf=None,
                    engine="numpy"):
         """Allgather operation
@@ -85,7 +85,7 @@ def _bcast(self, local_array, index, value):
             # self.local_array[index] = self.base_comm.bcast(value)
             mpi_bcast(self.base_comm, self.rank, self.local_array, index, value,
                       engine=self.engine)
-        
+
     def _send(self, send_buf, dest, count=None, tag=0):
         """Send operation
         """
diff --git a/pylops_mpi/DistributedArray.py b/pylops_mpi/DistributedArray.py
@@ -341,7 +341,7 @@ def local_shapes(self):
             return self._nccl_local_shapes(False)
         else:
             return self._allgather(self.base_comm,
-                                   self.base_comm_nccl, 
+                                   self.base_comm_nccl,
                                    self.local_shape)
 
     @property
@@ -383,7 +383,7 @@ def asarray(self, masked: bool = False):
                 final_array = self._allgather_subcomm(self.local_array)
             else:
                 final_array = self._allgather(self.base_comm,
-                                              self.base_comm_nccl, 
+                                              self.base_comm_nccl,
                                               self.local_array,
                                               engine=self.engine)
             return np.concatenate(final_array, axis=self.axis)
@@ -484,7 +484,7 @@ def _nccl_local_shapes(self, masked: bool):
             all_tuples = self._allgather_subcomm(self.local_shape).get()
         else:
             all_tuples = self._allgather(self.base_comm,
-                                         self.base_comm_nccl, 
+                                         self.base_comm_nccl,
                                          self.local_shape).get()
         # NCCL returns the flat array that packs every tuple as 1-dimensional array
         # unpack each tuple from each rank
@@ -625,12 +625,12 @@ def _compute_vector_norm(self, local_array: NDArray,
                 # CuPy + non-CUDA-aware MPI: This will call non-buffered communication
                 # which return a list of object - must be copied back to a GPU memory.
                 recv_buf = self._allreduce_subcomm(self.sub_comm, self.base_comm_nccl,
-                                                   send_buf.get(), recv_buf.get(), 
+                                                   send_buf.get(), recv_buf.get(),
                                                    op=MPI.MAX, engine=self.engine)
                 recv_buf = ncp.asarray(ncp.squeeze(recv_buf, axis=axis))
             else:
                 recv_buf = self._allreduce_subcomm(self.sub_comm, self.base_comm_nccl,
-                                                   send_buf, recv_buf, op=MPI.MAX, 
+                                                   send_buf, recv_buf, op=MPI.MAX,
                                                    engine=self.engine)
                 # TODO (tharitt): In current implementation, there seems to be a semantic difference between Buffered MPI and NCCL
                 # the (1, size) is collapsed to (size, ) with buffered MPI while NCCL retains it.
@@ -643,18 +643,18 @@ def _compute_vector_norm(self, local_array: NDArray,
             send_buf = ncp.min(ncp.abs(local_array), axis=axis).astype(ncp.float64)
             if self.engine == "cupy" and self.base_comm_nccl is None and not deps.cuda_aware_mpi_enabled:
                 recv_buf = self._allreduce_subcomm(self.sub_comm, self.base_comm_nccl,
-                                                   send_buf.get(), recv_buf.get(), 
+                                                   send_buf.get(), recv_buf.get(),
                                                    op=MPI.MIN, engine=self.engine)
                 recv_buf = ncp.asarray(ncp.squeeze(recv_buf, axis=axis))
             else:
                 recv_buf = self._allreduce_subcomm(self.sub_comm, self.base_comm_nccl,
-                                                   send_buf, recv_buf, 
+                                                   send_buf, recv_buf,
                                                    op=MPI.MIN, engine=self.engine)
                 if self.base_comm_nccl:
                     recv_buf = ncp.asarray(ncp.squeeze(recv_buf, axis=axis))
         else:
             recv_buf = self._allreduce_subcomm(self.sub_comm, self.base_comm_nccl,
-                                               ncp.sum(ncp.abs(ncp.float_power(local_array, ord)), axis=axis), 
+                                               ncp.sum(ncp.abs(ncp.float_power(local_array, ord)), axis=axis),
                                                engine=self.engine)
             recv_buf = ncp.power(recv_buf, 1.0 / ord)
         return recv_buf
diff --git a/pylops_mpi/basicoperators/VStack.py b/pylops_mpi/basicoperators/VStack.py
@@ -135,17 +135,17 @@ def _matvec(self, x: DistributedArray) -> DistributedArray:
     def _rmatvec(self, x: DistributedArray) -> DistributedArray:
         ncp = get_module(x.engine)
         y = DistributedArray(global_shape=self.shape[1],
-                             base_comm=x.base_comm, 
-                             base_comm_nccl=x.base_comm_nccl, 
+                             base_comm=x.base_comm,
+                             base_comm_nccl=x.base_comm_nccl,
                              partition=Partition.BROADCAST,
                              engine=x.engine,
                              dtype=self.dtype)
         y1 = []
         for iop, oper in enumerate(self.ops):
             y1.append(oper.rmatvec(x.local_array[self.nnops[iop]: self.nnops[iop + 1]]))
         y1 = ncp.sum(ncp.vstack(y1), axis=0)
-        y[:] = self._allreduce(x.base_comm, x.base_comm_nccl, 
-                               y1, op=MPI.SUM, engine=x.engine) 
+        y[:] = self._allreduce(x.base_comm, x.base_comm_nccl,
+                               y1, op=MPI.SUM, engine=x.engine)
         return y
 
 
diff --git a/pylops_mpi/utils/_common.py b/pylops_mpi/utils/_common.py
@@ -3,12 +3,9 @@
     "_unroll_allgather_recv"
 ]
 
-from typing import Optional
 
 import numpy as np
-from mpi4py import MPI
 from pylops.utils.backend import get_module
-from pylops_mpi.utils import deps
 
 
 # TODO: return type annotation for both cupy and numpy

Original file line number	Diff line number	Diff line change
`@@ -3,12 +3,9 @@`
`3`	`3`	`"_unroll_allgather_recv"`
`4`	`4`	`]`
`5`	`5`
`6`		`-from typing import Optional`
`7`	`6`
`8`	`7`	`import numpy as np`
`9`		`-from mpi4py import MPI`
`10`	`8`	`from pylops.utils.backend import get_module`
`11`		`-from pylops_mpi.utils import deps`
`12`	`9`
`13`	`10`
`14`	`11`	`# TODO: return type annotation for both cupy and numpy`