optimise

a-r-r-o-w · a-r-r-o-w · commit 5ea3d8af549c · 2025-01-26T16:48:39.000+01:00
diff --git a/src/diffusers/hooks/group_offloading.py b/src/diffusers/hooks/group_offloading.py
@@ -218,10 +218,10 @@ def post_forward(self, module, output):
         registries = [submodule._diffusers_hook for _, submodule in self.execution_order]
 
         for i in range(num_executed):
-            registries[i].remove_hook(_LAYER_EXECUTION_TRACKER)
+            registries[i].remove_hook(_LAYER_EXECUTION_TRACKER, recurse=False)
 
         # Remove the current lazy prefetch group offloading hook so that it doesn't interfere with the next forward pass
-        base_module_registry.remove_hook(_LAZY_PREFETCH_GROUP_OFFLOADING)
+        base_module_registry.remove_hook(_LAZY_PREFETCH_GROUP_OFFLOADING, recurse=False)
 
         # Apply lazy prefetching by setting required attributes
         group_offloading_hooks = [registry.get_hook(_GROUP_OFFLOADING) for registry in registries]
@@ -536,7 +536,10 @@ def _apply_lazy_group_offloading_hook(
     hook = GroupOffloadingHook(group, offload_on_init, next_group)
     lazy_prefetch_hook = LazyPrefetchGroupOffloadingHook()
     registry = HookRegistry.check_if_exists_or_initialize(module)
-    registry.register_hook(hook, _GROUP_OFFLOADING)
+    # We may have already registered a group offloading hook if the module had a torch.nn.Parameter whose parent
+    # is the current module. In such cases, we don't want to overwrite the existing group offloading hook.
+    if registry.get_hook(_GROUP_OFFLOADING) is None:
+        registry.register_hook(hook, _GROUP_OFFLOADING)
     registry.register_hook(lazy_prefetch_hook, _LAZY_PREFETCH_GROUP_OFFLOADING)
 
 
diff --git a/src/diffusers/hooks/hooks.py b/src/diffusers/hooks/hooks.py
@@ -13,7 +13,6 @@
 # limitations under the License.
 
 import functools
-import gc
 from typing import Any, Dict, Optional, Tuple
 
 import torch
@@ -187,8 +186,6 @@ def remove_hook(self, name: str, recurse: bool = True) -> None:
                 if hasattr(module, "_diffusers_hook"):
                     module._diffusers_hook.remove_hook(name, recurse=False)
 
-        gc.collect()
-
     def reset_stateful_hooks(self, recurse: bool = True) -> None:
         for hook_name in reversed(self._hook_order):
             hook = self.hooks[hook_name]