NVIDIA-NeMo · ananthsub · Jun 5, 2025 · Jun 4, 2025 · Jun 4, 2025 · Jun 4, 2025
diff --git a/nemo_lm/peft/walk_utils.py b/nemo_lm/peft/walk_utils.py
@@ -0,0 +1,353 @@
+# Copyright (c) 2025, NVIDIA CORPORATION.  All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Walking utilities for PyTorch module transformation.
+
+This module provides utilities for recursively applying transformations to PyTorch modules,
+handling complex hierarchies including lists, dictionaries, and nested structures.
+These utilities are copied from NeMo's fn/base.py to provide independent module traversal
+capabilities without external dependencies.
+
+Examples:
+    Basic module transformation:
+        >>> def add_tag(module, name=None, **kwargs):
+        ...     module.tag = f"transformed_{name}"
+        ...     return module
+        >>>
+        >>> model = nn.Sequential(nn.Linear(10, 5), nn.ReLU())
+        >>> transformed = walk(model, add_tag)
+
+    Conditional transformation:
+        >>> def freeze_linear(module, **kwargs):
+        ...     if isinstance(module, nn.Linear):
+        ...         for param in module.parameters():
+        ...             param.requires_grad = False
+        ...     return module
+        >>>
+        >>> frozen_model = walk(model, freeze_linear)
+"""
+
+import inspect
+from typing import Callable, Iterable, Protocol, TypeVar, Union, runtime_checkable
+
+import torch.nn as nn
+
+
+@runtime_checkable
+class HasBool(Protocol):
+    """Protocol for objects that can be evaluated as boolean."""
+
+    def __bool__(self) -> bool: ...
+
+
+_TModule = TypeVar("_TModule", bound=nn.Module)
+ModuleFunc = Callable[[nn.Module], nn.Module]
+ModulePredicate = Callable[[nn.Module], Union[bool, HasBool]]
+
+
+def map(  # noqa: A001
+    module: _TModule,
+    func: ModuleFunc,
+    leaf_only: bool = False,
+    **kwargs,
+) -> _TModule:
+    """Applies a function to a PyTorch module or a collection of modules.
+
+    This function can be used to modify modules in place, such as changing their attributes,
+    applying normalization, or any other custom transformations. It supports individual modules,
+    lists of modules, and dictionaries of modules. The function can be applied selectively to
+    modules that do not have parameters if `leaf_only` is set to True.
+
+    Args:
+        module: The module or collection of modules to which the function will be applied.
+        func: A callable that takes a module (and optionally additional keyword arguments) and
+              returns a transformed module. The signature should be `func(module, **kwargs)`.
+        leaf_only: If True, the function will only be applied to modules that
+                                    do not have any parameters. Defaults to False.
+        **kwargs: Additional keyword arguments that will be passed to `func`.
+
+    Returns:
+        The transformed module or collection of modules.
+
+    Examples:
+        >>> import torch.nn as nn
+        >>> from nemo_lm.utils.walking_utils import map
+
+        # Example: Adding a custom attribute to all modules
+        >>> model = nn.Sequential(nn.Linear(10, 20), nn.ReLU(), nn.Linear(20, 10))
+        >>> def add_id(m, module_id=0):
+        ...     m.custom_id = module_id
+        ...     return m
+        >>> model = map(model, add_id, module_id=42)
+    """
+    if not kwargs.pop("_skip_map", False) and hasattr(module, "map"):
+        return module.map(func, leaf_only=leaf_only, **kwargs)
+
+    elif isinstance(module, Iterable):
+        if all(hasattr(module, key) for key in ["items", "values", "keys"]):
+            return _map_module_dict(module, func, leaf_only=leaf_only, **kwargs)
+
+        return _map_module_list(module, func, leaf_only=leaf_only, **kwargs)
+    else:
+        return _map_module(module, func, leaf_only=leaf_only, **kwargs)
+
+
+def walk(
+    module: _TModule,
+    func: ModuleFunc,
+    leaf_only: bool = False,
+    **kwargs,
+) -> _TModule:
+    """Recursively apply a function to a module or collection.
+
+    This function is similar to `map`, but it applies the function recursively to all child
+    modules as well. This is useful for applying transformations that need to consider the
+    module hierarchy.
+
+    Args:
+        module: The module or collection to recursively apply to.
+        func: The function to apply.
+        leaf_only: If True, only apply to modules without parameters. Defaults to False.
+        **kwargs: Additional kwargs to pass to the function.
+
+    Returns:
+        The transformed module or collection.
+
+    Examples:
+        >>> import torch.nn as nn
+        >>> from nemo_lm.utils.walking_utils import walk
+
+        # Example: Freezing all parameters in a model
+        >>> model = nn.Sequential(nn.Linear(10, 20), nn.ReLU(), nn.Linear(20, 10))
+        >>> def freeze_params(m):
+        ...     for param in m.parameters(recurse=False):
+        ...         param.requires_grad = False
+        ...     return m
+        >>> frozen_model = walk(model, freeze_params)
+    """
+    return map(
+        module,
+        func,
+        recurse=True,
+        leaf_only=leaf_only,
+        **kwargs,
+    )
+
+
+def forall(module: nn.Module, func: ModulePredicate, recurse: bool = False) -> bool:
+    """
+    Checks if a predicate holds for all modules in a given module or its children, optionally
+    recursively.
+
+    This function iterates over all modules and applies a predicate function to determine if
+    all modules satisfy a certain condition. If `recurse` is True, it checks all child modules
+    recursively.
+
+    Args:
+        module (nn.Module): The root module to check.
+        func (ModulePredicate): A predicate function that takes a module as input and returns
+                                a boolean or an object that can be evaluated as a boolean.
+        recurse (bool): If True, applies the predicate recursively to all child modules.
+                        Defaults to False.
+
+    Returns:
+        bool: True if all modules satisfy the predicate, False otherwise.
+
+    Examples:
+        >>> import torch.nn as nn
+        >>> from nemo_lm.utils.walking_utils import forall
+
+        >>> model = nn.Sequential(nn.Linear(10, 20), nn.ReLU(), nn.Linear(20, 10))
+        >>> predicate = lambda m: isinstance(m, (nn.Linear, nn.Sequential, nn.ReLU))
+        >>> print(forall(model, predicate, recurse=True))
+        True
+    """
+
+    def apply_predicate(m):
+        result = func(m)
+        # Convert result to bool if it's not already a boolean (e.g., if it's an instance of HasBool)
+        return bool(result)
+
+    if recurse:
+        # Apply the predicate to all modules recursively
+        results = [apply_predicate(m) for m in module.modules()]
+    else:
+        # Apply the predicate only to the top-level module
+        results = [apply_predicate(module)]
+
+    return all(results)
+
+
+def _map_module(
+    module: _TModule, func: ModuleFunc, recurse=False, leaf_only=False, transformed_modules=None, **kwargs
+) -> _TModule:
+    """
+    Applies a transformation function to a module and optionally to its child modules.
+
+    Parameters:
+        module : nn.Module
+            The module to which the function will be applied.
+        func : ModuleFunc
+            The function that will be applied to the module.
+        recurse : bool, optional
+            Whether to apply the function recursively to child modules.
+        leaf_only : bool, optional
+            Whether to apply the function only to modules without parameters.
+        transformed_modules : set, optional
+            A set to keep track of modules that have already been transformed.
+        **kwargs : dict
+            Additional keyword arguments that will be passed to the transformation function.
+
+    Returns:
+        nn.Module
+            The transformed module.
+    """
+    if transformed_modules is None:
+        transformed_modules = set()
+
+    if id(module) in transformed_modules:
+        return module
+
+    new_module = module
+    f_kwargs = _get_func_kwargs(func, **kwargs)
+
+    if not leaf_only or list(module.parameters(recurse=False)):
+        new_module = func(new_module, **f_kwargs)
+
+    prefix = kwargs.get("name", "") if not kwargs.get("prefix", "") else f"{kwargs['prefix']}.{kwargs['name']}"
+    kwargs.pop("i", None)
+    kwargs.pop("name", None)
+    kwargs.pop("prefix", None)
+
+    for i, (name, child) in enumerate(module.named_children()):
+        setattr(
+            new_module,
+            name,
+            map(
+                child,
+                func,
+                recurse=recurse,
+                leaf_only=leaf_only,
+                transformed_modules=transformed_modules,
+                i=i,
+                name=name,
+                prefix=prefix,
+                **kwargs,
+            ),
+        )
+
+    transformed_modules.add(id(new_module))
+
+    return new_module
+
+
+def _map_module_list(
+    module_list: _TModule, func: ModuleFunc, recurse=False, leaf_only=False, transformed_modules=None, **kwargs
+) -> _TModule:
+    """Apply a transformation function to a list of modules."""
+    if transformed_modules is None:
+        transformed_modules = set()
+
+    f_kwargs = _get_func_kwargs(func, **kwargs)
+    if not leaf_only:
+        module_list = func(module_list, **f_kwargs)
+
+    mapped_modules = []
+    prefix = kwargs.get("name", "") if not kwargs.get("prefix", "") else f"{kwargs['prefix']}.{kwargs['name']}"
+    kwargs.pop("i", None)
+    kwargs.pop("name", None)
+    kwargs.pop("prefix", None)
+    for i, module in enumerate(module_list):
+        new_module = map(
+            module,
+            func,
+            recurse=recurse,
+            leaf_only=leaf_only,
+            transformed_modules=transformed_modules,
+            i=i,
+            name=str(i),
+            prefix=prefix,
+            **kwargs,
+        )
+        mapped_modules.append(new_module)
+
+    return _create_list_wrapper(module_list, mapped_modules)
+
+
+def _map_module_dict(
+    module_dict: _TModule,
+    func: ModuleFunc,
+    recurse: bool = False,
+    leaf_only: bool = False,
+    transformed_modules=None,
+    **kwargs,
+) -> _TModule:
+    """
+    Applies a transformation function to a ModuleDict of modules.
+
+    Parameters:
+        module_dict : nn.ModuleDict
+            The ModuleDict of modules to which the function will be applied.
+        func : ModuleFunc
+            The function that will be applied to the modules.
+        recurse : bool, optional
+            Whether to apply the function recursively to child modules.
+        leaf_only : bool, optional
+            Whether to apply the function only to modules without parameters.
+        **kwargs : dict
+            Additional keyword arguments that will be passed to the transformation function.
+
+    Returns:
+        nn.ModuleDict
+            The ModuleDict of transformed modules.
+    """
+    if transformed_modules is None:
+        transformed_modules = set()
+
+    f_kwargs = _get_func_kwargs(func, **kwargs)
+    if not leaf_only:
+        module_dict = func(module_dict, **f_kwargs)
+
+    mapped_modules = {}
+    for i, (name, module) in enumerate(module_dict.items()):
+        kwargs["i"] = i
+        kwargs["name"] = name
+
+        mapped_modules[name] = map(
+            module,
+            func,
+            recurse=recurse,
+            leaf_only=leaf_only,
+            transformed_modules=transformed_modules,
+            **kwargs,
+        )
+
+    return type(module_dict)(mapped_modules)
+
+
+def _create_list_wrapper(module_list, to_add):
+    """Create a wrapper for a list of modules, preserving the original type."""
+    # Check the signature of the type constructor
+    sig = inspect.signature(type(module_list).__init__)
+    if "args" in sig.parameters:
+        return type(module_list)(*to_add)  # Unpack new_modules
+
+    return type(module_list)(to_add)  # Don't unpack new_modules
+
+
+def _get_func_kwargs(func, **kwargs):
+    """Extract kwargs that match the function signature."""
+    sig = inspect.signature(func)
+    return {kwarg: value for kwarg, value in kwargs.items() if kwarg in sig.parameters}