openvinotoolkit
diff --git a/‎examples/pruning/torch/resnet18/README.md‎
Lines changed: 2 additions & 0 deletions b/‎examples/pruning/torch/resnet18/README.md‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎examples/pruning/torch/resnet18/main.py‎
Lines changed: 89 additions & 94 deletions b/‎examples/pruning/torch/resnet18/main.py‎
Lines changed: 89 additions & 94 deletions
diff --git a/‎src/nncf/parameters.py‎
Lines changed: 1 addition & 0 deletions b/‎src/nncf/parameters.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/nncf/pruning/prune_model.py‎
Lines changed: 2 additions & 2 deletions b/‎src/nncf/pruning/prune_model.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎…cf/torch/function_hook/prune/__init__.py‎ ‎…/torch/function_hook/pruning/__init__.py‎src/nncf/torch/function_hook/prune/__init__.py renamed to src/nncf/torch/function_hook/pruning/__init__.py b/‎…cf/torch/function_hook/prune/__init__.py‎ ‎…/torch/function_hook/pruning/__init__.py‎src/nncf/torch/function_hook/prune/__init__.py renamed to src/nncf/torch/function_hook/pruning/__init__.py
diff --git a/‎…unction_hook/prune/magnitude/__init__.py‎ ‎…ction_hook/pruning/magnitude/__init__.py‎src/nncf/torch/function_hook/prune/magnitude/__init__.py renamed to src/nncf/torch/function_hook/pruning/magnitude/__init__.py b/‎…unction_hook/prune/magnitude/__init__.py‎ ‎…ction_hook/pruning/magnitude/__init__.py‎src/nncf/torch/function_hook/prune/magnitude/__init__.py renamed to src/nncf/torch/function_hook/pruning/magnitude/__init__.py
diff --git a/‎…ch/function_hook/prune/magnitude/algo.py‎ ‎…/function_hook/pruning/magnitude/algo.py‎src/nncf/torch/function_hook/prune/magnitude/algo.py renamed to src/nncf/torch/function_hook/pruning/magnitude/algo.py
Lines changed: 3 additions & 3 deletions b/‎…ch/function_hook/prune/magnitude/algo.py‎ ‎…/function_hook/pruning/magnitude/algo.py‎src/nncf/torch/function_hook/prune/magnitude/algo.py renamed to src/nncf/torch/function_hook/pruning/magnitude/algo.py
Lines changed: 3 additions & 3 deletions
diff --git a/‎…function_hook/prune/magnitude/modules.py‎ ‎…nction_hook/pruning/magnitude/modules.py‎src/nncf/torch/function_hook/prune/magnitude/modules.py renamed to src/nncf/torch/function_hook/pruning/magnitude/modules.py b/‎…function_hook/prune/magnitude/modules.py‎ ‎…nction_hook/pruning/magnitude/modules.py‎src/nncf/torch/function_hook/prune/magnitude/modules.py renamed to src/nncf/torch/function_hook/pruning/magnitude/modules.py
@@ -32,4 +32,6 @@ It's pretty simple. The example does not require additional preparation. It will
 
 ```bash
 python main.py
+# Or to run Regularization-Based pruning
+python main.py --mode rb
 ```
@@ -11,49 +11,54 @@
 
 import os
 import warnings
+from argparse import ArgumentParser
 from pathlib import Path
 
 import openvino as ov
 import torch
-import torch.optim
-import torch.utils.data
-import torch.utils.data.distributed
-import torchvision.datasets as datasets
-import torchvision.models as models
-import torchvision.transforms as transforms
 from fastdownload import FastDownload
 from rich.progress import track
 from torch import nn
 from torch.jit import TracerWarning
 from torch.utils.data import DataLoader
+from torchvision import datasets
+from torchvision import transforms
+from torchvision.models import resnet18
 
 import nncf
-import nncf.parameters
-import nncf.torch
-import nncf.torch.function_hook
-import nncf.torch.function_hook.prune
-import nncf.torch.function_hook.prune.prune_model
 from nncf.parameters import PruneMode
-from nncf.torch.function_hook.prune.magnitude.schedulers import MultiStepMagnitudePruningScheduler
+from nncf.torch.function_hook.pruning.magnitude.schedulers import MultiStepMagnitudePruningScheduler
+from nncf.torch.function_hook.pruning.rb.losses import RBLoss
+from nncf.torch.function_hook.pruning.rb.schedulers import MultiStepRBPruningScheduler
 
 warnings.filterwarnings("ignore", category=TracerWarning)
 warnings.filterwarnings("ignore", category=UserWarning)
 
 BASE_MODEL_NAME = "resnet18"
 IMAGE_SIZE = 64
 BATCH_SIZE = 128
-TRAINING_EPOCHS = 2
 
 
 ROOT = Path(__file__).parent.resolve()
-BEST_CKPT_NAME = "resnet18_int8_best.pt"
 CHECKPOINT_URL = (
     "https://storage.openvinotoolkit.org/repositories/nncf/openvino_notebook_ckpts/302_resnet18_fp32_v1.pth"
 )
 DATASET_URL = "http://cs231n.stanford.edu/tiny-imagenet-200.zip"
 DATASET_PATH = Path().home() / ".cache" / "nncf" / "datasets"
 
 
+def get_argument_parser() -> ArgumentParser:
+    parser = ArgumentParser()
+    parser.add_argument(
+        "--mode",
+        type=str,
+        choices=["magnitude", "rb"],
+        default="magnitude",
+        help="Pruning mode to use. Choices are: magnitude, rb. Default is magnitude.",
+    )
+    return parser
+
+
 def download_dataset() -> Path:
     downloader = FastDownload(base=DATASET_PATH.resolve(), archive="downloaded", data="extracted")
     return downloader.get(DATASET_URL)
@@ -66,10 +71,10 @@ def load_checkpoint(model: nn.Module) -> tuple[nn.Module, float]:
 
 
 def get_resnet18_model(device: torch.device) -> nn.Module:
-    num_classes = 200  # 200 is for Tiny ImageNet, default is 1000 for ImageNet
-    model = models.resnet18(weights=None)
+    model = resnet18(weights=None)
     # Update the last FC layer for Tiny ImageNet number of classes.
-    model.fc = nn.Linear(in_features=512, out_features=num_classes, bias=True)
+    # 200 is for Tiny ImageNet, default is 1000 for ImageNet
+    model.fc = nn.Linear(in_features=512, out_features=200, bias=True)
     model.to(device)
     return model
 
@@ -78,6 +83,7 @@ def train_epoch(
     train_loader: DataLoader,
     model: nn.Module,
     criterion: nn.Module,
+    rb_loss: RBLoss,
     optimizer: torch.optim.Optimizer,
     device: torch.device,
 ):
@@ -91,50 +97,34 @@ def train_epoch(
         # Compute output.
         output = model(images)
         loss = criterion(output, target)
-
+        if rb_loss is not None:
+            loss += rb_loss()
         # Compute gradient and do opt step.
         optimizer.zero_grad()
         loss.backward()
         optimizer.step()
 
 
-def validate(val_loader: DataLoader, model: nn.Module, device: torch.device) -> float:
-    top1_sum = 0.0
-
+@torch.no_grad()
+def validate(val_loader: torch.utils.data.DataLoader, model: torch.nn.Module, device: torch.device) -> float:
     # Switch to evaluate mode.
     model.eval()
 
-    with torch.no_grad():
-        for images, target in track(val_loader, total=len(val_loader), description="Validation:"):
-            images = images.to(device)
-            target = target.to(device)
-
-            # Compute output.
-            output = model(images)
-
-            # Measure accuracy and record loss.
-            [acc1] = accuracy(output, target, topk=(1,))
-            top1_sum += acc1.item()
-
-        num_samples = len(val_loader)
-        top1_avg = top1_sum / num_samples
-    return top1_avg
+    correct = 0
+    total = 0
 
+    for images, target in track(val_loader, total=len(val_loader), description="Validation:"):
+        images = images.to(device)
+        target = target.to(device)
 
-def accuracy(output: torch.Tensor, target: torch.tensor, topk: tuple[int, ...] = (1,)):
-    with torch.no_grad():
-        maxk = max(topk)
-        batch_size = target.size(0)
+        output = model(images)
 
-        _, pred = output.topk(maxk, 1, True, True)
-        pred = pred.t()
-        correct = pred.eq(target.view(1, -1).expand_as(pred))
+        _, preds = output.max(1)
+        correct += preds.eq(target).sum().item()
+        total += target.size(0)
 
-        res = []
-        for k in topk:
-            correct_k = correct[:k].reshape(-1).float().sum(0, keepdim=True)
-            res.append(correct_k.mul_(100.0 / batch_size))
-        return res
+    accuracy1 = 100.0 * correct / total
+    return accuracy1
 
 
 def create_data_loaders() -> tuple[DataLoader, DataLoader]:
@@ -151,23 +141,12 @@ def create_data_loaders() -> tuple[DataLoader, DataLoader]:
     train_dataset = datasets.ImageFolder(
         train_dir,
         transforms.Compose(
-            [
-                transforms.Resize(IMAGE_SIZE),
-                transforms.RandomHorizontalFlip(),
-                transforms.ToTensor(),
-                normalize,
-            ]
+            [transforms.Resize(IMAGE_SIZE), transforms.RandomHorizontalFlip(), transforms.ToTensor(), normalize]
         ),
     )
     val_dataset = datasets.ImageFolder(
         val_dir,
-        transforms.Compose(
-            [
-                transforms.Resize(IMAGE_SIZE),
-                transforms.ToTensor(),
-                normalize,
-            ]
-        ),
+        transforms.Compose([transforms.Resize(IMAGE_SIZE), transforms.ToTensor(), normalize]),
     )
 
     train_loader = DataLoader(
@@ -200,7 +179,10 @@ def prepare_tiny_imagenet_200(dataset_dir: Path) -> None:
     val_images_dir.rmdir()
 
 
-def main():
+def main() -> float:
+    args = get_argument_parser().parse_args()
+    pruning_mode = args.mode
+
     torch.manual_seed(0)
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
     print(f"Using {device} device")
@@ -212,51 +194,64 @@ def main():
     model = get_resnet18_model(device)
     model, acc1_fp32 = load_checkpoint(model)
 
-    print(f"Accuracy@1 of original FP32 model: {acc1_fp32}")
+    print(f"Accuracy@1 of original FP32 model: {acc1_fp32:.2f}")
 
     train_loader, val_loader = create_data_loaders()
     example_input = torch.rand(1, 3, IMAGE_SIZE, IMAGE_SIZE).to(device)
 
     ###############################################################################
     # Step 2: Prune model
-    print(os.linesep + "[Step 2] Prune model")
-
-    # Unstructured pruning with 70% sparsity ratio
-    pruned_model = nncf.prune(
-        model,
-        mode=PruneMode.UNSTRUCTURED_MAGNITUDE_GLOBAL,
-        ratio=0.7,
-        ignored_scope=nncf.IgnoredScope(),
-        examples_inputs=example_input,
-    )
-
-    acc1_init = validate(val_loader, pruned_model, device)
-
-    print(f"Accuracy@1 of pruned model with 0.7 pruning ratio without fine-tuning: {acc1_init:.3f}")
-
-    ###############################################################################
-    # Step 3: Fine tune with multi step sparsity scheduler
-    print(os.linesep + "[Step 3] Fine tune with multi step sparsity scheduler")
+    print(os.linesep + "[Step 2]: Prune model and specify training parameters")
+
+    if pruning_mode == "magnitude":
+        pruned_model = nncf.prune(
+            model,
+            mode=PruneMode.UNSTRUCTURED_MAGNITUDE_GLOBAL,
+            ratio=0.7,
+            ignored_scope=nncf.IgnoredScope(),
+            examples_inputs=example_input,
+        )
+        num_epochs = 2
+        rb_loss = None
+        scheduler = MultiStepMagnitudePruningScheduler(
+            model=model, mode=PruneMode.UNSTRUCTURED_MAGNITUDE_GLOBAL, steps={0: 0.5, 1: 0.7}
+        )
+        optimizer = torch.optim.Adam(pruned_model.parameters(), lr=1e-5)
+    else:
+        pruned_model = nncf.prune(
+            model,
+            mode=PruneMode.UNSTRUCTURED_REGULARIZATION_BASED,
+            ignored_scope=nncf.IgnoredScope(),
+            examples_inputs=example_input,
+        )
+        num_epochs = 30
+        rb_loss = RBLoss(pruned_model, target_ratio=0.7, p=0.1).to(device)
+        scheduler = MultiStepRBPruningScheduler(rb_loss, steps={0: 0.3, 5: 0.5, 10: 0.7})
+
+        # Set higher lr for mask parameters to achieve the target pruning ratio faster
+        mask_params = [p for n, p in pruned_model.named_parameters() if "mask" in n]
+        model_params = [p for n, p in pruned_model.named_parameters() if "mask" not in n]
+        optimizer = torch.optim.Adam(
+            [
+                {"params": model_params, "lr": 1e-5},
+                {"params": mask_params, "lr": 1e-2, "weight_decay": 0.0},
+            ]
+        )
 
-    # Define loss function (criterion) and optimizer.
     criterion = nn.CrossEntropyLoss().to(device)
-    compression_lr = 1e-5
-    optimizer = torch.optim.Adam(pruned_model.parameters(), lr=compression_lr)
 
-    # Create prune scheduler with multi steps strategy
-    pruning_scheduler = MultiStepMagnitudePruningScheduler(
-        pruned_model, mode=PruneMode.UNSTRUCTURED_MAGNITUDE_GLOBAL, steps={0: 0.6, 1: 0.7}
-    )
+    ###############################################################################
+    # Step 3: Fine tune
+    print(os.linesep + "[Step 3] Fine tune with multi step pruning ratio scheduler")
 
-    for epoch in range(2):
+    for epoch in range(num_epochs):
         print(os.linesep + f"Train epoch: {epoch}")
+        scheduler.step()
+        train_epoch(train_loader, pruned_model, criterion, rb_loss, optimizer, device=device)
 
-        pruning_scheduler.step()
-
-        train_epoch(train_loader, pruned_model, criterion, optimizer, device=device)
         acc1 = validate(val_loader, pruned_model, device)
-        # Show statistics of pruning
-        print(f"Accuracy@1 of pruned model after {epoch} epoch ratio {pruning_scheduler.current_ratio}: {acc1:.3f}")
+        print(f"Current pruning ratio: {scheduler.current_ratio:.3f}")
+        print(f"Accuracy@1 of pruned model after {epoch} epoch: {acc1:.3f}")
 
     ###############################################################################
     # Step 4: Export models
 
@@ -221,3 +221,4 @@ class QuantizationMode(StrEnum):
 class PruneMode(StrEnum):
     UNSTRUCTURED_MAGNITUDE_LOCAL = auto()
     UNSTRUCTURED_MAGNITUDE_GLOBAL = auto()
+    UNSTRUCTURED_REGULARIZATION_BASED = auto()
@@ -23,7 +23,7 @@ def prune(
     model: TModel,
     *,
     mode: PruneMode,
-    ratio: float,
+    ratio: Optional[float] = None,
     ignored_scope: Optional[IgnoredScope] = None,
     examples_inputs: Optional[Any] = None,
 ) -> TModel:
@@ -40,7 +40,7 @@ def prune(
     """
     backend = get_backend(model)
     if backend == BackendType.TORCH:
-        from nncf.torch.function_hook.prune.prune_model import prune
+        from nncf.torch.function_hook.pruning.prune_model import prune
 
         model = prune(model, mode, ratio, ignored_scope, examples_inputs)
     else:
 
@@ -15,7 +15,7 @@
 import nncf
 from nncf.parameters import PruneMode
 from nncf.torch.function_hook.hook_storage import decode_hook_name
-from nncf.torch.function_hook.prune.magnitude.modules import UnstructuredPruningMask
+from nncf.torch.function_hook.pruning.magnitude.modules import UnstructuredPruningMask
 from nncf.torch.function_hook.wrapper import get_hook_storage
 from nncf.torch.function_hook.wrapper import register_post_function_hook
 from nncf.torch.model_graph_manager import get_const_data_by_name
@@ -114,7 +114,7 @@ def update_pruning_ratio(
             new_mask = (abs_data > threshold).to(dtype=torch.bool)
 
             # Set new mask
-            hook.binary_mask = new_mask
+            hook.binary_mask.copy_(new_mask)
 
     elif mode == PruneMode.UNSTRUCTURED_MAGNITUDE_GLOBAL:
         # Get threshold value for all normalized weights
@@ -135,7 +135,7 @@ def update_pruning_ratio(
             new_mask = (norm_data > threshold_val).to(dtype=torch.bool)
 
             # Set new mask
-            hook.binary_mask = new_mask
+            hook.binary_mask.copy_(new_mask)
     else:
         msg = f"Unsupported pruning mode: {mode}"
         raise nncf.InternalError(msg)