resemble-ai · rsxdalv · May 30, 2025 · Jun 1, 2025 · Jun 1, 2025 · Jun 1, 2025
diff --git a/requirements.txt b/requirements.txt
@@ -1,5 +1,4 @@
 celluloid>=0.2.0
-deepspeed>=0.12.4
 librosa>=0.10.1
 matplotlib>=3.8.1
 numpy>=1.26.2

diff --git a/resemble_enhance/denoiser/inference.py b/resemble_enhance/denoiser/inference.py
@@ -4,23 +4,17 @@
 import torch
 
 from ..inference import inference
-from .train import Denoiser, HParams
+from .safetensors_loader import load_denoiser_model, create_default_denoiser
+from .hparams import HParams
 
 logger = logging.getLogger(__name__)
 
 
 @cache
 def load_denoiser(run_dir, device):
     if run_dir is None:
-        return Denoiser(HParams())
-    hp = HParams.load(run_dir)
-    denoiser = Denoiser(hp)
-    path = run_dir / "ds" / "G" / "default" / "mp_rank_00_model_states.pt"
-    state_dict = torch.load(path, map_location="cpu")["module"]
-    denoiser.load_state_dict(state_dict)
-    denoiser.eval()
-    denoiser.to(device)
-    return denoiser
+        return create_default_denoiser(device)
+    return load_denoiser_model(run_dir, device)
 
 
 @torch.inference_mode()

diff --git a/resemble_enhance/denoiser/safetensors_loader.py b/resemble_enhance/denoiser/safetensors_loader.py
@@ -0,0 +1,247 @@
+"""
+Enhanced model loader for denoiser with safetensors support and JSON configs.
+Provides efficient loading without state_dict filtering when using safetensors.
+"""
+import json
+import logging
+from pathlib import Path
+from typing import Dict, Any, Union
+
+import torch
+from safetensors.torch import load_file
+
+from .denoiser import Denoiser
+from .hparams import HParams
+
+logger = logging.getLogger(__name__)
+
+
+class JSONConfig:
+    """Simple config class that works with JSON files instead of OmegaConf."""
+
+    def __init__(self, config_dict: Dict[str, Any]):
+        self._config = config_dict
+        # Set attributes for easy access
+        for key, value in config_dict.items():
+            if isinstance(value, dict):
+                setattr(self, key, JSONConfig(value))
+            else:
+                setattr(self, key, value)
+
+    @classmethod
+    def load(cls, json_path: Union[str, Path]) -> 'JSONConfig':
+        """Load config from JSON file."""
+        with open(json_path, 'r') as f:
+            config_dict = json.load(f)
+        return cls(config_dict)
+
+    def get(self, key: str, default=None):
+        """Get config value with default."""
+        return getattr(self, key, default)
+
+    def to_dict(self) -> Dict[str, Any]:
+        """Convert back to dictionary."""
+        return self._config
+
+
+def load_denoiser_from_safetensors(model_dir: Union[str, Path], device: str = "cpu") -> Denoiser:
+    """Load denoiser model from safetensors format.
+
+    Args:
+        model_dir: Directory containing model.safetensors and config.json
+        device: Device to load the model on
+
+    Returns:
+        Loaded Denoiser model
+    """
+    model_path = Path(model_dir)
+
+    # Load config
+    config_path = model_path / "config.json"
+    if not config_path.exists():
+        raise FileNotFoundError(f"Config file not found: {config_path}")
+
+    config = JSONConfig.load(config_path)
+
+    # Create HParams with default values, then update from config
+    hp = HParams()
+
+    # For frozen dataclasses, we need to use object.__setattr__
+    config_dict = config.to_dict()
+    for key, value in config_dict.items():
+        if hasattr(hp, key):
+            try:
+                object.__setattr__(hp, key, value)
+            except Exception:
+                logger.warning(f"Could not set {key}={value} on HParams")
+
+    # Create model
+    model = Denoiser(hp)
+
+    # Load weights from safetensors
+    weights_path = model_path / "model.safetensors"
+    if not weights_path.exists():
+        raise FileNotFoundError(f"Model weights not found: {weights_path}")
+
+    state_dict = load_file(weights_path, device=device)
+
+    # No filtering needed - safetensors already contains only denoiser weights
+    model.load_state_dict(state_dict)
+    model.eval()
+    model.to(device)
+
+    logger.info(f"Loaded denoiser model from safetensors: {model_path}")
+    return model
+
+
+def load_denoiser_model(run_dir: Union[str, Path, None], device: str = "cpu") -> Denoiser:
+    """Load denoiser model from either safetensors or DeepSpeed checkpoint.
+
+    Args:
+        run_dir: Path to model directory (safetensors) or checkpoint directory (DeepSpeed)
+        device: Device to load the model on
+
+    Returns:
+        Loaded Denoiser model
+    """
+    if run_dir is None:
+        return create_default_denoiser(device)
+
+    run_dir = Path(run_dir)
+
+    # Check if this is a safetensors model directory
+    if (run_dir / "model.safetensors").exists() and (run_dir / "config.json").exists():
+        logger.info("Loading denoiser from safetensors format")
+        return load_denoiser_from_safetensors(run_dir, device)
+
+    # Fall back to DeepSpeed checkpoint loading
+    logger.info("Loading denoiser from DeepSpeed checkpoint format")
+    return load_denoiser_from_deepspeed(run_dir, device)
+
+
+def load_denoiser_from_deepspeed(run_dir: Path, device: str = "cpu") -> Denoiser:
+    """Load denoiser model from DeepSpeed checkpoint (legacy format).
+
+    Args:
+        run_dir: Path to the model checkpoint directory
+        device: Device to load the model on
+
+    Returns:
+        Loaded Denoiser model ready for inference
+    """
+    # Load hparams
+    hparams_path = run_dir / "hparams.yaml"
+    if not hparams_path.exists():
+        logger.warning(f"hparams.yaml not found in {run_dir}, using defaults")
+        hp = HParams()
+    else:
+        hp = HParams.load(run_dir)
+
+    # Create model
+    model = Denoiser(hp)
+
+    # Load the state dict from DeepSpeed checkpoint
+    ckpt_path = run_dir / "ds" / "G" / "default" / "mp_rank_00_model_states.pt"
+    if not ckpt_path.exists():
+        logger.warning(f"Model checkpoint not found at {ckpt_path}, returning default model")
+        return create_default_denoiser(device)
+
+    state_dict = torch.load(ckpt_path, map_location="cpu")["module"]
+    model.load_state_dict(state_dict)
+    model.eval()
+    model.to(device)
+
+    logger.info(f"Loaded denoiser model from DeepSpeed checkpoint: {run_dir}")
+    return model
+
+
+def load_denoiser_from_enhancer_checkpoint(run_dir: Union[str, Path, None], device: str = "cpu") -> Denoiser:
+    """Load denoiser model from an enhancer checkpoint.
+
+    This extracts the denoiser weights from an enhancer checkpoint that contains
+    both enhancer and denoiser weights.
+
+    Args:
+        run_dir: Path to the enhancer checkpoint directory (None for default model)
+        device: Device to load the model on
+
+    Returns:
+        Loaded Denoiser model ready for inference
+    """
+    # If no run_dir provided, create default model
+    if run_dir is None:
+        return create_default_denoiser(device)
+
+    run_dir = Path(run_dir)
+
+    # Check if this is a safetensors enhancer directory with separate denoiser
+    denoiser_safetensors_dir = run_dir.parent / "denoiser" if run_dir.parent else None
+    if (denoiser_safetensors_dir and 
+        (denoiser_safetensors_dir / "model.safetensors").exists() and 
+        (denoiser_safetensors_dir / "config.json").exists()):
+        logger.info("Loading denoiser from separate safetensors directory")
+        return load_denoiser_from_safetensors(denoiser_safetensors_dir, device)
+
+    # Try to load denoiser hparams first, fall back to enhancer hparams
+    denoiser_hp_path = run_dir / "denoiser_hparams.yaml"
+    if denoiser_hp_path.exists():
+        hp = HParams.load(denoiser_hp_path)
+    else:
+        # Load enhancer hparams and use denoiser settings from it
+        from ..enhancer.hparams import HParams as EnhancerHParams
+        enhancer_hp_path = run_dir / "hparams.yaml"
+        if enhancer_hp_path.exists():
+            enhancer_hp = EnhancerHParams.load(run_dir)
+
+            # Create denoiser hparams from enhancer config
+            hp = HParams()
+            # Copy relevant settings if they exist
+            if hasattr(enhancer_hp, 'denoiser_run_dir') and enhancer_hp.denoiser_run_dir:
+                denoiser_run_dir = Path(enhancer_hp.denoiser_run_dir)
+                if (denoiser_run_dir / "hparams.yaml").exists():
+                    hp = HParams.load(denoiser_run_dir)
+        else:
+            # No hparams found, use default
+            hp = HParams()
+
+    model = Denoiser(hp)
+
+    # Load the state dict from enhancer checkpoint
+    ckpt_path = run_dir / "ds" / "G" / "default" / "mp_rank_00_model_states.pt"
+    if not ckpt_path.exists():
+        # No checkpoint found, return default model
+        return create_default_denoiser(device)
+
+    state_dict = torch.load(ckpt_path, map_location="cpu")["module"]
+
+    # Extract only denoiser weights
+    denoiser_state_dict = {k.replace('denoiser.', '', 1): v for k, v in state_dict.items() if k.startswith('denoiser.')}
+
+    if not denoiser_state_dict:
+        # No denoiser weights found, return default model
+        logger.warning("No denoiser weights found in enhancer checkpoint, using default model")
+        return create_default_denoiser(device)
+
+    model.load_state_dict(denoiser_state_dict)
+    model.eval()
+    model.to(device)
+
+    logger.info(f"Loaded denoiser from enhancer checkpoint: {run_dir}")
+    return model
+
+
+def create_default_denoiser(device: str = "cpu") -> Denoiser:
+    """Create a default denoiser model with default hyperparameters.
+
+    Args:
+        device: Device to create the model on
+
+    Returns:
+        Default Denoiser model (not trained)
+    """
+    hp = HParams()
+    model = Denoiser(hp)
+    model.eval()
+    model.to(device)
+    logger.info("Created default denoiser model")
+    return model
diff --git a/resemble_enhance/enhancer/download.py b/resemble_enhance/enhancer/download.py
@@ -11,14 +11,34 @@
 def get_source_url(relpath):
     return f"https://huggingface.co/ResembleAI/resemble-enhance/resolve/main/{RUN_NAME}/{relpath}?download=true"
 
+def get_safetensors_url(relpath):
+    return f"https://huggingface.co/rsxdalv/resemble-enhance/resolve/main/{relpath}?download=true"
 
 def get_target_path(relpath: str | Path, run_dir: str | Path | None = None):
     if run_dir is None:
         run_dir = Path(__file__).parent.parent / "model_repo" / RUN_NAME
     return Path(run_dir) / relpath
 
 
-def download(run_dir: str | Path | None = None):
+def download(run_dir: str | Path | None = None, safetensors: bool = False) -> Path:
+    relpaths_safetensors = [
+        "denoiser/config.json",
+        "denoiser/model.safetensors",
+        "denoiser/model_info.json",
+        "enhancer/config.json",
+        "enhancer/model.safetensors",
+        "enhancer/model_info.json",
+    ]
+    if safetensors:
+        for relpath in relpaths_safetensors:
+            path = get_target_path(relpath, run_dir=run_dir)
+            if path.exists():
+                continue
+            url = get_safetensors_url(relpath)
+            path.parent.mkdir(parents=True, exist_ok=True)
+            torch.hub.download_url_to_file(url, str(path))
+        return get_target_path("", run_dir=run_dir)
+
     relpaths = ["hparams.yaml", "ds/G/latest", "ds/G/default/mp_rank_00_model_states.pt"]
     for relpath in relpaths:
         path = get_target_path(relpath, run_dir=run_dir)