diff --git a/BACKWARDS_COMPATIBILITY_FIXED.md b/BACKWARDS_COMPATIBILITY_FIXED.md
new file mode 100644
index 0000000..e69de29
diff --git a/CONFIG_IMPROVEMENT.md b/CONFIG_IMPROVEMENT.md
index c50ff47..e69de29 100644
--- a/CONFIG_IMPROVEMENT.md
+++ b/CONFIG_IMPROVEMENT.md
@@ -1,176 +0,0 @@
-# MuMDIA Configuration Management Improvement
-
-## The Problem
-The original `run.py` had extremely complex argument parsing and configuration management:
-
-- **~100 lines** of argument parsing code
-- **Complex merging logic** between CLI args and config files  
-- **Difficult to maintain** argument parsing functions
-- **Hard to understand** configuration flow
-- **Manual config validation** and error handling
-
-## The Solution: Simplified Configuration with Dataclasses
-
-### Before (Complex approach in `run.py`):
-
-```python
-def parse_arguments() -> Tuple[argparse.ArgumentParser, argparse.Namespace]:
-    """Parse command line arguments - 50+ lines of argparse setup"""
-    parser = argparse.ArgumentParser()
-    parser.add_argument("--mzml_file", type=str, help="Path to mzML file", default=None)
-    parser.add_argument("--fasta_file", type=str, help="Path to FASTA file", default=None)
-    # ... 30+ more arguments ...
-    args = parser.parse_args()
-    return parser, args
-
-def was_arg_explicitly_provided(parser: argparse.ArgumentParser, arg_name: str) -> bool:
-    """Check if argument was explicitly provided - complex logic"""
-    for action in parser._actions:
-        if arg_name in action.dest:
-            for option in action.option_strings:
-                if option in sys.argv:
-                    return True
-    return False
-
-def modify_config(parser: argparse.ArgumentParser, args: argparse.Namespace, config_path: str) -> Dict[str, Any]:
-    """Load and modify config - 50+ lines of complex merging logic"""
-    # Load base config from JSON
-    # Override with CLI args using complex checking
-    # Save effective config
-    # Return merged config dict
-
-# In main():
-parser, args = parse_arguments()
-config = modify_config(parser, args, args.config_file)
-# Extract all individual values from config dict
-mzml_file = config["mzml_file"]
-fasta_file = config["fasta_file"]
-# ... dozens more extractions ...
-```
-
-### After (Clean dataclass approach in `config_manager_clean.py`):
-
-```python
-@dataclass
-class MuMDIAConfig:
-    """Clean, type-safe configuration with defaults"""
-    mzml_file: str = ""
-    fasta_file: str = ""
-    result_dir: str = "results"
-    n_windows: int = 10
-    training_fdr: float = 0.05
-    final_fdr: float = 0.01
-    model_type: str = "xgboost"
-    no_cache: bool = False
-    clean: bool = False
-    sage_only: bool = False
-    # ... all options clearly defined
-
-    @classmethod
-    def from_json(cls, json_path: str) -> "MuMDIAConfig":
-        """Simple JSON loading with error handling"""
-        
-    @classmethod  
-    def from_args(cls, args=None) -> "MuMDIAConfig":
-        """Simple CLI parsing with config file support"""
-        
-    def validate(self) -> None:
-        """Clean validation logic"""
-
-def get_config() -> MuMDIAConfig:
-    """One-liner to get validated config"""
-    config = MuMDIAConfig.from_args()
-    config.validate()
-    return config
-
-# In main():
-config = get_config()  # That's it! One line replaces 100+ lines!
-# Direct attribute access:
-print(config.mzml_file)
-print(config.n_windows)
-```
-
-## Key Improvements
-
-### 1. **Dramatic Code Reduction**
-- **Before**: ~100 lines of complex parsing logic
-- **After**: 1 line: `config = get_config()`
-- **Reduction**: 99% fewer lines for config management!
-
-### 2. **Type Safety** 
-- **Before**: Untyped dictionary access like `config["mzml_file"]`
-- **After**: Type-safe attribute access like `config.mzml_file`
-- **Benefit**: IDE autocomplete, type checking, fewer runtime errors
-
-### 3. **Clear Defaults**
-- **Before**: Defaults scattered across argparse definitions
-- **After**: All defaults clearly visible in dataclass definition
-- **Benefit**: Easy to see and modify default values
-
-### 4. **Better Error Handling**
-- **Before**: Manual validation scattered throughout code
-- **After**: Centralized validation in `validate()` method
-- **Benefit**: Consistent error messages and validation logic
-
-### 5. **Simpler Usage Patterns**
-
-#### Command line usage:
-```bash
-# Simple usage
-python run_simple.py --mzml_file data.mzML --fasta_file proteins.fasta
-
-# With options
-python run_simple.py --mzml_file data.mzML --fasta_file proteins.fasta --n_windows 5 --verbose --no-cache
-
-# With config file
-python run_simple.py --config_file my_config.json
-
-# Config file with CLI overrides 
-python run_simple.py --config_file my_config.json --clean --result_dir custom_results
-```
-
-#### JSON config files:
-```json
-{
-  "mzml_file": "data.mzML",
-  "fasta_file": "proteins.fasta", 
-  "result_dir": "my_results",
-  "n_windows": 15,
-  "training_fdr": 0.1,
-  "model_type": "nn",
-  "verbose": true
-}
-```
-
-## Implementation Status
-
-✅ **Created**: `config_manager_clean.py` - Complete simplified config system
-✅ **Created**: `run_simple.py` - Demo of clean config usage
-✅ **Created**: `config_demo.py` - Working demonstration
-✅ **Tested**: Both CLI arguments and JSON config files work perfectly
-
-## Migration Path
-
-The new config system is **fully backwards compatible**. You can:
-
-1. **Immediate adoption**: Use `config_manager_clean.py` for new features
-2. **Gradual migration**: Replace complex config logic piece by piece  
-3. **Side-by-side**: Run both systems during transition period
-
-## Developer Experience Impact
-
-**Before**: Developers had to:
-- Navigate 100+ lines of complex argument parsing
-- Understand config merging logic  
-- Manually handle validation
-- Debug dictionary key errors
-- Maintain scattered default values
-
-**After**: Developers can:
-- See all configuration at a glance in the dataclass
-- Get IDE support with autocomplete and type checking
-- Add new config options by just adding a dataclass field
-- Trust that validation is centralized and consistent
-- Focus on business logic instead of configuration plumbing
-
-The new approach makes MuMDIA **much more maintainable and developer-friendly**!
diff --git a/CONFIG_SIMPLIFIED_COMPLETE.md b/CONFIG_SIMPLIFIED_COMPLETE.md
new file mode 100644
index 0000000..e69de29
diff --git a/config.py b/config.py
new file mode 100644
index 0000000..afa2462
--- /dev/null
+++ b/config.py
@@ -0,0 +1,540 @@
+#!/usr/bin/env python3
+"""
+Simplified MuMDIA Configuration System
+
+This module provides a simplified, flat configuration system that replaces the previous
+complex nested configuration. Key features:
+
+1. Single flat parameter structure instead of nested sections
+2. Override mechanism using suffixes (_initial_search, _full_search)  
+3. Automatic default values for all parameters
+4. Backwards compatibility with existing workflow code
+"""
+
+from dataclasses import dataclass, field
+from typing import Dict, Any, List, Optional
+import json
+
+import argparse
+import json
+import os
+from dataclasses import dataclass, field, asdict
+from pathlib import Path
+from typing import Dict, Any, Optional, Union, List
+import sys
+
+
+def convert_legacy_config(legacy_data: Dict[str, Any]) -> Dict[str, Any]:
+    """Convert old nested config format to new flat format."""
+    flat_data = {}
+    
+    # Extract basic parameters from sage_basic section
+    if "sage_basic" in legacy_data:
+        sage_basic = legacy_data["sage_basic"]
+        
+        # Extract file paths
+        if "mzml_paths" in sage_basic and sage_basic["mzml_paths"]:
+            flat_data["mzml_file"] = sage_basic["mzml_paths"][0]
+        
+        # Extract database parameters
+        if "database" in sage_basic:
+            db = sage_basic["database"]
+            if "fasta" in db:
+                flat_data["fasta_file"] = db["fasta"]
+            if "enzyme" in db:
+                enzyme = db["enzyme"]
+                flat_data["missed_cleavages"] = enzyme.get("missed_cleavages", 2)
+                flat_data["cleave_at"] = enzyme.get("cleave_at", "KR")
+            flat_data["max_variable_mods"] = db.get("max_variable_mods", 1)
+        
+        # Extract other sage_basic parameters
+        flat_data["deisotope"] = sage_basic.get("deisotope", False)
+        flat_data["chimera"] = sage_basic.get("chimera", True)
+        flat_data["wide_window"] = sage_basic.get("wide_window", True)
+        flat_data["report_psms"] = sage_basic.get("report_psms", 5)
+    
+    # Extract full search overrides from sage section
+    if "sage" in legacy_data:
+        sage = legacy_data["sage"]
+        
+        # Full search specific parameters
+        flat_data["deisotope_full_search"] = sage.get("deisotope", True)
+        flat_data["report_psms_full_search"] = sage.get("report_psms", 12)
+        
+        if "database" in sage:
+            db = sage["database"]
+            if "enzyme" in db and "cleave_at" in db["enzyme"]:
+                flat_data["cleave_at_initial_search"] = db["enzyme"]["cleave_at"]
+            flat_data["max_variable_mods_full_search"] = db.get("max_variable_mods", 2)
+    
+    # Extract MuMDIA parameters - only include fields that exist in MuMDIAConfig
+    mumdia_field_mapping = {
+        "write_deeplc_pickle": "write_deeplc_pickle",
+        "write_ms2pip_pickle": "write_ms2pip_pickle", 
+        "write_correlation_pickles": "write_correlation_pickles",
+        "write_initial_search_pickle": "write_initial_search_pickle",
+        "write_full_search_pickle": "write_full_search_pickle",
+        "read_deeplc_pickle": "read_deeplc_pickle",
+        "read_ms2pip_pickle": "read_ms2pip_pickle",
+        "read_correlation_pickles": "read_correlation_pickles",
+        "read_full_search_pickles": "read_full_search_pickle",  # Fix plural->singular
+        "read_initial_search_pickle": "read_initial_search_pickle",
+        "remove_intermediate_files": "remove_intermediate_files",
+        "fdr_init_search": "fdr_init_search",
+    }
+    
+    if "mumdia" in legacy_data:
+        mumdia = legacy_data["mumdia"]
+        for old_key, new_key in mumdia_field_mapping.items():
+            if old_key in mumdia:
+                flat_data[new_key] = mumdia[old_key]
+    
+    # Set default result_dir if not present
+    if "result_dir" not in flat_data:
+        flat_data["result_dir"] = "results"
+    
+    return flat_data
+
+
+def load_config_from_json(json_path: str) -> 'MuMDIAConfig':
+    """Load configuration from JSON file, supporting both old and new formats."""
+    with open(json_path, 'r') as f:
+        config_data = json.load(f)
+    
+    # Check if this is the old nested format
+    if "sage_basic" in config_data or "sage" in config_data or "mumdia" in config_data:
+        print(f"🔄 Converting legacy config format to new simplified format...")
+        config_data = convert_legacy_config(config_data)
+    
+    # Filter out comment fields (fields starting with _comment)
+    filtered_data = {k: v for k, v in config_data.items() if not k.startswith('_comment')}
+    
+    return MuMDIAConfig(**filtered_data)
+
+
+@dataclass
+class MuMDIAConfig:
+    """
+    Simplified MuMDIA configuration with smart defaults and override mechanism.
+    
+    Parameters can be overridden for specific search types using suffixes:
+    - parameter_initial_search: Override for initial search only
+    - parameter_full_search: Override for full search only
+    - parameter: Default value used for both if no specific override
+    """
+    
+    # === File paths ===
+    mzml_file: str = ""
+    fasta_file: str = ""
+    mgf_file: str = ""
+    result_dir: str = "results"
+    config_file: str = "configs/config.json"
+    
+    # === Search parameters ===
+    # Database settings
+    bucket_size: int = 1024
+    bucket_size_initial_search: Optional[int] = None
+    bucket_size_full_search: Optional[int] = None
+    
+    # Enzyme settings
+    missed_cleavages: int = 2
+    missed_cleavages_initial_search: Optional[int] = None
+    missed_cleavages_full_search: Optional[int] = None
+    
+    min_len: int = 6
+    max_len: int = 30
+    cleave_at: str = "KR"
+    cleave_at_initial_search: str = "$"  # Different default for initial search
+    cleave_at_full_search: Optional[str] = None
+    
+    restrict: str = "P"
+    c_terminal: bool = True
+    
+    # Mass ranges
+    fragment_min_mz: float = 100.0
+    fragment_max_mz: float = 2500.0
+    peptide_min_mass: float = 300.0
+    peptide_max_mass: float = 5000.0
+    
+    # Ion settings
+    ion_kinds: List[str] = field(default_factory=lambda: ["b", "y"])
+    min_ion_index: int = 2
+    max_fragment_charge: int = 1
+    
+    # Modifications
+    static_mods: Dict[str, float] = field(default_factory=lambda: {"C": 57.0215})
+    variable_mods: Dict[str, List[float]] = field(default_factory=lambda: {"M": [15.9949]})
+    max_variable_mods: int = 1
+    max_variable_mods_initial_search: Optional[int] = None
+    max_variable_mods_full_search: int = 2  # Different default for full search
+    
+    # Decoys
+    decoy_tag: str = "rev_"
+    generate_decoys: bool = True
+    
+    # Tolerances
+    precursor_tol_da_low: float = -40.0
+    precursor_tol_da_high: float = 40.0
+    fragment_tol_ppm_low: float = -13.0
+    fragment_tol_ppm_high: float = 13.0
+    
+    # Charge and isotope settings
+    precursor_charge_min: int = 1
+    precursor_charge_max: int = 4
+    isotope_errors_min: int = -1
+    isotope_errors_max: int = 1
+    
+    # Processing settings
+    deisotope: bool = False
+    deisotope_initial_search: Optional[bool] = None
+    deisotope_full_search: bool = True  # Different default for full search
+    
+    annotate_matches: bool = True
+    chimera: bool = True
+    predict_rt: bool = False
+    wide_window: bool = True
+    
+    # Peak settings
+    min_peaks: int = 0
+    max_peaks: int = 10000
+    min_matched_peaks: int = 5
+    
+    # Reporting
+    report_psms: int = 5
+    report_psms_initial_search: Optional[int] = None
+    report_psms_full_search: int = 12  # Different default for full search
+    
+    # === MuMDIA-specific settings ===
+    # Pickle settings
+    write_deeplc_pickle: bool = True
+    write_ms2pip_pickle: bool = True
+    write_correlation_pickles: bool = True
+    write_initial_search_pickle: bool = True
+    write_full_search_pickle: bool = True
+    read_deeplc_pickle: bool = False
+    read_ms2pip_pickle: bool = False
+    read_correlation_pickles: bool = False
+    read_full_search_pickle: bool = False
+    read_initial_search_pickle: bool = False
+    
+    # Processing settings
+    remove_intermediate_files: bool = False
+    dlc_transfer_learn: bool = False
+    fdr_init_search: float = 0.01
+    
+    # ML settings
+    n_windows: int = 10
+    training_fdr: float = 0.01
+    final_fdr: float = 0.01
+    model_type: str = "xgboost"
+    
+    # Runtime flags
+    no_cache: bool = False
+    clean: bool = False
+    sage_only: bool = False
+    skip_mokapot: bool = False
+    verbose: bool = False
+    
+    # Feature settings
+    rescoring_features: List[str] = field(default_factory=lambda: [
+        "distribution_correlation_matrix_psm_ids",
+        "distribution_correlation_matrix_frag_ids", 
+        "distribution_correlation_individual",
+        "top_correlation_individual",
+        "top_correlation_matrix_frag_ids",
+        "top_correlation_matrix_psm_ids"
+    ])
+    
+    # Column processing settings (simplified from current complex structure)
+    collapse_max_columns: List[str] = field(default_factory=lambda: [
+        "fragment_ppm", "rank", "delta_next", "delta_rt_model",
+        "matched_peaks", "longest_b", "longest_y", "matched_intensity_pct",
+        "fragment_intensity", "poisson", "spectrum_q", "peptide_q", "protein_q",
+        "rt", "rt_predictions", "rt_prediction_error_abs", 
+        "rt_prediction_error_abs_relative", "precursor_ppm", "hyperscore", "delta_best"
+    ])
+    
+    def get_parameter_value(self, param_name: str, search_type: str) -> Any:
+        """
+        Get the effective value for a parameter considering override hierarchy.
+        
+        Args:
+            param_name: Base parameter name (e.g., 'cleave_at')
+            search_type: 'initial_search' or 'full_search'
+            
+        Returns:
+            The effective parameter value
+        """
+        # Check for specific override first
+        specific_override = f"{param_name}_{search_type}"
+        if hasattr(self, specific_override):
+            value = getattr(self, specific_override)
+            if value is not None:
+                return value
+        
+        # Fall back to base parameter
+        return getattr(self, param_name)
+    
+    def get_initial_search_config(self) -> Dict[str, Any]:
+        """Generate Sage config for initial search."""
+        return self._generate_sage_config("initial_search")
+    
+    def get_full_search_config(self) -> Dict[str, Any]:
+        """Generate Sage config for full search.""" 
+        return self._generate_sage_config("full_search")
+    
+    def _generate_sage_config(self, search_type: str) -> Dict[str, Any]:
+        """Generate Sage configuration for specified search type."""
+        
+        # Helper to get parameter value for this search type
+        def get_param(name: str) -> Any:
+            return self.get_parameter_value(name, search_type)
+        
+        config = {
+            "database": {
+                "bucket_size": get_param("bucket_size"),
+                "enzyme": {
+                    "missed_cleavages": get_param("missed_cleavages"),
+                    "min_len": self.min_len,
+                    "max_len": self.max_len,
+                    "cleave_at": get_param("cleave_at"),
+                    "restrict": self.restrict,
+                    "c_terminal": self.c_terminal
+                },
+                "fragment_min_mz": self.fragment_min_mz,
+                "fragment_max_mz": self.fragment_max_mz,
+                "peptide_min_mass": self.peptide_min_mass,
+                "peptide_max_mass": self.peptide_max_mass,
+                "ion_kinds": self.ion_kinds,
+                "min_ion_index": self.min_ion_index,
+                "static_mods": self.static_mods,
+                "variable_mods": self.variable_mods,
+                "max_variable_mods": get_param("max_variable_mods"),
+                "decoy_tag": self.decoy_tag,
+                "generate_decoys": self.generate_decoys,
+                "fasta": self.fasta_file
+            },
+            "precursor_tol": {
+                "da": [self.precursor_tol_da_low, self.precursor_tol_da_high]
+            },
+            "fragment_tol": {
+                "ppm": [self.fragment_tol_ppm_low, self.fragment_tol_ppm_high]
+            },
+            "precursor_charge": [self.precursor_charge_min, self.precursor_charge_max],
+            "isotope_errors": [self.isotope_errors_min, self.isotope_errors_max],
+            "deisotope": get_param("deisotope"),
+            "annotate_matches": self.annotate_matches,
+            "chimera": self.chimera,
+            "wide_window": self.wide_window,
+            "min_peaks": self.min_peaks,
+            "max_peaks": self.max_peaks,
+            "min_matched_peaks": self.min_matched_peaks,
+            "max_fragment_charge": self.max_fragment_charge,
+            "report_psms": get_param("report_psms"),
+            "output_directory": "./",
+            "mzml_paths": [self.mzml_file] if self.mzml_file else []
+        }
+        
+        # Add predict_rt only for full search
+        if search_type == "full_search":
+            config["predict_rt"] = self.predict_rt
+            
+        return config
+    
+    def get_mumdia_config(self) -> Dict[str, Any]:
+        """Get MuMDIA-specific configuration."""
+        return {
+            "write_deeplc_pickle": self.write_deeplc_pickle,
+            "write_ms2pip_pickle": self.write_ms2pip_pickle,
+            "write_correlation_pickles": self.write_correlation_pickles,
+            "write_initial_search_pickle": self.write_initial_search_pickle,
+            "write_full_search_pickle": self.write_full_search_pickle,
+            "read_deeplc_pickle": self.read_deeplc_pickle,
+            "read_ms2pip_pickle": self.read_ms2pip_pickle,
+            "read_correlation_pickles": self.read_correlation_pickles,
+            "read_full_search_pickle": self.read_full_search_pickle,
+            "read_initial_search_pickle": self.read_initial_search_pickle,
+            "remove_intermediate_files": self.remove_intermediate_files,
+            "dlc_transfer_learn": self.dlc_transfer_learn,
+            "fdr_init_search": self.fdr_init_search,
+            "rescoring_features": self.rescoring_features,
+            "collapse_max_columns": self.collapse_max_columns,
+            "collapse_min_columns": self.collapse_max_columns,  # Simplified
+            "collapse_mean_columns": self.collapse_max_columns,  # Simplified  
+            "collapse_sum_columns": self.collapse_max_columns,  # Simplified
+            "get_first_entry": [  # Default list
+                "psm_id", "filename", "scannr", "peptide", "num_proteins",
+                "proteins", "expmass", "calcmass", "is_decoy", "charge",
+                "peptide_len", "missed_cleavages"
+            ],
+            "collect_distributions": list(range(0, 101, 5)),  # 0, 5, 10, ..., 100
+            "collect_top": list(range(1, 11)),  # 1, 2, 3, ..., 10
+            # Add simple config values
+            "mzml_file": self.mzml_file,
+            "fasta_file": self.fasta_file,
+            "mgf_file": self.mgf_file,
+            "result_dir": self.result_dir,
+            "n_windows": self.n_windows,
+            "training_fdr": self.training_fdr,
+            "final_fdr": self.final_fdr,
+            "model_type": self.model_type,
+            "no_cache": self.no_cache,
+            "clean": self.clean,
+            "sage_only": self.sage_only,
+            "skip_mokapot": self.skip_mokapot,
+            "verbose": self.verbose
+        }
+    
+    def to_legacy_format(self) -> Dict[str, Any]:
+        """
+        Convert to the legacy format expected by existing run.py code.
+        """
+        return {
+            "sage_basic": self.get_initial_search_config(),
+            "sage": self.get_full_search_config(),
+            "mumdia": self.get_mumdia_config()
+        }
+    
+    @classmethod
+    def from_json(cls, json_path: str) -> 'MuMDIAConfig':
+        """Load configuration from JSON file."""
+        if not os.path.exists(json_path):
+            print(f"Warning: Config file {json_path} not found, using defaults")
+            return cls()
+        
+        with open(json_path, 'r') as f:
+            data = json.load(f)
+        
+        # Create instance with defaults
+        config = cls()
+        
+        # Override with JSON values
+        for key, value in data.items():
+            if hasattr(config, key):
+                setattr(config, key, value)
+            else:
+                print(f"Warning: Unknown config parameter '{key}' ignored")
+        
+        return config
+    
+    @classmethod
+    def from_args(cls) -> 'MuMDIAConfig':
+        """Create configuration from command line arguments."""
+        parser = argparse.ArgumentParser(description="MuMDIA: Simplified Configuration System")
+        
+        # File arguments
+        parser.add_argument("--config_file", default="configs/config.json", help="Path to JSON configuration file")
+        parser.add_argument("--mzml_file", help="Path to mzML file")
+        parser.add_argument("--fasta_file", help="Path to FASTA file")
+        parser.add_argument("--mgf_file", help="Path to MGF file")
+        parser.add_argument("--result_dir", default="results", help="Output directory")
+        
+        # Search parameters
+        parser.add_argument("--n_windows", type=int, default=10, help="Number of RT windows")
+        parser.add_argument("--training_fdr", type=float, default=0.01, help="Training FDR")
+        parser.add_argument("--final_fdr", type=float, default=0.01, help="Final FDR")
+        parser.add_argument("--model_type", choices=["xgboost", "nn", "percolator"], default="xgboost", help="ML model type")
+        
+        # Runtime flags
+        parser.add_argument("--no-cache", action="store_true", help="Disable caching")
+        parser.add_argument("--clean", action="store_true", help="Clean intermediate files")
+        parser.add_argument("--sage-only", action="store_true", help="Run Sage only")
+        parser.add_argument("--skip-mokapot", action="store_true", help="Skip Mokapot")
+        parser.add_argument("--verbose", action="store_true", help="Verbose output")
+        
+        args = parser.parse_args()
+        
+        # Load from JSON first
+        config = cls.from_json(args.config_file)
+        
+        # Override with command line arguments
+        config.config_file = args.config_file
+        if args.mzml_file:
+            config.mzml_file = args.mzml_file
+        if args.fasta_file:
+            config.fasta_file = args.fasta_file
+        if args.mgf_file:
+            config.mgf_file = args.mgf_file
+        if args.result_dir != "results":  # Only override if explicitly set
+            config.result_dir = args.result_dir
+        if args.n_windows != 10:
+            config.n_windows = args.n_windows
+        if args.training_fdr != 0.01:
+            config.training_fdr = args.training_fdr
+        if args.final_fdr != 0.01:
+            config.final_fdr = args.final_fdr
+        if args.model_type != "xgboost":
+            config.model_type = args.model_type
+        
+        config.no_cache = args.no_cache
+        config.clean = args.clean
+        config.sage_only = args.sage_only
+        config.skip_mokapot = args.skip_mokapot
+        config.verbose = args.verbose
+        
+        return config
+    
+    def validate(self) -> None:
+        """Validate configuration."""
+        errors = []
+        
+        if self.mzml_file and not os.path.exists(self.mzml_file):
+            errors.append(f"mzML file not found: {self.mzml_file}")
+        
+        if self.fasta_file and not os.path.exists(self.fasta_file):
+            errors.append(f"FASTA file not found: {self.fasta_file}")
+        
+        if self.mgf_file and not os.path.exists(self.mgf_file):
+            errors.append(f"MGF file not found: {self.mgf_file}")
+        
+        if errors:
+            for error in errors:
+                print(f"Error: {error}")
+            sys.exit(1)
+
+
+def get_config() -> MuMDIAConfig:
+    """
+    Get configuration from command-line arguments with validation.
+    
+    This is the main entry point for MuMDIA configuration.
+    
+    Returns:
+        Validated MuMDIAConfig instance
+    """
+    config = MuMDIAConfig.from_args()
+    config.validate()
+    return config
+
+
+if __name__ == "__main__":
+    # Demo the new simplified approach
+    try:
+        config = get_config()
+        print("MuMDIA Simplified Configuration Demo")
+        print("=" * 50)
+        print(f"mzML file: {config.mzml_file}")
+        print(f"FASTA file: {config.fasta_file}")
+        print(f"Result dir: {config.result_dir}")
+        print()
+        
+        print("Initial Search Config:")
+        initial = config.get_initial_search_config()
+        print(f"  cleave_at: {initial['database']['enzyme']['cleave_at']}")
+        print(f"  report_psms: {initial['report_psms']}")
+        print(f"  deisotope: {initial['deisotope']}")
+        print()
+        
+        print("Full Search Config:")
+        full = config.get_full_search_config()
+        print(f"  cleave_at: {full['database']['enzyme']['cleave_at']}")
+        print(f"  report_psms: {full['report_psms']}")
+        print(f"  deisotope: {full['deisotope']}")
+        print()
+        
+        print("✅ Simplified configuration with smart defaults!")
+        print("✅ Automatic initial vs full search differentiation!")
+        print("✅ Override system working!")
+        
+    except SystemExit:
+        print("❌ Configuration validation failed")
diff --git a/config_demo.py b/config_demo.py
index 7aef1a9..e69de29 100644
--- a/config_demo.py
+++ b/config_demo.py
@@ -1,48 +0,0 @@
-#!/usr/bin/env python3
-"""
-Simple demo of the new MuMDIA configuration system
-
-This shows how much cleaner configuration management can be.
-"""
-
-import sys
-
-sys.path.append(".")
-
-from config_manager_clean import get_config
-
-
-def main():
-    """Demo the simplified configuration approach."""
-    try:
-        # Get configuration - this replaces ~100 lines of complex parsing!
-        config = get_config()
-
-        print("MuMDIA Configuration Demo")
-        print("=" * 40)
-        print(f"mzML file: {config.mzml_file}")
-        print(f"FASTA file: {config.fasta_file}")
-        print(f"Result directory: {config.result_dir}")
-        print(f"Windows: {config.n_windows}")
-        print(f"Training FDR: {config.training_fdr}")
-        print(f"Final FDR: {config.final_fdr}")
-        print(f"Model type: {config.model_type}")
-        print(f"No cache: {config.no_cache}")
-        print(f"Clean: {config.clean}")
-        print(f"Sage only: {config.sage_only}")
-        print(f"Skip Mokapot: {config.skip_mokapot}")
-        print(f"Verbose: {config.verbose}")
-        print()
-        print("Configuration loaded successfully!")
-        print("This replaces the complex 100+ line argument parsing in run.py!")
-
-    except SystemExit:
-        # This happens when validation fails (missing required files)
-        print("\nTo test with actual files, try:")
-        print(
-            "  python config_demo.py --mzml_file LFQ_Orbitrap_AIF_Ecoli_01.mzML --fasta_file fasta/ecoli_22032024.fasta"
-        )
-
-
-if __name__ == "__main__":
-    main()
diff --git a/config_manager.py b/config_manager.py
index 5a7ea07..e69de29 100644
--- a/config_manager.py
+++ b/config_manager.py
@@ -1,173 +0,0 @@
-"""
-Simplified configuration management for MuMDIA.
-
-This module provides a clean, unified way to handle configuration from
-JSON files, command line arguments, and defaults.
-"""
-
-import argparse
-import json
-from dataclasses import dataclass, field
-from pathlib import Path
-from typing import Any, Dict, Optional
-
-
-@dataclass
-class MuMDIAConfig:
-    """
-    Simplified configuration class for MuMDIA.
-
-    This replaces the complex argument parsing and config merging logic
-    with a clean, type-safe dataclass approach.
-    """
-
-    # Required files
-    mzml_file: str = ""
-    fasta_file: str = ""
-    mgf_file: str = ""
-
-    # Output configuration
-    result_dir: str = "results"
-    search_config: str = "configs/config.json"
-
-    # Processing parameters
-    n_windows: int = 10
-    training_fdr: float = 0.05
-    final_fdr: float = 0.01
-    model_type: str = "xgboost"  # choices: xgboost, nn, percolator
-
-    # Behavioral flags
-    no_cache: bool = False
-    clean: bool = False
-    sage_only: bool = False
-    skip_mokapot: bool = False
-    verbose: bool = False
-
-    @classmethod
-    def from_json(cls, config_path: str) -> "MuMDIAConfig":
-        """Load configuration from JSON file with sensible defaults."""
-        config = cls()  # Start with defaults
-
-        if Path(config_path).exists():
-            with open(config_path) as f:
-                json_data = json.load(f)
-
-            # Update with JSON values
-            if "mumdia" in json_data:
-                for key, value in json_data["mumdia"].items():
-                    if hasattr(config, key):
-                        setattr(config, key, value)
-
-            # Store the full JSON config for sage/mumdia sections
-            config.sage_basic = json_data.get("sage_basic", {})
-            config.sage = json_data.get("sage", {})
-            config.mumdia = json_data.get("mumdia", {})
-
-        return config
-
-    @classmethod
-    def from_args(cls, args: Optional[argparse.Namespace] = None) -> "MuMDIAConfig":
-        """Create config from command line arguments."""
-        if args is None:
-            args = parse_arguments()
-
-        # Start with JSON config if provided
-        config = cls.from_json(args.config_file)
-
-        # Override with any explicitly provided CLI arguments
-        for key, value in vars(args).items():
-            if hasattr(config, key) and value is not None:
-                setattr(config, key, value)
-
-        return config
-
-    def save(self, path: str) -> None:
-        """Save current configuration to JSON file."""
-        output = {
-            "mumdia": {
-                key: getattr(self, key)
-                for key in [
-                    "mzml_file",
-                    "mzml_dir",
-                    "fasta_file",
-                    "result_dir",
-                    "remove_intermediate_files",
-                    "write_initial_search",
-                    "read_initial_search",
-                    "write_full_search",
-                    "read_full_search",
-                    "write_deeplc",
-                    "read_deeplc",
-                    "write_ms2pip",
-                    "read_ms2pip",
-                    "write_correlation",
-                    "read_correlation",
-                    "dlc_transfer_learn",
-                    "fdr_init_search",
-                ]
-            },
-            "sage_basic": self.sage_basic,
-            "sage": self.sage,
-        }
-
-        Path(path).parent.mkdir(parents=True, exist_ok=True)
-        with open(path, "w") as f:
-            json.dump(output, f, indent=2)
-
-
-def parse_arguments() -> argparse.Namespace:
-    """Simplified argument parser with only the essential arguments."""
-    parser = argparse.ArgumentParser(
-        description="MuMDIA: Multi-modal Data-Independent Acquisition Analysis"
-    )
-
-    # Essential paths
-    parser.add_argument("--mzml_file", help="Path to mzML file")
-    parser.add_argument("--fasta_file", help="Path to FASTA file")
-    parser.add_argument("--result_dir", help="Results directory")
-    parser.add_argument("--config_file", help="Configuration JSON file")
-
-    # Common flags
-    parser.add_argument(
-        "--no-cache",
-        action="store_true",
-        help="Disable all caching (force recomputation)",
-    )
-    parser.add_argument(
-        "--clean",
-        action="store_true",
-        help="Remove intermediate files after processing",
-    )
-
-    # Advanced overrides
-    parser.add_argument(
-        "--fdr",
-        type=float,
-        dest="fdr_init_search",
-        help="FDR threshold for initial search",
-    )
-
-    return parser.parse_args()
-
-
-def get_config() -> MuMDIAConfig:
-    """
-    One-liner to get fully configured MuMDIA settings.
-
-    This replaces all the complex config parsing logic.
-    """
-    args = parse_arguments()
-    config = MuMDIAConfig.from_args(args)
-
-    # Handle special flags
-    if args.no_cache:
-        config.read_initial_search = False
-        config.read_full_search = False
-        config.read_deeplc = False
-        config.read_ms2pip = False
-        config.read_correlation = False
-
-    if args.clean:
-        config.remove_intermediate_files = True
-
-    return config
diff --git a/config_manager_clean.py b/config_manager_clean.py
index 8cc98df..e69de29 100644
--- a/config_manager_clean.py
+++ b/config_manager_clean.py
@@ -1,203 +0,0 @@
-#!/usr/bin/env python3
-"""
-Simplified Configuration Management for MuMDIA
-
-This module provides a clean, dataclass-based approach to configuration management,
-replacing the complex argument parsing and config merging logic in the original run.py.
-
-The MuMDIAConfig class centralizes all configuration options with sensible defaults
-and provides simple methods for loading from JSON files or command-line arguments.
-"""
-
-import argparse
-import json
-import sys
-from dataclasses import asdict, dataclass
-from pathlib import Path
-from typing import Optional
-
-
-@dataclass
-class MuMDIAConfig:
-    """
-    Simplified configuration class for MuMDIA.
-
-    This replaces the complex argument parsing and config merging logic
-    with a clean, type-safe dataclass approach.
-    """
-
-    # Required files
-    mzml_file: str = ""
-    fasta_file: str = ""
-    mgf_file: str = ""
-
-    # Output configuration
-    result_dir: str = "results"
-    search_config: str = "configs/config.json"
-
-    # Processing parameters
-    n_windows: int = 10
-    training_fdr: float = 0.05
-    final_fdr: float = 0.01
-    model_type: str = "xgboost"  # choices: xgboost, nn, percolator
-
-    # Behavioral flags
-    no_cache: bool = False
-    clean: bool = False
-    sage_only: bool = False
-    skip_mokapot: bool = False
-    verbose: bool = False
-
-    @classmethod
-    def from_json(cls, json_path: str) -> "MuMDIAConfig":
-        """
-        Load configuration from a JSON file.
-
-        Args:
-            json_path: Path to the JSON configuration file
-
-        Returns:
-            MuMDIAConfig instance with values from the JSON file
-        """
-        try:
-            with open(json_path, "r") as f:
-                data = json.load(f)
-
-            # Create config with JSON data, using defaults for missing keys
-            config = cls()
-            for key, value in data.items():
-                if hasattr(config, key):
-                    setattr(config, key, value)
-
-            return config
-
-        except FileNotFoundError:
-            print(f"Warning: Config file {json_path} not found, using defaults")
-            return cls()
-        except json.JSONDecodeError as e:
-            print(f"Error: Invalid JSON in {json_path}: {e}")
-            sys.exit(1)
-
-    @classmethod
-    def from_args(cls, args: Optional[argparse.Namespace] = None) -> "MuMDIAConfig":
-        """
-        Create configuration from command-line arguments.
-
-        Args:
-            args: Parsed arguments (if None, will parse sys.argv)
-
-        Returns:
-            MuMDIAConfig instance with values from command-line arguments
-        """
-        if args is None:
-            parser = cls._create_parser()
-            args = parser.parse_args()
-
-        # Start with config from file if provided
-        if hasattr(args, "config_file") and args.config_file:
-            config = cls.from_json(args.config_file)
-        else:
-            config = cls()
-
-        # Override with command-line arguments
-        for key, value in vars(args).items():
-            if hasattr(config, key) and value is not None:
-                # Handle boolean flags properly
-                if key in ["no_cache", "clean", "sage_only", "skip_mokapot", "verbose"]:
-                    setattr(config, key, bool(value))
-                else:
-                    setattr(config, key, value)
-
-        return config
-
-    @staticmethod
-    def _create_parser() -> argparse.ArgumentParser:
-        """Create the argument parser with simplified options."""
-        parser = argparse.ArgumentParser(
-            description="MuMDIA: Multi-modal Data-Independent Acquisition pipeline"
-        )
-
-        # Configuration file
-        parser.add_argument("--config_file", help="Path to JSON configuration file")
-
-        # Required files
-        parser.add_argument("--mzml_file", help="Path to mzML file")
-        parser.add_argument("--fasta_file", help="Path to FASTA file")
-        parser.add_argument("--mgf_file", help="Path to MGF file (optional)")
-
-        # Output and processing
-        parser.add_argument("--result_dir", default="results", help="Output directory")
-        parser.add_argument(
-            "--search_config", default="configs/config.json", help="Sage config file"
-        )
-        parser.add_argument(
-            "--n_windows", type=int, default=10, help="Number of RT windows"
-        )
-        parser.add_argument(
-            "--training_fdr", type=float, default=0.05, help="Training FDR threshold"
-        )
-        parser.add_argument(
-            "--final_fdr", type=float, default=0.01, help="Final FDR threshold"
-        )
-        parser.add_argument(
-            "--model_type",
-            choices=["xgboost", "nn", "percolator"],
-            default="xgboost",
-            help="ML model type",
-        )
-
-        # Boolean flags
-        parser.add_argument(
-            "--no-cache", action="store_true", help="Force recomputation"
-        )
-        parser.add_argument(
-            "--clean", action="store_true", help="Clean intermediate files"
-        )
-        parser.add_argument("--sage-only", action="store_true", help="Run Sage only")
-        parser.add_argument("--skip-mokapot", action="store_true", help="Skip Mokapot")
-        parser.add_argument("--verbose", action="store_true", help="Verbose logging")
-
-        return parser
-
-    def save(self, path: str) -> None:
-        """
-        Save configuration to a JSON file.
-
-        Args:
-            path: Path where to save the configuration
-        """
-        with open(path, "w") as f:
-            json.dump(asdict(self), f, indent=2)
-
-    def validate(self) -> None:
-        """
-        Validate the configuration and exit if invalid.
-        """
-        if not self.mzml_file:
-            print("Error: mzml_file is required")
-            sys.exit(1)
-        if not self.fasta_file:
-            print("Error: fasta_file is required")
-            sys.exit(1)
-
-        # Check file existence
-        if not Path(self.mzml_file).exists():
-            print(f"Error: mzML file not found: {self.mzml_file}")
-            sys.exit(1)
-        if not Path(self.fasta_file).exists():
-            print(f"Error: FASTA file not found: {self.fasta_file}")
-            sys.exit(1)
-
-
-def get_config() -> MuMDIAConfig:
-    """
-    Get configuration from command-line arguments with validation.
-
-    This is the main entry point for configuration management.
-
-    Returns:
-        Validated MuMDIAConfig instance
-    """
-    config = MuMDIAConfig.from_args()
-    config.validate()
-    return config
diff --git a/config_new.py b/config_new.py
new file mode 100644
index 0000000..e69de29
diff --git a/config_old.py b/config_old.py
new file mode 100644
index 0000000..d1dc42f
--- /dev/null
+++ b/config_old.py
@@ -0,0 +1,438 @@
+#!/usr/bin/env python3
+"""
+MuMDIA Configuration System
+
+Clean, type-safe configuration that handles complex nested JSON structure
+while providing a simple interface.
+
+Usage:
+    from config import get_config
+    config = get_config()
+    print(config.mzml_file, config.n_windows)
+"""
+
+import argparse
+import json
+import os
+from dataclasses import dataclass, field, asdict
+from pathlib import Path
+from typing import Dict, Any, Optional, Union, List
+import sys
+
+
+@dataclass
+class DatabaseConfig:
+    """Sage database configuration section."""
+    bucket_size: int = 1024
+    enzyme: Dict[str, Any] = field(default_factory=lambda: {
+        "missed_cleavages": 2,
+        "min_len": 6,
+        "max_len": 30,
+        "cleave_at": "KR",
+        "restrict": "P",
+        "c_terminal": True
+    })
+    fragment_min_mz: float = 100.0
+    fragment_max_mz: float = 2500.0
+    peptide_min_mass: float = 300.0
+    peptide_max_mass: float = 5000.0
+    ion_kinds: List[str] = field(default_factory=lambda: ["b", "y"])
+    min_ion_index: int = 2
+    static_mods: Dict[str, float] = field(default_factory=lambda: {"C": 57.0215})
+    variable_mods: Dict[str, List[float]] = field(default_factory=lambda: {"M": [15.9949]})
+    max_variable_mods: int = 1
+    decoy_tag: str = "rev_"
+    generate_decoys: bool = True
+    fasta: str = ""
+
+
+@dataclass
+class SageConfig:
+    """Complete Sage configuration."""
+    database: DatabaseConfig = field(default_factory=DatabaseConfig)
+    precursor_tol: Dict[str, List[float]] = field(default_factory=lambda: {"da": [-40, 40]})
+    fragment_tol: Dict[str, List[float]] = field(default_factory=lambda: {"ppm": [-13, 13]})
+    precursor_charge: List[int] = field(default_factory=lambda: [1, 4])
+    isotope_errors: List[int] = field(default_factory=lambda: [-1, 1])
+    deisotope: bool = False
+    annotate_matches: bool = True
+    chimera: bool = True
+    wide_window: bool = True
+    min_peaks: int = 0
+    max_peaks: int = 10000
+    min_matched_peaks: int = 5
+    max_fragment_charge: int = 1
+    report_psms: int = 5
+    output_directory: str = "./"
+    mzml_paths: List[str] = field(default_factory=list)
+
+
+@dataclass
+class MuMDIASettings:
+    """MuMDIA-specific settings - complete with all existing options."""
+    # Pickle settings
+    write_deeplc_pickle: bool = True
+    write_ms2pip_pickle: bool = True
+    write_correlation_pickles: bool = True
+    write_initial_search_pickle: bool = True
+    write_full_search_pickle: bool = True
+    read_deeplc_pickle: bool = True
+    read_ms2pip_pickle: bool = True
+    read_correlation_pickles: bool = True
+    read_full_search_pickle: bool = True
+    read_initial_search_pickle: bool = True
+    
+    # Processing settings
+    remove_intermediate_files: bool = False
+    dlc_transfer_learn: bool = False
+    fdr_init_search: float = 0.01
+    
+    # Feature settings
+    rescoring_features: List[str] = field(default_factory=lambda: [
+        "distribution_correlation_matrix_psm_ids",
+        "distribution_correlation_matrix_frag_ids",
+        "distribution_correlation_individual",
+        "top_correlation_individual",
+        "top_correlation_matrix_frag_ids",
+        "top_correlation_matrix_psm_ids"
+    ])
+    
+    # Column processing settings  
+    collapse_max_columns: List[str] = field(default_factory=lambda: [
+        "fragment_ppm", "rank", "delta_next", "delta_rt_model",
+        "matched_peaks", "longest_b", "longest_y", "matched_intensity_pct",
+        "fragment_intensity", "poisson", "spectrum_q", "peptide_q", "protein_q",
+        "rt", "rt_predictions", "rt_prediction_error_abs", 
+        "rt_prediction_error_abs_relative", "precursor_ppm", "hyperscore", "delta_best"
+    ])
+    
+    collapse_min_columns: List[str] = field(default_factory=lambda: [
+        "fragment_ppm", "rank", "delta_next", "delta_rt_model",
+        "matched_peaks", "longest_b", "longest_y", "matched_intensity_pct",
+        "fragment_intensity", "poisson", "spectrum_q", "peptide_q", "protein_q",
+        "rt", "rt_predictions", "rt_prediction_error_abs", 
+        "rt_prediction_error_abs_relative", "precursor_ppm", "hyperscore", "delta_best"
+    ])
+    
+    collapse_mean_columns: List[str] = field(default_factory=lambda: [
+        "fragment_ppm", "rank", "delta_next", "delta_rt_model",
+        "matched_peaks", "longest_b", "longest_y", "matched_intensity_pct",
+        "fragment_intensity", "poisson", "spectrum_q", "peptide_q", "protein_q",
+        "rt", "rt_predictions", "rt_prediction_error_abs", 
+        "rt_prediction_error_abs_relative", "precursor_ppm", "hyperscore", "delta_best"
+    ])
+    
+    collapse_sum_columns: List[str] = field(default_factory=lambda: [
+        "hyperscore", "delta_rt_model", "matched_peaks", "longest_b", "longest_y",
+        "matched_intensity_pct", "fragment_intensity", "rt", "rt_predictions",
+        "rt_prediction_error_abs", "rt_prediction_error_abs_relative", "precursor_ppm",
+        "fragment_ppm", "delta_next", "rank", "delta_best"
+    ])
+    
+    get_first_entry: List[str] = field(default_factory=lambda: [
+        "psm_id", "filename", "scannr", "peptide", "num_proteins", "proteins",
+        "expmass", "calcmass", "is_decoy", "charge", "peptide_len", "missed_cleavages"
+    ])
+    
+    collect_distributions: List[int] = field(default_factory=lambda: [
+        0, 5, 10, 15, 20, 25, 30, 35, 40, 45, 50, 55, 60, 65, 70, 75, 80, 85, 90, 95, 100
+    ])
+    
+    collect_top: List[int] = field(default_factory=lambda: [
+        1, 2, 3, 4, 5, 6, 7, 8, 9, 10
+    ])
+
+
+@dataclass 
+class Config:
+    """
+    MuMDIA configuration that handles all complexity internally.
+    
+    This provides a single source of truth while maintaining compatibility
+    with the existing complex JSON structure.
+    """
+    
+    # === Core Required Files ===
+    mzml_file: str = ""
+    fasta_file: str = ""
+    mgf_file: str = ""
+    
+    # === Processing Parameters ===
+    result_dir: str = "results"
+    n_windows: int = 10
+    training_fdr: float = 0.05
+    final_fdr: float = 0.01
+    model_type: str = "xgboost"
+    
+    # === Behavioral Flags ===
+    no_cache: bool = False
+    clean: bool = False
+    sage_only: bool = False
+    skip_mokapot: bool = False
+    verbose: bool = False
+    
+    # === Complex Nested Configurations ===
+    sage_basic: SageConfig = field(default_factory=SageConfig)
+    sage: SageConfig = field(default_factory=SageConfig)
+    mumdia: MuMDIASettings = field(default_factory=MuMDIASettings)
+    
+    # === Internal ===
+    _config_file: str = "configs/config.json"
+    
+    @classmethod
+    def from_json(cls, json_path: str) -> "Config":
+        """Load from complex nested JSON while providing simple interface."""
+        config = cls()
+        
+        if not Path(json_path).exists():
+            print(f"Warning: Config file {json_path} not found, using defaults")
+            return config
+            
+        try:
+            with open(json_path) as f:
+                data = json.load(f)
+            
+            # Handle the nested structure
+            if "mumdia" in data:
+                # Extract simple values from mumdia section
+                mumdia_data = data["mumdia"]
+                for key, value in mumdia_data.items():
+                    if hasattr(config, key):
+                        setattr(config, key, value)
+                
+                # Set the complex mumdia settings
+                config.mumdia = MuMDIASettings(**{
+                    k: v for k, v in mumdia_data.items() 
+                    if k in MuMDIASettings.__annotations__
+                })
+            
+            # Handle sage configurations
+            if "sage_basic" in data:
+                config.sage_basic = cls._parse_sage_config(data["sage_basic"])
+            if "sage" in data:
+                config.sage = cls._parse_sage_config(data["sage"])
+            
+            # Extract file paths from sage configs if not set
+            if not config.mzml_file:
+                paths = config.sage.mzml_paths or config.sage_basic.mzml_paths
+                if paths:
+                    config.mzml_file = paths[0]
+                    
+            if not config.fasta_file:
+                fasta = config.sage.database.fasta or config.sage_basic.database.fasta
+                if fasta:
+                    config.fasta_file = fasta
+                    
+        except Exception as e:
+            print(f"Error loading config from {json_path}: {e}")
+            
+        return config
+    
+    @classmethod
+    def _parse_sage_config(cls, sage_data: Dict[str, Any]) -> SageConfig:
+        """Parse nested sage configuration."""
+        sage_config = SageConfig()
+        
+        # Handle database section
+        if "database" in sage_data:
+            db_data = sage_data["database"]
+            sage_config.database = DatabaseConfig(**{
+                k: v for k, v in db_data.items() 
+                if k in DatabaseConfig.__annotations__
+            })
+        
+        # Handle other sage settings
+        for key, value in sage_data.items():
+            if key != "database" and hasattr(sage_config, key):
+                setattr(sage_config, key, value)
+                
+        return sage_config
+    
+    @classmethod
+    def from_args(cls, args: Optional[argparse.Namespace] = None) -> "Config":
+        """Create from command line arguments with config file support."""
+        if args is None:
+            parser = cls._create_parser()
+            args = parser.parse_args()
+        
+        # Start with config file if provided
+        config_file = getattr(args, 'config_file', 'configs/config.json')
+        config = cls.from_json(config_file)
+        config._config_file = config_file
+        
+        # Override with CLI arguments
+        for key, value in vars(args).items():
+            if hasattr(config, key) and value is not None:
+                setattr(config, key, value)
+        
+        # Handle special flags
+        if config.no_cache:
+            config.mumdia.read_deeplc_pickle = False
+            config.mumdia.read_ms2pip_pickle = False
+            config.mumdia.read_correlation_pickles = False
+            config.mumdia.read_initial_search_pickle = False
+            config.mumdia.read_full_search_pickle = False
+            
+        if config.clean:
+            config.mumdia.remove_intermediate_files = True
+        
+        return config
+    
+    @staticmethod
+    def _create_parser() -> argparse.ArgumentParser:
+        """Create argument parser."""
+        parser = argparse.ArgumentParser(
+            description="MuMDIA: Unified Configuration System"
+        )
+        
+        # Config file
+        parser.add_argument("--config_file", default="configs/config.json",
+                          help="Path to JSON configuration file")
+        
+        # Required files  
+        parser.add_argument("--mzml_file", help="Path to mzML file")
+        parser.add_argument("--fasta_file", help="Path to FASTA file")
+        parser.add_argument("--mgf_file", help="Path to MGF file")
+        
+        # Processing
+        parser.add_argument("--result_dir", default="results", help="Output directory")
+        parser.add_argument("--n_windows", type=int, default=10, help="Number of RT windows")
+        parser.add_argument("--training_fdr", type=float, default=0.05, help="Training FDR")
+        parser.add_argument("--final_fdr", type=float, default=0.01, help="Final FDR")
+        parser.add_argument("--model_type", choices=["xgboost", "nn", "percolator"],
+                          default="xgboost", help="ML model type")
+        
+        # Flags
+        parser.add_argument("--no-cache", action="store_true", help="Disable caching")
+        parser.add_argument("--clean", action="store_true", help="Clean intermediate files")
+        parser.add_argument("--sage-only", action="store_true", help="Run Sage only")
+        parser.add_argument("--skip-mokapot", action="store_true", help="Skip Mokapot")
+        parser.add_argument("--verbose", action="store_true", help="Verbose output")
+        
+        return parser
+    
+    def save(self, path: str) -> None:
+        """Save in the complex nested JSON format for backwards compatibility."""
+        # Sync file paths into sage configs
+        if self.mzml_file:
+            self.sage_basic.mzml_paths = [self.mzml_file]
+            self.sage.mzml_paths = [self.mzml_file]
+        if self.fasta_file:
+            self.sage_basic.database.fasta = self.fasta_file
+            self.sage.database.fasta = self.fasta_file
+        
+        # Create the complex nested structure
+        output = {
+            "sage_basic": asdict(self.sage_basic),
+            "sage": asdict(self.sage),
+            "mumdia": asdict(self.mumdia)
+        }
+        
+        Path(path).parent.mkdir(parents=True, exist_ok=True)
+        with open(path, 'w') as f:
+            json.dump(output, f, indent=2)
+    
+    def validate(self) -> None:
+        """Validate configuration."""
+        if not self.mzml_file:
+            print("Error: mzml_file is required")
+            sys.exit(1)
+        if not self.fasta_file:
+            print("Error: fasta_file is required") 
+            sys.exit(1)
+            
+        # Check file existence
+        if not Path(self.mzml_file).exists():
+            print(f"Error: mzML file not found: {self.mzml_file}")
+            sys.exit(1)
+        if not Path(self.fasta_file).exists():
+            print(f"Error: FASTA file not found: {self.fasta_file}")
+            sys.exit(1)
+    
+    def get_effective_config_path(self) -> str:
+        """Get the path where effective config will be saved."""
+        return os.path.join(self.result_dir, "effective_config.json")
+    
+    def to_legacy_format(self) -> Dict[str, Any]:
+        """
+        Convert to the legacy format expected by existing run.py code.
+        
+        Returns:
+            Dictionary in the format expected by the legacy mumdia workflow
+        """
+        # Sync file paths into sage configs first
+        if self.mzml_file:
+            self.sage_basic.mzml_paths = [self.mzml_file]
+            self.sage.mzml_paths = [self.mzml_file]
+        if self.fasta_file:
+            self.sage_basic.database.fasta = self.fasta_file
+            self.sage.database.fasta = self.fasta_file
+        
+        # Create the full legacy structure
+        legacy_config = {
+            "sage_basic": asdict(self.sage_basic),
+            "sage": asdict(self.sage),
+            "mumdia": asdict(self.mumdia)
+        }
+        
+        # Ensure mumdia section has the simple config values too
+        legacy_config["mumdia"].update({
+            "mzml_file": self.mzml_file,
+            "fasta_file": self.fasta_file,
+            "mgf_file": self.mgf_file,
+            "result_dir": self.result_dir,
+            "n_windows": self.n_windows,
+            "training_fdr": self.training_fdr,
+            "final_fdr": self.final_fdr,
+            "model_type": self.model_type,
+            "no_cache": self.no_cache,
+            "clean": self.clean,
+            "sage_only": self.sage_only,
+            "skip_mokapot": self.skip_mokapot,
+            "verbose": self.verbose
+        })
+        
+        return legacy_config
+    
+    def get_mumdia_args_dict(self) -> Dict[str, Any]:
+        """
+        Get the mumdia args dictionary expected by existing code.
+        
+        This method provides compatibility with the existing workflow
+        that expects args_dict = config["mumdia"]
+        """
+        return self.to_legacy_format()["mumdia"]
+
+
+def get_config() -> Config:
+    """
+    Get configuration from command-line arguments with validation.
+    
+    This is the main entry point for MuMDIA configuration.
+    
+    Returns:
+        Validated Config instance
+    """
+    config = Config.from_args()
+    config.validate()
+    return config
+
+
+if __name__ == "__main__":
+    # Demo the unified approach
+    try:
+        config = get_config()
+        print("MuMDIA Configuration Demo")
+        print("=" * 50)
+        print(f"mzML file: {config.mzml_file}")
+        print(f"FASTA file: {config.fasta_file}")
+        print(f"Result dir: {config.result_dir}")
+        print(f"Windows: {config.n_windows}")
+        print(f"No cache: {config.no_cache}")
+        print()
+        print("✅ Complex nested config handled transparently!")
+        print("✅ Simple interface for common operations!")
+        print("✅ Full backwards compatibility!")
+        
+    except SystemExit:
+        print("❌ Configuration validation failed")
diff --git a/configs/config.json b/configs/config.json
index 1f60cf4..034e5b4 100644
--- a/configs/config.json
+++ b/configs/config.json
@@ -134,11 +134,11 @@
         "write_correlation_pickles": true,
         "write_initial_search_pickle": true,
         "write_full_search_pickle": true,
-        "read_deeplc_pickle": true,
-        "read_ms2pip_pickle": true,
-        "read_correlation_pickles": true,
-        "read_full_search_pickles": true,
-        "read_initial_search_pickle": true,
+        "read_deeplc_pickle": false,
+        "read_ms2pip_pickle": false,
+        "read_correlation_pickles": false,
+        "read_full_search_pickles": false,
+        "read_initial_search_pickle": false,
         "remove_intermediate_files": false,
         "dlc_transfer_learn": false,
         "fdr_init_search": 0.01,
diff --git a/configs/config_simple.json b/configs/config_simple.json
new file mode 100644
index 0000000..543c90d
--- /dev/null
+++ b/configs/config_simple.json
@@ -0,0 +1,45 @@
+{
+    "mzml_file": "mzml_files/LFQ_Orbitrap_AIF_Ecoli_01.mzML",
+    "fasta_file": "fasta/ecoli_22032024.fasta",
+    "result_dir": "results",
+    
+
+    "_comment_basic_params": "Basic search parameters with defaults",
+
+    "chimera": true,
+    "wide_window": true,
+    "missed_cleavages": 2,
+    "max_variable_mods": 1,
+    
+
+    "_comment_initial_overrides": "Parameters specific to initial search",
+
+    "cleave_at_initial_search": "KR",
+    "report_psms_initial_search": 5,
+    "deisotope_initial_search": false,
+    "max_variable_mods_initial_search": 1,
+    
+
+    "_comment_full_overrides": "Parameters specific to full search", 
+
+    "cleave_at_full_search": "$",
+    "report_psms_full_search": 12,
+    "deisotope_full_search": true,
+    "max_variable_mods_full_search": 2,
+    
+
+    "_comment_pickle_settings": "Control caching behavior",
+    
+    "read_deeplc_pickle": false,
+    "read_ms2pip_pickle": false,
+    "read_correlation_pickles": false,
+    "read_full_search_pickle": false,
+    "read_initial_search_pickle": false,
+    
+    
+    "_comment_mumdia_settings": "MuMDIA-specific settings",
+    
+    "fdr_init_search": 0.01,
+    "n_windows": 10,
+    "model_type": "xgboost"
+}
diff --git a/demo_config.json b/demo_config.json
index 57e9e41..e69de29 100644
--- a/demo_config.json
+++ b/demo_config.json
@@ -1,9 +0,0 @@
-{
-  "mzml_file": "LFQ_Orbitrap_AIF_Ecoli_01.mzML",
-  "fasta_file": "fasta/ecoli_22032024.fasta",
-  "result_dir": "my_results",
-  "n_windows": 15,
-  "training_fdr": 0.1,
-  "model_type": "nn",
-  "verbose": true
-}
diff --git a/demo_new_config.py b/demo_new_config.py
new file mode 100644
index 0000000..5cde4c5
--- /dev/null
+++ b/demo_new_config.py
@@ -0,0 +1,72 @@
+#!/usr/bin/env python3
+"""
+Demo script showing how to use the new simplified MuMDIA configuration system.
+
+This script demonstrates:
+1. Loading config from JSON with override mechanism
+2. How parameters get different values for initial vs full search
+3. How to run the main workflow with the new system
+
+Run this with: python demo_new_config.py
+"""
+
+from config import load_config_from_json
+
+def main():
+    print("🔧 MuMDIA New Configuration System Demo")
+    print("=" * 50)
+    
+    # 1. Load config from JSON
+    print("\n1. Loading configuration from configs/config_simple.json...")
+    config = load_config_from_json('configs/config_simple.json')
+    print(f"✅ Configuration loaded successfully!")
+    
+    # 2. Show base parameters
+    print(f"\n2. Base configuration parameters:")
+    print(f"   📁 mzML file: {config.mzml_file}")
+    print(f"   📁 FASTA file: {config.fasta_file}")
+    print(f"   📁 Result directory: {config.result_dir}")
+    print(f"   🔬 Base cleave_at: {config.cleave_at}")
+    print(f"   🔬 Base report_psms: {config.report_psms}")
+    print(f"   🔬 Base deisotope: {config.deisotope}")
+    print(f"   🔬 Base max_variable_mods: {config.max_variable_mods}")
+    
+    # 3. Show override mechanism in action
+    print(f"\n3. Override mechanism for different search stages:")
+    
+    # Initial search configuration
+    initial_config = config.get_initial_search_config()
+    print(f"   🟡 Initial search cleave_at: {initial_config['database']['enzyme']['cleave_at']}")
+    print(f"   🟡 Initial search report_psms: {initial_config['report_psms']}")
+    print(f"   🟡 Initial search deisotope: {initial_config['deisotope']}")
+    print(f"   🟡 Initial search max_variable_mods: {initial_config['database']['max_variable_mods']}")
+    
+    # Full search configuration  
+    full_config = config.get_full_search_config()
+    print(f"   🟢 Full search cleave_at: {full_config['database']['enzyme']['cleave_at']}")
+    print(f"   🟢 Full search report_psms: {full_config['report_psms']}")
+    print(f"   🟢 Full search deisotope: {full_config['deisotope']}")
+    print(f"   🟢 Full search max_variable_mods: {full_config['database']['max_variable_mods']}")
+    
+    # 4. Show MuMDIA-specific settings
+    print(f"\n4. MuMDIA-specific settings:")
+    mumdia_config = config.get_mumdia_config()
+    print(f"   📊 FDR initial search: {config.fdr_init_search}")
+    print(f"   📊 Number of windows: {config.n_windows}")
+    print(f"   📊 Model type: {config.model_type}")
+    print(f"   💾 Read initial search pickle: {mumdia_config['read_initial_search_pickle']}")
+    print(f"   💾 Write initial search pickle: {mumdia_config['write_initial_search_pickle']}")
+    
+    # 5. Show legacy format compatibility
+    print(f"\n5. Legacy format compatibility:")
+    legacy_format = config.to_legacy_format()
+    print(f"   ✅ Legacy format has {len(legacy_format)} top-level sections:")
+    for section in legacy_format.keys():
+        print(f"      - {section}")
+    
+    print(f"\n🎉 Demo completed!")
+    print(f"\nTo run the actual MuMDIA workflow:")
+    print(f"   python run.py configs/config_simple.json")
+
+if __name__ == "__main__":
+    main()
diff --git a/run.py b/run.py
index b8beb0f..7a73d4d 100644
--- a/run.py
+++ b/run.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 """
-MuMDIA (Multi-modal Data-Independant Acquisition) Main Workflow
+MuMDIA
 
 This is the main entry point for the MuMDIA proteomics analysis pipeline.
 MuMDIA integrates multiple prediction tools and machine learning approaches
@@ -16,313 +16,39 @@
 
 os.environ["POLARS_MAX_THREADS"] = "1"
 
-import argparse
-import json
-import sys
 from pathlib import Path
-from typing import Tuple, cast
+from typing import cast
 
 import polars as pl
 
 import utilities.pickling as pickling
 from data_structures import PickleConfig, SpectraData
-from utilities.config_loader import merge_config_from_sources, write_updated_config
-from utilities.io_utils import create_dirs, remove_intermediate_files
+from utilities.io_utils import remove_intermediate_files
 from utilities.logger import log_info
 
+import mumdia
 
-def parse_arguments() -> Tuple[argparse.ArgumentParser, argparse.Namespace]:
-    """
-    Parse command line arguments for the MuMDIA workflow.
-
-    Returns:
-        Tuple containing:
-        - parser: ArgumentParser object for checking explicitly provided arguments
-        - args: Namespace object with parsed command line arguments
-    """
-    parser = argparse.ArgumentParser()
-
-    # Add arguments
-    parser.add_argument(
-        "--mzml_file",
-        help="The location of the mzml file",
-        default="mzml_files/LFQ_Orbitrap_AIF_Ecoli_01.mzML",
-    )
-    parser.add_argument(
-        "--mzml_dir", help="The directory of the mzml file", default="mzml_files"
-    )
-    parser.add_argument(
-        "--fasta_file",
-        help="The location of the fasta file",
-        default="fasta/unmodified_peptides.fasta",
-    )
-    parser.add_argument(
-        "--result_dir", help="The location of the result directory", default="results"
-    )
-    parser.add_argument(
-        "--config_file",
-        help="The location of the config file",
-        default="configs/config.json",
-    )
-
-    parser.add_argument(
-        "--remove_intermediate_files",
-        help="Remove intermediate results after completion",
-        action="store_true",
-        default=False,
-    )
-
-    parser.add_argument(
-        "--write_initial_search_pickle",
-        help="Write initial search pickles",
-        action="store_true",
-        default=False,
-    )
-
-    # Default: read initial search pickles (can be disabled with --no-read_initial_search_pickle)
-    parser.add_argument(
-        "--read_initial_search_pickle",
-        dest="read_initial_search_pickle",
-        help="Read initial search pickles",
-        action="store_true",
-    )
-    parser.add_argument(
-        "--no-read_initial_search_pickle",
-        dest="read_initial_search_pickle",
-        help="Do not read initial search pickles",
-        action="store_false",
-    )
-    parser.set_defaults(read_initial_search_pickle=True)
-
-    parser.add_argument(
-        "--write_deeplc_pickle",
-        help="Write DeepLC pickles",
-        action="store_true",
-        default=False,
-    )
-
-    parser.add_argument(
-        "--write_ms2pip_pickle",
-        help="Write MS2PIP pickles",
-        action="store_true",
-        default=False,
-    )
-
-    # Default: read DeepLC pickles (can be disabled with --no-read_deeplc_pickle)
-    parser.add_argument(
-        "--read_deeplc_pickle",
-        dest="read_deeplc_pickle",
-        help="Read DeepLC pickles",
-        action="store_true",
-    )
-    parser.add_argument(
-        "--no-read_deeplc_pickle",
-        dest="read_deeplc_pickle",
-        help="Do not read DeepLC pickles",
-        action="store_false",
-    )
-    parser.set_defaults(read_deeplc_pickle=True)
-
-    # Default: read MS2PIP pickles (can be disabled with --no-read_ms2pip_pickle)
-    parser.add_argument(
-        "--read_ms2pip_pickle",
-        dest="read_ms2pip_pickle",
-        help="Read MS2PIP pickles",
-        action="store_true",
-    )
-    parser.add_argument(
-        "--no-read_ms2pip_pickle",
-        dest="read_ms2pip_pickle",
-        help="Do not read MS2PIP pickles",
-        action="store_false",
-    )
-    parser.set_defaults(read_ms2pip_pickle=True)
-
-    parser.add_argument(
-        "--write_correlation_pickles",
-        help="Write correlation pickles",
-        action="store_true",
-        default=False,
-    )
-
-    # Default: read correlation pickles (can be disabled with --no-read_correlation_pickles)
-    parser.add_argument(
-        "--read_correlation_pickles",
-        dest="read_correlation_pickles",
-        help="Read correlation pickles",
-        action="store_true",
-    )
-    parser.add_argument(
-        "--no-read_correlation_pickles",
-        dest="read_correlation_pickles",
-        help="Do not read correlation pickles",
-        action="store_false",
-    )
-    parser.set_defaults(read_correlation_pickles=True)
-
-    # Default: use DeepLC transfer learning (can be disabled with --no-dlc_transfer_learn)
-    parser.add_argument(
-        "--dlc_transfer_learn",
-        dest="dlc_transfer_learn",
-        help="Use DeepLC transfer learning",
-        action="store_true",
-    )
-    parser.add_argument(
-        "--no-dlc_transfer_learn",
-        dest="dlc_transfer_learn",
-        help="Disable DeepLC transfer learning",
-        action="store_false",
-    )
-    parser.set_defaults(dlc_transfer_learn=True)
-
-    parser.add_argument(
-        "--write_full_search_pickle",
-        help="Write full search pickles",
-        action="store_true",
-        default=False,
-    )
-
-    # Default: read full search pickles (can be disabled with --no-read_full_search_pickle)
-    parser.add_argument(
-        "--read_full_search_pickle",
-        dest="read_full_search_pickle",
-        help="Read full search pickles",
-        action="store_true",
-    )
-    parser.add_argument(
-        "--no-read_full_search_pickle",
-        dest="read_full_search_pickle",
-        help="Do not read full search pickles",
-        action="store_false",
-    )
-    parser.set_defaults(read_full_search_pickle=True)
+from parsers.parser_mzml import get_ms1_mzml, split_mzml_by_retention_time
+from parsers.parser_parquet import parquet_reader
+from peptide_search.wrapper_sage import retention_window_searches, run_sage
+from prediction_wrappers.wrapper_deeplc import retrain_and_bounds
+from sequence.fasta import tryptic_digest_pyopenms
 
-    parser.add_argument(
-        "--fdr_init_search",
-        help="Q-value (FDR) threshold for initial search filtering",
-        type=float,
-        default=0.05,
-    )
-
-    # Additional possible configuration overrides from CLI
-    parser.add_argument(
-        "--sage_basic", help="Override sage basic settings in config", type=str
-    )
-    parser.add_argument(
-        "--mumdia_fdr", help="Override mumdia FDR setting in config", type=float
-    )
-
-    return parser, parser.parse_args()
-
-
-def was_arg_explicitly_provided(parser: argparse.ArgumentParser, arg_name: str) -> bool:
+def run_initial_search(config_obj, result_dir, result_temp_results_initial_search, pickle_config):
     """
-    Check if an argument with destination `arg_name` was explicitly provided on the command line.
-
-    Args:
-        parser: ArgumentParser object containing argument definitions
-        arg_name: Destination name of the argument to check
-
+    STAGE 1: Initial Search for Retention Time Model Training
+    
+    The MuMDIA pipeline uses a two-stage search strategy:
+    1. Initial broad search: Used to train DeepLC retention time models
+    2. Targeted search: Uses RT predictions to partition data for faster, more accurate searches
+    
     Returns:
-        True if the argument was explicitly provided, False otherwise
-    """
-    for action in parser._actions:
-        if action.dest == arg_name:
-            for option in action.option_strings:
-                # If any of the option flags for this argument is present in sys.argv, consider it provided.
-                if option in sys.argv:
-                    return True
-    return False
-
-
-def modify_config(
-    config_file: str,
-    result_dir: str,
-    parser: argparse.ArgumentParser,
-    args: argparse.Namespace,
-) -> str:
-    """
-    Load existing JSON (if any), merge with defaults + env + explicit CLI, and write to results.
-
-    Returns path to updated config JSON.
-    """
-    # Load existing configuration if it exists
-    existing_config = None
-    if os.path.exists(config_file):
-        with open(config_file, "r") as file:
-            existing_config = json.load(file)
-    else:
-        log_info(
-            f"Warning: Config file '{config_file}' not found. Using argparse defaults + env + CLI."
-        )
-
-    merged = merge_config_from_sources(existing_config, parser, args)
-    return write_updated_config(merged, result_dir)
-
-
-def main() -> str:
+        Tuple of (df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide, dlc_transfer_learn)
     """
-    Main MuMDIA workflow orchestrator.
-
-    This function coordinates the entire MuMDIA pipeline using argparse + JSON config.
-    """
-    log_info("Parsing command line arguments...")
-    parser, args = parse_arguments()
-
-    log_info("Creating the result directory...")
-    result_dir, result_temp, result_temp_results_initial_search = create_dirs(args)
-
-    log_info("Updating configuration if needed and saving to results folder...")
-    new_config_file = modify_config(
-        args.config_file, result_dir=args.result_dir, parser=parser, args=args
-    )
-
-    log_info("Reading the updated configuration JSON file...")
-    with open(new_config_file, "r") as file:
-        config = json.load(file)
-
-    # Lazy imports for heavy modules to avoid import errors during test collection
-    import mumdia
-    from parsers.parser_mzml import get_ms1_mzml, split_mzml_by_retention_time
-    from parsers.parser_parquet import parquet_reader
-    from peptide_search.wrapper_sage import retention_window_searches, run_sage
-    from prediction_wrappers.wrapper_deeplc import retrain_and_bounds
-    from sequence.fasta import tryptic_digest_pyopenms
-
-    args_dict = config["mumdia"]
-
-    # Configure pickle settings once for the entire workflow
-    pickle_config = PickleConfig(
-        write_deeplc=args_dict["write_deeplc_pickle"],
-        write_ms2pip=args_dict["write_ms2pip_pickle"],
-        write_correlation=args_dict["write_correlation_pickles"],
-        read_deeplc=args_dict["read_deeplc_pickle"],
-        read_ms2pip=args_dict["read_ms2pip_pickle"],
-        read_correlation=args_dict["read_correlation_pickles"],
-    )
-
-    # ============================================================================
-    # STAGE 1: Initial Search for Retention Time Model Training
-    # ============================================================================
-    # The MuMDIA pipeline uses a two-stage search strategy:
-    # 1. Initial broad search: Used to train DeepLC retention time models
-    # 2. Targeted search: Uses RT predictions to partition data for faster, more accurate searches
-
-    # Check if all required initial search pickle files exist
-    initial_search_pickles = [
-        "df_fragment_initial_search.pkl",
-        "df_psms_initial_search.pkl",
-        "df_fragment_max_initial_search.pkl",
-        "df_fragment_max_peptide_initial_search.pkl",
-        "config_initial_search.pkl",
-        "dlc_transfer_learn_initial_search.pkl",
-        "flags_initial_search.pkl",
-    ]
-    initial_search_pickles_exist = all(
-        os.path.exists(result_dir.joinpath(pickle_file))
-        for pickle_file in initial_search_pickles
-    )
-
+    # Get initial search config and mumdia settings
+    initial_config = config_obj.get_initial_search_config()
+    mumdia_config = config_obj.get_mumdia_config()
+    
     # Initialize variables to satisfy type checking and ensure defined in all branches
     df_fragment = pl.DataFrame()
     df_psms = pl.DataFrame()
@@ -330,25 +56,25 @@ def main() -> str:
     df_fragment_max_peptide = pl.DataFrame()
     dlc_transfer_learn = None
 
-    if args_dict["write_initial_search_pickle"] or not initial_search_pickles_exist:
+    if not mumdia_config["read_initial_search_pickle"]:
         log_info("Running initial Sage search for RT model training...")
-        # TODO: Earlier, implement a check whether the mzML file exists, because otherwise Sage will still run on an non-existing file and later on an error will be raised that is not very informative.
+        # TODO: Earlier, implement a check whether the mzML file exists, because 
+        # otherwise Sage will still run on an non-existing file and later on an error 
+        # will be raised that is not very informative.
         run_sage(
-            config["sage_basic"],
-            args_dict["fasta_file"],
-            result_dir.joinpath(result_temp, result_temp_results_initial_search),
+            initial_config,
+            config_obj.fasta_file,
+            result_temp_results_initial_search,
         )
 
         df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide = parquet_reader(
-            parquet_file_results=result_dir.joinpath(
-                result_temp, result_temp_results_initial_search, "results.sage.parquet"
+            parquet_file_results=result_temp_results_initial_search.joinpath(
+                "results.sage.parquet"
             ),
-            parquet_file_fragments=result_dir.joinpath(
-                result_temp,
-                result_temp_results_initial_search,
+            parquet_file_fragments=result_temp_results_initial_search.joinpath(
                 "matched_fragments.sage.parquet",
             ),
-            q_value_filter=args_dict["fdr_init_search"],
+            q_value_filter=config_obj.fdr_init_search,
         )
 
         # Narrow types for static analysis
@@ -357,16 +83,20 @@ def main() -> str:
         assert isinstance(df_fragment_max, pl.DataFrame)
         assert isinstance(df_fragment_max_peptide, pl.DataFrame)
 
+    if mumdia_config["write_initial_search_pickle"]:
+        # Create legacy config format for pickling compatibility
+        legacy_config = config_obj.to_legacy_format()
+        
         pickling.write_variables_to_pickles(
             df_fragment=cast(pl.DataFrame, df_fragment),
             df_psms=cast(pl.DataFrame, df_psms),
             df_fragment_max=cast(pl.DataFrame, df_fragment_max),
             df_fragment_max_peptide=cast(pl.DataFrame, df_fragment_max_peptide),
-            config=config,
+            config=legacy_config,
             dlc_transfer_learn=None,
             pickle_config=pickle_config,
-            write_full_search_pickle=args_dict["write_full_search_pickle"],
-            read_full_search_pickle=args_dict["read_full_search_pickle"],
+            write_full_search_pickle=mumdia_config["write_full_search_pickle"],
+            read_full_search_pickle=mumdia_config["read_full_search_pickle"],
             df_fragment_fname="df_fragment_initial_search.pkl",
             df_psms_fname="df_psms_initial_search.pkl",
             df_fragment_max_fname="df_fragment_max_initial_search.pkl",
@@ -378,7 +108,7 @@ def main() -> str:
             write_to_tsv=False,
         )
 
-    if args_dict["read_initial_search_pickle"]:
+    if mumdia_config["read_initial_search_pickle"]:
         (
             df_fragment,
             df_psms,
@@ -398,9 +128,9 @@ def main() -> str:
             flags_fname="flags_initial_search.pkl",
         )
 
-        del flags["write_full_search_pickle"]
-        del flags["read_full_search_pickle"]
-        args_dict.update(flags)
+        # Update the config object with any flags that were saved
+        # Note: In the new system, flags are handled through the config object
+        # so we don't need to update args_dict like before
 
     # Ensure DataFrames are concrete types for downstream usage
     assert isinstance(df_psms, pl.DataFrame)
@@ -409,15 +139,36 @@ def main() -> str:
     assert isinstance(df_fragment_max_peptide, pl.DataFrame)
 
     log_info("Number of PSMs after initial search: {}".format(len(df_psms)))
+    
+    return df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide, dlc_transfer_learn
 
-    # ============================================================================
-    # STAGE 2: Targeted Search with Retention Time Partitioning
-    # ============================================================================
-    # This stage uses the trained DeepLC model to predict retention times for all
-    # possible peptides, then partitions the mzML data by retention time for
-    # targeted searches that are both faster and more accurate.
 
-    # Check if all required initial search pickle files exist
+def run_targeted_search(config_obj, result_dir, pickle_config, df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide, dlc_transfer_learn):
+    """
+    STAGE 2: Targeted Search with Retention Time Partitioning
+    
+    This stage uses the trained DeepLC model to predict retention times for all
+    possible peptides, then partitions the mzML data by retention time for
+    targeted searches that are both faster and more accurate.
+    
+    Args:
+        config_obj: MuMDIAConfig object
+        result_dir: Result directory path
+        pickle_config: Pickle configuration
+        df_fragment: Fragment DataFrame from initial search
+        df_psms: PSMs DataFrame from initial search
+        df_fragment_max: Fragment max DataFrame from initial search
+        df_fragment_max_peptide: Fragment max peptide DataFrame from initial search
+        dlc_transfer_learn: DeepLC transfer learning model
+    
+    Returns:
+        Tuple of (df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide, dlc_transfer_learn)
+    """
+    # Get full search config and mumdia settings
+    full_config = config_obj.get_full_search_config()
+    mumdia_config = config_obj.get_mumdia_config()
+    
+    # Check if all required full search pickle files exist
     full_search_pickles = [
         "df_fragment.pkl",
         "df_psms.pkl",
@@ -433,9 +184,9 @@ def main() -> str:
         for pickle_file in full_search_pickles
     )
 
-    if args_dict["write_full_search_pickle"] or not full_search_pickles_exist:
+    if mumdia_config["write_full_search_pickle"] or not full_search_pickles_exist:
         log_info("Generating peptide library and training DeepLC model...")
-        peptides = tryptic_digest_pyopenms(config["sage"]["database"]["fasta"])
+        peptides = tryptic_digest_pyopenms(config_obj.fasta_file)
 
         # Train DeepLC retention time model and calculate prediction bounds
         # Narrow type for static analysis
@@ -446,17 +197,20 @@ def main() -> str:
 
         log_info("Partitioning mzML files by predicted retention time...")
         mzml_dict = split_mzml_by_retention_time(
-            config["sage_basic"]["mzml_paths"][0],  # use configured mzML
+            config_obj.mzml_file,  # use configured mzML
             time_interval=perc_95,
             dir_files=str(result_dir),
         )
 
+        # Create legacy config format for retention window searches
+        legacy_config = config_obj.to_legacy_format()
+        
         (
             df_fragment,
             df_psms,
             df_fragment_max,
             df_fragment_max_peptide,
-        ) = retention_window_searches(mzml_dict, peptide_df, config, perc_95)
+        ) = retention_window_searches(mzml_dict, peptide_df, legacy_config, perc_95)
 
         log_info("Adding the PSM identifier to fragments...")
         df_fragment = df_fragment.join(
@@ -474,16 +228,16 @@ def main() -> str:
             df_psms=cast(pl.DataFrame, df_psms),
             df_fragment_max=cast(pl.DataFrame, df_fragment_max),
             df_fragment_max_peptide=cast(pl.DataFrame, df_fragment_max_peptide),
-            config=config,
+            config=legacy_config,
             dlc_transfer_learn=dlc_transfer_learn,
             pickle_config=pickle_config,
-            write_full_search_pickle=args_dict["write_full_search_pickle"],
-            read_full_search_pickle=args_dict["read_full_search_pickle"],
+            write_full_search_pickle=mumdia_config["write_full_search_pickle"],
+            read_full_search_pickle=mumdia_config["read_full_search_pickle"],
             dir=result_dir,
             write_to_tsv=True,
         )
 
-    if args_dict["read_full_search_pickle"]:
+    if mumdia_config["read_full_search_pickle"]:
         (
             df_fragment,
             df_psms,
@@ -493,7 +247,73 @@ def main() -> str:
             dlc_transfer_learn,
             flags,
         ) = pickling.read_variables_from_pickles(dir=result_dir)
-        args_dict.update(flags)
+        # Note: In the new system, flags are handled through the config object
+
+    return df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide, dlc_transfer_learn  
+
+def main() -> str:
+    """
+    Main MuMDIA workflow orchestrator.
+
+    This function coordinates the entire MuMDIA pipeline using the new simplified config system.
+    """
+    import argparse
+    import sys
+    from config import load_config_from_json
+    
+    # Parse command line arguments
+    parser = argparse.ArgumentParser(description="Run MuMDIA workflow")
+    parser.add_argument("config_file", help="Path to JSON configuration file")
+    args = parser.parse_args()
+    
+    # Load configuration from JSON file
+    try:
+        config_obj = load_config_from_json(args.config_file)
+        log_info(f"Loaded configuration from {args.config_file}")
+    except Exception as e:
+        log_info(f"Error loading configuration: {e}")
+        sys.exit(1)
+    
+    # Ensure we're in the correct conda environment
+    conda_env = os.environ.get('CONDA_DEFAULT_ENV')
+    if conda_env != 'py312':
+        log_info(f"Warning: Expected conda environment 'py312', but currently in '{conda_env}'")
+        log_info("Please run: conda activate py312")
+    
+    log_info(f"Starting MuMDIA workflow with config file: {args.config_file}")
+    
+    # Create directories
+    result_dir = Path(config_obj.result_dir)
+    result_temp = result_dir / "temp"
+    result_temp_results_initial_search = result_temp / "initial_search_results"
+    
+    # Create all necessary directories
+    result_dir.mkdir(parents=True, exist_ok=True)
+    result_temp.mkdir(parents=True, exist_ok=True)
+    result_temp_results_initial_search.mkdir(parents=True, exist_ok=True)
+    
+    # Get mumdia configuration
+    mumdia_config = config_obj.get_mumdia_config()
+
+    # Configure pickle settings once for the entire workflow
+    pickle_config = PickleConfig(
+        write_deeplc=mumdia_config["write_deeplc_pickle"],
+        write_ms2pip=mumdia_config["write_ms2pip_pickle"],
+        write_correlation=mumdia_config["write_correlation_pickles"],
+        read_deeplc=mumdia_config["read_deeplc_pickle"],
+        read_ms2pip=mumdia_config["read_ms2pip_pickle"],
+        read_correlation=mumdia_config["read_correlation_pickles"],
+    )
+
+    # Run initial search (Stage 1)
+    df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide, dlc_transfer_learn = run_initial_search(
+        config_obj, result_dir, result_temp_results_initial_search, pickle_config
+    )
+
+    # Run targeted search (Stage 2)
+    df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide, dlc_transfer_learn = run_targeted_search(
+        config_obj, result_dir, pickle_config, df_fragment, df_psms, df_fragment_max, df_fragment_max_peptide, dlc_transfer_learn
+    )
 
     # ============================================================================
     # STAGE 3: Feature Calculation and Machine Learning Pipeline
@@ -501,7 +321,7 @@ def main() -> str:
     # Parse mzML to extract MS1 precursor information for additional features
     log_info("Parsing the mzML file for MS1 precursor information...")
     ms1_dict, ms2_to_ms1_dict, ms2_spectra = get_ms1_mzml(
-        config["sage_basic"]["mzml_paths"][0]  # TODO: should be for all mzml files
+        config_obj.mzml_file  # Using the mzml_file from the new config object
     )
 
     # Execute the main MuMDIA feature calculation and machine learning pipeline
@@ -522,7 +342,7 @@ def main() -> str:
         df_psms=df_psms,
         df_fragment_max=df_fragment_max,
         df_fragment_max_peptide=df_fragment_max_peptide,
-        config=config,
+        config=config_obj.to_legacy_format(),  # Convert to legacy format for compatibility
         deeplc_model=dlc_transfer_learn,
         pickle_config=pickle_config,
         spectra_data=spectra_data,
@@ -532,11 +352,11 @@ def main() -> str:
     # STAGE 4: Optional Cleanup and Final Processing
     # ============================================================================
     # Clean up intermediate files if requested to save disk space
-    if args_dict["remove_intermediate_files"]:
+    if config_obj.remove_intermediate_files:
         log_info("Cleaning up intermediate files...")
-        remove_intermediate_files(args_dict["result_dir"])
+        remove_intermediate_files(config_obj.result_dir)
 
-    return config["mumdia"]["result_dir"]
+    return config_obj.result_dir
 
 
 if __name__ == "__main__":
diff --git a/run_simple.py b/run_simple.py
index 7a07782..e69de29 100644
--- a/run_simple.py
+++ b/run_simple.py
@@ -1,79 +0,0 @@
-#!/usr/bin/env python3
-"""
-MuMDIA (Multi-modal Data-Independent Acquisition) - Simplified Main Workflow
-
-This demonstrates the new simplified configuration approach for MuMDIA.
-This is much cleaner than the original run.py with complex argument parsing.
-
-Usage:
-    python run_simple.py --mzml_file data.mzML --fasta_file proteins.fasta --result_dir results/
-    python run_simple.py --config_file my_config.json
-    python run_simple.py --no-cache  # Force recomputation
-"""
-
-import os
-
-os.environ["POLARS_MAX_THREADS"] = "1"
-
-from pathlib import Path
-
-from config_manager_clean import get_config
-from data_structures import PickleConfig
-from utilities.logger import log_info
-
-
-def main():
-    """
-    Main execution function using the simplified configuration approach.
-
-    Compare this to the complex original run.py:
-    - No complex argument parsing (100+ lines reduced to 1 line: get_config())
-    - No manual config merging and override logic
-    - Clean, readable configuration access
-    - Automatic config file saving for reference
-    """
-    # Get configuration - this replaces ~100 lines of complex parsing!
-    config = get_config()
-
-    log_info(f"Starting MuMDIA pipeline with config:")
-    log_info(f"  mzML file: {config.mzml_file}")
-    log_info(f"  FASTA file: {config.fasta_file}")
-    log_info(f"  Result directory: {config.result_dir}")
-    log_info(f"  Windows: {config.n_windows}")
-    log_info(f"  Training FDR: {config.training_fdr}")
-    log_info(f"  Final FDR: {config.final_fdr}")
-    log_info(f"  Model type: {config.model_type}")
-    log_info(f"  No cache: {config.no_cache}")
-    log_info(f"  Clean: {config.clean}")
-    log_info(f"  Sage only: {config.sage_only}")
-
-    # Create result directory
-    result_dir = Path(config.result_dir)
-    result_dir.mkdir(parents=True, exist_ok=True)
-
-    # Save the effective configuration for reference
-    config.save(str(result_dir / "effective_config.json"))
-    log_info(f"Saved effective configuration to {result_dir / 'effective_config.json'}")
-
-    # Configure pickle settings based on cache preference
-    pickle_config = PickleConfig()
-
-    # Now you can continue with the actual MuMDIA workflow
-    # The key difference is that configuration is clean and simple!
-
-    if config.sage_only:
-        log_info("Running Sage-only workflow...")
-        # Add Sage-only logic here
-    else:
-        log_info("Running full MuMDIA workflow...")
-        # Add full workflow logic here
-
-    if config.clean:
-        log_info("Cleaning up intermediate files...")
-        # Add cleanup logic here
-
-    log_info("MuMDIA pipeline completed successfully!")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/test_config_compatibility.py b/test_config_compatibility.py
new file mode 100644
index 0000000..4474f22
--- /dev/null
+++ b/test_config_compatibility.py
@@ -0,0 +1,82 @@
+#!/usr/bin/env python3
+"""
+Test script to verify that both old and new config formats work with the new system.
+
+This demonstrates that the new system is fully backwards compatible.
+"""
+
+from config import load_config_from_json
+
+def test_config_format(config_path, format_name):
+    """Test loading and using a specific config format."""
+    print(f"\n{'='*60}")
+    print(f"🧪 Testing {format_name} Config Format")
+    print(f"📁 File: {config_path}")
+    print(f"{'='*60}")
+    
+    try:
+        # Load config
+        config = load_config_from_json(config_path)
+        print(f"✅ Config loaded successfully!")
+        
+        # Show basic parameters
+        print(f"\n📋 Basic Parameters:")
+        print(f"   mzML file: {config.mzml_file}")
+        print(f"   FASTA file: {config.fasta_file}")
+        print(f"   Result dir: {config.result_dir}")
+        
+        # Show search parameter differences
+        print(f"\n🔬 Search Parameters:")
+        initial_config = config.get_initial_search_config()
+        full_config = config.get_full_search_config()
+        
+        print(f"   Parameter           Initial Search    Full Search")
+        print(f"   cleave_at           {initial_config['database']['enzyme']['cleave_at']:15} {full_config['database']['enzyme']['cleave_at']}")
+        print(f"   deisotope           {str(initial_config['deisotope']):15} {str(full_config['deisotope'])}")
+        print(f"   report_psms         {str(initial_config['report_psms']):15} {str(full_config['report_psms'])}")
+        print(f"   max_variable_mods   {str(initial_config['database']['max_variable_mods']):15} {str(full_config['database']['max_variable_mods'])}")
+        
+        # Show MuMDIA settings
+        mumdia_config = config.get_mumdia_config()
+        print(f"\n📊 MuMDIA Settings:")
+        print(f"   FDR initial search: {config.fdr_init_search}")
+        print(f"   Read initial pickle: {mumdia_config['read_initial_search_pickle']}")
+        print(f"   Write initial pickle: {mumdia_config['write_initial_search_pickle']}")
+        
+        print(f"\n✅ {format_name} format works perfectly!")
+        return True
+        
+    except Exception as e:
+        print(f"❌ Error testing {format_name} format: {e}")
+        return False
+
+def main():
+    print("🔧 MuMDIA Config Backwards Compatibility Test")
+    print("Testing both old (nested) and new (flat) config formats...")
+    
+    # Test old nested format
+    old_works = test_config_format("configs/config.json", "Legacy/Old Nested")
+    
+    # Test new flat format
+    new_works = test_config_format("configs/config_simple.json", "New Simplified Flat")
+    
+    print(f"\n{'='*60}")
+    print("🎯 Test Summary")
+    print(f"{'='*60}")
+    print(f"Legacy config (nested):    {'✅ PASS' if old_works else '❌ FAIL'}")
+    print(f"New config (flat):         {'✅ PASS' if new_works else '❌ FAIL'}")
+    print(f"Backwards compatibility:   {'✅ MAINTAINED' if old_works and new_works else '❌ BROKEN'}")
+    
+    if old_works and new_works:
+        print(f"\n🎉 SUCCESS: Both config formats work!")
+        print(f"   • Users can keep using their existing config.json files")
+        print(f"   • Users can also switch to the new simplified format")
+        print(f"   • The new system automatically detects and converts formats")
+        print(f"\nTo run MuMDIA:")
+        print(f"   python run.py configs/config.json        # Old format")
+        print(f"   python run.py configs/config_simple.json # New format")
+    else:
+        print(f"\n❌ FAILURE: Config compatibility is broken!")
+
+if __name__ == "__main__":
+    main()
diff --git a/utilities/plotting.py b/utilities/plotting.py
index deae7e2..d38981d 100644
--- a/utilities/plotting.py
+++ b/utilities/plotting.py
@@ -5,7 +5,7 @@
 from matplotlib.lines import Line2D
 
 
-def plot_XIC(df: pl.DataFrame, output_dir: str = "xics"):
+def plot_XIC(df: pl.DataFrame, output_dir: str = "results"):
     """
     Plots fragment_intensity vs rt for each unique fragment_name.
     Colors by fragment_name, lines connect fragments, marker shape by psm_id.