script3r
diff --git a/‎README.md‎
Lines changed: 20 additions & 4 deletions b/‎README.md‎
Lines changed: 20 additions & 4 deletions
diff --git a/‎crates/cbom-generator/src/algorithm_detector.rs‎
Lines changed: 49 additions & 39 deletions b/‎crates/cbom-generator/src/algorithm_detector.rs‎
Lines changed: 49 additions & 39 deletions
diff --git a/‎crates/cbom-generator/src/certificate_parser.rs‎
Lines changed: 21 additions & 55 deletions b/‎crates/cbom-generator/src/certificate_parser.rs‎
Lines changed: 21 additions & 55 deletions
@@ -4,7 +4,7 @@
   <img src="cipherscope.png" alt="CipherScope Logo" width="350" height="350">
 </div>
 
-Fast cryptographic inventory generator. Scans codebases to identify cryptographic algorithms and assess quantum resistance.
+Fast cryptographic inventory generator that creates Minimal Viable Cryptographic Bill of Materials (MV-CBOM) documents. Scans codebases to identify cryptographic algorithms, certificates, and assess post-quantum cryptography readiness.
 
 ## Quick Start
 
@@ -39,9 +39,25 @@ cargo build --release
 
 ## Options
 
+### Core Options
 - `--patterns PATH` - Custom patterns file (default: `patterns.toml`)
-- `--progress` - Show progress bar
-- `--deterministic` - Reproducible output for testing
+- `--progress` - Show progress bar during scanning
+- `--deterministic` - Reproducible output for testing/ground-truth generation
+- `--output FILE` - Output file for single-project CBOM (default: stdout)
+- `--recursive` - Generate MV-CBOMs for all discovered projects
+- `--output-dir DIR` - Output directory for recursive CBOMs
+
+### Filtering & Performance
+- `--threads N` - Number of processing threads
+- `--max-file-size MB` - Maximum file size to scan (default: 2MB)
+- `--include-glob GLOB` - Include files matching glob pattern(s)
+- `--exclude-glob GLOB` - Exclude files matching glob pattern(s)
+
+### Certificate Scanning
+- `--skip-certificates` - Skip certificate scanning during CBOM generation
+
+### Configuration
+- `--print-config` - Print merged patterns/config and exit
 
 ## Languages Supported
 
@@ -81,4 +97,4 @@ cargo test
 
 ## License
 
-MIT
+MIT
@@ -51,43 +51,40 @@ impl AlgorithmDetector {
         scan_path: &Path,
         findings: &[Finding],
     ) -> Result<Vec<CryptoAsset>> {
+        let registry = match &self.registry {
+            Some(registry) => registry,
+            None => return Ok(Vec::new()),
+        };
+
         let mut algorithms = Vec::new();
         let mut seen_algorithms = HashSet::new();
 
-        if let Some(registry) = &self.registry {
-            // Extract algorithms from findings using registry patterns
-            for finding in findings {
-                if let Some(algorithm_assets) =
-                    self.extract_algorithms_from_finding_with_registry(finding, registry)?
-                {
-                    for asset in algorithm_assets {
-                        let key = self.create_deduplication_key(&asset);
-                        if seen_algorithms.insert(key) {
-                            algorithms.push(asset);
-                        }
-                    }
-                }
-            }
-
-            // Only perform deep static analysis if we have a reasonable number of findings
-            // Skip for large codebases to avoid performance issues
-            if findings.len() < 1000 {
-                let additional_algorithms =
-                    self.perform_deep_static_analysis_with_registry(scan_path, registry)?;
-                for asset in additional_algorithms {
+        // Extract algorithms from findings using registry patterns
+        for finding in findings {
+            if let Some(algorithm_assets) =
+                self.extract_algorithms_from_finding_with_registry(finding, registry)?
+            {
+                for asset in algorithm_assets {
                     let key = self.create_deduplication_key(&asset);
                     if seen_algorithms.insert(key) {
                         algorithms.push(asset);
                     }
                 }
             }
-        } else {
-            // No registry available; skip instead of using static fallbacks.
+        }
+
+        // Always perform deep static analysis regardless of findings count
+        let additional_algorithms =
+            self.perform_deep_static_analysis_with_registry(scan_path, registry)?;
+        for asset in additional_algorithms {
+            let key = self.create_deduplication_key(&asset);
+            if seen_algorithms.insert(key) {
+                algorithms.push(asset);
+            }
         }
 
         // Merge duplicate algorithms with different parameter specificity
-        let merged_algorithms = self.merge_algorithm_assets(algorithms);
-        Ok(merged_algorithms)
+        Ok(self.merge_algorithm_assets(algorithms))
     }
 
     /// Extract algorithms from finding using pattern registry
@@ -119,7 +116,7 @@ impl AlgorithmDetector {
                         parameters,
                         Some(finding.library.clone()),
                         Some(AssetEvidence {
-                            file: finding.file.display().to_string(),
+                            file: finding.file.to_string_lossy().to_string(),
                             detector_id: finding.detector_id.clone(),
                             line: finding.span.line,
                             column: finding.span.column,
@@ -258,20 +255,18 @@ impl AlgorithmDetector {
     ) -> Result<Vec<CryptoAsset>> {
         let mut algorithms = Vec::new();
 
-        // Only analyze a limited number of files to avoid performance issues
-        const MAX_FILES_TO_ANALYZE: usize = 100;
-        let mut files_analyzed = 0;
+        // Analyze files for parameter extraction - removed arbitrary limits for comprehensive scanning
+        let mut _files_analyzed = 0;
 
         // Walk through source files for parameter extraction
         for entry in WalkDir::new(scan_path)
-            .max_depth(5) // Limit depth to avoid deep recursion
+            .max_depth(20) // Support very deep directory structures
             .into_iter()
             .filter_map(|e| e.ok())
             .filter(|e| e.file_type().is_file())
         {
-            if files_analyzed >= MAX_FILES_TO_ANALYZE {
-                break; // Stop after analyzing enough files
-            }
+            // Note: Removed MAX_FILES_TO_ANALYZE limit for comprehensive cryptographic analysis
+            // In large codebases, crypto usage can be deeply nested and limits can miss important findings
 
             let path = entry.path();
 
@@ -285,7 +280,7 @@ impl AlgorithmDetector {
                 ) {
                     if let Ok(mut extracted) = self.analyze_file_with_registry(path, registry) {
                         algorithms.append(&mut extracted);
-                        files_analyzed += 1;
+                        _files_analyzed += 1;
                     }
                 }
             }
@@ -373,18 +368,33 @@ impl AlgorithmDetector {
         Ok(algorithms)
     }
 
-    /// Create a proper deduplication key based on algorithm properties, not bom_ref
+    /// Create a deduplication key based on algorithm properties AND evidence location
+    /// This ensures same algorithms from different files are reported separately
     fn create_deduplication_key(&self, asset: &CryptoAsset) -> String {
         match &asset.asset_properties {
             AssetProperties::Algorithm(props) => {
-                // Deduplicate by algorithm name, primitive, and source library to avoid merging
-                // different libraries' detections of the same algorithm (e.g., OpenSSL vs CommonCrypto).
+                // Include evidence location to allow multiple instances from different files/locations
                 let library = asset.source_library.as_deref().unwrap_or("unknown-library");
+                let params_key = props
+                    .parameter_set
+                    .as_ref()
+                    .map(|p| format!("{:?}", p))
+                    .unwrap_or_else(|| "no-params".to_string());
+
+                // Include file and line information to allow same algorithm from different locations
+                let evidence_key = if let Some(evidence) = &asset.evidence {
+                    format!("{}:{}:{}", evidence.file, evidence.line, evidence.column)
+                } else {
+                    "no-evidence".to_string()
+                };
+
                 format!(
-                    "{}:{}:{}",
+                    "{}:{}:{}:{}:{}",
                     asset.name.as_deref().unwrap_or("unknown"),
                     props.primitive as u8,
-                    library
+                    library,
+                    params_key,
+                    evidence_key
                 )
             }
             _ => format!(
 
@@ -191,7 +191,7 @@ impl CertificateParser {
         }
     }
 
-    /// Map signature algorithm OID to algorithm properties
+    /// Map signature algorithm OID to algorithm properties (for tests)
     #[cfg(test)]
     fn map_signature_algorithm(
         &self,
@@ -202,113 +202,79 @@ impl CertificateParser {
         u8,
         Option<serde_json::Value>,
     ) {
-        match oid {
+        let (name, primitive, level) = match oid {
             // RSA signature algorithms - all vulnerable to quantum attacks
-            "1.2.840.113549.1.1.1" => (
-                "RSA".to_string(),
-                crate::CryptographicPrimitive::Signature,
-                0,
-                None,
-            ),
-            "1.2.840.113549.1.1.4" => (
-                "RSA with MD5".to_string(),
-                crate::CryptographicPrimitive::Signature,
-                0,
-                None,
-            ),
+            "1.2.840.113549.1.1.1" => ("RSA", crate::CryptographicPrimitive::Signature, 0),
+            "1.2.840.113549.1.1.4" => ("RSA with MD5", crate::CryptographicPrimitive::Signature, 0),
             "1.2.840.113549.1.1.5" => (
-                "RSA with SHA-1".to_string(),
+                "RSA with SHA-1",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
             "1.2.840.113549.1.1.11" => (
-                "RSA with SHA-256".to_string(),
+                "RSA with SHA-256",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
             "1.2.840.113549.1.1.12" => (
-                "RSA with SHA-384".to_string(),
+                "RSA with SHA-384",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
             "1.2.840.113549.1.1.13" => (
-                "RSA with SHA-512".to_string(),
+                "RSA with SHA-512",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
 
             // ECDSA signature algorithms - all vulnerable to quantum attacks
             "1.2.840.10045.4.1" => (
-                "ECDSA with SHA-1".to_string(),
+                "ECDSA with SHA-1",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
             "1.2.840.10045.4.3.1" => (
-                "ECDSA with SHA-224".to_string(),
+                "ECDSA with SHA-224",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
             "1.2.840.10045.4.3.2" => (
-                "ECDSA with SHA-256".to_string(),
+                "ECDSA with SHA-256",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
             "1.2.840.10045.4.3.3" => (
-                "ECDSA with SHA-384".to_string(),
+                "ECDSA with SHA-384",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
             "1.2.840.10045.4.3.4" => (
-                "ECDSA with SHA-512".to_string(),
+                "ECDSA with SHA-512",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
 
             // EdDSA - also vulnerable to quantum attacks
-            "1.3.101.112" => (
-                "Ed25519".to_string(),
-                crate::CryptographicPrimitive::Signature,
-                0,
-                None,
-            ),
-            "1.3.101.113" => (
-                "Ed448".to_string(),
-                crate::CryptographicPrimitive::Signature,
-                0,
-                None,
-            ),
+            "1.3.101.112" => ("Ed25519", crate::CryptographicPrimitive::Signature, 0),
+            "1.3.101.113" => ("Ed448", crate::CryptographicPrimitive::Signature, 0),
 
             // DSA - vulnerable to quantum attacks
-            "1.2.840.10040.4.1" => (
-                "DSA".to_string(),
-                crate::CryptographicPrimitive::Signature,
-                0,
-                None,
-            ),
+            "1.2.840.10040.4.1" => ("DSA", crate::CryptographicPrimitive::Signature, 0),
             "1.2.840.10040.4.3" => (
-                "DSA with SHA-1".to_string(),
+                "DSA with SHA-1",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
 
             // Default case for unknown algorithms
             _ => (
-                format!("Unknown Algorithm (OID: {})", oid),
+                "Unknown Algorithm",
                 crate::CryptographicPrimitive::Signature,
                 0,
-                None,
             ),
-        }
+        };
+
+        (name.to_string(), primitive, level, None)
     }
 
     /// Convert ASN.1 time to Chrono DateTime