ooples
diff --git a/‎src/AiDotNet.csproj‎
Lines changed: 2 additions & 0 deletions b/‎src/AiDotNet.csproj‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/Deployment/Configuration/ABTestingConfig.cs‎
Lines changed: 114 additions & 0 deletions b/‎src/Deployment/Configuration/ABTestingConfig.cs‎
Lines changed: 114 additions & 0 deletions
diff --git a/‎src/Deployment/Configuration/CacheConfig.cs‎
Lines changed: 92 additions & 0 deletions b/‎src/Deployment/Configuration/CacheConfig.cs‎
Lines changed: 92 additions & 0 deletions
diff --git a/‎src/Deployment/Configuration/DeploymentConfiguration.cs‎
Lines changed: 60 additions & 0 deletions b/‎src/Deployment/Configuration/DeploymentConfiguration.cs‎
Lines changed: 60 additions & 0 deletions
@@ -48,8 +48,10 @@
 	<ItemGroup>
 	  <PackageReference Include="Azure.Search.Documents" Version="11.7.0" />
 	  <PackageReference Include="Elastic.Clients.Elasticsearch" Version="9.2.1" />
+	  <PackageReference Include="Google.Protobuf" Version="3.28.3" />
 	  <PackageReference Include="Microsoft.CSharp" Version="4.7.0" />
 	  <PackageReference Include="Microsoft.Data.Sqlite" Version="8.0.21" />
+	  <PackageReference Include="Microsoft.ML.OnnxRuntime" Version="1.20.1" />
 	  <PackageReference Include="Newtonsoft.Json" Version="13.0.4" />
 	  <PackageReference Include="Pinecone.Client" Version="4.0.2" />
 	  <PackageReference Include="StackExchange.Redis" Version="2.9.32" />
 
@@ -0,0 +1,114 @@
+using AiDotNet.Enums;
+
+namespace AiDotNet.Deployment.Configuration;
+
+/// <summary>
+/// Configuration for A/B testing - comparing multiple model versions by splitting traffic.
+/// </summary>
+/// <remarks>
+/// <para><b>For Beginners:</b> A/B testing lets you try out a new model version on a small percentage
+/// of users before fully deploying it. This helps you:
+/// - Test new models in production safely
+/// - Compare performance between versions with real users
+/// - Gradually roll out changes to minimize risk
+/// - Make data-driven decisions about which model is better
+///
+/// How it works:
+/// You specify how to split traffic between versions. For example:
+/// - Version 1.0: 80% of traffic (current stable version)
+/// - Version 2.0: 20% of traffic (new experimental version)
+///
+/// Then you monitor metrics like accuracy, latency, and user satisfaction to decide
+/// which version is better.
+///
+/// Example:
+/// <code>
+/// var abConfig = new ABTestingConfig
+/// {
+///     Enabled = true,
+///     TrafficSplit = new Dictionary&lt;string, double&gt;
+///     {
+///         { "1.0.0", 0.9 },
+///         { "2.0.0", 0.1 }
+///     },
+///     ControlVersion = "1.0.0",
+///     AssignmentStrategy = AssignmentStrategy.Sticky
+/// };
+/// </code>
+/// </para>
+/// </remarks>
+public class ABTestingConfig
+{
+    /// <summary>
+    /// Gets or sets whether A/B testing is enabled (default: false).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> Set to true to enable traffic splitting between model versions.
+    /// False means all traffic goes to the default version.
+    /// </para>
+    /// </remarks>
+    public bool Enabled { get; set; } = false;
+
+    /// <summary>
+    /// Gets or sets the traffic split configuration.
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> Dictionary mapping version name to traffic percentage (0.0 to 1.0).
+    /// Example: { "1.0": 0.8, "2.0": 0.2 } means 80% on v1.0, 20% on v2.0.
+    /// Percentages must sum to 1.0.
+    /// </para>
+    /// </remarks>
+    public Dictionary<string, double> TrafficSplit { get; set; } = new();
+
+    /// <summary>
+    /// Gets or sets the strategy for assigning users to versions (default: Random).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> How to assign requests to versions:
+    /// - Random: Each request randomly assigned based on traffic split
+    /// - Sticky: Users consistently get the same version (based on user ID hash)
+    /// - Gradual: Gradually shift traffic from old to new version over time
+    /// </para>
+    /// </remarks>
+    public AssignmentStrategy AssignmentStrategy { get; set; } = AssignmentStrategy.Random;
+
+    /// <summary>
+    /// Gets or sets the duration in days for the A/B test (default: 7).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> How long to run the test before analyzing results.
+    /// 7 days is typical for gathering meaningful data. After this, choose a winner.
+    /// </para>
+    /// </remarks>
+    public int TestDurationDays { get; set; } = 7;
+
+    /// <summary>
+    /// Gets or sets whether to track experiment assignment for each request (default: true).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> Records which version was used for each request.
+    /// Useful for analysis but adds slight overhead. Recommended for A/B testing.
+    /// </para>
+    /// </remarks>
+    public bool TrackAssignments { get; set; } = true;
+
+    /// <summary>
+    /// Gets or sets the minimum sample size per version before comparing results (default: 1000).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> Need at least this many samples before results are statistically significant.
+    /// 1000 is a good minimum. Don't make decisions with fewer samples.
+    /// </para>
+    /// </remarks>
+    public int MinSampleSize { get; set; } = 1000;
+
+    /// <summary>
+    /// Gets or sets the control group version (baseline for comparison).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> The current production version to compare against.
+    /// Typically your stable version. New versions are compared to this baseline.
+    /// </para>
+    /// </remarks>
+    public string? ControlVersion { get; set; }
+}
@@ -0,0 +1,92 @@
+using AiDotNet.Enums;
+
+namespace AiDotNet.Deployment.Configuration;
+
+/// <summary>
+/// Configuration for model caching - storing loaded models in memory to avoid repeated loading.
+/// </summary>
+/// <remarks>
+/// <para><b>For Beginners:</b> Loading an AI model from disk takes time. Caching keeps recently-used
+/// models in memory so they can be used again instantly, like keeping your frequently-used apps
+/// open on your phone instead of closing and reopening them.
+///
+/// Benefits:
+/// - Much faster inference (no model loading time)
+/// - Better throughput when serving multiple requests
+/// - Reduces disk I/O
+///
+/// Considerations:
+/// - Uses memory (RAM) to store models
+/// - Limited cache size - old models get evicted when full
+///
+/// Eviction Policies (what to remove when cache is full):
+/// - LRU (Least Recently Used): Removes models you haven't used in a while (recommended)
+/// - LFU (Least Frequently Used): Removes models used least often
+/// - FIFO: Removes oldest models first
+/// - Random: Removes random models (simple but unpredictable)
+///
+/// For most applications, LRU with a moderate max size works well.
+/// </para>
+/// </remarks>
+public class CacheConfig
+{
+    /// <summary>
+    /// Gets or sets whether caching is enabled (default: true).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> Set to true to enable caching, false to disable it entirely.
+    /// Caching is recommended for production systems to improve performance.
+    /// </para>
+    /// </remarks>
+    public bool Enabled { get; set; } = true;
+
+    /// <summary>
+    /// Gets or sets the maximum number of models to cache (default: 10).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> How many models to keep in memory simultaneously.
+    /// Higher values use more memory but reduce cache misses. 10 is a good default for most cases.
+    /// </para>
+    /// </remarks>
+    public int MaxCacheSize { get; set; } = 10;
+
+    /// <summary>
+    /// Gets or sets the cache eviction policy (default: LRU).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> Determines which model to remove when cache is full.
+    /// LRU (Least Recently Used) is recommended - it removes models you haven't used recently.
+    /// </para>
+    /// </remarks>
+    public CacheEvictionPolicy EvictionPolicy { get; set; } = CacheEvictionPolicy.LRU;
+
+    /// <summary>
+    /// Gets or sets the cache entry time-to-live in seconds (default: 3600 = 1 hour).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> How long unused models stay in cache before removal.
+    /// Default is 1 hour. Set to 0 to disable TTL (models only removed when cache is full).
+    /// </para>
+    /// </remarks>
+    public int TimeToLiveSeconds { get; set; } = 3600;
+
+    /// <summary>
+    /// Gets or sets whether to preload models on startup (default: false).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> If true, frequently-used models are loaded into cache at startup.
+    /// This eliminates first-request latency but increases startup time. Use for production servers.
+    /// </para>
+    /// </remarks>
+    public bool PreloadModels { get; set; } = false;
+
+    /// <summary>
+    /// Gets or sets whether to track cache hit/miss statistics (default: true).
+    /// </summary>
+    /// <remarks>
+    /// <para><b>For Beginners:</b> Tracks how often models are found in cache (hits) vs loaded from disk (misses).
+    /// Useful for monitoring and optimization but has tiny performance overhead. Recommended.
+    /// </para>
+    /// </remarks>
+    public bool TrackStatistics { get; set; } = true;
+}
@@ -0,0 +1,60 @@
+namespace AiDotNet.Deployment.Configuration;
+
+/// <summary>
+/// Aggregates all deployment-related configurations.
+/// Used to pass deployment settings from PredictionModelBuilder to PredictionModelResult.
+/// </summary>
+public class DeploymentConfiguration
+{
+    /// <summary>
+    /// Gets or sets the quantization configuration (null = no quantization).
+    /// </summary>
+    public QuantizationConfig? Quantization { get; set; }
+
+    /// <summary>
+    /// Gets or sets the caching configuration (null = use defaults).
+    /// </summary>
+    public CacheConfig? Caching { get; set; }
+
+    /// <summary>
+    /// Gets or sets the versioning configuration (null = use defaults).
+    /// </summary>
+    public VersioningConfig? Versioning { get; set; }
+
+    /// <summary>
+    /// Gets or sets the A/B testing configuration (null = disabled).
+    /// </summary>
+    public ABTestingConfig? ABTesting { get; set; }
+
+    /// <summary>
+    /// Gets or sets the telemetry configuration (null = use defaults).
+    /// </summary>
+    public TelemetryConfig? Telemetry { get; set; }
+
+    /// <summary>
+    /// Gets or sets the export configuration (null = use defaults).
+    /// </summary>
+    public ExportConfig? Export { get; set; }
+
+    /// <summary>
+    /// Creates a deployment configuration from individual config objects.
+    /// </summary>
+    public static DeploymentConfiguration Create(
+        QuantizationConfig? quantization,
+        CacheConfig? caching,
+        VersioningConfig? versioning,
+        ABTestingConfig? abTesting,
+        TelemetryConfig? telemetry,
+        ExportConfig? export)
+    {
+        return new DeploymentConfiguration
+        {
+            Quantization = quantization,
+            Caching = caching,
+            Versioning = versioning,
+            ABTesting = abTesting,
+            Telemetry = telemetry,
+            Export = export
+        };
+    }
+}