ooples · ooples · Nov 8, 2025
@@ -0,0 +1,158 @@
+namespace AiDotNet.FederatedLearning.Aggregators;
+
+using AiDotNet.Interfaces;
+
+/// <summary>
+/// Implements the Federated Averaging (FedAvg) aggregation strategy.
+/// </summary>
+/// <remarks>
+/// FedAvg is the foundational aggregation algorithm for federated learning, proposed by
+/// McMahan et al. in 2017. It performs a weighted average of client model updates based
+/// on the number of training samples each client has.
+///
+/// <b>For Beginners:</b> FedAvg is like calculating a weighted class average where students
+/// who solved more practice problems have more influence on the final answer.
+///
+/// How FedAvg works:
+/// 1. Each client trains on their local data and computes model updates
+/// 2. Clients send their updated model weights to the server
+/// 3. Server computes weighted average: weight = (client_samples / total_samples)
+/// 4. New global model = Σ(weight_i × client_model_i)
+///
+/// For example, with 3 hospitals:
+/// - Hospital A: 1000 patients, model accuracy 90%
+/// - Hospital B: 500 patients, model accuracy 88%
+/// - Hospital C: 1500 patients, model accuracy 92%
+///
+/// Total patients: 3000
+/// Hospital A weight: 1000/3000 = 0.333
+/// Hospital B weight: 500/3000 = 0.167
+/// Hospital C weight: 1500/3000 = 0.500
+///
+/// For each model parameter:
+/// global_param = 0.333 × A_param + 0.167 × B_param + 0.500 × C_param
+///
+/// Benefits:
+/// - Simple and efficient
+/// - Well-studied theoretically
+/// - Works well when clients have similar data distributions (IID data)
+///
+/// Limitations:
+/// - Assumes clients are equally reliable
+/// - Can struggle with non-IID data (different distributions across clients)
+/// - No built-in handling for stragglers (slow clients)
+///
+/// Reference: McMahan, H. B., et al. (2017). "Communication-Efficient Learning of Deep Networks
+/// from Decentralized Data." AISTATS 2017.
+/// </remarks>
+/// <typeparam name="T">The numeric type for model parameters (e.g., double, float).</typeparam>
+public class FedAvgAggregationStrategy<T> : IAggregationStrategy<Dictionary<string, T[]>>
+    where T : struct, IComparable<T>, IConvertible
+{
+    /// <summary>
+    /// Aggregates client models using weighted averaging based on the number of samples.
+    /// </summary>
+    /// <remarks>
+    /// This method implements the core FedAvg algorithm:
+    ///
+    /// Mathematical formulation:
+    /// w_global = Σ(n_k / n_total) × w_k
+    ///
+    /// where:
+    /// - w_global: global model weights
+    /// - w_k: client k's model weights
+    /// - n_k: number of samples at client k
+    /// - n_total: total samples across all clients
+    ///
+    /// <b>For Beginners:</b> This combines all client models into one by taking a weighted
+    /// average, where clients with more data have more influence.
+    ///
+    /// Step-by-step process:
+    /// 1. Calculate total samples across all clients
+    /// 2. For each client, compute weight = client_samples / total_samples
+    /// 3. For each model parameter, compute weighted sum
+    /// 4. Return the aggregated model
+    ///
+    /// For example, if we have 2 clients with a simple model (one parameter):
+    /// - Client 1: 300 samples, parameter value = 0.8
+    /// - Client 2: 700 samples, parameter value = 0.6
+    ///
+    /// Total samples: 1000
+    /// Client 1 weight: 300/1000 = 0.3
+    /// Client 2 weight: 700/1000 = 0.7
+    /// Aggregated parameter: 0.3 × 0.8 + 0.7 × 0.6 = 0.24 + 0.42 = 0.66
+    /// </remarks>
+    /// <param name="clientModels">Dictionary mapping client IDs to their model parameters.</param>
+    /// <param name="clientWeights">Dictionary mapping client IDs to their sample counts (weights).</param>
+    /// <returns>The aggregated global model parameters.</returns>
+    public Dictionary<string, T[]> Aggregate(
+        Dictionary<int, Dictionary<string, T[]>> clientModels,
+        Dictionary<int, double> clientWeights)
+    {
+        if (clientModels == null || clientModels.Count == 0)
+        {
+            throw new ArgumentException("Client models cannot be null or empty.", nameof(clientModels));
+        }
+
+        if (clientWeights == null || clientWeights.Count == 0)
+        {
+            throw new ArgumentException("Client weights cannot be null or empty.", nameof(clientWeights));
+        }
+
+        // Calculate total weight (total number of samples across all clients)
+        double totalWeight = clientWeights.Values.Sum();
+
+        if (totalWeight <= 0)
+        {
+            throw new ArgumentException("Total weight must be positive.", nameof(clientWeights));
+        }
+
+        // Get the first client's model structure to initialize the aggregated model
+        var firstClientModel = clientModels.First().Value;
+        var aggregatedModel = new Dictionary<string, T[]>();
+
+        // Initialize aggregated model with zeros
+        foreach (var layerName in firstClientModel.Keys)
+        {
+            aggregatedModel[layerName] = new T[firstClientModel[layerName].Length];
+        }
+
+        // Perform weighted aggregation
+        foreach (var clientId in clientModels.Keys)
+        {
+            var clientModel = clientModels[clientId];
+            var clientWeight = clientWeights[clientId];
+
+            // Normalized weight for this client
+            double normalizedWeight = clientWeight / totalWeight;
+
+            // Add weighted contribution from this client to the aggregated model
+            foreach (var layerName in clientModel.Keys)
+            {
+                var clientParams = clientModel[layerName];
+                var aggregatedParams = aggregatedModel[layerName];
+
+                for (int i = 0; i < clientParams.Length; i++)
+                {
+                    // Convert T to double, perform weighted addition, convert back to T
+                    double currentValue = Convert.ToDouble(aggregatedParams[i]);
+                    double clientValue = Convert.ToDouble(clientParams[i]);
+                    double weightedValue = currentValue + (normalizedWeight * clientValue);
+
+                    aggregatedParams[i] = (T)Convert.ChangeType(weightedValue, typeof(T));
+                }
+            }
+        }
+
+        return aggregatedModel;
+    }
+
+    /// <summary>
+    /// Gets the name of the aggregation strategy.
+    /// </summary>
+    /// <returns>The string "FedAvg".</returns>
+    public string GetStrategyName()
+    {
+        return "FedAvg";
+    }
+}