JuliaAI
diff --git a/‎src/MLJParticleSwarmOptimization.jl‎
Lines changed: 3 additions & 1 deletion b/‎src/MLJParticleSwarmOptimization.jl‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎src/parameters.jl‎
Lines changed: 5 additions & 10 deletions b/‎src/parameters.jl‎
Lines changed: 5 additions & 10 deletions
diff --git a/‎src/strategies/abstract.jl‎
Lines changed: 11 additions & 0 deletions b/‎src/strategies/abstract.jl‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎src/strategies/adaptive.jl‎
Lines changed: 227 additions & 0 deletions b/‎src/strategies/adaptive.jl‎
Lines changed: 227 additions & 0 deletions
diff --git a/‎src/strategies/basic.jl‎
Lines changed: 4 additions & 4 deletions b/‎src/strategies/basic.jl‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎src/update.jl‎
Lines changed: 4 additions & 6 deletions b/‎src/update.jl‎
Lines changed: 4 additions & 6 deletions
diff --git a/‎test/parameters.jl‎
Lines changed: 7 additions & 7 deletions b/‎test/parameters.jl‎
Lines changed: 7 additions & 7 deletions
@@ -6,11 +6,13 @@ using Distributions
 using MLJBase
 using MLJTuning
 
-export StaticCoeffs, ParticleSwarm
+export ParticleSwarm, AdaptiveParticleSwarm
 
 include("swarm.jl")
 include("parameters.jl")
 include("update.jl")
+include("strategies/abstract.jl")
 include("strategies/basic.jl")
+include("strategies/adaptive.jl")
 
 end
@@ -4,17 +4,13 @@
 
 # Initialize particle swarm state
 
-function initialize(
-    r::Union{ParamRange, Tuple{ParamRange, Any}},
-    tuning::AbstractParticleSwarm
-)
-    return initialize([r], tuning)
+function initialize(rng::AbstractRNG, r::Union{ParamRange, Tuple{ParamRange, Any}}, n::Int)
+    return initialize(rng, [r], n)
 end
 
-function initialize(rs::AbstractVector, tuning::AbstractParticleSwarm)
-    n = tuning.n_particles
+function initialize(rng::AbstractRNG, rs::AbstractVector, n::Int)
     # `length` is 1 for `NumericRange` and the number of categories for `NominalRange`
-    ranges, parameters, lengths, Xᵢ = zip(_initialize.(tuning.rng, rs, n)...)
+    ranges, parameters, lengths, Xᵢ = zip(_initialize.(rng, rs, n)...)
     indices = _to_indices(lengths)
     X = hcat(Xᵢ...)
     V = zero(X)
@@ -102,9 +98,8 @@ end
 # For updating `state.parameters`, the model hyperparameters to be returned, from their
 # internal representation `state.X`
 
-function retrieve!(state::ParticleSwarmState, tuning::AbstractParticleSwarm)
+function retrieve!(rng::AbstractRNG, state::ParticleSwarmState)
     ranges, params, indices, X = state.ranges, state.parameters, state.indices, state.X
-    rng = tuning.rng
     for (r, p, i) in zip(ranges, params, indices)
         _retrieve!(rng, p, r, view(X, :, i))
     end
 
@@ -0,0 +1,11 @@
+function initialize(r, tuning::AbstractParticleSwarm)
+    return initialize(tuning.rng, r, tuning.n_particles)
+end
+
+function retrieve!(state::ParticleSwarmState, tuning::AbstractParticleSwarm)
+    return retrieve!(tuning.rng, state)
+end
+
+function pbest!(state::ParticleSwarmState, measurements, tuning::AbstractParticleSwarm)
+    return pbest!(state, measurements, tuning.prob_shift)
+end
@@ -0,0 +1,227 @@
+"""
+    AdaptiveParticleSwarm(n_particles = 3,
+                          c1 = 2.0,
+                          c2 = 2.0,
+                          prob_shift = 0.25,
+                          rng = Random.GLOBAL_RNG)
+
+Instantiate an adaptive particle swarm optimization tuning strategy. A swarm is
+initiated by sampling hyperparameters with their customizable priors, and new
+models are generated by referencing each member's and the swarm's best models so
+far.
+
+### Supported Ranges and Discrete Hyperparameter Handling
+
+See [`ParticleSwarm`](@ref) for more information about supported ranges and how
+discrete hyperparameters are handled.
+
+### Algorithm
+
+Hyperparameter ranges are sampled and concatenated into position vectors for
+each swarm particle. Velocity is initiated to be zeros, and in each iteration,
+every particle's position is updated to approach its personal best and the
+swarm's best models so far with the equations:
+
+\$vₖ₊₁ = w⋅vₖ + c₁⋅rand()⋅(pbest - xₖ) + c₂⋅rand()⋅(gbest - xₖ)\$
+
+\$xₖ₊₁ = xₖ + vₖ₊₁\$
+
+Coefficients `w`, `c1`, `c2` are adaptively adjusted at each iteration by
+determining the evolutionary phase of the swarm. We calculate the evolutionary
+factor by comparing the mean distance from each particle to other members of the
+swarm. This factor is then used to classify whether the swarm is in exploration,
+exploitation, convergence, or jumping out phase and calibrate the tuning
+hyperparameters accordingly. For more information, refer to "Adaptive Particle
+Swarm Optimiztion" by Zhan, Zhang, Li, and Chung. Note that we omit the elitist
+learning strategy in the paper.
+
+New models are then generated for evaluation by mutating the fields of a deep
+copy of `model`. If the corresponding range has a specified `scale` function,
+then the transformation is applied before the hyperparameter is returned. If
+`scale` is a symbol (eg, `:log`), it is ignored.
+"""
+mutable struct AdaptiveParticleSwarm{R<:AbstractRNG} <: AbstractParticleSwarm
+    n_particles::Int
+    c1::Float64
+    c2::Float64
+    prob_shift::Float64
+    rng::R
+end
+
+# Constructor
+
+function AdaptiveParticleSwarm(;
+    n_particles=3,
+    c1=2.0,
+    c2=2.0,
+    prob_shift=0.25,
+    rng::R=Random.GLOBAL_RNG
+) where {R}
+    swarm = AdaptiveParticleSwarm{R}(n_particles, c1, c2, prob_shift, rng)
+    message = MLJTuning.clean!(swarm)
+    isempty(message) || @warn message
+    return swarm
+end
+
+# Validate tuning hyperparameters
+
+function MLJTuning.clean!(tuning::AdaptiveParticleSwarm)
+    warning = ""
+    if tuning.n_particles < 3
+        warning *= "AdaptiveParticleSwarm requires at least 3 particles. " *
+                   "Resetting n_particles=3. "
+        tuning.n_particles = 3
+    end
+    c1, c2 = tuning.c1, tuning.c2
+    if !(1.5 ≤ c1 ≤ 2.5) || !(1.5 ≤ c2 ≤ 2.5) || (c1 + c2 > 4)
+        c1, c2 = _clamp_coefficients(c1, c2)
+        warning *= "AdaptiveParticleSwarm requires 1.5 ≤ c1 ≤ 2.5, 1.5 ≤ c2 ≤ 2.5, and " *
+                   "c1 + c2 ≤ 4. Resetting coefficients c1=$(c1), c2=$(c2). "
+        tuning.c1 = c1
+        tuning.c2 = c2
+    end
+    if !(0 ≤ tuning.prob_shift < 1)
+        warning *= "AdaptiveParticleSwarm requires 0 ≤ prob_shift < 1. " *
+                   "Resetting prob_shift=0.25. "
+        tuning.prob_shift = 0.25
+    end
+    return warning
+end
+
+# Helper function to clamp swarm coefficients in the interval [1.5, 2.5] with a sum of less
+# than or equal to 4
+
+function _clamp_coefficients(c1, c2)
+    c1 = min(max(c1, 1.5), 2.5)
+    c2 = min(max(c2, 1.5), 2.5)
+    scale = 4. / (c1 + c2)
+    if scale < 1
+        c1 *= scale
+        c2 *= scale
+    end
+    return c1, c2
+end
+
+# Initial state
+
+function MLJTuning.setup(tuning::AdaptiveParticleSwarm, model, ranges, n, verbosity)
+    # state, evolutionary phase, swarm coefficients
+    return (initialize(ranges, tuning), nothing, tuning.c1, tuning.c2)
+end
+
+# New models
+
+function MLJTuning.models(
+    tuning::AdaptiveParticleSwarm,
+    model,
+    history,
+    (state, phase, c1, c2),
+    n_remaining,
+    verbosity
+)
+    n_particles = tuning.n_particles
+    if !isnothing(history)
+        sig = MLJTuning.signature(history[1].measure[1])
+        measurements = similar(state.pbest)
+        map(history[end-n_particles+1:end]) do h
+            measurements[h.metadata] = sig * h.measurement[1]
+        end
+        pbest!(state, measurements, tuning)
+        gbest!(state)
+        f = _evolutionary_factor(state.X, argmin(state.pbest))
+        phase = _evolutionary_phase(f, phase)
+        w, c1, c2 = _adapt_parameters(tuning.rng, c1, c2, f, phase)
+        move!(tuning.rng, state, w, c1, c2)
+    end
+    retrieve!(state, tuning)
+    fields = getproperty.(state.ranges, :field)
+    new_models = map(1:n_particles) do i
+        clone = deepcopy(model)
+        for (field, param) in zip(fields, getindex.(state.parameters, i))
+            recursive_setproperty!(clone, field, param)
+        end
+        (clone, i)
+    end
+    return new_models, (state, phase, c1, c2)
+end
+
+# Helper function to calculate the evolutionary factor and phase
+
+function _evolutionary_factor(X, gbest_i)
+    n_particles = size(X, 1)
+    dists = zeros(n_particles, n_particles)
+    for i in 1:n_particles
+        for j in i+1:n_particles
+            dists[j, i] = dists[i, j] = norm(X[i, :] - X[j, :])
+        end
+    end
+    mean_dists = sum(dists, dims=2) / (n_particles - 1)
+    min_dist, max_dist = extrema(mean_dists)
+    gbest_dist = mean_dists[gbest_i]
+    f = (gbest_dist - min_dist) / max(max_dist - min_dist, sqrt(eps()))
+    return f
+end
+
+function _evolutionary_phase(f, phase)
+    # Classify evolutionary phase
+    μs = [μ₁(f), μ₂(f), μ₃(f), μ₄(f)]
+    if phase === nothing # first iteration
+        phase = argmax(μs)
+    else
+        next_phase = mod1(phase + 1, 4)
+        # switch to next phase if possible
+        if μs[next_phase] > 0
+            phase = next_phase
+        # stay in current phase is possible, else pick the most likely phase
+        elseif μs[phase] == 0
+            phase = argmax(μs)
+        end
+    end
+    return phase
+end
+
+# Helper functions to calculate probabilities of the four evolutionary states
+
+μ₁(f) = f ≤ 0.4 ? 0.0         :
+        f ≤ 0.6 ? 5 * f - 2   :
+        f ≤ 0.7 ? 1           :
+        f ≤ 0.8 ? -10 * f + 8 :
+        0.0
+
+μ₂(f) = f ≤ 0.2 ? 0.0        :
+        f ≤ 0.3 ? 10 * f - 2 :
+        f ≤ 0.4 ? 1.0        :
+        f ≤ 0.6 ? -5 * f + 3 :
+        0.0
+
+μ₃(f) = f ≤ 0.1 ? 1.0          :
+        f ≤ 0.3 ? -5 * f + 1.5 :
+        0.0
+
+μ₄(f) = f ≤ 0.7 ? 0.0         :
+        f ≤ 0.9 ? 5 * f - 3.5 :
+        1.0
+
+# Adaptive control of swarm's parameters
+
+function _adapt_parameters(rng, c1, c2, f, phase)
+    w = 1.0 / (1.0 + 1.5*exp(-2.6 * f)) # update inertia
+    δ = rand(rng) * 0.05 + 0.05 # coefficient acceleration
+    if phase === 1 # exploration
+        c1 += δ
+        c2 -= δ
+    elseif phase === 2 # exploitation
+        δ *= 0.5
+        c1 += δ
+        c2 -= δ
+    elseif phase === 3 # convergence
+        δ *= 0.5
+        c1 += δ
+        c2 += δ
+    else # jumping out
+        c1 -= δ
+        c2 += δ
+    end
+    c1, c2 = _clamp_coefficients(c1, c2)
+    return w, c1, c2
+end
@@ -10,7 +10,7 @@ Instantiate a particle swarm optimization tuning strategy. A swarm is initiated
 by sampling hyperparameters with their customizable priors, and new models are
 generated by referencing each member's and the swarm's best models so far.
 
-### Supported ranges
+### Supported Ranges
 
 A single one-dimensional range or vector of one-dimensional ranges can be
 specified. `ParamRange` objects are constructed using the `range` method. If not
@@ -171,9 +171,9 @@ function MLJTuning.models(
         map(history[end-n_particles+1:end]) do h
             measurements[h.metadata] = sign * h.measurement[1]
         end
-        pbest!(state, tuning, measurements)
-        gbest!(state, tuning)
-        move!(state, tuning)
+        pbest!(state, measurements, tuning)
+        gbest!(state)
+        move!(tuning.rng, state, T(tuning.w), T(tuning.c1), T(tuning.c2))
     end
     retrieve!(state, tuning)
     fields = getproperty.(state.ranges, :field)
 
@@ -1,8 +1,7 @@
 # Move the swarm
 
-function move!(state::ParticleSwarmState{T}, tuning::AbstractParticleSwarm) where {T}
-    rng, X, V = tuning.rng, state.X, state.V
-    w, c1, c2 = T(tuning.w), T(tuning.c1), T(tuning.c2)
+function move!(rng::AbstractRNG, state::ParticleSwarmState{T}, w, c1, c2) where {T}
+    X, V = state.X, state.V
     @. V = w*V + c1*rand(rng, T)*(state.pbest_X - X) + c2*rand(rng, T)*(state.gbest_X - X)
     X .+= V
     for (r, idx) in zip(state.ranges, state.indices)
@@ -24,9 +23,8 @@ end
 
 # Update pbest
 
-function pbest!(state::ParticleSwarmState, tuning::AbstractParticleSwarm, measurements)
+function pbest!(state::ParticleSwarmState, measurements, prob_shift)
     X, pbest, pbest_X = state.X, state.pbest, state.pbest_X
-    prob_shift = tuning.prob_shift
     improved = measurements .<= pbest
     pbest[improved] .= measurements[improved]
     for (r, p, i) in zip(state.ranges, state.parameters, state.indices)
@@ -48,7 +46,7 @@ end
 
 # Update gbest
 
-function gbest!(state::ParticleSwarmState, tuning::AbstractParticleSwarm)
+function gbest!(state::ParticleSwarmState)
     pbest, pbest_X, gbest, gbest_X = state.pbest, state.pbest_X, state.gbest, state.gbest_X
     best, i = findmin(pbest)
     gbest .= best
 
@@ -69,29 +69,29 @@
     end
 
     @testset "Initialize one range" begin
-        ps = ParticleSwarm(n_particles=n, rng=StableRNG(1234))
+        rng = StableRNG(1234)
         for (r, l, i, X) in zip(rs, lengths, indices, Xs)
-            state = PSO.initialize(r, ps)
+            state = PSO.initialize(rng, r, n)
             @test state.ranges == (r,)
             @test state.indices == (l == 1 ? 1 : 1:l,)
             @test state.X ≈ X
         end
     end
 
     @testset "Initialize multiple ranges" begin
-        ps = ParticleSwarm(n_particles=n, rng=StableRNG(1234))
+        rng = StableRNG(1234)
         ranges = [r1, (r2, Uniform), (r3, d3), r4]
-        state = PSO.initialize(ranges, ps)
+        state = PSO.initialize(rng, ranges, n)
         @test state.ranges == rs
         @test state.indices == indices
         @test state.X ≈ hcat(Xs...)
     end
 
     @testset "Retrieve parameters" begin
-        ps = ParticleSwarm(n_particles=n, rng=StableRNG(1234))
+        rng = StableRNG(1234)
         ranges = [r1, (r2, Uniform), (r3, d3), r4]
-        state = PSO.initialize(ranges, ps)
-        PSO.retrieve!(state, ps)
+        state = PSO.initialize(rng, ranges, n)
+        PSO.retrieve!(rng, state)
         @test state.parameters == (
             ["a", "a", "c"],
             [553, 250, 375],