JuliaAI
diff --git a/‎Project.toml‎
Lines changed: 10 additions & 6 deletions b/‎Project.toml‎
Lines changed: 10 additions & 6 deletions
diff --git a/‎src/MLJLinearModels.jl‎
Lines changed: 7 additions & 0 deletions b/‎src/MLJLinearModels.jl‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎src/glr/constructors.jl‎
Lines changed: 6 additions & 8 deletions b/‎src/glr/constructors.jl‎
Lines changed: 6 additions & 8 deletions
diff --git a/‎src/mlj/classifiers.jl‎
Lines changed: 39 additions & 0 deletions b/‎src/mlj/classifiers.jl‎
Lines changed: 39 additions & 0 deletions
diff --git a/‎src/mlj/interface.jl‎
Lines changed: 118 additions & 0 deletions b/‎src/mlj/interface.jl‎
Lines changed: 118 additions & 0 deletions
@@ -1,22 +1,26 @@
 name = "MLJLinearModels"
 uuid = "6ee0df7b-362f-4a72-a706-9e79364fb692"
 authors = ["Thibaut Lienart <[email protected]>"]
-version = "0.1.0"
+version = "0.2.0"
 
 [deps]
 DocStringExtensions = "ffbed154-4ef7-542d-bbb7-c09d3a79fcae"
 IterativeSolvers = "42fd0dbc-a981-5370-80f2-aaf504508153"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 LinearMaps = "7a12625a-238d-50fd-b39a-03d52299707e"
+MLJBase = "a7f614a8-145f-11e9-1d2a-a57a1082229d"
 Optim = "429524aa-4258-5aef-a3af-852621145aeb"
 Parameters = "d96e819e-fc66-5662-9728-84c9c7592b0a"
+Tables = "bd369af6-aec1-5ad0-b16a-f7cc5008161c"
 
 [compat]
-DocStringExtensions = ">= 0.7.0"
-Optim = ">= 0.19"
-IterativeSolvers = ">= 0.8"
-Parameters = ">= 0.10"
-LinearMaps = ">= 2.5"
+DocStringExtensions = "^0.8"
+IterativeSolvers = "^0.8"
+LinearMaps = "^2.5"
+MLJBase = "^0.7"
+Optim = "^0.19"
+Parameters = "^0.12"
+Tables = "^0.2"
 julia = "^1.0.0"
 
 [extras]
 
@@ -6,10 +6,14 @@ import LinearMaps: LinearMap
 import IterativeSolvers: cg
 import Optim
 
+import MLJBase
+
 import Base.+, Base.-, Base.*, Base./, Base.convert
 
 const AVR = AbstractVector{<:Real}
 
+const Option{T} = Union{Nothing,T}
+
 include("scratchspace.jl")
 
 include("utils.jl")
@@ -39,4 +43,7 @@ include("fit/proxgrad.jl")
 include("fit/iwls.jl")
 # include("fit/admm.jl")
 
+# > Interface <
+include("mlj/interface.jl")
+
 end # module
@@ -58,7 +58,7 @@ end
 """
 $SIGNATURES
 
-Objective function: ``|Xθ - y|₂²/2 + λ|θ|₁``
+Objective function: ``|Xθ - y|₂²/2 + λ|θ|₁``.
 """
 function LassoRegression(λ::Real=1.0; lambda::Real=λ, fit_intercept::Bool=true,
                          penalize_intercept::Bool=false)
@@ -72,7 +72,7 @@ end
 """
 $SIGNATURES
 
-Objective function: ``|Xθ - y|₂²/2 + λ|θ|₂²/2 + γ|θ|₁``
+Objective function: ``|Xθ - y|₂²/2 + λ|θ|₂²/2 + γ|θ|₁``.
 """
 function ElasticNetRegression(λ::Real=1.0, γ::Real=1.0; lambda::Real=λ, gamma::Real=γ,
                               fit_intercept::Bool=true, penalize_intercept::Bool=false)
@@ -131,9 +131,7 @@ MultinomialRegression(a...; kwa...) = LogisticRegression(a...; multi_class=true,
 """
 $SIGNATURES
 
-Objective function: ``∑ρ(Xθ - y) + λ|θ|₂²`` where ρ is a given function on the residuals and
-δ a positive tuning parameter for the function in question (e.g. for Huber it corresponds to the
-radius of the ball in which residuals are weighed quadratically).
+Objective function: ``∑ρ(Xθ - y) + λ|θ|₂² + γ|θ|₁`` where ρ is a given function on the residuals.
 """
 function RobustRegression(ρ::RobustRho=HuberRho(0.1), λ::Real=1.0, γ::Real=0.0;
                           rho::RobustRho=ρ, lambda::Real=λ, gamma::Real=γ,
@@ -151,7 +149,7 @@ $SIGNATURES
 
 Huber Regression with objective:
 
-``∑ρ(Xθ - y) + λ|θ|₂²/2 + γ|θ|``
+``∑ρ(Xθ - y) + λ|θ|₂²/2 + γ|θ|₁``
 
 Where `ρ` is the Huber function `ρ(r) = r²/2``  if `|r|≤δ` and `ρ(r)=δ(|r|-δ/2)` otherwise.
 """
@@ -169,7 +167,7 @@ $SIGNATURES
 
 Quantile Regression with objective:
 
-``∑ρ(Xθ - y) + λ|θ|₂²/2 + γ|θ|``
+``∑ρ(Xθ - y) + λ|θ|₂²/2 + γ|θ|₁``
 
 Where `ρ` is the check function `ρ(r) = r(δ - 1(r < 0))`.
 """
@@ -187,7 +185,7 @@ $SIGNATURES
 
 Least Absolute Deviation regression with objective:
 
-``|Xθ - y|₁ + λ|θ|₂²/2 + γ|θ|``
+``|Xθ - y|₁ + λ|θ|₂²/2 + γ|θ|₁``
 
 This is a specific type of Quantile Regression with `δ=0.5` (median).
 """
 
@@ -0,0 +1,39 @@
+#=  ===================
+    LOGISTIC CLASSIFIER
+    =================== =#
+
+@with_kw_noshow mutable struct LogisticClassifier <: MLJBase.Probabilistic
+    lambda::Real             = 1.0
+    gamma::Real              = 0.0
+    penalty::Symbol          = :l2
+    fit_intercept::Bool      = true
+    penalize_intercept::Bool = false
+    solver::Option{Solver}   = nothing
+    multi_class::Bool        = false
+end
+
+glr(m::LogisticClassifier) = LogisticRegression(m.lambda, m.gamma; penalty=m.penalty,
+                                                multi_class=m.multi_class,
+                                                fit_intercept=m.fit_intercept,
+                                                penalize_intercept=m.penalize_intercept)
+
+descr(::Type{LogisticClassifier}) = "Classifier corresponding to the loss function ``L(y, Xθ) + λ|θ|₂²/2 + γ|θ|₁`` where `L` is the logistic loss."
+
+#=  ======================
+    MULTINOMIAL CLASSIFIER
+    ====================== =#
+
+@with_kw_noshow mutable struct MultinomialClassifier <: MLJBase.Probabilistic
+    lambda::Real             = 1.0
+    gamma::Real              = 0.0
+    penalty::Symbol          = :l2
+    fit_intercept::Bool      = true
+    penalize_intercept::Bool = false
+    solver::Option{Solver}   = nothing
+end
+
+glr(m::MultinomialClassifier) = MultinomialRegression(m.lambda, m.gamma; penalty=m.penalty,
+                                                      fit_intercept=m.fit_intercept,
+                                                      penalize_intercept=m.penalize_intercept)
+
+descr(::Type{MultinomialClassifier}) = "Classifier corresponding to the loss function ``L(y, Xθ) + λ|θ|₂²/2 + γ|θ|₁`` where `L` is the multinomial loss."
@@ -0,0 +1,118 @@
+export LinearRegressor, RidgeRegressor, LassoRegressor, ElasticNetRegressor,
+       RobustRegressor, HuberRegressor, QuantileRegressor, LADRegressor,
+       LogisticClassifier, MultinomialClassifier
+
+include("regressors.jl")
+include("classifiers.jl")
+
+const REG_MODELS = (LinearRegressor, RidgeRegressor, LassoRegressor, ElasticNetRegressor,
+                    RobustRegressor, HuberRegressor, QuantileRegressor, LADRegressor)
+const CLF_MODELS = (LogisticClassifier, MultinomialClassifier)
+const ALL_MODELS = (REG_MODELS..., CLF_MODELS...)
+
+#= ==========
+   REGRESSORS
+   ========== =#
+
+function MLJBase.fit(m::Union{REG_MODELS...}, verb::Int, X, y)
+    Xmatrix = MLJBase.matrix(X)
+    reg     = glr(m)
+    solver  = m.solver === nothing ? _solver(reg, size(Xmatrix)) : m.solver
+    # get the parameters
+    θ = fit(reg, Xmatrix, y; solver=solver)
+    # return
+    return θ, nothing, NamedTuple{}()
+end
+
+MLJBase.predict(m::Union{REG_MODELS...}, θ, Xnew) = apply_X(MLJBase.matrix(Xnew), θ)
+
+function MLJBase.fitted_params(m::Union{REG_MODELS...}, θ)
+    m.fit_intercept && return (coefs = θ[1:end-1], intercept = θ[end])
+    return (coefs = θ, intercept = nothing)
+end
+
+#= ===========
+   CLASSIFIERS
+   =========== =#
+
+function MLJBase.fit(m::Union{CLF_MODELS...}, verb::Int, X, y)
+    Xmatrix  = MLJBase.matrix(X)
+    yplain   = convert.(Int, MLJBase.int(y))
+    classes  = MLJBase.classes(y[1])
+    nclasses = length(classes)
+    if nclasses == 2
+        # recode
+        yplain[yplain .== 1] .= -1
+        yplain[yplain .== 2] .= 1
+        c = 1
+    else
+        c = nclasses
+    end
+    clf    = glr(m)
+    solver = m.solver === nothing ? _solver(clf, size(Xmatrix)) : m.solver
+    # get the parameters
+    θ = fit(clf, Xmatrix, yplain, solver=solver)
+    # return
+    return (θ, c, classes), nothing, NamedTuple{}()
+end
+
+function MLJBase.predict(m::Union{CLF_MODELS...}, (θ, c, classes), Xnew)
+    Xmatrix = MLJBase.matrix(Xnew)
+    preds   = apply_X(Xmatrix, θ, c)
+    # binary classification
+    if c == 1
+        preds  .= sigmoid.(preds)
+        preds   = hcat(1.0 .- preds, preds) # scores for -1 and 1
+        return [MLJBase.UnivariateFinite(classes, preds[i, :]) for i in 1:size(Xmatrix,1)]
+    end
+    # multiclass
+    preds .= softmax(preds)
+    return [MLJBase.UnivariateFinite(classes, preds[i, :]) for i in 1:size(Xmatrix,1)]
+end
+
+function MLJBase.fitted_params(m::Union{CLF_MODELS...}, (θ, c, classes))
+    if c > 1
+        if m.fit_intercept
+            W = reshape(θ, div(length(θ), c), c)
+            return (coefs = W, intercept = nothing)
+        end
+        W = reshape(θ, p+1, c)
+        return (coefs = W[1:p, :], intercept = W[end, :])
+    end
+    # single class
+    m.fit_intercept && return (coefs = θ[1:end-1], intercept = θ[end])
+    return (coefs = θ, intercept = nothing)
+end
+
+#= =======================
+   METADATA FOR ALL MODELS
+   ======================= =#
+
+MLJBase.metadata_pkg.(ALL_MODELS,
+    name="MLJLinearModels",
+    uuid="6ee0df7b-362f-4a72-a706-9e79364fb692",
+    url="https://github.com/alan-turing-institute/MLJLinearModels.jl",
+    julia=true,
+    license="MIT",
+    is_wrapper=false)
+
+descr_(M) = descr(M) *
+    "\n→ based on [MLJLinearModels](https://github.com/alan-turing-institute/MLJLinearModels.jl)" *
+    "\n→ do `@load $(MLJBase.name(M)) pkg=\"MLJLinearModels\" to use the model.`" *
+    "\n→ do `?$(MLJBase.name(M))` for documentation."
+lp_(M) = "MLJLinearModels.$(MLJBase.name(M))"
+
+for M in REG_MODELS
+    MLJBase.metadata_model(M,
+        input=MLJBase.Table(MLJBase.Continuous),
+        target=AbstractVector{MLJBase.Continuous},
+        weights=false,
+        descr=descr_(M), path=lp_(M))
+end
+for M in CLF_MODELS
+    MLJBase.metadata_model(M,
+        input=MLJBase.Table(MLJBase.Continuous),
+        target=AbstractVector{<:MLJBase.Finite},
+        weights=false,
+        descr=descr_(M), path=lp_(M))
+end