Add lrtest (#162)

nalimilan · web-flow · commit a7d153440765 · 2020-07-03T10:13:06.000+02:00
Heavily Inspired by `ftest` in GLM. Also introduce an `isnested` function
which can be overloaded by modeling packages to protect users from comparing
non-nested models: a warning is printed if no method has been defined by a model
type; if it's defined, an error is thrown for non-nested models.
diff --git a/Project.toml b/Project.toml
@@ -5,7 +5,9 @@ version = "0.6.11"
 [deps]
 DataAPI = "9a962f9c-6df0-11e9-0e5d-c546b8b5ee8a"
 DataStructures = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8"
+Distributions = "31c24e10-a181-5473-b8eb-7969acd0382f"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
+Printf = "de0858da-6303-5e67-8744-51eddeeeb8d7"
 ShiftedArrays = "1277b4bf-5013-50f5-be3d-901d8477a67a"
 SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
 StatsBase = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91"
@@ -16,6 +18,7 @@ CategoricalArrays = "0.7"
 DataAPI = "1.1"
 DataFrames = "0.20, 0.21"
 DataStructures = "0.17.0"
+Distributions = "0.16, 0.17, 0.18, 0.19, 0.20, 0.21, 0.22, 0.23"
 ShiftedArrays = "1.0.0"
 StatsBase = "0.22, 0.23, 0.24, 0.25, 0.26, 0.27, 0.28, 0.29, 0.30, 0.31, 0.32, 0.33"
 Tables = "0.2, 1"
diff --git a/src/StatsModels.jl b/src/StatsModels.jl
@@ -6,6 +6,8 @@ using ShiftedArrays
 using ShiftedArrays: lag, lead
 using DataStructures
 using DataAPI: levels
+using Printf: @sprintf
+using Distributions: Chisq, ccdf
 
 using SparseArrays
 using LinearAlgebra
@@ -56,7 +58,9 @@ export
     width,
     modelcols,
     modelmatrix,
-    response
+    response,
+
+    lrtest
 
 include("traits.jl")
 include("contrasts.jl")
@@ -66,5 +70,6 @@ include("temporal_terms.jl")
 include("formula.jl")
 include("modelframe.jl")
 include("statsmodel.jl")
+include("lrtest.jl")
 
 end # module StatsModels
diff --git a/src/lrtest.jl b/src/lrtest.jl
@@ -0,0 +1,166 @@
+struct LRTestResult{N}
+    nobs::Int
+    deviance::NTuple{N, Float64}
+    dof::NTuple{N, Int}
+    pval::NTuple{N, Float64}
+end
+
+_diff(t::NTuple{N}) where {N} = ntuple(i->t[i+1]-t[i], N-1)
+
+"""
+    isnested(m1::StatisticalModel, m2::StatisticalModel; atol::Real=0.0)
+
+Indicate whether model `m1` is nested in model `m2`, i.e. whether
+`m1` can be obtained by constraining some parameters in `m2`.
+Both models must have been fitted on the same data.
+"""
+function isnested end
+
+"""
+    lrtest(mods::StatisticalModel...; atol::Real=0.0)
+
+For each sequential pair of statistical models in `mods...`, perform a likelihood ratio
+test to determine if the first one fits significantly better than the next.
+
+A table is returned containing degrees of freedom (DOF),
+difference in DOF from the preceding model, deviance, difference in deviance
+from the preceding model, and likelihood ratio and p-value for the comparison
+between the two models.
+
+Optional keyword argument `atol` controls the numerical tolerance when testing whether
+the models are nested.
+
+# Examples
+
+Suppose we want to compare the effects of two or more treatments on some result.
+Our null hypothesis is that `Result ~ 1` fits the data as well as
+`Result ~ 1 + Treatment`.
+
+```jldoctest
+julia> using DataFrames, GLM
+
+julia> dat = DataFrame(Result=[1, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1],
+                       Treatment=[1, 1, 1, 2, 2, 2, 1, 1, 1, 2, 2, 2],
+                       Other=categorical([1, 1, 2, 1, 2, 1, 3, 1, 1, 2, 2, 1]));
+
+julia> nullmodel = glm(@formula(Result ~ 1), dat, Binomial(), LogitLink());
+
+julia> model = glm(@formula(Result ~ 1 + Treatment), dat, Binomial(), LogitLink());
+
+julia> bigmodel = glm(@formula(Result ~ 1 + Treatment + Other), dat, Binomial(), LogitLink());
+
+julia> lrtest(nullmodel, model, bigmodel)
+Likelihood-ratio test: 3 models fitted on 12 observations
+──────────────────────────────────────────────
+     DOF  ΔDOF  Deviance  ΔDeviance  p(>Chisq)
+──────────────────────────────────────────────
+[1]    1         16.3006                      
+[2]    2     1   15.9559    -0.3447     0.5571
+[3]    4     2   14.0571    -1.8988     0.3870
+──────────────────────────────────────────────
+
+julia> lrtest(bigmodel, model, nullmodel)
+Likelihood-ratio test: 3 models fitted on 12 observations
+──────────────────────────────────────────────
+     DOF  ΔDOF  Deviance  ΔDeviance  p(>Chisq)
+──────────────────────────────────────────────
+[1]    4         14.0571                      
+[2]    2    -2   15.9559     1.8988     0.3870
+[3]    1    -1   16.3006     0.3447     0.5571
+──────────────────────────────────────────────
+```
+"""
+function lrtest(mods::StatisticalModel...; atol::Real=0.0)
+    if length(mods) < 2
+        throw(ArgumentError("At least two models are needed to perform LR test"))
+    end
+    T = typeof(mods[1])
+    df = dof.(mods)
+    forward = df[1] <= df[2]
+    if !all(m -> typeof(m) == T, mods)
+        throw(ArgumentError("LR test is only valid for models of the same type"))
+    end
+    if !all(==(nobs(mods[1])), nobs.(mods))
+        throw(ArgumentError("LR test is only valid for models fitted on the same data, " *
+                            "but number of observations differ"))
+    end
+    checknested = hasmethod(isnested, Tuple{T, T})
+    if forward
+        for i in 2:length(mods)
+            if df[i-1] >= df[i] ||
+                (checknested && !isnested(mods[i-1], mods[i], atol=atol))
+                throw(ArgumentError("LR test is only valid for nested models"))
+            end
+        end
+    else
+        for i in 2:length(mods)
+            if df[i] >= df[i-1] ||
+                (checknested && !isnested(mods[i], mods[i-1], atol=atol))
+                throw(ArgumentError("LR test is only valid for nested models"))
+            end
+        end
+    end
+    if !checknested
+        @warn "Could not check whether models are nested as model type " *
+            "$(nameof(T)) does not implement isnested: results may not be meaningful"
+    end
+
+    dev = deviance.(mods)
+    Δdev = _diff(dev)
+
+    Δdf = _diff(df)
+    dfr = Int.(dof_residual.(mods))
+
+    if (forward && any(x -> x > 0, Δdev)) || (!forward && any(x -> x < 0, Δdev))
+        throw(ArgumentError("Residual deviance must be strictly lower " *
+                            "in models with more degrees of freedom"))
+    end
+
+    pval = (NaN, ccdf.(Chisq.(abs.(Δdf)), abs.(Δdev))...)
+    return LRTestResult(Int(nobs(mods[1])), dev, df, pval)
+end
+
+function Base.show(io::IO, lrr::LRTestResult{N}) where N
+    Δdf = _diff(lrr.dof)
+    Δdev = _diff(lrr.deviance)
+
+    nc = 6
+    nr = N
+    outrows = Matrix{String}(undef, nr+1, nc)
+
+    outrows[1, :] = ["", "DOF", "ΔDOF", "Deviance", "ΔDeviance", "p(>Chisq)"]
+
+    outrows[2, :] = ["[1]", @sprintf("%.0d", lrr.dof[1]), " ",
+                     @sprintf("%.4f", lrr.deviance[1]), " ", " "]
+
+    for i in 2:nr
+        outrows[i+1, :] = ["[$i]", @sprintf("%.0d", lrr.dof[i]),
+                           @sprintf("%.0d", Δdf[i-1]),
+                           @sprintf("%.4f", lrr.deviance[i]), @sprintf("%.4f", Δdev[i-1]),
+                           string(StatsBase.PValue(lrr.pval[i])) ]
+    end
+    colwidths = length.(outrows)
+    max_colwidths = [maximum(view(colwidths, :, i)) for i in 1:nc]
+    totwidth = sum(max_colwidths) + 2*5
+
+    println(io, "Likelihood-ratio test: $N models fitted on $(lrr.nobs) observations")
+    println(io, '─'^totwidth)
+
+    for r in 1:nr+1
+        for c in 1:nc
+            cur_cell = outrows[r, c]
+            cur_cell_len = length(cur_cell)
+
+            padding = " "^(max_colwidths[c]-cur_cell_len)
+            if c > 1
+                padding = "  "*padding
+            end
+
+            print(io, padding)
+            print(io, cur_cell)
+        end
+        print(io, "\n")
+        r == 1 && println(io, '─'^totwidth)
+    end
+    print(io, '─'^totwidth)
+end
diff --git a/test/statsmodel.jl b/test/statsmodel.jl
@@ -40,6 +40,13 @@ function StatsBase.predict(mod::DummyMod, newX::Matrix;
         throw(ArgumentError("value not allowed for interval"))
     end
 end
+StatsBase.dof(mod::DummyMod) = length(mod.beta)
+StatsBase.dof_residual(mod::DummyMod) = length(mod.y) - length(mod.beta)
+StatsBase.nobs(mod::DummyMod) = length(mod.y)
+StatsBase.deviance(mod::DummyMod) = sum((response(mod) .- predict(mod)).^2)
+# Incorrect but simple definition
+StatsModels.isnested(mod1::DummyMod, mod2::DummyMod; atol::Real=0.0) =
+    dof(mod1) <= dof(mod2)
 
 # A dummy RegressionModel type that does not support intercept
 struct DummyModNoIntercept <: RegressionModel
@@ -83,6 +90,11 @@ function StatsBase.predict(mod::DummyModNoIntercept, newX::Matrix;
         throw(ArgumentError("value not allowed for interval"))
     end
 end
+StatsBase.dof(mod::DummyModNoIntercept) = length(mod.beta)
+StatsBase.dof_residual(mod::DummyModNoIntercept) = length(mod.y) - length(mod.beta)
+StatsBase.nobs(mod::DummyModNoIntercept) = length(mod.y)
+StatsBase.deviance(mod::DummyModNoIntercept) = sum((response(mod) .- predict(mod)).^2)
+# isnested not implemented to test fallback
 
 ## Another dummy model type to test fall-through show method
 struct DummyModTwo <: RegressionModel
@@ -212,3 +224,65 @@ Base.show(io::IO, m::DummyModTwo) = println(io, m.msg)
     show(io, m2)
 
 end
+
+@testset "lrtest" begin
+
+    y = collect(1:4)
+    x1 = 2:5
+    x2 = [1, 5, 3, 1]
+
+    m0 = DummyMod([1], ones(4, 1), y)
+    m1 = DummyMod([1, 0.3], [ones(4, 1) x1], y)
+    m2 = DummyMod([1, 0.25, 0.05, 0.04], [ones(4, 1) x1 x2 x1.*x2], y)
+
+    @test_throws ArgumentError lrtest(m0)
+    @test_throws ArgumentError lrtest(m0, m0)
+    @test_throws ArgumentError lrtest(m0, m2, m1)
+    @test_throws ArgumentError lrtest(m1, m0, m2)
+    @test_throws ArgumentError lrtest(m2, m0, m1)
+
+    m1b = DummyMod([1, 0.3], [ones(3, 1) x1[2:end]], y[2:end])
+    @test_throws ArgumentError lrtest(m0, m1b)
+
+    lr1 = lrtest(m0, m1)
+    @test isnan(lr1.pval[1])
+    @test lr1.pval[2] ≈ 0.0010484433450981662
+    @test sprint(show, lr1) == """
+        Likelihood-ratio test: 2 models fitted on 4 observations
+        ──────────────────────────────────────────────
+             DOF  ΔDOF  Deviance  ΔDeviance  p(>Chisq)
+        ──────────────────────────────────────────────
+        [1]    1         14.0000                      
+        [2]    2     1    3.2600   -10.7400     0.0010
+        ──────────────────────────────────────────────"""
+
+    m0 = DummyModNoIntercept(Float64[], ones(4, 0), y)
+    m1 = DummyModNoIntercept([0.3], reshape(x1, :, 1), y)
+    m2 = DummyModNoIntercept([0.25, 0.05, 0.04], [x1 x2 x1.*x2], y)
+
+    @test_throws ArgumentError lrtest(m0)
+    @test_throws ArgumentError lrtest(m0, m0)
+    @test_throws ArgumentError lrtest(m0, m2, m1)
+    @test_throws ArgumentError lrtest(m1, m0, m2)
+    @test_throws ArgumentError lrtest(m2, m0, m1)
+
+    m1b = DummyModNoIntercept([0.3], reshape(x1[2:end], :, 1), y[2:end])
+    @test_throws ArgumentError lrtest(m0, m1b)
+
+    # Incorrect, but check that it doesn't throw an error
+    lr2 = @test_logs((:warn, "Could not check whether models are nested " *
+                     "as model type DummyModNoIntercept does not implement isnested: " *
+                     "results may not be meaningful"),
+                     lrtest(m0, m1))
+    @test isnan(lr2.pval[1])
+    @test lr2.pval[2] ≈ 1.2147224767092312e-5
+    @test sprint(show, lr2) == """
+        Likelihood-ratio test: 2 models fitted on 4 observations
+        ──────────────────────────────────────────────
+             DOF  ΔDOF  Deviance  ΔDeviance  p(>Chisq)
+        ──────────────────────────────────────────────
+        [1]    0         30.0000                      
+        [2]    1     1   10.8600   -19.1400      <1e-4
+        ──────────────────────────────────────────────"""
+
+end