add CI computation for emmeans and empairs (#72)

palday · ararslan · web-flow · commit b802417a963a · 2025-12-17T11:24:33.000-06:00
Co-authored-by: Alex Arslan &lt;alex.arslan@beacon.bio&gt;
diff --git a/Project.toml b/Project.toml
@@ -1,6 +1,6 @@
 name = "Effects"
 uuid = "8f03c58b-bd97-4933-a826-f71b64d2cca2"
-version = "1.6.0"
+version = "1.7.0"
 authors = ["Beacon Biosignals, Inc."]
 
 [deps]
diff --git a/src/emmeans.jl b/src/emmeans.jl
@@ -14,13 +14,28 @@ of the underlying standard deviations.
 """
 pooled_sem(sems...) = sqrt(sum(abs2, sems))
 
+function _ci!(df::AbstractDataFrame, level;
+              eff_col::AbstractString, err_col::AbstractString,
+              lower_col::AbstractString,
+              upper_col::AbstractString)
+    transform!(df,
+               [eff_col, err_col, "dof"] => ByRow() do eff, err, ν
+                   scale = quantile(TDist(ν), (1 + level) / 2)
+                   lower = eff - scale * err
+                   upper = eff + scale * err
+                   return (lower, upper)
+               end => [lower_col, upper_col])
+    return df
+end
+
 # similar to effects (and the underlying math is the same) but
 # the establishment of the reference grid is different
 # we don't allow specifying the "typifier" here -- if you want that,
 # then choose a less full service function
 """
     emmeans(model::RegressionModel; eff_col=nothing, err_col=:err,
-            invlink=identity, levels=Dict(), dof=nothing)
+            invlink=identity, levels=Dict(), dof=nothing,
+            ci_level=nothing, lower_col=:lower, upper_col=:upper)
 
 Compute estimated marginal means, a.k.a. least-square (LS) means for a model.
 
@@ -39,6 +54,13 @@ a large number of observations, `dof=Inf` may be appropriate.
 
 `invlink`, `eff_col` and `err_col` work exactly as in [`effects!`](@ref).
 
+If `ci_level` is provided, then `ci_level` confidence intervals are computed using
+the Wald approximation based on the standard errors and quantiles of the ``t``-distribution.
+If `dof` is not provided, then the degrees of freedom are assumed to be infinite,
+which is equivalent to using the normal distribution.
+The corresponding lower and upper edges of the interval are placed in `lower_col`
+and `upper_col`, respectively.
+
 Estimated marginal means are closely related to effects and are also known as
 least-square means. The functionality here is a convenience
 wrapper for [`effects`](@ref) and maps onto the concept of least-square means
@@ -49,7 +71,8 @@ not currently supported. The documentation for the [R package emmeans](https://c
 explains [the background in more depth](https://cran.r-project.org/web/packages/emmeans/vignettes/basics.html).
 """
 function emmeans(model::RegressionModel; eff_col=nothing, err_col=:err,
-                 invlink=identity, levels=Dict(), dof=nothing)
+                 invlink=identity, levels=Dict(), dof=nothing, ci_level=nothing,
+                 lower_col=:lower, upper_col=:upper)
     form = formula(model)
     typical = mean
     defaults = Dict{Symbol,Vector}()
@@ -68,18 +91,30 @@ function emmeans(model::RegressionModel; eff_col=nothing, err_col=:err,
     grid = expand_grid(levels)
     eff_col = string(something(eff_col, _responsename(model)))
     err_col = string(err_col)
+    lower_col = string(lower_col)
+    upper_col = string(upper_col)
 
     result = effects!(grid, model; eff_col, err_col, typical, invlink)
     if !isnothing(dof)
         result[!, :dof] .= _dof(dof, model)
     end
+    if !isnothing(ci_level)
+        # we keep this separate so that we don't add a DoF column
+        # if there is no CI
+        if isnothing(dof)
+            result[!, :dof] .= Inf
+        end
+        _ci!(result, ci_level; eff_col, err_col, lower_col, upper_col)
+    end
     return result
 end
 
 """
     empairs(model::RegressionModel; eff_col=nothing, err_col=:err,
-            invlink=identity, levels=Dict(), dof=nothing, padjust=identity)
-    empairs(df::AbstractDataFrame; eff_col, err_col=:err, padjust=identity)
+            invlink=identity, levels=Dict(), dof=nothing, padjust=identity,
+            ci_level=nothing, lower_col=:lower, upper_col=:upper)
+    empairs(df::AbstractDataFrame; eff_col, err_col=:err, padjust=identity,
+            ci_level=nothing, lower_col=:lower, upper_col=:upper)
 
 Compute pairwise differences of estimated marginal means.
 
@@ -104,9 +139,19 @@ If `padjust` is provided, then it is used to compute adjust the p-values for
 multiple comparisons. [`MultipleTesting.jl`](https://juliangehring.github.io/MultipleTesting.jl/stable/)
 provides a number of useful possibilities for this.
 
+If `ci_level` is provided, then `ci_level` confidence intervals are computed using
+the Wald approximation based on the standard errors and quantiles of the ``t``-distribution.
+If `dof` is not provided, then the degrees of freedom are assumed to be infinite,
+which is equivalent to using the normal distribution.
+The corresponding lower and upper edges of the interval are placed in `lower_col`
+and `upper_col`, respectively.
+
 !!! note
     `padjust` is silently ignored if `dof` is not provided.
 
+!!! note
+    Confidence intervals are **not** adjusted for multiple comparisons.
+
 !!! warning
     This feature is experimental and the precise column names and presentation of
     contrasts/differences may change without being considered breaking.
@@ -122,18 +167,22 @@ provides a number of useful possibilities for this.
     discussed in [the documentation for the R package `emmeans`](https://cran.r-project.org/web/packages/emmeans/vignettes/transformations.html).
 """
 function empairs(model::RegressionModel; eff_col=nothing, err_col=:err,
-                 invlink=identity, levels=Dict(), dof=nothing, padjust=identity)
+                 invlink=identity, levels=Dict(), dof=nothing, padjust=identity,
+                 ci_level=nothing, lower_col=:lower, upper_col=:upper)
     eff_col = something(eff_col, _responsename(model))
     em = emmeans(model; eff_col, err_col, invlink, levels, dof)
-    return empairs(em; eff_col, err_col, padjust)
+    return empairs(em; eff_col, err_col, padjust, ci_level, lower_col, upper_col)
 end
 
-function empairs(df::AbstractDataFrame; eff_col, err_col=:err, padjust=identity)
+function empairs(df::AbstractDataFrame; eff_col, err_col=:err, padjust=identity,
+                 ci_level=nothing, lower_col=:lower, upper_col=:upper)
     # need to enforce that we're all the same type
     # (mixing string and symbol is an issue with Not
     #  and a few other things below)
     eff_col = string(eff_col)
     err_col = string(err_col)
+    lower_col = string(lower_col)
+    upper_col = string(upper_col)
     stats_cols = [eff_col, err_col]
     "dof" in names(df) && push!(stats_cols, "dof")
 
@@ -170,5 +219,11 @@ function empairs(df::AbstractDataFrame; eff_col, err_col=:err, padjust=identity)
                    end => "Pr(>|t|)")
         transform!(result_df, "Pr(>|t|)" => padjust => "Pr(>|t|)")
     end
+    if !isnothing(ci_level)
+        if "dof" ∉ stats_cols
+            result_df[!, :dof] .= Inf
+        end
+        _ci!(result_df, ci_level; eff_col, err_col, lower_col, upper_col)
+    end
     return result_df
 end
diff --git a/test/emmeans.jl b/test/emmeans.jl
@@ -53,6 +53,20 @@ model_scaled = lm(@formula(weight ~ 1 + sex * age), growthdata;
     end
     em = emmeans(m; levels=Dict(:age => 23))
     @test all(em.age .== 23)
+
+    @testset "confint" begin
+        em = emmeans(m; ci_level=0.68)
+        @test all(==(Inf), em[!, :dof])
+        # 68% CI is approximately one standard error
+        @test em[!, :weight] + em[!, :err] ≈ em[!, :upper] rtol = 1e-3
+        @test em[!, :weight] - em[!, :err] ≈ em[!, :lower] rtol = 1e-3
+
+        em = emmeans(m; ci_level=0.68, dof=dof_residual)
+        @test all(==(10), em[!, :dof])
+        # 68% CI is approximately one standard error
+        @test em[!, :weight] + em[!, :err] ≈ em[!, :upper] rtol = 1e-3
+        @test em[!, :weight] - em[!, :err] ≈ em[!, :lower] rtol = 1e-3
+    end
 end
 
 # R> pairs(em)
@@ -101,6 +115,20 @@ bonferroni(pvals) = adjust(PValues(pvals), Bonferroni())
                             rtol=0.001))
     end
 
+    @testset "confint" begin
+        em = empairs(m; ci_level=0.68)
+        @test all(==(Inf), em[!, :dof])
+        # 68% CI is approximately one standard error
+        @test em[!, :weight] + em[!, :err] ≈ em[!, :upper] rtol = 1e-3
+        @test em[!, :weight] - em[!, :err] ≈ em[!, :lower] rtol = 1e-3
+
+        em = emmeans(m; ci_level=0.68, dof=dof_residual)
+        @test all(==(10), em[!, :dof])
+        # 68% CI is approximately one standard error
+        @test em[!, :weight] + em[!, :err] ≈ em[!, :upper] rtol = 1e-3
+        @test em[!, :weight] - em[!, :err] ≈ em[!, :lower] rtol = 1e-3
+    end
+
     @testset "AbstractString crossing" begin
         # this model is utter nonsense, but it creates a particular pattern
         # with InlineStrings that fails if our type restriction is too tight