src/ols.jl

"""
    olsranef(model::LinearMixedModel, method=:simultaneous)

Compute the group-level estimates using ordinary least squares.

This is somewhat similar to the conditional modes / BLUPs computed without
shrinkage.

There is no shrinkage of the group-level estimates with this approach, which
means singular estimates can be avoided. However, this also means the random
effects design matrix must not be singular.

The following methods are provided:
1. (default) OLS estimates computed for all strata (blocking variables)
   simultaneously with `method=:simultaneous`. This pools the variance
   across estimates but does not shrink the estimates. Note that this method
   internal reparameterizes the random effects matrix `Z` to use effects coding
   and only use a single intercept shared across all grouping variables.
2. OLS estimates computed within each stratum with `method=:stratum`. This
   method is equivalent for example to computing each subject-level and each
   item-level regression separately.
3. Pseudo-OLS estimated computed by applying extremely mild shrinkage to achieve
   essentially unpenalized conditional (i.e. within group) means with
   `method=:inflated_identity`. This method
   is also used in MixedModelsMakie for generating shrinkage plots


For fully balanced designs with a single blocking variable, these methods will
give the same results.

!!! warning
    If the design matrix for the random effects is rank deficient (e.g., through
    the use of `MixedModels.fulldummy` or missing cells in the data), then the
    methods `:simultaneous` and `:stratum` will fail because no
    shrinkage/regularization is applied.
"""
function olsranef(model::LinearMixedModel{T}, method=:simultaneous; kwargs...) where {T}
    fixef_res = copy(response(model))
    # what's not explained by the fixed effects has to be explained by the RE
    X = model.X
    β = model.β # (X'X) \ (X'fixef_res)
    mul!(fixef_res, X, β, -one(T), one(T))

    return olsranef(model, fixef_res, Val(method); kwargs...)
end

function olsranef(model::LinearMixedModel{T}, fixef_res, ::Val{:stratum}) where {T}
    blups = Vector{Matrix{T}}()
    for trm in model.reterms
        re = []

        z = trm.z
        refs = unique(trm.refs)
        ngrps = length(refs)
        npreds = length(trm.cnames)

        j = 1
        for r in refs
            i = trm.refs .== r
            X = trm[i, j:(j + npreds - 1)]
            b = (X'X) \ (X'fixef_res[i])
            push!(re, b)
            j += npreds
        end

        push!(blups, hcat(re...))
    end

    return blups
end

function olsranef(model::LinearMixedModel{T}, fixef_res, ::Val{:simultaneous}) where {T}
    n_reterms = size(model.reterms)[1]

    code = Vector{Matrix{T}}(undef, n_reterms) # new contrast matrices
    mat = Vector{Matrix{T}}(undef, n_reterms) # new Z model matrices

    ### create new Z matrices with orthogonal contrasts
    for (i, trm) in enumerate(model.reterms)
        dim = size(trm.z)[1]
        cd = StatsModels.ContrastsMatrix(EffectsCoding(), trm.levels).matrix
        cd = kron(cd, I(dim))
        code[i] = cd
        mat[i] = trm * cd
    end

    # add in intercept
    # note that we pass two dims to ones to create a matrix
    pushfirst!(mat, ones(sum(first ∘ size, mat), 1))
    Z = hcat(mat...)
    # compute the BLUPs
    flatblups = Z'Z \ Z'fixef_res
    # get back to original coding
    flatblups = BlockDiagonal(code) * @view flatblups[2:end, :]

    blups = Vector{Matrix{T}}()
    offset = 1
    for trm in model.reterms
        chunksize = size(trm, 2)
        ngrps = length(trm.levels)
        npreds = length(trm.cnames)
        re = Matrix{T}(reshape(view(flatblups, offset:(offset + chunksize - 1)),
                               npreds, ngrps))
        offset += chunksize
        push!(blups, re)
    end
    return blups
end

function olsranef(model::LinearMixedModel{T}, fixef_res, ::Val{:inflated_identity};
                  θref=1000 .* model.optsum.initial) where {T}
    blups = try
        ranef(updateL!(setθ!(model, θref)))
    catch e
        @error "Failed to compute unshrunken values with the following exception:"
        rethrow(e)
    finally
        updateL!(setθ!(model, model.optsum.final)) # restore parameter estimates
    end

    return blups
end

"""
    MixedModels.residuals(model::LinearMixedModel, blups)

Compute the residuals of a mixed model, **ignoring blups**.

This a convenience function to allow [`nonparametricboostrap`](@ref) and
[`permutation`](@ref) to always assume that the keyword argument
`residual_method` is a two-argument method.

!!! warning
    This method is currently being pirated from MixedModels.jl and will
    probably be renamed or removed in a future release.
"""
MixedModels.residuals(model::LinearMixedModel, blups::Vector) = residuals(model)
# XXX This is kinda type piracy, if it weren't developed by one of the MixedModels.jl devs....

"""

    residuals_from_blups(model::LinearMixedModel{T}, blups::Vector{<:AbstractMatrix{T}})

Compute the residuals of a mixed model using the specified group-level BLUPs/predictors.

This is useful for, e.g., comparing the residuals from a mixed-effects model with shrunken
group-level predictors against a non-shrunken classical OLS model fit within each group.
"""
function residuals_from_blups(model::LinearMixedModel{T},
                              blups::Vector{<:AbstractMatrix{T}}) where {T}
    y = response(model) # we are now modifying the model

    ŷ = zeros(T, length(y))

    for (re, trm) in zip(blups, model.reterms)
        mul!(ŷ, trm, re, one(T), one(T))
    end

    mul!(ŷ, model.X, model.β, one(T), one(T))

    # TODO: do this inplace to avoid an allocation
    return y .- ŷ
end