doxygen/html/linear_regression_8h_source.html

/***************************************************************

 * @file        linearRegression.h

 * @author      Gabriel Hoffman

 * @email       gabriel.hoffman@mssm.edu

 * @brief       Evaluate linear regression with Armadillo library

 * Copyright (C) 2024 Gabriel Hoffman

 **************************************************************/


#ifndef LINEAR_REGRESSION_H_

#define LINEAR_REGRESSION_H_


#include <tuple>

#include <type_traits>


// if -D USE_R, use RcppArmadillo library

#ifdef USE_R

// [[Rcpp::depends(RcppParallel)]]

// [[Rcpp::depends(RcppParallel)]]

#include <RcppArmadillo.h>

#include <RcppParallel.h>

#else

#include <armadillo>

#endif


#include "misc.h"

#include "CleanData.h"

#include "ModelFit.h"


using namespace arma;

using namespace std;


namespace fastglmmLib {


struct LMWork {

    mat Q, R, V;

    vec residuals;

    LMWork() {}

};


static ModelFit lm(

    const arma::mat& X,

    const arma::colvec& y,

    const ModelDetail md = LOW,

    const double &lambda = 0,

    const double &rdf_offset = 0,

    LMWork *work = nullptr,

    const bool estimateDispersion = true,

    const bool scaleByDispersion = true) {


    int n = X.n_rows, k = X.n_cols;


    // allocate work, if not already alloc'd

  bool alloc_local = false;

  if( work == nullptr ){

    alloc_local = true;

      work = new LMWork();

  }


  // QR decomp

  // success0 indicates QR was successful and R is valid

    bool success0 = qr_econ(work->Q, work->R, X);


    // test if X is full rank

    double minDiagR = abs(diagvec(work->R)).min();

    double tol = 1e-12;

    if( success0 && (minDiagR < tol)){

        success0 = false;

    }


  vec beta;

    bool success1 = false;


    // cross product for ridge and vcov

    mat A = work->R.t() * work->R;


    // if QR succeed, compute beta

    if( success0 ){

        if( lambda == 0.0 ){

            // OLS

            success1 = solve(beta, work->R, trans(work->Q) * y, solve_opts::no_approx);

        }else{

            // Ridge penalty,

        // A.diag() += lambda;

        // but not on intercept

        for( uword i=1; i<A.n_rows; ++i){

            A(i,i) += lambda;

        }


            success1 = solve(beta, A, work->R.t() * work->Q.t() * y, arma::solve_opts::fast + arma::solve_opts::likely_sympd);

        }

    }


    // if system is singular,

    // set beta to NaN

    if( ! success0 || ! success1){

        beta = vec(work->R.n_cols);

    beta.fill(datum::nan);

    }


    // if md != LEAST, compute residuals

    vec stderr;

    double rdf = n - k - rdf_offset;

    double dispersion = 1.0;

    bool success2 = true;

    if( md != LEAST ){


        if( success1 ){

            // only compute inverse if solve() above succeeded

        // V = solve(t(R)*R)

        success2 = inv_sympd(work->V, A);

        }else{

            success2 = false;

        }


    // residuals

        work->residuals = y - X*beta;


    // for linear regression

    if( estimateDispersion ){

        // std.errors of coefficients

            dispersion = dot(work->residuals, work->residuals) / rdf;

        }else{

        // for GLM, don't scale by residual variance

            dispersion = 1.0;

        }


    if( success0 && success1 && success2 ){

        stderr = sqrt(dispersion * diagvec(work->V));

    }else{

      stderr = vec(k, fill::value(datum::nan));

      beta.fill(datum::nan);

    }

    }


    bool success = success0 && success1 && success2;


    // return results with specified level of detail

    ModelFit fit;

  switch( md ){

    case LEAST:

            fit = ModelFit( success, beta );

            break;


      case LOW:

            fit = ModelFit( success, beta, stderr, dispersion, rdf);

            break;


        case MEDIUM:

            fit = ModelFit( success, beta, stderr, dispersion, rdf, work->V * dispersion);

            break;


        case HIGH:

            fit = ModelFit( success, beta, stderr, dispersion, rdf, work->V * dispersion, work->residuals);

            break;


        case MOST:

        case MAX:

            vec hatvalues = diagvec(work->Q * trans(work->Q));

            fit = ModelFit( success, beta, stderr, dispersion, rdf, work->V * dispersion, work->residuals, hatvalues);

            fit.setFittedValues( X*beta );

            break;

    }


    // free work if allocated in this function

  if( alloc_local) delete work;


    return fit;

}


template <typename T>

static tuple<vec, T> preprojection(

    const vec &y,

    const mat &X_design,

    const T &X_features,

    const vec &weights = {}){


    // naive calculation

    // vec y_proj = y - X_design * inv(trans(X_design) * X_design) * trans(X_design) * y;

    // mat X_proj = X_features - X_design * inv(trans(X_design) * X_design) * trans(X_design) * X_features;


    // if weights is empty, set w to ones

    vec w;

    if( ! weights.is_empty() ){

        w = weights;

    }else{

        w = vec(y.n_elem).ones();

    }

    arma::colvec wsqrt = sqrt(w / mean(w));


    // apply weights in computation to y, X_design, and X_features

    mat X_design_wsqrt = X_design.each_col() % wsqrt;

    vec y_wsqrt = y % wsqrt;

    T X_features_wsqrt = scaleEachCol(X_features, wsqrt);


    // Use QR decomp of X_design, and recycle pre-computed values

    mat Q, R;

    qr_econ(Q, R, X_design_wsqrt);


  // back solve

    vec beta = solve(R, trans(Q) * y_wsqrt);

    vec y_proj = y_wsqrt - X_design_wsqrt * beta;


  // back solve

  // use constructor T() to subtract matricies of the same type

    mat gamma = solve(R, trans(Q) * X_features_wsqrt);

    T X_proj;


    // cast X_design_wsqrt * gamma to type T if needed

    if( is_same_v<decltype(X_features_wsqrt), decltype(X_design_wsqrt)> ){

        X_proj = X_features_wsqrt - X_design_wsqrt * gamma;

    }else{

        X_proj = X_features_wsqrt - T(X_design_wsqrt * gamma);

    }


    return {y_proj, X_proj};

}


template <typename T>

static tuple<vec, T> preprojection(

    const vec &y,

    const sp_mat &X_design,

    const T &X_features,

    const vec &weights = {}){


    // naive calculation

    // vec y_proj = y - X_design * inv(trans(X_design) * X_design) * trans(X_design) * y;

    // mat X_proj = X_features - X_design * inv(trans(X_design) * X_design) * trans(X_design) * X_features;


    // if weights is empty, set w to ones

    vec w;

    if( ! weights.is_empty() ){

        w = weights;

    }else{

        w = vec(y.n_elem).ones();

    }

    arma::colvec wsqrt = sqrt(w / mean(w));


    // apply weights in computation to y, X_design, and X_features

    sp_mat X_design_wsqrt = scaleEachCol(X_design, wsqrt);

    vec y_wsqrt = y % wsqrt;

    T X_features_wsqrt = scaleEachCol(X_features, wsqrt);


    // recycle sparse crossprod

    // spsolve uses lapack after converting V to dense matrix

    // minimal penalty practical V dimensions

    bool success;

    vec beta;

    mat gamma;


    sp_mat V = trans(X_design_wsqrt) * X_design_wsqrt;

    success = spsolve(beta, V, vec(trans(X_design_wsqrt) * y_wsqrt), "lapack");

    if( ! success ) beta.fill(datum::nan);

    vec y_proj = y_wsqrt - X_design_wsqrt * beta;


    success = spsolve(gamma, V, mat(trans(X_design_wsqrt) * X_features_wsqrt), "lapack");

    if( ! success ) gamma.fill(datum::nan);


    T X_proj;

    // cast X_design_wsqrt * gamma to type T if needed

    if( is_same_v<decltype(X_features_wsqrt), decltype(X_design_wsqrt)> ){

        X_proj = X_features_wsqrt - X_design_wsqrt * gamma;

    }else{

        X_proj = X_features_wsqrt - T(X_design_wsqrt * gamma);

    }


    return {y_proj, X_proj};

}


static ModelFit wlm(

    const arma::mat& X,

    const arma::colvec& y,

    const arma::colvec& w = {},

    const ModelDetail md = LOW,

    const double &lambda = 0,

    const double &rdf_offset = 0,

    LMWork *work = nullptr) {


    ModelFit fit;


    if( w.is_empty() ){

        fit = lm( X, y, md, lambda, rdf_offset, work);

    }else{

        arma::colvec wsqrt = sqrt(w / mean(w));

        fit = lm( X.each_col() % wsqrt, y % wsqrt, md, lambda, rdf_offset, work);


        if( md >= HIGH){

        // Rescale residuals by weights afterward

        //  since input X and y are scaled before lm()

        fit.residuals /= wsqrt;

    }

    }


    return fit;

}


static vector<ModelFit> lmFitFeatures_standard(

    const arma::vec &y,

    const arma::mat &X_design,

    const arma::mat &X_features,

    const vector<string> &ids,

    const arma::vec &weights = {},

    const ModelDetail md = LOW,

    const double &lambda = 0,

    const int &nthreads = 1){


    int n_covs = X_design.n_cols;


    if( X_features.n_cols == 0){

        throw invalid_argument("X_features has 0 columns");

    }


    vector<ModelFit> fitList(X_features.n_cols, ModelFit());


    // Parallel part using Thread Building Blocks

    tbb::task_arena limited_arena(nthreads);

    limited_arena.execute([&] {

    tbb::parallel_for(

        tbb::blocked_range<int>(0, X_features.n_cols, 100),

        [&](const tbb::blocked_range<int>& r){

        // create design matrix with jth feature in the last column

        // X = cbind(X_design, X_features[,0])

        arma::mat X(X_design);

        X.insert_cols(n_covs, X_features.col(0));


        LMWork *work = new LMWork();


        // iterate through responses

      for (int j = r.begin(); j != r.end(); ++j) {


            // Create design matrix with intercept as first column

            X.col(n_covs) = X_features.col(j);


            // linear regression

            ModelFit fit = wlm(X, y, weights, md, lambda, 0, work);

            fit.ID = ids[j];


            // save result to list

            fitList.at(j) =  fit;

        }

        delete work;

    }); });


    return fitList;

}


template <typename T1, typename T2>

static ModelFitList lmFitFeatures_preproj(

    const arma::vec &y,

    const T1 &X_design,

    const T2 &X_features,

    const vector<string> &ids,

    const arma::vec &weights = {},

    const ModelDetail md = LOW,

    const double &lambda = 0,

    const int &nthreads = 1){


    if( X_features.n_cols == 0){

        throw invalid_argument("X_features has 0 columns");

    }


    ModelFitList fitList(X_features.n_cols, ModelFit());


    // pre-projection to regress out the covariates first

    // set rdf_offset to the number of covariates projected out

    // auto [y_proj, X_proj] = preprojection(y, X_design, X_features, weights);

    vec y_proj;

    mat X_proj;

    tie(y_proj, X_proj) = preprojection(y, X_design, X_features, weights);

    double rdf_offset = X_design.n_cols;


    vec wsqrt = sqrt(weights);


    // Parallel part using Thread Building Blocks

    tbb::task_arena limited_arena(nthreads);

    limited_arena.execute([&] {

    tbb::parallel_for(

        tbb::blocked_range<int>(0, X_proj.n_cols, 100),

        [&](const tbb::blocked_range<int>& r){


        disable_parallel_blas();


        LMWork *work = new LMWork();


        for (int j = r.begin(); j != r.end(); ++j) {


            // linear regression

            ModelFit fit = lm(X_proj.col(j), y_proj, md, lambda, rdf_offset, work );


            fit.ID = ids[j];


            if( md >= HIGH){

          // Rescale residuals by weights afterward

          //  since input X and y are scaled before lm()

          fit.residuals /= wsqrt;

      }


            // save result to list

            fitList.at(j) =  fit;

        }

        delete work;

    }); });


    return fitList;

}


template <typename T1, typename T2>

static ModelFitList lmFitFeatures(

    const arma::vec &y,

    const T1 &X_design,

    const T2 &X_features,

    const vector<string> &ids,

    const arma::vec &weights = {},

    const ModelDetail md = LOW,

    const double &lambda = 0,

    const bool &preprojection = true,

    const int &nthreads = 1){


    ModelFitList fitList;


    if( preprojection ){

        // supports mat and sp_mat

        fitList = lmFitFeatures_preproj(y, X_design, X_features, ids, weights, md, lambda, nthreads);

    }else{

        // only supports mat

        fitList = lmFitFeatures_standard(y, mat(X_design), mat(X_features), ids, weights, md, lambda, nthreads);

    }


    return fitList;

}


static ModelFitList lmFitResponses(

    const arma::mat &Y,

    const arma::mat &X,

    const vector<string> &ids,

    const arma::mat &Weights,

    const ModelDetail md = LOW,

    const double &lambda = 0,

    const int &nthreads = 1){


  ModelFitList fitList(Y.n_cols, ModelFit());


  CleanData data(Y, X, Weights);


  mat X_clean = data.get_X();

  mat Wsqrt = sqrt(data.get_W());

  mat Yw = data.get_Y() % Wsqrt;


  // Parallel part using Thread Building Blocks

    tbb::task_arena limited_arena(nthreads);

    limited_arena.execute([&] {

    tbb::parallel_for(

    tbb::blocked_range<int>(0, Y.n_cols, 10),

    [&](const tbb::blocked_range<int>& r){


        disable_parallel_blas();


    for (int j = r.begin(); j != r.end(); ++j) {


            // Reduce residual degrees of freedom by the number of

            //  entries with zero weights

          int rdf_offset = accu(Wsqrt.col(j) == 0.0);


        // linear regression

        // ModelFit fit = wlm(X, Y.col(j), Weights.col(j));

        ModelFit fit = lm(X_clean.each_col() % Wsqrt.col(j),

                                            Yw.col(j), md, lambda, rdf_offset);


            fit.ID = ids[j];


            if( md >= HIGH){

        // Rescale residuals by weights afterward

        //  since input X and y are scaled before lm()

        fit.residuals /= Wsqrt.col(j);

        fit.mu /= Wsqrt.col(j);

            }


        // save result to list

        fitList.at(j) =  fit;

        }

    }); });


    return fitList;

}


}


#endif

CleanData.h

ModelFit.h

fastglmmLib::ModelFit
Definition ModelFit.h:37

misc.h

scaleEachCol
mat scaleEachCol(const mat &X, const vec &w)
Definition misc.h:17

fastglmmLib
Definition CleanData.h:17

fastglmmLib::ModelDetail
ModelDetail
Definition ModelFit.h:26

fastglmmLib::MOST
@ MOST
Definition ModelFit.h:31

fastglmmLib::MEDIUM
@ MEDIUM
Definition ModelFit.h:29

fastglmmLib::LEAST
@ LEAST
Definition ModelFit.h:27

fastglmmLib::HIGH
@ HIGH
Definition ModelFit.h:30

fastglmmLib::MAX
@ MAX
Definition ModelFit.h:32

fastglmmLib::LOW
@ LOW
Definition ModelFit.h:28

fastglmmLib::ModelFitList
vector< ModelFit > ModelFitList
Definition ModelFit.h:393

fastglmmLib::LMWork
Definition linearRegression.h:37

fastglmmLib::LMWork::R
mat R
Definition linearRegression.h:38

fastglmmLib::LMWork::residuals
vec residuals
Definition linearRegression.h:39

fastglmmLib::LMWork::V
mat V
Definition linearRegression.h:38

fastglmmLib::LMWork::LMWork
LMWork()
Definition linearRegression.h:40

fastglmmLib::LMWork::Q
mat Q
Definition linearRegression.h:38