diff --git a/DESCRIPTION b/DESCRIPTION
index 48dcd8c5..3f0b5efd 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -1,8 +1,8 @@
 Package: ranger
 Type: Package
 Title: A Fast Implementation of Random Forests
-Version: 0.15.4
-Date: 2023-11-07
+Version: 0.16.1
+Date: 2023-11-20
 Author: Marvin N. Wright [aut, cre], Stefan Wager [ctb], Philipp Probst [ctb]
 Maintainer: Marvin N. Wright <cran@wrig.de>
 Description: A fast implementation of Random Forests, particularly suited for high
@@ -13,7 +13,7 @@ Description: A fast implementation of Random Forests, particularly suited for hi
           can be directly analyzed.
 License: GPL-3
 Imports: Rcpp (>= 0.11.2), Matrix
-LinkingTo: Rcpp, RcppEigen
+LinkingTo: Rcpp, RcppArmadillo
 Depends: R (>= 3.1)
 Suggests: 
     survival,
diff --git a/NEWS.md b/NEWS.md
index 5d62851c..06475661 100644
--- a/NEWS.md
+++ b/NEWS.md
@@ -1,4 +1,10 @@
 
+# ranger 0.16.1
+* Add linear model residual splitting
+
+# ranger 0.16.0
+* New CRAN version
+
 # ranger 0.15.4
 * Add node.stats option to save node statistics of all nodes
 * Add time.interest option to restrict unique survival times (faster and saves memory)
diff --git a/R/RcppExports.R b/R/RcppExports.R
index ddca1b3f..fad9127e 100644
--- a/R/RcppExports.R
+++ b/R/RcppExports.R
@@ -1,8 +1,8 @@
 # Generated by using Rcpp::compileAttributes() -> do not edit by hand
 # Generator token: 10BE3573-1514-4C36-9D1C-5A225CD40393
 
-rangerCpp <- function(treetype, input_x, input_y, variable_names, mtry, num_trees, verbose, seed, num_threads, write_forest, importance_mode_r, min_node_size, min_bucket, split_select_weights, use_split_select_weights, always_split_variable_names, use_always_split_variable_names, prediction_mode, loaded_forest, snp_data, sample_with_replacement, probability, unordered_variable_names, use_unordered_variable_names, save_memory, splitrule_r, case_weights, use_case_weights, class_weights, predict_all, keep_inbag, sample_fraction, alpha, minprop, holdout, prediction_type_r, num_random_splits, sparse_x, use_sparse_data, order_snps, oob_error, max_depth, inbag, use_inbag, regularization_factor, use_regularization_factor, regularization_usedepth, node_stats, time_interest, use_time_interest) {
-    .Call(`_ranger_rangerCpp`, treetype, input_x, input_y, variable_names, mtry, num_trees, verbose, seed, num_threads, write_forest, importance_mode_r, min_node_size, min_bucket, split_select_weights, use_split_select_weights, always_split_variable_names, use_always_split_variable_names, prediction_mode, loaded_forest, snp_data, sample_with_replacement, probability, unordered_variable_names, use_unordered_variable_names, save_memory, splitrule_r, case_weights, use_case_weights, class_weights, predict_all, keep_inbag, sample_fraction, alpha, minprop, holdout, prediction_type_r, num_random_splits, sparse_x, use_sparse_data, order_snps, oob_error, max_depth, inbag, use_inbag, regularization_factor, use_regularization_factor, regularization_usedepth, node_stats, time_interest, use_time_interest)
+rangerCpp <- function(treetype, input_x, input_y, variable_names, mtry, num_trees, verbose, seed, num_threads, write_forest, importance_mode_r, min_node_size, min_bucket, split_select_weights, use_split_select_weights, always_split_variable_names, use_always_split_variable_names, prediction_mode, loaded_forest, snp_data, sample_with_replacement, probability, unordered_variable_names, use_unordered_variable_names, save_memory, splitrule_r, case_weights, use_case_weights, class_weights, predict_all, keep_inbag, sample_fraction, alpha, minprop, holdout, prediction_type_r, num_random_splits, sparse_x, use_sparse_data, order_snps, oob_error, max_depth, inbag, use_inbag, regularization_factor, use_regularization_factor, regularization_usedepth, node_stats, time_interest, use_time_interest, confounders, use_confounders) {
+    .Call(`_ranger_rangerCpp`, treetype, input_x, input_y, variable_names, mtry, num_trees, verbose, seed, num_threads, write_forest, importance_mode_r, min_node_size, min_bucket, split_select_weights, use_split_select_weights, always_split_variable_names, use_always_split_variable_names, prediction_mode, loaded_forest, snp_data, sample_with_replacement, probability, unordered_variable_names, use_unordered_variable_names, save_memory, splitrule_r, case_weights, use_case_weights, class_weights, predict_all, keep_inbag, sample_fraction, alpha, minprop, holdout, prediction_type_r, num_random_splits, sparse_x, use_sparse_data, order_snps, oob_error, max_depth, inbag, use_inbag, regularization_factor, use_regularization_factor, regularization_usedepth, node_stats, time_interest, use_time_interest, confounders, use_confounders)
 }
 
 numSmaller <- function(values, reference) {
diff --git a/R/predict.R b/R/predict.R
index 82599ab0..bd0d2c23 100644
--- a/R/predict.R
+++ b/R/predict.R
@@ -73,7 +73,8 @@ predict.ranger.forest <- function(object, data, predict.all = FALSE,
                                   num.trees = object$num.trees, 
                                   type = "response", se.method = "infjack",
                                   seed = NULL, num.threads = NULL,
-                                  verbose = TRUE, inbag.counts = NULL, ...) {
+                                  verbose = TRUE, inbag.counts = NULL,
+                                  confounders = NULL, ...) {
 
   ## GenABEL GWA data
   if (inherits(data, "gwaa.data")) {
@@ -122,6 +123,31 @@ predict.ranger.forest <- function(object, data, predict.all = FALSE,
     stop("Error: Invalid value for 'type'. Use 'response', 'se', 'terminalNodes', or 'quantiles'.")
   }
   
+  if (!is.null(confounders)) {
+    if (is.null(forest$glm.coefs) || length(unlist(forest$glm.coefs)) == 0) {
+      stop("For glm prediction, fit a regression RF with the confounders argument.")
+    }
+    if (is.data.frame(confounders)) {
+      confounders <- model.matrix( ~ ., confounders)
+    } else if (is.matrix(confounders)) {
+      confounders <- cbind(1, confounders)
+    } else {
+      stop("Error: confounders argument has to be matrix or data.frame.")
+    }
+    nodes <- predict(object = object, data = data, predict.all = predict.all,
+                     num.trees = num.trees, type = "terminalNodes", se.method = se.method,
+                     seed = seed, num.threads = num.threads,
+                     verbose = verbose, inbag.counts = inbag.counts, ...)$predictions
+    
+    pred <- sapply(1:num.trees, function(i) {
+      tree_coefs <- forest$glm.coefs[[i]][nodes[, i] + 1]
+      sapply(1:length(tree_coefs), function(j) {
+        confounders[j, ] %*% tree_coefs[[j]]
+      })
+    })
+    return(pred)
+  }
+  
   ## Type "se" only for certain tree types
   if (type == "se" && se.method == "jack" && forest$treetype != "Regression") {
     stop("Error: Jackknife standard error prediction currently only available for regression.")
@@ -250,6 +276,8 @@ predict.ranger.forest <- function(object, data, predict.all = FALSE,
   regularization.factor <- c(0, 0)
   use.regularization.factor <- FALSE
   regularization.usedepth <- FALSE
+  confounders <- matrix(c(0, 0))
+  use.confounders <- FALSE
   node.stats <- FALSE
   time.interest <- c(0, 0)
   use.time.interest <- FALSE
@@ -277,7 +305,7 @@ predict.ranger.forest <- function(object, data, predict.all = FALSE,
                       prediction.type, num.random.splits, sparse.x, use.sparse.data,
                       order.snps, oob.error, max.depth, inbag, use.inbag, 
                       regularization.factor, use.regularization.factor, regularization.usedepth, 
-                      node.stats, time.interest, use.time.interest)
+                      node.stats, time.interest, use.time.interest, confounders, use.confounders)
 
   if (length(result) == 0) {
     stop("User interrupt or internal error.")
diff --git a/R/ranger.R b/R/ranger.R
index 660c82d5..2f6a41c2 100644
--- a/R/ranger.R
+++ b/R/ranger.R
@@ -122,6 +122,7 @@
 ##' @param minprop For "maxstat" splitrule: Lower quantile of covariate distribution to be considered for splitting.
 ##' @param split.select.weights Numeric vector with weights between 0 and 1, used to calculate the probability to select variables for splitting. Alternatively, a list of size num.trees, containing split select weight vectors for each tree can be used.  
 ##' @param always.split.variables Character vector with variable names to be always selected in addition to the \code{mtry} variables tried for splitting.
+##' @param confounders Confounders data.frame to adjust for in regression RF.
 ##' @param respect.unordered.factors Handling of unordered factor covariates. One of 'ignore', 'order' and 'partition'. For the "extratrees" splitrule the default is "partition" for all other splitrules 'ignore'. Alternatively TRUE (='order') or FALSE (='ignore') can be used. See below for details. 
 ##' @param scale.permutation.importance Scale permutation importance by standard error as in (Breiman 2001). Only applicable if permutation variable importance mode selected.
 ##' @param regularization.factor Regularization factor (gain penalization), either a vector of length p or one value for all variables.
@@ -238,6 +239,7 @@ ranger <- function(formula = NULL, data = NULL, num.trees = 500, mtry = NULL,
                    case.weights = NULL, class.weights = NULL, splitrule = NULL, 
                    num.random.splits = 1, alpha = 0.5, minprop = 0.1,
                    split.select.weights = NULL, always.split.variables = NULL,
+                   confounders = NULL,
                    respect.unordered.factors = NULL,
                    scale.permutation.importance = FALSE,
                    local.importance = FALSE, 
@@ -850,6 +852,20 @@ ranger <- function(formula = NULL, data = NULL, num.trees = 500, mtry = NULL,
     }
   }
   
+  ## Confounders
+  if (is.null(confounders)) {
+    confounders <- matrix(c(0, 0))
+    use.confounders <- FALSE
+  } else if (is.data.frame(confounders)) {
+    confounders <- model.matrix( ~ ., confounders)
+    use.confounders <- TRUE
+  } else if (is.matrix(confounders)) {
+    confounders <- cbind(1, confounders)
+    use.confounders <- TRUE
+  } else {
+    stop("Error: confounders argument has to be matrix or data.frame.")
+  }
+
   ## Time of interest
   if (is.null(time.interest)) {
     time.interest <- c(0, 0)
@@ -928,7 +944,7 @@ ranger <- function(formula = NULL, data = NULL, num.trees = 500, mtry = NULL,
                       num.random.splits, sparse.x, use.sparse.data, order.snps, oob.error, max.depth, 
                       inbag, use.inbag, 
                       regularization.factor, use.regularization.factor, regularization.usedepth, 
-                      node.stats, time.interest, use.time.interest)
+                      node.stats, time.interest, use.time.interest, confounders, use.confounders)
   
   if (length(result) == 0) {
     stop("User interrupt or internal error.")
diff --git a/man/predict.ranger.forest.Rd b/man/predict.ranger.forest.Rd
index ba018b0e..0a99def0 100644
--- a/man/predict.ranger.forest.Rd
+++ b/man/predict.ranger.forest.Rd
@@ -15,6 +15,7 @@
   num.threads = NULL,
   verbose = TRUE,
   inbag.counts = NULL,
+  confounders = NULL,
   ...
 )
 }
diff --git a/man/ranger.Rd b/man/ranger.Rd
index 61c6e5df..75098c95 100644
--- a/man/ranger.Rd
+++ b/man/ranger.Rd
@@ -25,6 +25,7 @@ ranger(
   minprop = 0.1,
   split.select.weights = NULL,
   always.split.variables = NULL,
+  confounders = NULL,
   respect.unordered.factors = NULL,
   scale.permutation.importance = FALSE,
   local.importance = FALSE,
@@ -90,6 +91,8 @@ ranger(
 
 \item{always.split.variables}{Character vector with variable names to be always selected in addition to the \code{mtry} variables tried for splitting.}
 
+\item{confounders}{Confounders data.frame to adjust for in regression RF.}
+
 \item{respect.unordered.factors}{Handling of unordered factor covariates. One of 'ignore', 'order' and 'partition'. For the "extratrees" splitrule the default is "partition" for all other splitrules 'ignore'. Alternatively TRUE (='order') or FALSE (='ignore') can be used. See below for details.}
 
 \item{scale.permutation.importance}{Scale permutation importance by standard error as in (Breiman 2001). Only applicable if permutation variable importance mode selected.}
diff --git a/src/Data.h b/src/Data.h
index c58e5ec6..7ca83c1e 100644
--- a/src/Data.h
+++ b/src/Data.h
@@ -33,7 +33,7 @@ class Data {
 
   virtual double get_x(size_t row, size_t col) const = 0;
   virtual double get_y(size_t row, size_t col) const = 0;
-
+  
   size_t getVariableID(const std::string& variable_name) const;
 
   virtual void reserveMemory(size_t y_cols) = 0;
@@ -196,6 +196,24 @@ class Data {
     order_snps = true;
   }
   // #nocov end
+  
+  virtual void lm(std::vector<size_t>& sampleIDs, size_t start, size_t end) {
+    // Empty on purpose
+  }
+  
+  virtual std::vector<double> lm_coefs(std::vector<size_t>& sampleIDs, size_t start, size_t end) {
+    // Empty on purpose
+    return std::vector<double>();
+  }
+  
+  virtual double predict(size_t row, std::vector<double> coefs) {
+    // Empty on purpose
+    return 0;
+  }
+  
+  virtual double get_yy(size_t row, size_t col) const {
+    return get_y(row, col);
+  }
 
 protected:
   std::vector<std::string> variable_names;
diff --git a/src/DataRcpp.h b/src/DataRcpp.h
index ca21561c..cf79b29d 100644
--- a/src/DataRcpp.h
+++ b/src/DataRcpp.h
@@ -27,9 +27,10 @@ Ratzeburger Allee 160
 
 #ifndef DATARCPP_H_
 #define DATARCPP_H_
-
+ 
 #include <Rcpp.h>
-
+#include <RcppArmadillo.h>
+ 
 #include "globals.h"
 #include "utility.h"
 #include "Data.h"
@@ -39,13 +40,16 @@ namespace ranger {
 class DataRcpp: public Data {
 public:
   DataRcpp() = default;
-  DataRcpp(Rcpp::NumericMatrix& x, Rcpp::NumericMatrix& y, std::vector<std::string> variable_names, size_t num_rows, size_t num_cols) {
+  DataRcpp(Rcpp::NumericMatrix& x, Rcpp::NumericMatrix& y, std::vector<std::string> variable_names, size_t num_rows, size_t num_cols, 
+           Rcpp::NumericMatrix& confounders) {
       this->x = x;
       this->y = y;
       this->variable_names = variable_names;
       this->num_rows = num_rows;
       this->num_cols = num_cols;
       this->num_cols_no_snp = num_cols;
+      this->confounders = confounders;
+      this->resid = arma::colvec(y(Rcpp::_, 0));
     }
   
   DataRcpp(const DataRcpp&) = delete;
@@ -86,9 +90,54 @@ class DataRcpp: public Data {
   }
   // #nocov end 
   
+  void lm(std::vector<size_t>& sampleIDs, size_t start, size_t end) override {
+    if (confounders.size() > 0) {
+      std::vector<size_t> idx;
+      idx.assign(sampleIDs.begin() + start, sampleIDs.begin() + end);
+      
+      arma::uvec ia = arma::conv_to<arma::uvec>::from(idx);
+      
+      arma::mat ca = arma::mat(confounders.begin(), confounders.nrow(),
+                               confounders.ncol(), false);
+      arma::colvec ya = arma::colvec(y(Rcpp::_, 0));
+      
+      arma::colvec coef = arma::solve(ca.rows(ia), ya(ia));
+      resid(ia) = ya(ia) - ca.rows(ia)*coef;
+    }
+  }
+  
+  std::vector<double> lm_coefs(std::vector<size_t>& sampleIDs, size_t start, size_t end) override {
+    if (confounders.size() > 0) {
+      std::vector<size_t> idx;
+      idx.assign(sampleIDs.begin() + start, sampleIDs.begin() + end);
+      
+      arma::uvec ia = arma::conv_to<arma::uvec>::from(idx);
+      
+      arma::mat ca = arma::mat(confounders.begin(), confounders.nrow(),
+                               confounders.ncol(), false);
+      arma::colvec ya = arma::colvec(y(Rcpp::_, 0));
+      
+      arma::colvec coef = arma::solve(ca.rows(ia), ya(ia));
+      
+      return arma::conv_to<std::vector<double>>::from(coef);
+    } else {
+      return std::vector<double>();
+    }
+  }
+  
+  double predict(size_t row, std::vector<double> coefs) override {
+    return arma::dot(arma::vec(confounders(row, Rcpp::_)), arma::vec(coefs));
+  }
+  
+  double get_yy(size_t row, size_t col) const override {
+    return resid(row);
+  }
+  
 private:
   Rcpp::NumericMatrix x;
   Rcpp::NumericMatrix y;
+  arma::colvec resid;
+  Rcpp::NumericMatrix confounders;
 };
 
 } // namespace ranger
diff --git a/src/DataSparse.cpp b/src/DataSparse.cpp
index 779a54d6..59e599ea 100644
--- a/src/DataSparse.cpp
+++ b/src/DataSparse.cpp
@@ -30,10 +30,10 @@
 
 namespace ranger {
 
-DataSparse::DataSparse(Eigen::SparseMatrix<double>& x, Rcpp::NumericMatrix& y, std::vector<std::string> variable_names, size_t num_rows,
+DataSparse::DataSparse(arma::sp_mat& x, Rcpp::NumericMatrix& y, std::vector<std::string> variable_names, size_t num_rows,
     size_t num_cols) :
     x { }{
-  this->x.swap(x);
+  this->x = x;
   this->y = y;
   this->variable_names = variable_names;
   this->num_rows = num_rows;
diff --git a/src/DataSparse.h b/src/DataSparse.h
index 3cd90433..de302b5c 100644
--- a/src/DataSparse.h
+++ b/src/DataSparse.h
@@ -28,7 +28,7 @@
 #ifndef DATASPARSE_H_
 #define DATASPARSE_H_
 
-#include <RcppEigen.h>
+#include <RcppArmadillo.h>
 
 #include "globals.h"
 #include "utility.h"
@@ -40,7 +40,7 @@ class DataSparse: public Data {
 public:
   DataSparse() = default;
   
-  DataSparse(Eigen::SparseMatrix<double>& x, Rcpp::NumericMatrix& y, std::vector<std::string> variable_names, size_t num_rows,
+  DataSparse(arma::sp_mat& x, Rcpp::NumericMatrix& y, std::vector<std::string> variable_names, size_t num_rows,
       size_t num_cols);
 
   DataSparse(const DataSparse&) = delete;
@@ -54,7 +54,7 @@ class DataSparse: public Data {
       col = getUnpermutedVarID(col);
       row = getPermutedSampleID(row);
     }
-    return x.coeff(row, col);
+    return x(row, col);
   }
   
   double get_y(size_t row, size_t col) const override {
@@ -67,7 +67,7 @@ class DataSparse: public Data {
   }
 
   void set_x(size_t col, size_t row, double value, bool& error) override {
-    x.coeffRef(row, col) = value;
+    x(row, col) = value;
   }
   
   void set_y(size_t col, size_t row, double value, bool& error) override {
@@ -76,7 +76,7 @@ class DataSparse: public Data {
   // #nocov end 
 
 private:
-  Eigen::SparseMatrix<double> x;
+  arma::sp_mat x;
   Rcpp::NumericMatrix y;
 };
 
diff --git a/src/ForestRegression.cpp b/src/ForestRegression.cpp
index 7c1bb326..37bb1df9 100644
--- a/src/ForestRegression.cpp
+++ b/src/ForestRegression.cpp
@@ -39,6 +39,16 @@ void ForestRegression::loadForest(size_t num_trees,
   equalSplit(thread_ranges, 0, num_trees - 1, num_threads);
 }
 
+std::vector<std::vector<std::vector<double>>> ForestRegression::getGlmCoefs() const {
+  std::vector<std::vector<std::vector<double>>> result;
+  result.reserve(num_trees);
+  for (const auto& tree : trees) {
+    const auto& temp = dynamic_cast<const TreeRegression&>(*tree);
+    result.push_back(temp.getGlmCoefs());
+  }
+  return result;
+}
+
 void ForestRegression::initInternal() {
 
   // If mtry not set, use floored square root of number of independent variables
diff --git a/src/ForestRegression.h b/src/ForestRegression.h
index 62689d38..313b631f 100644
--- a/src/ForestRegression.h
+++ b/src/ForestRegression.h
@@ -32,6 +32,8 @@ class ForestRegression: public Forest {
   void loadForest(size_t num_trees, std::vector<std::vector<std::vector<size_t>> >& forest_child_nodeIDs,
       std::vector<std::vector<size_t>>& forest_split_varIDs, std::vector<std::vector<double>>& forest_split_values,
       std::vector<bool>& is_ordered_variable);
+  
+  std::vector<std::vector<std::vector<double>>> getGlmCoefs() const;
 
 private:
   void initInternal() override;
diff --git a/src/Makevars b/src/Makevars
index a77f2396..41c83d0d 100644
--- a/src/Makevars
+++ b/src/Makevars
@@ -1,2 +1,3 @@
-PKG_CPPFLAGS = -DR_BUILD
+PKG_CPPFLAGS = -DR_BUILD $(SHLIB_OPENMP_CXXFLAGS)
+PKG_LIBS = $(SHLIB_OPENMP_CXXFLAGS) $(LAPACK_LIBS) $(BLAS_LIBS) $(FLIBS)
 
diff --git a/src/Makevars.win b/src/Makevars.win
index a6af4dd1..4ba80722 100644
--- a/src/Makevars.win
+++ b/src/Makevars.win
@@ -1,2 +1,4 @@
-PKG_CPPFLAGS = -DR_BUILD -DWIN_R_BUILD
+PKG_CPPFLAGS = -DR_BUILD -DWIN_R_BUILD $(SHLIB_OPENMP_CXXFLAGS)
+PKG_LIBS = $(SHLIB_OPENMP_CXXFLAGS) $(LAPACK_LIBS) $(BLAS_LIBS) $(FLIBS)
+
 
diff --git a/src/RcppExports.cpp b/src/RcppExports.cpp
index a47c2234..26f2b345 100644
--- a/src/RcppExports.cpp
+++ b/src/RcppExports.cpp
@@ -2,7 +2,7 @@
 // Generator token: 10BE3573-1514-4C36-9D1C-5A225CD40393
 
 #include "../inst/include/ranger.h"
-#include <RcppEigen.h>
+#include <RcppArmadillo.h>
 #include <Rcpp.h>
 
 using namespace Rcpp;
@@ -13,8 +13,8 @@ Rcpp::Rostream<false>& Rcpp::Rcerr = Rcpp::Rcpp_cerr_get();
 #endif
 
 // rangerCpp
-Rcpp::List rangerCpp(uint treetype, Rcpp::NumericMatrix& input_x, Rcpp::NumericMatrix& input_y, std::vector<std::string> variable_names, uint mtry, uint num_trees, bool verbose, uint seed, uint num_threads, bool write_forest, uint importance_mode_r, uint min_node_size, uint min_bucket, std::vector<std::vector<double>>& split_select_weights, bool use_split_select_weights, std::vector<std::string>& always_split_variable_names, bool use_always_split_variable_names, bool prediction_mode, Rcpp::List loaded_forest, Rcpp::RawMatrix snp_data, bool sample_with_replacement, bool probability, std::vector<std::string>& unordered_variable_names, bool use_unordered_variable_names, bool save_memory, uint splitrule_r, std::vector<double>& case_weights, bool use_case_weights, std::vector<double>& class_weights, bool predict_all, bool keep_inbag, std::vector<double>& sample_fraction, double alpha, double minprop, bool holdout, uint prediction_type_r, uint num_random_splits, Eigen::SparseMatrix<double>& sparse_x, bool use_sparse_data, bool order_snps, bool oob_error, uint max_depth, std::vector<std::vector<size_t>>& inbag, bool use_inbag, std::vector<double>& regularization_factor, bool use_regularization_factor, bool regularization_usedepth, bool node_stats, std::vector<double>& time_interest, bool use_time_interest);
-RcppExport SEXP _ranger_rangerCpp(SEXP treetypeSEXP, SEXP input_xSEXP, SEXP input_ySEXP, SEXP variable_namesSEXP, SEXP mtrySEXP, SEXP num_treesSEXP, SEXP verboseSEXP, SEXP seedSEXP, SEXP num_threadsSEXP, SEXP write_forestSEXP, SEXP importance_mode_rSEXP, SEXP min_node_sizeSEXP, SEXP min_bucketSEXP, SEXP split_select_weightsSEXP, SEXP use_split_select_weightsSEXP, SEXP always_split_variable_namesSEXP, SEXP use_always_split_variable_namesSEXP, SEXP prediction_modeSEXP, SEXP loaded_forestSEXP, SEXP snp_dataSEXP, SEXP sample_with_replacementSEXP, SEXP probabilitySEXP, SEXP unordered_variable_namesSEXP, SEXP use_unordered_variable_namesSEXP, SEXP save_memorySEXP, SEXP splitrule_rSEXP, SEXP case_weightsSEXP, SEXP use_case_weightsSEXP, SEXP class_weightsSEXP, SEXP predict_allSEXP, SEXP keep_inbagSEXP, SEXP sample_fractionSEXP, SEXP alphaSEXP, SEXP minpropSEXP, SEXP holdoutSEXP, SEXP prediction_type_rSEXP, SEXP num_random_splitsSEXP, SEXP sparse_xSEXP, SEXP use_sparse_dataSEXP, SEXP order_snpsSEXP, SEXP oob_errorSEXP, SEXP max_depthSEXP, SEXP inbagSEXP, SEXP use_inbagSEXP, SEXP regularization_factorSEXP, SEXP use_regularization_factorSEXP, SEXP regularization_usedepthSEXP, SEXP node_statsSEXP, SEXP time_interestSEXP, SEXP use_time_interestSEXP) {
+Rcpp::List rangerCpp(uint treetype, Rcpp::NumericMatrix& input_x, Rcpp::NumericMatrix& input_y, std::vector<std::string> variable_names, uint mtry, uint num_trees, bool verbose, uint seed, uint num_threads, bool write_forest, uint importance_mode_r, uint min_node_size, uint min_bucket, std::vector<std::vector<double>>& split_select_weights, bool use_split_select_weights, std::vector<std::string>& always_split_variable_names, bool use_always_split_variable_names, bool prediction_mode, Rcpp::List loaded_forest, Rcpp::RawMatrix snp_data, bool sample_with_replacement, bool probability, std::vector<std::string>& unordered_variable_names, bool use_unordered_variable_names, bool save_memory, uint splitrule_r, std::vector<double>& case_weights, bool use_case_weights, std::vector<double>& class_weights, bool predict_all, bool keep_inbag, std::vector<double>& sample_fraction, double alpha, double minprop, bool holdout, uint prediction_type_r, uint num_random_splits, arma::sp_mat& sparse_x, bool use_sparse_data, bool order_snps, bool oob_error, uint max_depth, std::vector<std::vector<size_t>>& inbag, bool use_inbag, std::vector<double>& regularization_factor, bool use_regularization_factor, bool regularization_usedepth, bool node_stats, std::vector<double>& time_interest, bool use_time_interest, Rcpp::NumericMatrix confounders, bool use_confounders);
+RcppExport SEXP _ranger_rangerCpp(SEXP treetypeSEXP, SEXP input_xSEXP, SEXP input_ySEXP, SEXP variable_namesSEXP, SEXP mtrySEXP, SEXP num_treesSEXP, SEXP verboseSEXP, SEXP seedSEXP, SEXP num_threadsSEXP, SEXP write_forestSEXP, SEXP importance_mode_rSEXP, SEXP min_node_sizeSEXP, SEXP min_bucketSEXP, SEXP split_select_weightsSEXP, SEXP use_split_select_weightsSEXP, SEXP always_split_variable_namesSEXP, SEXP use_always_split_variable_namesSEXP, SEXP prediction_modeSEXP, SEXP loaded_forestSEXP, SEXP snp_dataSEXP, SEXP sample_with_replacementSEXP, SEXP probabilitySEXP, SEXP unordered_variable_namesSEXP, SEXP use_unordered_variable_namesSEXP, SEXP save_memorySEXP, SEXP splitrule_rSEXP, SEXP case_weightsSEXP, SEXP use_case_weightsSEXP, SEXP class_weightsSEXP, SEXP predict_allSEXP, SEXP keep_inbagSEXP, SEXP sample_fractionSEXP, SEXP alphaSEXP, SEXP minpropSEXP, SEXP holdoutSEXP, SEXP prediction_type_rSEXP, SEXP num_random_splitsSEXP, SEXP sparse_xSEXP, SEXP use_sparse_dataSEXP, SEXP order_snpsSEXP, SEXP oob_errorSEXP, SEXP max_depthSEXP, SEXP inbagSEXP, SEXP use_inbagSEXP, SEXP regularization_factorSEXP, SEXP use_regularization_factorSEXP, SEXP regularization_usedepthSEXP, SEXP node_statsSEXP, SEXP time_interestSEXP, SEXP use_time_interestSEXP, SEXP confoundersSEXP, SEXP use_confoundersSEXP) {
 BEGIN_RCPP
     Rcpp::RObject rcpp_result_gen;
     Rcpp::RNGScope rcpp_rngScope_gen;
@@ -55,7 +55,7 @@ BEGIN_RCPP
     Rcpp::traits::input_parameter< bool >::type holdout(holdoutSEXP);
     Rcpp::traits::input_parameter< uint >::type prediction_type_r(prediction_type_rSEXP);
     Rcpp::traits::input_parameter< uint >::type num_random_splits(num_random_splitsSEXP);
-    Rcpp::traits::input_parameter< Eigen::SparseMatrix<double>& >::type sparse_x(sparse_xSEXP);
+    Rcpp::traits::input_parameter< arma::sp_mat& >::type sparse_x(sparse_xSEXP);
     Rcpp::traits::input_parameter< bool >::type use_sparse_data(use_sparse_dataSEXP);
     Rcpp::traits::input_parameter< bool >::type order_snps(order_snpsSEXP);
     Rcpp::traits::input_parameter< bool >::type oob_error(oob_errorSEXP);
@@ -68,7 +68,9 @@ BEGIN_RCPP
     Rcpp::traits::input_parameter< bool >::type node_stats(node_statsSEXP);
     Rcpp::traits::input_parameter< std::vector<double>& >::type time_interest(time_interestSEXP);
     Rcpp::traits::input_parameter< bool >::type use_time_interest(use_time_interestSEXP);
-    rcpp_result_gen = Rcpp::wrap(rangerCpp(treetype, input_x, input_y, variable_names, mtry, num_trees, verbose, seed, num_threads, write_forest, importance_mode_r, min_node_size, min_bucket, split_select_weights, use_split_select_weights, always_split_variable_names, use_always_split_variable_names, prediction_mode, loaded_forest, snp_data, sample_with_replacement, probability, unordered_variable_names, use_unordered_variable_names, save_memory, splitrule_r, case_weights, use_case_weights, class_weights, predict_all, keep_inbag, sample_fraction, alpha, minprop, holdout, prediction_type_r, num_random_splits, sparse_x, use_sparse_data, order_snps, oob_error, max_depth, inbag, use_inbag, regularization_factor, use_regularization_factor, regularization_usedepth, node_stats, time_interest, use_time_interest));
+    Rcpp::traits::input_parameter< Rcpp::NumericMatrix >::type confounders(confoundersSEXP);
+    Rcpp::traits::input_parameter< bool >::type use_confounders(use_confoundersSEXP);
+    rcpp_result_gen = Rcpp::wrap(rangerCpp(treetype, input_x, input_y, variable_names, mtry, num_trees, verbose, seed, num_threads, write_forest, importance_mode_r, min_node_size, min_bucket, split_select_weights, use_split_select_weights, always_split_variable_names, use_always_split_variable_names, prediction_mode, loaded_forest, snp_data, sample_with_replacement, probability, unordered_variable_names, use_unordered_variable_names, save_memory, splitrule_r, case_weights, use_case_weights, class_weights, predict_all, keep_inbag, sample_fraction, alpha, minprop, holdout, prediction_type_r, num_random_splits, sparse_x, use_sparse_data, order_snps, oob_error, max_depth, inbag, use_inbag, regularization_factor, use_regularization_factor, regularization_usedepth, node_stats, time_interest, use_time_interest, confounders, use_confounders));
     return rcpp_result_gen;
 END_RCPP
 }
@@ -99,7 +101,7 @@ END_RCPP
 }
 
 static const R_CallMethodDef CallEntries[] = {
-    {"_ranger_rangerCpp", (DL_FUNC) &_ranger_rangerCpp, 50},
+    {"_ranger_rangerCpp", (DL_FUNC) &_ranger_rangerCpp, 52},
     {"_ranger_numSmaller", (DL_FUNC) &_ranger_numSmaller, 2},
     {"_ranger_randomObsNode", (DL_FUNC) &_ranger_randomObsNode, 3},
     {NULL, NULL, 0}
diff --git a/src/Tree.cpp b/src/Tree.cpp
index 57d3dfbd..2be40186 100644
--- a/src/Tree.cpp
+++ b/src/Tree.cpp
@@ -38,7 +38,7 @@ Tree::Tree(std::vector<std::vector<size_t>>& child_nodeIDs, std::vector<size_t>&
         0) {
 }
 
-void Tree::init(const Data* data, uint mtry, size_t num_samples, uint seed, std::vector<size_t>* deterministic_varIDs,
+void Tree::init(Data* data, uint mtry, size_t num_samples, uint seed, std::vector<size_t>* deterministic_varIDs,
     std::vector<double>* split_select_weights, ImportanceMode importance_mode, uint min_node_size, uint min_bucket,
     bool sample_with_replacement, bool memory_saving_splitting, SplitRule splitrule, std::vector<double>* case_weights,
     std::vector<size_t>* manual_inbag, bool keep_inbag, std::vector<double>* sample_fraction, double alpha,
diff --git a/src/Tree.h b/src/Tree.h
index 101c300d..665ffb92 100644
--- a/src/Tree.h
+++ b/src/Tree.h
@@ -35,7 +35,7 @@ class Tree {
   Tree(const Tree&) = delete;
   Tree& operator=(const Tree&) = delete;
 
-  void init(const Data* data, uint mtry, size_t num_samples, uint seed, std::vector<size_t>* deterministic_varIDs,
+  void init(Data* data, uint mtry, size_t num_samples, uint seed, std::vector<size_t>* deterministic_varIDs,
       std::vector<double>* split_select_weights, ImportanceMode importance_mode, uint min_node_size, uint min_bucket,
       bool sample_with_replacement, bool memory_saving_splitting, SplitRule splitrule,
       std::vector<double>* case_weights, std::vector<size_t>* manual_inbag, bool keep_inbag,
@@ -219,7 +219,7 @@ class Tree {
   std::mt19937_64 random_number_generator;
 
   // Pointer to original data
-  const Data* data;
+  Data* data;
 
   // Regularization
   bool regularization;
diff --git a/src/TreeRegression.cpp b/src/TreeRegression.cpp
index c272695b..937a04bf 100644
--- a/src/TreeRegression.cpp
+++ b/src/TreeRegression.cpp
@@ -42,6 +42,8 @@ void TreeRegression::allocateMemory() {
 }
 
 double TreeRegression::estimate(size_t nodeID) {
+  
+  glm_coefs[nodeID] = data->lm_coefs(sampleIDs, start_pos[nodeID], end_pos[nodeID]);
 
   // Mean of responses of samples in node
   double sum_responses_in_node = 0;
@@ -87,8 +89,12 @@ bool TreeRegression::splitNodeInternal(size_t nodeID, std::vector<size_t>& possi
   }
   if (pure) {
     split_values[nodeID] = pure_value;
+    glm_coefs[nodeID] = data->lm_coefs(sampleIDs, start_pos[nodeID], end_pos[nodeID]);
     return true;
   }
+  
+  // Fit linear model and save residuals
+  data->lm(sampleIDs, start_pos[nodeID], end_pos[nodeID]);
 
   // Find best split, stop if no decrease of impurity
   bool stop;
@@ -114,6 +120,7 @@ void TreeRegression::createEmptyNodeInternal() {
   if (save_node_stats) {
     node_predictions.push_back(0);
   }
+  glm_coefs.push_back(std::vector<double>());
 }
 
 double TreeRegression::computePredictionAccuracyInternal(std::vector<double>* prediction_error_casewise) {
@@ -122,7 +129,15 @@ double TreeRegression::computePredictionAccuracyInternal(std::vector<double>* pr
   double sum_of_squares = 0;
   for (size_t i = 0; i < num_predictions; ++i) {
     size_t terminal_nodeID = prediction_terminal_nodeIDs[i];
-    double predicted_value = split_values[terminal_nodeID];
+    
+    double predicted_value;
+    if (glm_coefs[terminal_nodeID].size() > 0) {
+      // Get predicted value from glm in terminal node
+      predicted_value = data->predict(oob_sampleIDs[i], glm_coefs[terminal_nodeID]);
+    } else {
+      predicted_value = split_values[terminal_nodeID];
+    }
+
     double real_value = data->get_y(oob_sampleIDs[i], 0);
     if (predicted_value != real_value) {
       double diff = (predicted_value - real_value) * (predicted_value - real_value);
@@ -146,7 +161,7 @@ bool TreeRegression::findBestSplit(size_t nodeID, std::vector<size_t>& possible_
   double sum_node = 0;
   for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
     size_t sampleID = sampleIDs[pos];
-    sum_node += data->get_y(sampleID, 0);
+    sum_node += data->get_yy(sampleID, 0);
   }
 
   // Stop early if no split posssible
@@ -236,7 +251,7 @@ void TreeRegression::findBestSplitValueSmallQ(size_t nodeID, size_t varID, doubl
     size_t idx = std::lower_bound(possible_split_values.begin(), possible_split_values.end(),
         data->get_x(sampleID, varID)) - possible_split_values.begin();
 
-    sums[idx] += data->get_y(sampleID, 0);
+    sums[idx] += data->get_yy(sampleID, 0);
     ++counter[idx];
   }
 
@@ -298,7 +313,7 @@ void TreeRegression::findBestSplitValueLargeQ(size_t nodeID, size_t varID, doubl
     size_t sampleID = sampleIDs[pos];
     size_t index = data->getIndex(sampleID, varID);
 
-    sums[index] += data->get_y(sampleID, 0);
+    sums[index] += data->get_yy(sampleID, 0);
     ++counter[index];
   }
 
@@ -391,7 +406,7 @@ void TreeRegression::findBestSplitValueUnordered(size_t nodeID, size_t varID, do
     // Sum in right child
     for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
       size_t sampleID = sampleIDs[pos];
-      double response = data->get_y(sampleID, 0);
+      double response = data->get_yy(sampleID, 0);
       double value = data->get_x(sampleID, varID);
       size_t factorID = floor(value) - 1;
 
@@ -434,7 +449,7 @@ bool TreeRegression::findBestSplitMaxstat(size_t nodeID, std::vector<size_t>& po
   response.reserve(num_samples_node);
   for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
     size_t sampleID = sampleIDs[pos];
-    response.push_back(data->get_y(sampleID, 0));
+    response.push_back(data->get_yy(sampleID, 0));
   }
   std::vector<double> ranks = rank(response);
 
@@ -544,7 +559,7 @@ bool TreeRegression::findBestSplitExtraTrees(size_t nodeID, std::vector<size_t>&
   double sum_node = 0;
   for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
     size_t sampleID = sampleIDs[pos];
-    sum_node += data->get_y(sampleID, 0);
+    sum_node += data->get_yy(sampleID, 0);
   }
 
   // Stop early if no split posssible
@@ -635,7 +650,7 @@ void TreeRegression::findBestSplitValueExtraTrees(size_t nodeID, size_t varID, d
   for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
     size_t sampleID = sampleIDs[pos];
     double value = data->get_x(sampleID, varID);
-    double response = data->get_y(sampleID, 0);
+    double response = data->get_yy(sampleID, 0);
 
     // Count samples until split_value reached
     for (size_t i = 0; i < num_splits; ++i) {
@@ -744,7 +759,7 @@ void TreeRegression::findBestSplitValueExtraTreesUnordered(size_t nodeID, size_t
     // Sum in right child
     for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
       size_t sampleID = sampleIDs[pos];
-      double response = data->get_y(sampleID, 0);
+      double response = data->get_yy(sampleID, 0);
       double value = data->get_x(sampleID, varID);
       size_t factorID = floor(value) - 1;
 
@@ -789,7 +804,7 @@ bool TreeRegression::findBestSplitBeta(size_t nodeID, std::vector<size_t>& possi
   double sum_node = 0;
   for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
     size_t sampleID = sampleIDs[pos];
-    sum_node += data->get_y(sampleID, 0);
+    sum_node += data->get_yy(sampleID, 0);
   }
 
   // Stop early if no split posssible
@@ -863,7 +878,7 @@ void TreeRegression::findBestSplitValueBeta(size_t nodeID, size_t varID, double
   for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
     size_t sampleID = sampleIDs[pos];
     double value = data->get_x(sampleID, varID);
-    double response = data->get_y(sampleID, 0);
+    double response = data->get_yy(sampleID, 0);
 
     // Count samples until split_value reached
     for (size_t i = 0; i < num_splits; ++i) {
@@ -902,7 +917,7 @@ void TreeRegression::findBestSplitValueBeta(size_t nodeID, size_t varID, double
     for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
       size_t sampleID = sampleIDs[pos];
       double value = data->get_x(sampleID, varID);
-      double response = data->get_y(sampleID, 0);
+      double response = data->get_yy(sampleID, 0);
 
       if (value > possible_split_values[i]) {
         var_right += (response - mean_right) * (response - mean_right);
@@ -928,7 +943,7 @@ void TreeRegression::findBestSplitValueBeta(size_t nodeID, size_t varID, double
     for (size_t pos = start_pos[nodeID]; pos < end_pos[nodeID]; ++pos) {
       size_t sampleID = sampleIDs[pos];
       double value = data->get_x(sampleID, varID);
-      double response = data->get_y(sampleID, 0);
+      double response = data->get_yy(sampleID, 0);
 
       if (value > possible_split_values[i]) {
         beta_loglik_right += betaLogLik(response, mean_right, phi_right);
diff --git a/src/TreeRegression.h b/src/TreeRegression.h
index 84c224f6..7a05e378 100644
--- a/src/TreeRegression.h
+++ b/src/TreeRegression.h
@@ -46,6 +46,10 @@ class TreeRegression: public Tree {
   size_t getPredictionTerminalNodeID(size_t sampleID) const {
     return prediction_terminal_nodeIDs[sampleID];
   }
+  
+  const std::vector<std::vector<double>>& getGlmCoefs() const {
+    return glm_coefs;
+  }
 
 private:
   bool splitNodeInternal(size_t nodeID, std::vector<size_t>& possible_split_varIDs) override;
@@ -93,6 +97,9 @@ class TreeRegression: public Tree {
     sums.clear();
     sums.shrink_to_fit();
   }
+  
+  // GLM coefficients in terminal nodes. Empty for non-terminal nodes (except if save_node_stats).
+  std::vector<std::vector<double>> glm_coefs;
 
   std::vector<size_t> counter;
   std::vector<double> sums;
diff --git a/src/rangerCpp.cpp b/src/rangerCpp.cpp
index c8c4fed2..d2215a4e 100644
--- a/src/rangerCpp.cpp
+++ b/src/rangerCpp.cpp
@@ -25,7 +25,9 @@
  http://www.imbs-luebeck.de
  #-------------------------------------------------------------------------------*/
 
-#include <RcppEigen.h>
+#define ARMA_WARN_LEVEL 1
+ 
+#include <RcppArmadillo.h>
 #include <vector>
 #include <sstream>
 #include <memory>
@@ -46,7 +48,7 @@
 
 using namespace ranger;
 
-// [[Rcpp::depends(RcppEigen)]]
+// [[Rcpp::depends(RcppArmadillo)]]
 // [[Rcpp::export]]
 Rcpp::List rangerCpp(uint treetype, Rcpp::NumericMatrix& input_x, Rcpp::NumericMatrix& input_y,
     std::vector<std::string> variable_names, uint mtry, uint num_trees, bool verbose, uint seed, uint num_threads,
@@ -58,11 +60,12 @@ Rcpp::List rangerCpp(uint treetype, Rcpp::NumericMatrix& input_x, Rcpp::NumericM
     bool use_unordered_variable_names, bool save_memory, uint splitrule_r, std::vector<double>& case_weights,
     bool use_case_weights, std::vector<double>& class_weights, bool predict_all, bool keep_inbag,
     std::vector<double>& sample_fraction, double alpha, double minprop, bool holdout, uint prediction_type_r,
-    uint num_random_splits, Eigen::SparseMatrix<double>& sparse_x, 
+    uint num_random_splits, arma::sp_mat& sparse_x, 
     bool use_sparse_data, bool order_snps, bool oob_error, uint max_depth, 
     std::vector<std::vector<size_t>>& inbag, bool use_inbag,
     std::vector<double>& regularization_factor, bool use_regularization_factor, bool regularization_usedepth,
-    bool node_stats, std::vector<double>& time_interest, bool use_time_interest) {
+    bool node_stats, std::vector<double>& time_interest, bool use_time_interest, 
+    Rcpp::NumericMatrix confounders, bool use_confounders) {
   
   Rcpp::List result;
 
@@ -89,6 +92,9 @@ Rcpp::List rangerCpp(uint treetype, Rcpp::NumericMatrix& input_x, Rcpp::NumericM
     if (!use_regularization_factor) {
       regularization_factor.clear();
     }
+    if (!use_confounders) {
+      confounders = Rcpp::NumericMatrix();
+    }
     if (!use_time_interest) {
       time_interest.clear();
     }
@@ -103,8 +109,8 @@ Rcpp::List rangerCpp(uint treetype, Rcpp::NumericMatrix& input_x, Rcpp::NumericM
     size_t num_rows;
     size_t num_cols;
     if (use_sparse_data) {
-      num_rows = sparse_x.rows();
-      num_cols = sparse_x.cols();
+      num_rows = sparse_x.n_rows;
+      num_cols = sparse_x.n_cols;
     } else {
       num_rows = input_x.nrow();
       num_cols = input_x.ncol();
@@ -114,7 +120,7 @@ Rcpp::List rangerCpp(uint treetype, Rcpp::NumericMatrix& input_x, Rcpp::NumericM
     if (use_sparse_data) {
       data = std::make_unique<DataSparse>(sparse_x, input_y, variable_names, num_rows, num_cols);
     } else {
-      data = std::make_unique<DataRcpp>(input_x, input_y, variable_names, num_rows, num_cols);
+      data = std::make_unique<DataRcpp>(input_x, input_y, variable_names, num_rows, num_cols, confounders);
     }
 
     // If there is snp data, add it
@@ -279,6 +285,8 @@ Rcpp::List rangerCpp(uint treetype, Rcpp::NumericMatrix& input_x, Rcpp::NumericM
         if (node_stats) {
           forest_object.push_back(forest->getNodePredictions(), "node.predictions");
         }
+        auto& temp = dynamic_cast<ForestRegression&>(*forest);
+        forest_object.push_back(temp.getGlmCoefs(), "glm.coefs");
       } else if (treetype == TREE_PROBABILITY) {
         auto& temp = dynamic_cast<ForestProbability&>(*forest);
         forest_object.push_back(temp.getClassValues(), "class.values");