From 5e92a2a26b779f8c7d238261a9a4e77f861d73dc Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sat, 3 Aug 2024 00:45:55 -0500
Subject: [PATCH 01/41] Added functions to convert BCF model to JSON string

---
 NAMESPACE                           |   3 +
 R/bcf.R                             | 290 ++++++++++++++++++++++++++++
 R/cpp11.R                           |  16 +-
 R/serialization.R                   |  32 ++-
 _pkgdown.yml                        |   2 +
 man/CppJson.Rd                      |  35 ++++
 man/createBCFModelFromJson.Rd       |  66 +++++++
 man/createBCFModelFromJsonString.Rd |  80 ++++++++
 man/createCppJsonString.Rd          |  17 ++
 man/saveBCFModelToJsonString.Rd     |  77 ++++++++
 src/cpp11.cpp                       |  33 +++-
 src/serialization.cpp               |  14 +-
 12 files changed, 649 insertions(+), 16 deletions(-)
 create mode 100644 man/createBCFModelFromJsonString.Rd
 create mode 100644 man/createCppJsonString.Rd
 create mode 100644 man/saveBCFModelToJsonString.Rd

diff --git a/NAMESPACE b/NAMESPACE
index ab87b7b9..03e83f44 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -11,8 +11,10 @@ export(computeForestLeafIndices)
 export(convertBCFModelToJson)
 export(createBCFModelFromJson)
 export(createBCFModelFromJsonFile)
+export(createBCFModelFromJsonString)
 export(createCppJson)
 export(createCppJsonFile)
+export(createCppJsonString)
 export(createForestContainer)
 export(createForestCovariates)
 export(createForestCovariatesFromMetadata)
@@ -43,6 +45,7 @@ export(preprocessTrainMatrix)
 export(sample_sigma2_one_iteration)
 export(sample_tau_one_iteration)
 export(saveBCFModelToJsonFile)
+export(saveBCFModelToJsonString)
 importFrom(R6,R6Class)
 importFrom(stats,lm)
 importFrom(stats,model.matrix)
diff --git a/R/bcf.R b/R/bcf.R
index 8e2287e2..1d554429 100644
--- a/R/bcf.R
+++ b/R/bcf.R
@@ -1322,6 +1322,79 @@ saveBCFModelToJsonFile <- function(object, filename){
     jsonobj$save_file(filename)
 }
 
+#' Convert the persistent aspects of a BCF model to (in-memory) JSON string
+#'
+#' @param object Object of type `bcf` containing draws of a Bayesian causal forest model and associated sampling outputs.
+#' @return JSON string
+#' @export
+#'
+#' @examples
+#' n <- 500
+#' x1 <- rnorm(n)
+#' x2 <- rnorm(n)
+#' x3 <- rnorm(n)
+#' x4 <- as.numeric(rbinom(n,1,0.5))
+#' x5 <- as.numeric(sample(1:3,n,replace=TRUE))
+#' X <- cbind(x1,x2,x3,x4,x5)
+#' p <- ncol(X)
+#' g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,4))}
+#' mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
+#' mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
+#' tau1 <- function(x) {rep(3,nrow(x))}
+#' tau2 <- function(x) {1+2*x[,2]*x[,4]}
+#' mu_x <- mu1(X)
+#' tau_x <- tau2(X)
+#' pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
+#' Z <- rbinom(n,1,pi_x)
+#' E_XZ <- mu_x + Z*tau_x
+#' snr <- 3
+#' group_ids <- rep(c(1,2), n %/% 2)
+#' rfx_coefs <- matrix(c(-1, -1, 1, 1), nrow=2, byrow=TRUE)
+#' rfx_basis <- cbind(1, runif(n, -1, 1))
+#' rfx_term <- rowSums(rfx_coefs[group_ids,] * rfx_basis)
+#' y <- E_XZ + rfx_term + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
+#' X <- as.data.frame(X)
+#' X$x4 <- factor(X$x4, ordered = TRUE)
+#' X$x5 <- factor(X$x5, ordered = TRUE)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' pi_test <- pi_x[test_inds]
+#' pi_train <- pi_x[train_inds]
+#' Z_test <- Z[test_inds]
+#' Z_train <- Z[train_inds]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' mu_test <- mu_x[test_inds]
+#' mu_train <- mu_x[train_inds]
+#' tau_test <- tau_x[test_inds]
+#' tau_train <- tau_x[train_inds]
+#' group_ids_test <- group_ids[test_inds]
+#' group_ids_train <- group_ids[train_inds]
+#' rfx_basis_test <- rfx_basis[test_inds,]
+#' rfx_basis_train <- rfx_basis[train_inds,]
+#' rfx_term_test <- rfx_term[test_inds]
+#' rfx_term_train <- rfx_term[train_inds]
+#' bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train, 
+#'                  pi_train = pi_train, group_ids_train = group_ids_train, 
+#'                  rfx_basis_train = rfx_basis_train, X_test = X_test, 
+#'                  Z_test = Z_test, pi_test = pi_test, group_ids_test = group_ids_test,
+#'                  rfx_basis_test = rfx_basis_test, 
+#'                  num_gfr = 100, num_burnin = 0, num_mcmc = 100, 
+#'                  sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
+#' # saveBCFModelToJsonString(bcf_model)
+saveBCFModelToJsonString <- function(object){
+    # Convert to Json
+    jsonobj <- convertBCFModelToJson(object)
+    
+    # Dump to string
+    return(jsonobj$return_json_string())
+}
+
 #' Convert an (in-memory) JSON representation of a BCF model to a BCF model object 
 #' which can be used for prediction, etc...
 #'
@@ -1538,3 +1611,220 @@ createBCFModelFromJsonFile <- function(json_filename){
     
     return(bcf_object)
 }
+
+#' Convert a JSON string containing sample information on a trained BCF model 
+#' to a BCF model object which can be used for prediction, etc...
+#'
+#' @param json_string JSON string dump
+#'
+#' @return Object of type `bcf`
+#' @export
+#'
+#' @examples
+#' n <- 500
+#' x1 <- rnorm(n)
+#' x2 <- rnorm(n)
+#' x3 <- rnorm(n)
+#' x4 <- as.numeric(rbinom(n,1,0.5))
+#' x5 <- as.numeric(sample(1:3,n,replace=TRUE))
+#' X <- cbind(x1,x2,x3,x4,x5)
+#' p <- ncol(X)
+#' g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,4))}
+#' mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
+#' mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
+#' tau1 <- function(x) {rep(3,nrow(x))}
+#' tau2 <- function(x) {1+2*x[,2]*x[,4]}
+#' mu_x <- mu1(X)
+#' tau_x <- tau2(X)
+#' pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
+#' Z <- rbinom(n,1,pi_x)
+#' E_XZ <- mu_x + Z*tau_x
+#' snr <- 3
+#' group_ids <- rep(c(1,2), n %/% 2)
+#' rfx_coefs <- matrix(c(-1, -1, 1, 1), nrow=2, byrow=TRUE)
+#' rfx_basis <- cbind(1, runif(n, -1, 1))
+#' rfx_term <- rowSums(rfx_coefs[group_ids,] * rfx_basis)
+#' y <- E_XZ + rfx_term + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
+#' X <- as.data.frame(X)
+#' X$x4 <- factor(X$x4, ordered = TRUE)
+#' X$x5 <- factor(X$x5, ordered = TRUE)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' pi_test <- pi_x[test_inds]
+#' pi_train <- pi_x[train_inds]
+#' Z_test <- Z[test_inds]
+#' Z_train <- Z[train_inds]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' mu_test <- mu_x[test_inds]
+#' mu_train <- mu_x[train_inds]
+#' tau_test <- tau_x[test_inds]
+#' tau_train <- tau_x[train_inds]
+#' group_ids_test <- group_ids[test_inds]
+#' group_ids_train <- group_ids[train_inds]
+#' rfx_basis_test <- rfx_basis[test_inds,]
+#' rfx_basis_train <- rfx_basis[train_inds,]
+#' rfx_term_test <- rfx_term[test_inds]
+#' rfx_term_train <- rfx_term[train_inds]
+#' bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train, 
+#'                  pi_train = pi_train, group_ids_train = group_ids_train, 
+#'                  rfx_basis_train = rfx_basis_train, X_test = X_test, 
+#'                  Z_test = Z_test, pi_test = pi_test, group_ids_test = group_ids_test,
+#'                  rfx_basis_test = rfx_basis_test, 
+#'                  num_gfr = 100, num_burnin = 0, num_mcmc = 100, 
+#'                  sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
+#' # bcf_json <- saveBCFModelToJsonString(bcf_model)
+#' # bcf_model_roundtrip <- createBCFModelFromJsonString(bcf_json)
+createBCFModelFromJsonString <- function(json_string){
+    # Load a `CppJson` object from string
+    bcf_json <- createCppJsonString(json_string)
+    
+    # Create and return the BCF object
+    bcf_object <- createBCFModelFromJson(bcf_json)
+    
+    return(bcf_object)
+}
+
+#' Convert an (in-memory) JSON representation of a BCF model to a BCF model object 
+#' which can be used for prediction, etc...
+#'
+#' @param json_object Object of type `CppJson` containing Json representation of a BCF model
+#'
+#' @return Object of type `bcf`
+#' @export
+#'
+#' @examples
+#' n <- 500
+#' x1 <- rnorm(n)
+#' x2 <- rnorm(n)
+#' x3 <- rnorm(n)
+#' x4 <- as.numeric(rbinom(n,1,0.5))
+#' x5 <- as.numeric(sample(1:3,n,replace=TRUE))
+#' X <- cbind(x1,x2,x3,x4,x5)
+#' p <- ncol(X)
+#' g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,4))}
+#' mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
+#' mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
+#' tau1 <- function(x) {rep(3,nrow(x))}
+#' tau2 <- function(x) {1+2*x[,2]*x[,4]}
+#' mu_x <- mu1(X)
+#' tau_x <- tau2(X)
+#' pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
+#' Z <- rbinom(n,1,pi_x)
+#' E_XZ <- mu_x + Z*tau_x
+#' snr <- 3
+#' group_ids <- rep(c(1,2), n %/% 2)
+#' rfx_coefs <- matrix(c(-1, -1, 1, 1), nrow=2, byrow=TRUE)
+#' rfx_basis <- cbind(1, runif(n, -1, 1))
+#' rfx_term <- rowSums(rfx_coefs[group_ids,] * rfx_basis)
+#' y <- E_XZ + rfx_term + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
+#' X <- as.data.frame(X)
+#' X$x4 <- factor(X$x4, ordered = TRUE)
+#' X$x5 <- factor(X$x5, ordered = TRUE)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' pi_test <- pi_x[test_inds]
+#' pi_train <- pi_x[train_inds]
+#' Z_test <- Z[test_inds]
+#' Z_train <- Z[train_inds]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' mu_test <- mu_x[test_inds]
+#' mu_train <- mu_x[train_inds]
+#' tau_test <- tau_x[test_inds]
+#' tau_train <- tau_x[train_inds]
+#' group_ids_test <- group_ids[test_inds]
+#' group_ids_train <- group_ids[train_inds]
+#' rfx_basis_test <- rfx_basis[test_inds,]
+#' rfx_basis_train <- rfx_basis[train_inds,]
+#' rfx_term_test <- rfx_term[test_inds]
+#' rfx_term_train <- rfx_term[train_inds]
+#' bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train, 
+#'                  pi_train = pi_train, group_ids_train = group_ids_train, 
+#'                  rfx_basis_train = rfx_basis_train, X_test = X_test, 
+#'                  Z_test = Z_test, pi_test = pi_test, group_ids_test = group_ids_test,
+#'                  rfx_basis_test = rfx_basis_test, 
+#'                  num_gfr = 100, num_burnin = 0, num_mcmc = 100, 
+#'                  sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
+#' # bcf_json <- convertBCFModelToJson(bcf_model)
+#' # bcf_model_roundtrip <- createBCFModelFromJson(bcf_json)
+createBCFModelFromJson <- function(json_object){
+    # Initialize the BCF model
+    output <- list()
+    
+    # Unpack the forests
+    output[["forests_mu"]] <- loadForestContainerJson(json_object, "forest_0")
+    output[["forests_tau"]] <- loadForestContainerJson(json_object, "forest_1")
+    
+    # Unpack metadata
+    train_set_metadata = list()
+    train_set_metadata[["num_numeric_vars"]] <- json_object$get_scalar("num_numeric_vars")
+    train_set_metadata[["num_ordered_cat_vars"]] <- json_object$get_scalar("num_ordered_cat_vars")
+    train_set_metadata[["num_unordered_cat_vars"]] <- json_object$get_scalar("num_unordered_cat_vars")
+    if (train_set_metadata[["num_numeric_vars"]] > 0) {
+        train_set_metadata[["numeric_vars"]] <- json_object$get_string_vector("numeric_vars")
+    }
+    if (train_set_metadata[["num_ordered_cat_vars"]] > 0) {
+        train_set_metadata[["ordered_cat_vars"]] <- json_object$get_string_vector("ordered_cat_vars")
+        train_set_metadata[["ordered_unique_levels"]] <- json_object$get_string_list("ordered_unique_levels", train_set_metadata[["ordered_cat_vars"]])
+    }
+    if (train_set_metadata[["num_unordered_cat_vars"]] > 0) {
+        train_set_metadata[["unordered_cat_vars"]] <- json_object$get_string_vector("unordered_cat_vars")
+        train_set_metadata[["unordered_unique_levels"]] <- json_object$get_string_list("unordered_unique_levels", train_set_metadata[["unordered_cat_vars"]])
+    }
+    output[["train_set_metadata"]] <- train_set_metadata
+    output[["keep_indices"]] <- json_object$get_vector("keep_indices")
+    
+    # Unpack model params
+    model_params = list()
+    model_params[["outcome_scale"]] <- json_object$get_scalar("outcome_scale")
+    model_params[["outcome_mean"]] <- json_object$get_scalar("outcome_mean")
+    model_params[["sample_sigma_global"]] <- json_object$get_boolean("sample_sigma_global")
+    model_params[["sample_sigma_leaf_mu"]] <- json_object$get_boolean("sample_sigma_leaf_mu")
+    model_params[["sample_sigma_leaf_tau"]] <- json_object$get_boolean("sample_sigma_leaf_tau")
+    model_params[["propensity_covariate"]] <- json_object$get_string("propensity_covariate")
+    model_params[["has_rfx"]] <- json_object$get_boolean("has_rfx")
+    model_params[["has_rfx_basis"]] <- json_object$get_boolean("has_rfx_basis")
+    model_params[["num_rfx_basis"]] <- json_object$get_scalar("num_rfx_basis")
+    model_params[["adaptive_coding"]] <- json_object$get_boolean("adaptive_coding")
+    model_params[["num_gfr"]] <- json_object$get_scalar("num_gfr")
+    model_params[["num_burnin"]] <- json_object$get_scalar("num_burnin")
+    model_params[["num_mcmc"]] <- json_object$get_scalar("num_mcmc")
+    model_params[["num_samples"]] <- json_object$get_scalar("num_samples")
+    model_params[["num_covariates"]] <- json_object$get_scalar("num_covariates")
+    output[["model_params"]] <- model_params
+    
+    # Unpack sampled parameters
+    if (model_params[["sample_sigma_global"]]) {
+        output[["sigma2_samples"]] <- json_object$get_vector("sigma2_samples", "parameters")
+    }
+    if (model_params[["sample_sigma_leaf_mu"]]) {
+        output[["sigma_leaf_mu_samples"]] <- json_object$get_vector("sigma_leaf_mu_samples", "parameters")
+    }
+    if (model_params[["sample_sigma_leaf_tau"]]) {
+        output[["sigma_leaf_tau_samples"]] <- json_object$get_vector("sigma_leaf_tau_samples", "parameters")
+    }
+    if (model_params[["adaptive_coding"]]) {
+        output[["b_1_samples"]] <- json_object$get_vector("b_1_samples", "parameters")
+        output[["b_0_samples"]] <- json_object$get_vector("b_0_samples", "parameters")
+    }
+    
+    # Unpack random effects
+    if (model_params[["has_rfx"]]) {
+        output[["rfx_unique_group_ids"]] <- json_object$get_string_vector("rfx_unique_group_ids")
+        output[["rfx_samples"]] <- loadRandomEffectSamplesJson(json_object, 0)
+    }
+    
+    class(output) <- "bcf"
+    return(output)
+}
diff --git a/R/cpp11.R b/R/cpp11.R
index 16d8b449..b9e710b7 100644
--- a/R/cpp11.R
+++ b/R/cpp11.R
@@ -464,10 +464,18 @@ json_add_rfx_groupids_cpp <- function(json_ptr, groupids) {
   .Call(`_stochtree_json_add_rfx_groupids_cpp`, json_ptr, groupids)
 }
 
-json_save_cpp <- function(json_ptr, filename) {
-  invisible(.Call(`_stochtree_json_save_cpp`, json_ptr, filename))
+get_json_string_cpp <- function(json_ptr) {
+  .Call(`_stochtree_get_json_string_cpp`, json_ptr)
 }
 
-json_load_cpp <- function(json_ptr, filename) {
-  invisible(.Call(`_stochtree_json_load_cpp`, json_ptr, filename))
+json_save_file_cpp <- function(json_ptr, filename) {
+  invisible(.Call(`_stochtree_json_save_file_cpp`, json_ptr, filename))
+}
+
+json_load_file_cpp <- function(json_ptr, filename) {
+  invisible(.Call(`_stochtree_json_load_file_cpp`, json_ptr, filename))
+}
+
+json_load_string_cpp <- function(json_ptr, json_string) {
+  invisible(.Call(`_stochtree_json_load_string_cpp`, json_ptr, json_string))
 }
diff --git a/R/serialization.R b/R/serialization.R
index eda655f5..525f5abf 100644
--- a/R/serialization.R
+++ b/R/serialization.R
@@ -276,12 +276,19 @@ CppJson <- R6::R6Class(
             return(output)
         }, 
         
+        #' @description
+        #' Convert a JSON object to in-memory string
+        #' @return JSON string
+        return_json_string = function() {
+            return(get_json_string_cpp(self$json_ptr))
+        }, 
+        
         #' @description
         #' Save a json object to file
         #' @param filename String of filepath, must end in ".json"
         #' @return NULL
         save_file = function(filename) {
-            json_save_cpp(self$json_ptr, filename)
+            json_save_file_cpp(self$json_ptr, filename)
         }, 
         
         #' @description
@@ -289,7 +296,15 @@ CppJson <- R6::R6Class(
         #' @param filename String of filepath, must end in ".json"
         #' @return NULL
         load_from_file = function(filename) {
-            json_load_cpp(self$json_ptr, filename)
+            json_load_file_cpp(self$json_ptr, filename)
+        }, 
+        
+        #' @description
+        #' Load a json object from string
+        #' @param json_string JSON string dump
+        #' @return NULL
+        load_from_string = function(json_string) {
+            json_load_string_cpp(self$json_ptr, json_string)
         }
     )
 )
@@ -379,3 +394,16 @@ createCppJsonFile <- function(json_filename) {
     output$load_from_file(json_filename)
     return(output)
 }
+
+#' Create a C++ Json object from a Json string
+#'
+#' @param json_string JSON string dump
+#' @return `CppJson` object
+#' @export
+createCppJsonString <- function(json_string) {
+    invisible((
+        output <- CppJson$new()
+    ))
+    output$load_from_string(json_string)
+    return(output)
+}
diff --git a/_pkgdown.yml b/_pkgdown.yml
index bffe900a..8292609e 100644
--- a/_pkgdown.yml
+++ b/_pkgdown.yml
@@ -18,6 +18,7 @@ reference:
   - predict.bcf
   - saveBCFModelToJsonFile
   - createBCFModelFromJsonFile
+  - createBCFModelFromJsonString
   - convertBCFModelToJson
   - createBCFModelFromJson
 
@@ -34,6 +35,7 @@ reference:
   - loadVectorJson
   - loadScalarJson
   - createCppJsonFile
+  - createCppJsonString
 
 - subtitle: Data
   desc: >
diff --git a/man/CppJson.Rd b/man/CppJson.Rd
index fa484513..a7f7e448 100644
--- a/man/CppJson.Rd
+++ b/man/CppJson.Rd
@@ -45,8 +45,10 @@ Wrapper around a C++ container of tree ensembles
 \item \href{#method-CppJson-get_string_vector}{\code{CppJson$get_string_vector()}}
 \item \href{#method-CppJson-get_numeric_list}{\code{CppJson$get_numeric_list()}}
 \item \href{#method-CppJson-get_string_list}{\code{CppJson$get_string_list()}}
+\item \href{#method-CppJson-return_json_string}{\code{CppJson$return_json_string()}}
 \item \href{#method-CppJson-save_file}{\code{CppJson$save_file()}}
 \item \href{#method-CppJson-load_from_file}{\code{CppJson$load_from_file()}}
+\item \href{#method-CppJson-load_from_string}{\code{CppJson$load_from_string()}}
 }
 }
 \if{html}{\out{<hr>}}
@@ -421,6 +423,19 @@ NULL
 }
 }
 \if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-CppJson-return_json_string"></a>}}
+\if{latex}{\out{\hypertarget{method-CppJson-return_json_string}{}}}
+\subsection{Method \code{return_json_string()}}{
+Convert a JSON object to in-memory string
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{CppJson$return_json_string()}\if{html}{\out{</div>}}
+}
+
+\subsection{Returns}{
+JSON string
+}
+}
+\if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-CppJson-save_file"></a>}}
 \if{latex}{\out{\hypertarget{method-CppJson-save_file}{}}}
 \subsection{Method \code{save_file()}}{
@@ -460,4 +475,24 @@ Load a json object from file
 NULL
 }
 }
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-CppJson-load_from_string"></a>}}
+\if{latex}{\out{\hypertarget{method-CppJson-load_from_string}{}}}
+\subsection{Method \code{load_from_string()}}{
+Load a json object from string
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{CppJson$load_from_string(json_string)}\if{html}{\out{</div>}}
+}
+
+\subsection{Arguments}{
+\if{html}{\out{<div class="arguments">}}
+\describe{
+\item{\code{json_string}}{JSON string dump}
+}
+\if{html}{\out{</div>}}
+}
+\subsection{Returns}{
+NULL
+}
+}
 }
diff --git a/man/createBCFModelFromJson.Rd b/man/createBCFModelFromJson.Rd
index 76c3ebcb..28b21ef0 100644
--- a/man/createBCFModelFromJson.Rd
+++ b/man/createBCFModelFromJson.Rd
@@ -5,15 +5,22 @@
 \title{Convert an (in-memory) JSON representation of a BCF model to a BCF model object
 which can be used for prediction, etc...}
 \usage{
+createBCFModelFromJson(json_object)
+
 createBCFModelFromJson(json_object)
 }
 \arguments{
 \item{json_object}{Object of type \code{CppJson} containing Json representation of a BCF model}
 }
 \value{
+Object of type \code{bcf}
+
 Object of type \code{bcf}
 }
 \description{
+Convert an (in-memory) JSON representation of a BCF model to a BCF model object
+which can be used for prediction, etc...
+
 Convert an (in-memory) JSON representation of a BCF model to a BCF model object
 which can be used for prediction, etc...
 }
@@ -77,4 +84,63 @@ bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train,
                  sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
 # bcf_json <- convertBCFModelToJson(bcf_model)
 # bcf_model_roundtrip <- createBCFModelFromJson(bcf_json)
+n <- 500
+x1 <- rnorm(n)
+x2 <- rnorm(n)
+x3 <- rnorm(n)
+x4 <- as.numeric(rbinom(n,1,0.5))
+x5 <- as.numeric(sample(1:3,n,replace=TRUE))
+X <- cbind(x1,x2,x3,x4,x5)
+p <- ncol(X)
+g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,4))}
+mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
+mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
+tau1 <- function(x) {rep(3,nrow(x))}
+tau2 <- function(x) {1+2*x[,2]*x[,4]}
+mu_x <- mu1(X)
+tau_x <- tau2(X)
+pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
+Z <- rbinom(n,1,pi_x)
+E_XZ <- mu_x + Z*tau_x
+snr <- 3
+group_ids <- rep(c(1,2), n \%/\% 2)
+rfx_coefs <- matrix(c(-1, -1, 1, 1), nrow=2, byrow=TRUE)
+rfx_basis <- cbind(1, runif(n, -1, 1))
+rfx_term <- rowSums(rfx_coefs[group_ids,] * rfx_basis)
+y <- E_XZ + rfx_term + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
+X <- as.data.frame(X)
+X$x4 <- factor(X$x4, ordered = TRUE)
+X$x5 <- factor(X$x5, ordered = TRUE)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+pi_test <- pi_x[test_inds]
+pi_train <- pi_x[train_inds]
+Z_test <- Z[test_inds]
+Z_train <- Z[train_inds]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+mu_test <- mu_x[test_inds]
+mu_train <- mu_x[train_inds]
+tau_test <- tau_x[test_inds]
+tau_train <- tau_x[train_inds]
+group_ids_test <- group_ids[test_inds]
+group_ids_train <- group_ids[train_inds]
+rfx_basis_test <- rfx_basis[test_inds,]
+rfx_basis_train <- rfx_basis[train_inds,]
+rfx_term_test <- rfx_term[test_inds]
+rfx_term_train <- rfx_term[train_inds]
+bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train, 
+                 pi_train = pi_train, group_ids_train = group_ids_train, 
+                 rfx_basis_train = rfx_basis_train, X_test = X_test, 
+                 Z_test = Z_test, pi_test = pi_test, group_ids_test = group_ids_test,
+                 rfx_basis_test = rfx_basis_test, 
+                 num_gfr = 100, num_burnin = 0, num_mcmc = 100, 
+                 sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
+# bcf_json <- convertBCFModelToJson(bcf_model)
+# bcf_model_roundtrip <- createBCFModelFromJson(bcf_json)
 }
diff --git a/man/createBCFModelFromJsonString.Rd b/man/createBCFModelFromJsonString.Rd
new file mode 100644
index 00000000..b25557ab
--- /dev/null
+++ b/man/createBCFModelFromJsonString.Rd
@@ -0,0 +1,80 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bcf.R
+\name{createBCFModelFromJsonString}
+\alias{createBCFModelFromJsonString}
+\title{Convert a JSON string containing sample information on a trained BCF model
+to a BCF model object which can be used for prediction, etc...}
+\usage{
+createBCFModelFromJsonString(json_string)
+}
+\arguments{
+\item{json_string}{JSON string dump}
+}
+\value{
+Object of type \code{bcf}
+}
+\description{
+Convert a JSON string containing sample information on a trained BCF model
+to a BCF model object which can be used for prediction, etc...
+}
+\examples{
+n <- 500
+x1 <- rnorm(n)
+x2 <- rnorm(n)
+x3 <- rnorm(n)
+x4 <- as.numeric(rbinom(n,1,0.5))
+x5 <- as.numeric(sample(1:3,n,replace=TRUE))
+X <- cbind(x1,x2,x3,x4,x5)
+p <- ncol(X)
+g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,4))}
+mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
+mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
+tau1 <- function(x) {rep(3,nrow(x))}
+tau2 <- function(x) {1+2*x[,2]*x[,4]}
+mu_x <- mu1(X)
+tau_x <- tau2(X)
+pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
+Z <- rbinom(n,1,pi_x)
+E_XZ <- mu_x + Z*tau_x
+snr <- 3
+group_ids <- rep(c(1,2), n \%/\% 2)
+rfx_coefs <- matrix(c(-1, -1, 1, 1), nrow=2, byrow=TRUE)
+rfx_basis <- cbind(1, runif(n, -1, 1))
+rfx_term <- rowSums(rfx_coefs[group_ids,] * rfx_basis)
+y <- E_XZ + rfx_term + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
+X <- as.data.frame(X)
+X$x4 <- factor(X$x4, ordered = TRUE)
+X$x5 <- factor(X$x5, ordered = TRUE)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+pi_test <- pi_x[test_inds]
+pi_train <- pi_x[train_inds]
+Z_test <- Z[test_inds]
+Z_train <- Z[train_inds]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+mu_test <- mu_x[test_inds]
+mu_train <- mu_x[train_inds]
+tau_test <- tau_x[test_inds]
+tau_train <- tau_x[train_inds]
+group_ids_test <- group_ids[test_inds]
+group_ids_train <- group_ids[train_inds]
+rfx_basis_test <- rfx_basis[test_inds,]
+rfx_basis_train <- rfx_basis[train_inds,]
+rfx_term_test <- rfx_term[test_inds]
+rfx_term_train <- rfx_term[train_inds]
+bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train, 
+                 pi_train = pi_train, group_ids_train = group_ids_train, 
+                 rfx_basis_train = rfx_basis_train, X_test = X_test, 
+                 Z_test = Z_test, pi_test = pi_test, group_ids_test = group_ids_test,
+                 rfx_basis_test = rfx_basis_test, 
+                 num_gfr = 100, num_burnin = 0, num_mcmc = 100, 
+                 sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
+# bcf_json <- saveBCFModelToJsonString(bcf_model)
+# bcf_model_roundtrip <- createBCFModelFromJsonString(bcf_json)
+}
diff --git a/man/createCppJsonString.Rd b/man/createCppJsonString.Rd
new file mode 100644
index 00000000..a8215cc6
--- /dev/null
+++ b/man/createCppJsonString.Rd
@@ -0,0 +1,17 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/serialization.R
+\name{createCppJsonString}
+\alias{createCppJsonString}
+\title{Create a C++ Json object from a Json string}
+\usage{
+createCppJsonString(json_string)
+}
+\arguments{
+\item{json_string}{JSON string dump}
+}
+\value{
+\code{CppJson} object
+}
+\description{
+Create a C++ Json object from a Json string
+}
diff --git a/man/saveBCFModelToJsonString.Rd b/man/saveBCFModelToJsonString.Rd
new file mode 100644
index 00000000..7dd31418
--- /dev/null
+++ b/man/saveBCFModelToJsonString.Rd
@@ -0,0 +1,77 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bcf.R
+\name{saveBCFModelToJsonString}
+\alias{saveBCFModelToJsonString}
+\title{Convert the persistent aspects of a BCF model to (in-memory) JSON string}
+\usage{
+saveBCFModelToJsonString(object)
+}
+\arguments{
+\item{object}{Object of type \code{bcf} containing draws of a Bayesian causal forest model and associated sampling outputs.}
+}
+\value{
+JSON string
+}
+\description{
+Convert the persistent aspects of a BCF model to (in-memory) JSON string
+}
+\examples{
+n <- 500
+x1 <- rnorm(n)
+x2 <- rnorm(n)
+x3 <- rnorm(n)
+x4 <- as.numeric(rbinom(n,1,0.5))
+x5 <- as.numeric(sample(1:3,n,replace=TRUE))
+X <- cbind(x1,x2,x3,x4,x5)
+p <- ncol(X)
+g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,4))}
+mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
+mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
+tau1 <- function(x) {rep(3,nrow(x))}
+tau2 <- function(x) {1+2*x[,2]*x[,4]}
+mu_x <- mu1(X)
+tau_x <- tau2(X)
+pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
+Z <- rbinom(n,1,pi_x)
+E_XZ <- mu_x + Z*tau_x
+snr <- 3
+group_ids <- rep(c(1,2), n \%/\% 2)
+rfx_coefs <- matrix(c(-1, -1, 1, 1), nrow=2, byrow=TRUE)
+rfx_basis <- cbind(1, runif(n, -1, 1))
+rfx_term <- rowSums(rfx_coefs[group_ids,] * rfx_basis)
+y <- E_XZ + rfx_term + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
+X <- as.data.frame(X)
+X$x4 <- factor(X$x4, ordered = TRUE)
+X$x5 <- factor(X$x5, ordered = TRUE)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+pi_test <- pi_x[test_inds]
+pi_train <- pi_x[train_inds]
+Z_test <- Z[test_inds]
+Z_train <- Z[train_inds]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+mu_test <- mu_x[test_inds]
+mu_train <- mu_x[train_inds]
+tau_test <- tau_x[test_inds]
+tau_train <- tau_x[train_inds]
+group_ids_test <- group_ids[test_inds]
+group_ids_train <- group_ids[train_inds]
+rfx_basis_test <- rfx_basis[test_inds,]
+rfx_basis_train <- rfx_basis[train_inds,]
+rfx_term_test <- rfx_term[test_inds]
+rfx_term_train <- rfx_term[train_inds]
+bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train, 
+                 pi_train = pi_train, group_ids_train = group_ids_train, 
+                 rfx_basis_train = rfx_basis_train, X_test = X_test, 
+                 Z_test = Z_test, pi_test = pi_test, group_ids_test = group_ids_test,
+                 rfx_basis_test = rfx_basis_test, 
+                 num_gfr = 100, num_burnin = 0, num_mcmc = 100, 
+                 sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
+# saveBCFModelToJsonString(bcf_model)
+}
diff --git a/src/cpp11.cpp b/src/cpp11.cpp
index 53423c30..6a5b883f 100644
--- a/src/cpp11.cpp
+++ b/src/cpp11.cpp
@@ -858,18 +858,33 @@ extern "C" SEXP _stochtree_json_add_rfx_groupids_cpp(SEXP json_ptr, SEXP groupid
   END_CPP11
 }
 // serialization.cpp
-void json_save_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string filename);
-extern "C" SEXP _stochtree_json_save_cpp(SEXP json_ptr, SEXP filename) {
+std::string get_json_string_cpp(cpp11::external_pointer<nlohmann::json> json_ptr);
+extern "C" SEXP _stochtree_get_json_string_cpp(SEXP json_ptr) {
   BEGIN_CPP11
-    json_save_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<nlohmann::json>>>(json_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(filename));
+    return cpp11::as_sexp(get_json_string_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<nlohmann::json>>>(json_ptr)));
+  END_CPP11
+}
+// serialization.cpp
+void json_save_file_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string filename);
+extern "C" SEXP _stochtree_json_save_file_cpp(SEXP json_ptr, SEXP filename) {
+  BEGIN_CPP11
+    json_save_file_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<nlohmann::json>>>(json_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(filename));
+    return R_NilValue;
+  END_CPP11
+}
+// serialization.cpp
+void json_load_file_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string filename);
+extern "C" SEXP _stochtree_json_load_file_cpp(SEXP json_ptr, SEXP filename) {
+  BEGIN_CPP11
+    json_load_file_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<nlohmann::json>>>(json_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(filename));
     return R_NilValue;
   END_CPP11
 }
 // serialization.cpp
-void json_load_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string filename);
-extern "C" SEXP _stochtree_json_load_cpp(SEXP json_ptr, SEXP filename) {
+void json_load_string_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string json_string);
+extern "C" SEXP _stochtree_json_load_string_cpp(SEXP json_ptr, SEXP json_string) {
   BEGIN_CPP11
-    json_load_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<nlohmann::json>>>(json_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(filename));
+    json_load_string_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<nlohmann::json>>>(json_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(json_string));
     return R_NilValue;
   END_CPP11
 }
@@ -910,6 +925,7 @@ static const R_CallMethodDef CallEntries[] = {
     {"_stochtree_forest_tracker_cpp",                                  (DL_FUNC) &_stochtree_forest_tracker_cpp,                                   4},
     {"_stochtree_get_forest_split_counts_forest_container_cpp",        (DL_FUNC) &_stochtree_get_forest_split_counts_forest_container_cpp,         3},
     {"_stochtree_get_granular_split_count_array_forest_container_cpp", (DL_FUNC) &_stochtree_get_granular_split_count_array_forest_container_cpp,  2},
+    {"_stochtree_get_json_string_cpp",                                 (DL_FUNC) &_stochtree_get_json_string_cpp,                                  1},
     {"_stochtree_get_overall_split_counts_forest_container_cpp",       (DL_FUNC) &_stochtree_get_overall_split_counts_forest_container_cpp,        2},
     {"_stochtree_get_residual_cpp",                                    (DL_FUNC) &_stochtree_get_residual_cpp,                                     1},
     {"_stochtree_get_tree_leaves_forest_container_cpp",                (DL_FUNC) &_stochtree_get_tree_leaves_forest_container_cpp,                 3},
@@ -943,9 +959,10 @@ static const R_CallMethodDef CallEntries[] = {
     {"_stochtree_json_extract_vector_cpp",                             (DL_FUNC) &_stochtree_json_extract_vector_cpp,                              2},
     {"_stochtree_json_extract_vector_subfolder_cpp",                   (DL_FUNC) &_stochtree_json_extract_vector_subfolder_cpp,                    3},
     {"_stochtree_json_increment_rfx_count_cpp",                        (DL_FUNC) &_stochtree_json_increment_rfx_count_cpp,                         1},
-    {"_stochtree_json_load_cpp",                                       (DL_FUNC) &_stochtree_json_load_cpp,                                        2},
+    {"_stochtree_json_load_file_cpp",                                  (DL_FUNC) &_stochtree_json_load_file_cpp,                                   2},
     {"_stochtree_json_load_forest_container_cpp",                      (DL_FUNC) &_stochtree_json_load_forest_container_cpp,                       2},
-    {"_stochtree_json_save_cpp",                                       (DL_FUNC) &_stochtree_json_save_cpp,                                        2},
+    {"_stochtree_json_load_string_cpp",                                (DL_FUNC) &_stochtree_json_load_string_cpp,                                 2},
+    {"_stochtree_json_save_file_cpp",                                  (DL_FUNC) &_stochtree_json_save_file_cpp,                                   2},
     {"_stochtree_json_save_forest_container_cpp",                      (DL_FUNC) &_stochtree_json_save_forest_container_cpp,                       2},
     {"_stochtree_num_samples_forest_container_cpp",                    (DL_FUNC) &_stochtree_num_samples_forest_container_cpp,                     1},
     {"_stochtree_num_trees_forest_container_cpp",                      (DL_FUNC) &_stochtree_num_trees_forest_container_cpp,                       1},
diff --git a/src/serialization.cpp b/src/serialization.cpp
index ba734757..3593f1a5 100644
--- a/src/serialization.cpp
+++ b/src/serialization.cpp
@@ -305,15 +305,25 @@ std::string json_add_rfx_groupids_cpp(cpp11::external_pointer<nlohmann::json> js
 }
 
 [[cpp11::register]]
-void json_save_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string filename) {
+std::string get_json_string_cpp(cpp11::external_pointer<nlohmann::json> json_ptr) {
+    return json_ptr->dump();
+}
+
+[[cpp11::register]]
+void json_save_file_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string filename) {
     std::ofstream output_file(filename);
     output_file << *json_ptr << std::endl;
 }
 
 [[cpp11::register]]
-void json_load_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string filename) {
+void json_load_file_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string filename) {
     std::ifstream f(filename);
     // nlohmann::json file_json = nlohmann::json::parse(f);
     *json_ptr = nlohmann::json::parse(f);
     // json_ptr.reset(&file_json);
 }
+
+[[cpp11::register]]
+void json_load_string_cpp(cpp11::external_pointer<nlohmann::json> json_ptr, std::string json_string) {
+    *json_ptr = nlohmann::json::parse(json_string);
+}

From bd060616ff6ebfc4efc25d1190dbc7801185d10f Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sun, 4 Aug 2024 08:50:01 -0500
Subject: [PATCH 02/41] Allow BART json serialization in R

---
 NAMESPACE                            |   6 +
 R/bart.R                             | 344 +++++++++++++++++++++++++++
 R/bcf.R                              | 139 -----------
 man/convertBARTModelToJson.Rd        |  41 ++++
 man/createBARTModelFromJson.Rd       |  44 ++++
 man/createBARTModelFromJsonFile.Rd   |  44 ++++
 man/createBARTModelFromJsonString.Rd |  46 ++++
 man/createBCFModelFromJson.Rd        |  66 -----
 man/saveBARTModelToJsonFile.Rd       |  40 ++++
 man/saveBARTModelToJsonString.Rd     |  41 ++++
 10 files changed, 606 insertions(+), 205 deletions(-)
 create mode 100644 man/convertBARTModelToJson.Rd
 create mode 100644 man/createBARTModelFromJson.Rd
 create mode 100644 man/createBARTModelFromJsonFile.Rd
 create mode 100644 man/createBARTModelFromJsonString.Rd
 create mode 100644 man/saveBARTModelToJsonFile.Rd
 create mode 100644 man/saveBARTModelToJsonString.Rd

diff --git a/NAMESPACE b/NAMESPACE
index 03e83f44..5c8c8869 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -8,7 +8,11 @@ export(bart)
 export(bcf)
 export(computeForestKernels)
 export(computeForestLeafIndices)
+export(convertBARTModelToJson)
 export(convertBCFModelToJson)
+export(createBARTModelFromJson)
+export(createBARTModelFromJsonFile)
+export(createBARTModelFromJsonString)
 export(createBCFModelFromJson)
 export(createBCFModelFromJsonFile)
 export(createBCFModelFromJsonString)
@@ -44,6 +48,8 @@ export(preprocessTrainDataFrame)
 export(preprocessTrainMatrix)
 export(sample_sigma2_one_iteration)
 export(sample_tau_one_iteration)
+export(saveBARTModelToJsonFile)
+export(saveBARTModelToJsonString)
 export(saveBCFModelToJsonFile)
 export(saveBCFModelToJsonString)
 importFrom(R6,R6Class)
diff --git a/R/bart.R b/R/bart.R
index 08f79549..9eaeb47c 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -688,3 +688,347 @@ getRandomEffectSamples.bartmodel <- function(object, ...){
     
     return(result)
 }
+
+#' Convert the persistent aspects of a BART model to (in-memory) JSON
+#'
+#' @param object Object of type `bartmodel` containing draws of a BART model and associated sampling outputs.
+#'
+#' @return Object of type `CppJson`
+#' @export
+#'
+#' @examples
+#' n <- 100
+#' p <- 5
+#' X <- matrix(runif(n*p), ncol = p)
+#' f_XW <- (
+#'     ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+#'     ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+#'     ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+#'     ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+#' )
+#' noise_sd <- 1
+#' y <- f_XW + rnorm(n, 0, noise_sd)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' bart_model <- bart(X_train = X_train, y_train = y_train)
+#' # bart_json <- convertBARTModelToJson(bart_model)
+convertBARTModelToJson <- function(object){
+    jsonobj <- createCppJson()
+    
+    if (is.null(object$model_params)) {
+        stop("This BCF model has not yet been sampled")
+    }
+
+    # Add the forests
+    jsonobj$add_forest(object$forests)
+
+    # Add metadata
+    jsonobj$add_scalar("num_numeric_vars", object$train_set_metadata$num_numeric_vars)
+    jsonobj$add_scalar("num_ordered_cat_vars", object$train_set_metadata$num_ordered_cat_vars)
+    jsonobj$add_scalar("num_unordered_cat_vars", object$train_set_metadata$num_unordered_cat_vars)
+    if (object$train_set_metadata$num_numeric_vars > 0) {
+        jsonobj$add_string_vector("numeric_vars", object$train_set_metadata$numeric_vars)
+    }
+    if (object$train_set_metadata$num_ordered_cat_vars > 0) {
+        jsonobj$add_string_vector("ordered_cat_vars", object$train_set_metadata$ordered_cat_vars)
+        jsonobj$add_string_list("ordered_unique_levels", object$train_set_metadata$ordered_unique_levels)
+    }
+    if (object$train_set_metadata$num_unordered_cat_vars > 0) {
+        jsonobj$add_string_vector("unordered_cat_vars", object$train_set_metadata$unordered_cat_vars)
+        jsonobj$add_string_list("unordered_unique_levels", object$train_set_metadata$unordered_unique_levels)
+    }
+    
+    # Add global parameters
+    jsonobj$add_scalar("outcome_scale", object$model_params$outcome_scale)
+    jsonobj$add_scalar("outcome_mean", object$model_params$outcome_mean)
+    jsonobj$add_boolean("sample_sigma", object$model_params$sample_sigma)
+    jsonobj$add_boolean("sample_tau", object$model_params$sample_tau)
+    jsonobj$add_boolean("has_rfx", object$model_params$has_rfx)
+    jsonobj$add_boolean("has_rfx_basis", object$model_params$has_rfx_basis)
+    jsonobj$add_scalar("num_rfx_basis", object$model_params$num_rfx_basis)
+    jsonobj$add_scalar("num_gfr", object$model_params$num_gfr)
+    jsonobj$add_scalar("num_burnin", object$model_params$num_burnin)
+    jsonobj$add_scalar("num_mcmc", object$model_params$num_mcmc)
+    jsonobj$add_scalar("num_samples", object$model_params$num_samples)
+    jsonobj$add_scalar("num_covariates", object$model_params$num_covariates)
+    jsonobj$add_scalar("num_basis", object$model_params$num_basis)
+    jsonobj$add_boolean("requires_basis", object$model_params$requires_basis)
+    jsonobj$add_vector("keep_indices", object$keep_indices)
+    if (object$model_params$sample_sigma) {
+        jsonobj$add_vector("sigma2_samples", object$sigma2_samples, "parameters")
+    }
+    if (object$model_params$sample_tau) {
+        jsonobj$add_vector("tau_samples", object$tau_samples, "parameters")
+    }
+
+    # Add random effects (if present)
+    if (object$model_params$has_rfx) {
+        jsonobj$add_random_effects(object$rfx_samples)
+        jsonobj$add_string_vector("rfx_unique_group_ids", object$rfx_unique_group_ids)
+    }
+    
+    return(jsonobj)
+}
+
+#' Convert the persistent aspects of a BART model to (in-memory) JSON and save to a file
+#'
+#' @param object Object of type `bartmodel` containing draws of a BART model and associated sampling outputs.
+#' @param filename String of filepath, must end in ".json"
+#'
+#' @return NULL
+#' @export
+#'
+#' @examples
+#' n <- 100
+#' p <- 5
+#' X <- matrix(runif(n*p), ncol = p)
+#' f_XW <- (
+#'     ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+#'     ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+#'     ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+#'     ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+#' )
+#' noise_sd <- 1
+#' y <- f_XW + rnorm(n, 0, noise_sd)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' bart_model <- bart(X_train = X_train, y_train = y_train)
+#' # saveBARTModelToJsonFile(bart_model, "test.json")
+saveBARTModelToJsonFile <- function(object, filename){
+    # Convert to Json
+    jsonobj <- convertBARTModelToJson(object)
+    
+    # Save to file
+    jsonobj$save_file(filename)
+}
+
+#' Convert the persistent aspects of a BART model to (in-memory) JSON string
+#'
+#' @param object Object of type `bartmodel` containing draws of a BART model and associated sampling outputs.
+#' @return JSON string
+#' @export
+#'
+#' @examples
+#' n <- 100
+#' p <- 5
+#' X <- matrix(runif(n*p), ncol = p)
+#' f_XW <- (
+#'     ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+#'     ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+#'     ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+#'     ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+#' )
+#' noise_sd <- 1
+#' y <- f_XW + rnorm(n, 0, noise_sd)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' bart_model <- bart(X_train = X_train, y_train = y_train)
+#' # saveBARTModelToJsonString(bart_model)
+saveBARTModelToJsonString <- function(object){
+    # Convert to Json
+    jsonobj <- convertBARTModelToJson(object)
+    
+    # Dump to string
+    return(jsonobj$return_json_string())
+}
+
+#' Convert an (in-memory) JSON representation of a BART model to a BART model object 
+#' which can be used for prediction, etc...
+#'
+#' @param json_object Object of type `CppJson` containing Json representation of a BART model
+#'
+#' @return Object of type `bartmodel`
+#' @export
+#'
+#' @examples
+#' n <- 100
+#' p <- 5
+#' X <- matrix(runif(n*p), ncol = p)
+#' f_XW <- (
+#'     ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+#'     ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+#'     ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+#'     ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+#' )
+#' noise_sd <- 1
+#' y <- f_XW + rnorm(n, 0, noise_sd)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' bart_model <- bart(X_train = X_train, y_train = y_train)
+#' # bart_json <- convertBARTModelToJson(bart_model)
+#' # bart_model_roundtrip <- createBARTModelFromJson(bart_json)
+createBARTModelFromJson <- function(json_object){
+    # Initialize the BCF model
+    output <- list()
+    
+    # Unpack the forests
+    output[["forests"]] <- loadForestContainerJson(json_object, "forest_0")
+
+    # Unpack metadata
+    train_set_metadata = list()
+    train_set_metadata[["num_numeric_vars"]] <- json_object$get_scalar("num_numeric_vars")
+    train_set_metadata[["num_ordered_cat_vars"]] <- json_object$get_scalar("num_ordered_cat_vars")
+    train_set_metadata[["num_unordered_cat_vars"]] <- json_object$get_scalar("num_unordered_cat_vars")
+    if (train_set_metadata[["num_numeric_vars"]] > 0) {
+        train_set_metadata[["numeric_vars"]] <- json_object$get_string_vector("numeric_vars")
+    }
+    if (train_set_metadata[["num_ordered_cat_vars"]] > 0) {
+        train_set_metadata[["ordered_cat_vars"]] <- json_object$get_string_vector("ordered_cat_vars")
+        train_set_metadata[["ordered_unique_levels"]] <- json_object$get_string_list("ordered_unique_levels", train_set_metadata[["ordered_cat_vars"]])
+    }
+    if (train_set_metadata[["num_unordered_cat_vars"]] > 0) {
+        train_set_metadata[["unordered_cat_vars"]] <- json_object$get_string_vector("unordered_cat_vars")
+        train_set_metadata[["unordered_unique_levels"]] <- json_object$get_string_list("unordered_unique_levels", train_set_metadata[["unordered_cat_vars"]])
+    }
+    output[["train_set_metadata"]] <- train_set_metadata
+    output[["keep_indices"]] <- json_object$get_vector("keep_indices")
+    
+    # Unpack model params
+    model_params = list()
+    model_params[["outcome_scale"]] <- json_object$get_scalar("outcome_scale")
+    model_params[["outcome_mean"]] <- json_object$get_scalar("outcome_mean")
+    model_params[["sample_sigma"]] <- json_object$get_boolean("sample_sigma")
+    model_params[["sample_tau"]] <- json_object$get_boolean("sample_tau")
+    model_params[["has_rfx"]] <- json_object$get_boolean("has_rfx")
+    model_params[["has_rfx_basis"]] <- json_object$get_boolean("has_rfx_basis")
+    model_params[["num_rfx_basis"]] <- json_object$get_scalar("num_rfx_basis")
+    model_params[["num_gfr"]] <- json_object$get_scalar("num_gfr")
+    model_params[["num_burnin"]] <- json_object$get_scalar("num_burnin")
+    model_params[["num_mcmc"]] <- json_object$get_scalar("num_mcmc")
+    model_params[["num_samples"]] <- json_object$get_scalar("num_samples")
+    model_params[["num_covariates"]] <- json_object$get_scalar("num_covariates")
+    model_params[["num_basis"]] <- json_object$get_scalar("num_basis")
+    model_params[["requires_basis"]] <- json_object$get_boolean("requires_basis")
+    output[["model_params"]] <- model_params
+    
+    # Unpack sampled parameters
+    if (model_params[["sample_sigma"]]) {
+        output[["sigma2_samples"]] <- json_object$get_vector("sigma2_samples", "parameters")
+    }
+    if (model_params[["sample_tau"]]) {
+        output[["tau_samples"]] <- json_object$get_vector("tau_samples", "parameters")
+    }
+
+    # Unpack random effects
+    if (model_params[["has_rfx"]]) {
+        output[["rfx_unique_group_ids"]] <- json_object$get_string_vector("rfx_unique_group_ids")
+        output[["rfx_samples"]] <- loadRandomEffectSamplesJson(json_object, 0)
+    }
+    
+    class(output) <- "bartmodel"
+    return(output)
+}
+
+#' Convert a JSON file containing sample information on a trained BART model 
+#' to a BART model object which can be used for prediction, etc...
+#'
+#' @param json_filename String of filepath, must end in ".json"
+#'
+#' @return Object of type `bartmodel`
+#' @export
+#'
+#' @examples
+#' n <- 100
+#' p <- 5
+#' X <- matrix(runif(n*p), ncol = p)
+#' f_XW <- (
+#'     ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+#'     ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+#'     ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+#'     ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+#' )
+#' noise_sd <- 1
+#' y <- f_XW + rnorm(n, 0, noise_sd)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' bart_model <- bart(X_train = X_train, y_train = y_train)
+#' # saveBARTModelToJsonFile(bart_model, "test.json")
+#' # bart_model_roundtrip <- createBARTModelFromJsonFile("test.json")
+createBARTModelFromJsonFile <- function(json_filename){
+    # Load a `CppJson` object from file
+    bart_json <- createCppJsonFile(json_filename)
+    
+    # Create and return the BCF object
+    bart_object <- createBARTModelFromJson(bart_json)
+    
+    return(bart_object)
+}
+
+#' Convert a JSON string containing sample information on a trained BART model 
+#' to a BART model object which can be used for prediction, etc...
+#'
+#' @param json_string JSON string dump
+#'
+#' @return Object of type `bartmodel`
+#' @export
+#'
+#' @examples
+#' n <- 100
+#' p <- 5
+#' X <- matrix(runif(n*p), ncol = p)
+#' f_XW <- (
+#'     ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+#'     ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+#'     ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+#'     ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+#' )
+#' noise_sd <- 1
+#' y <- f_XW + rnorm(n, 0, noise_sd)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' bart_model <- bart(X_train = X_train, y_train = y_train)
+#' # bart_json <- saveBARTModelToJsonString(bart_model)
+#' # bart_model_roundtrip <- createBARTModelFromJsonString(bart_json)
+#' # y_hat_mean_roundtrip <- rowMeans(predict(bart_model_roundtrip, X_train)$y_hat)
+#' # plot(rowMeans(bart_model$y_hat_train), y_hat_mean_roundtrip)
+createBARTModelFromJsonString <- function(json_string){
+    # Load a `CppJson` object from string
+    bart_json <- createCppJsonString(json_string)
+    
+    # Create and return the BCF object
+    bart_object <- createBARTModelFromJson(bart_json)
+    
+    return(bart_object)
+}
diff --git a/R/bcf.R b/R/bcf.R
index 1d554429..b959ef2d 100644
--- a/R/bcf.R
+++ b/R/bcf.R
@@ -1689,142 +1689,3 @@ createBCFModelFromJsonString <- function(json_string){
     
     return(bcf_object)
 }
-
-#' Convert an (in-memory) JSON representation of a BCF model to a BCF model object 
-#' which can be used for prediction, etc...
-#'
-#' @param json_object Object of type `CppJson` containing Json representation of a BCF model
-#'
-#' @return Object of type `bcf`
-#' @export
-#'
-#' @examples
-#' n <- 500
-#' x1 <- rnorm(n)
-#' x2 <- rnorm(n)
-#' x3 <- rnorm(n)
-#' x4 <- as.numeric(rbinom(n,1,0.5))
-#' x5 <- as.numeric(sample(1:3,n,replace=TRUE))
-#' X <- cbind(x1,x2,x3,x4,x5)
-#' p <- ncol(X)
-#' g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,4))}
-#' mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
-#' mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
-#' tau1 <- function(x) {rep(3,nrow(x))}
-#' tau2 <- function(x) {1+2*x[,2]*x[,4]}
-#' mu_x <- mu1(X)
-#' tau_x <- tau2(X)
-#' pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
-#' Z <- rbinom(n,1,pi_x)
-#' E_XZ <- mu_x + Z*tau_x
-#' snr <- 3
-#' group_ids <- rep(c(1,2), n %/% 2)
-#' rfx_coefs <- matrix(c(-1, -1, 1, 1), nrow=2, byrow=TRUE)
-#' rfx_basis <- cbind(1, runif(n, -1, 1))
-#' rfx_term <- rowSums(rfx_coefs[group_ids,] * rfx_basis)
-#' y <- E_XZ + rfx_term + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
-#' X <- as.data.frame(X)
-#' X$x4 <- factor(X$x4, ordered = TRUE)
-#' X$x5 <- factor(X$x5, ordered = TRUE)
-#' test_set_pct <- 0.2
-#' n_test <- round(test_set_pct*n)
-#' n_train <- n - n_test
-#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
-#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
-#' X_test <- X[test_inds,]
-#' X_train <- X[train_inds,]
-#' pi_test <- pi_x[test_inds]
-#' pi_train <- pi_x[train_inds]
-#' Z_test <- Z[test_inds]
-#' Z_train <- Z[train_inds]
-#' y_test <- y[test_inds]
-#' y_train <- y[train_inds]
-#' mu_test <- mu_x[test_inds]
-#' mu_train <- mu_x[train_inds]
-#' tau_test <- tau_x[test_inds]
-#' tau_train <- tau_x[train_inds]
-#' group_ids_test <- group_ids[test_inds]
-#' group_ids_train <- group_ids[train_inds]
-#' rfx_basis_test <- rfx_basis[test_inds,]
-#' rfx_basis_train <- rfx_basis[train_inds,]
-#' rfx_term_test <- rfx_term[test_inds]
-#' rfx_term_train <- rfx_term[train_inds]
-#' bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train, 
-#'                  pi_train = pi_train, group_ids_train = group_ids_train, 
-#'                  rfx_basis_train = rfx_basis_train, X_test = X_test, 
-#'                  Z_test = Z_test, pi_test = pi_test, group_ids_test = group_ids_test,
-#'                  rfx_basis_test = rfx_basis_test, 
-#'                  num_gfr = 100, num_burnin = 0, num_mcmc = 100, 
-#'                  sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
-#' # bcf_json <- convertBCFModelToJson(bcf_model)
-#' # bcf_model_roundtrip <- createBCFModelFromJson(bcf_json)
-createBCFModelFromJson <- function(json_object){
-    # Initialize the BCF model
-    output <- list()
-    
-    # Unpack the forests
-    output[["forests_mu"]] <- loadForestContainerJson(json_object, "forest_0")
-    output[["forests_tau"]] <- loadForestContainerJson(json_object, "forest_1")
-    
-    # Unpack metadata
-    train_set_metadata = list()
-    train_set_metadata[["num_numeric_vars"]] <- json_object$get_scalar("num_numeric_vars")
-    train_set_metadata[["num_ordered_cat_vars"]] <- json_object$get_scalar("num_ordered_cat_vars")
-    train_set_metadata[["num_unordered_cat_vars"]] <- json_object$get_scalar("num_unordered_cat_vars")
-    if (train_set_metadata[["num_numeric_vars"]] > 0) {
-        train_set_metadata[["numeric_vars"]] <- json_object$get_string_vector("numeric_vars")
-    }
-    if (train_set_metadata[["num_ordered_cat_vars"]] > 0) {
-        train_set_metadata[["ordered_cat_vars"]] <- json_object$get_string_vector("ordered_cat_vars")
-        train_set_metadata[["ordered_unique_levels"]] <- json_object$get_string_list("ordered_unique_levels", train_set_metadata[["ordered_cat_vars"]])
-    }
-    if (train_set_metadata[["num_unordered_cat_vars"]] > 0) {
-        train_set_metadata[["unordered_cat_vars"]] <- json_object$get_string_vector("unordered_cat_vars")
-        train_set_metadata[["unordered_unique_levels"]] <- json_object$get_string_list("unordered_unique_levels", train_set_metadata[["unordered_cat_vars"]])
-    }
-    output[["train_set_metadata"]] <- train_set_metadata
-    output[["keep_indices"]] <- json_object$get_vector("keep_indices")
-    
-    # Unpack model params
-    model_params = list()
-    model_params[["outcome_scale"]] <- json_object$get_scalar("outcome_scale")
-    model_params[["outcome_mean"]] <- json_object$get_scalar("outcome_mean")
-    model_params[["sample_sigma_global"]] <- json_object$get_boolean("sample_sigma_global")
-    model_params[["sample_sigma_leaf_mu"]] <- json_object$get_boolean("sample_sigma_leaf_mu")
-    model_params[["sample_sigma_leaf_tau"]] <- json_object$get_boolean("sample_sigma_leaf_tau")
-    model_params[["propensity_covariate"]] <- json_object$get_string("propensity_covariate")
-    model_params[["has_rfx"]] <- json_object$get_boolean("has_rfx")
-    model_params[["has_rfx_basis"]] <- json_object$get_boolean("has_rfx_basis")
-    model_params[["num_rfx_basis"]] <- json_object$get_scalar("num_rfx_basis")
-    model_params[["adaptive_coding"]] <- json_object$get_boolean("adaptive_coding")
-    model_params[["num_gfr"]] <- json_object$get_scalar("num_gfr")
-    model_params[["num_burnin"]] <- json_object$get_scalar("num_burnin")
-    model_params[["num_mcmc"]] <- json_object$get_scalar("num_mcmc")
-    model_params[["num_samples"]] <- json_object$get_scalar("num_samples")
-    model_params[["num_covariates"]] <- json_object$get_scalar("num_covariates")
-    output[["model_params"]] <- model_params
-    
-    # Unpack sampled parameters
-    if (model_params[["sample_sigma_global"]]) {
-        output[["sigma2_samples"]] <- json_object$get_vector("sigma2_samples", "parameters")
-    }
-    if (model_params[["sample_sigma_leaf_mu"]]) {
-        output[["sigma_leaf_mu_samples"]] <- json_object$get_vector("sigma_leaf_mu_samples", "parameters")
-    }
-    if (model_params[["sample_sigma_leaf_tau"]]) {
-        output[["sigma_leaf_tau_samples"]] <- json_object$get_vector("sigma_leaf_tau_samples", "parameters")
-    }
-    if (model_params[["adaptive_coding"]]) {
-        output[["b_1_samples"]] <- json_object$get_vector("b_1_samples", "parameters")
-        output[["b_0_samples"]] <- json_object$get_vector("b_0_samples", "parameters")
-    }
-    
-    # Unpack random effects
-    if (model_params[["has_rfx"]]) {
-        output[["rfx_unique_group_ids"]] <- json_object$get_string_vector("rfx_unique_group_ids")
-        output[["rfx_samples"]] <- loadRandomEffectSamplesJson(json_object, 0)
-    }
-    
-    class(output) <- "bcf"
-    return(output)
-}
diff --git a/man/convertBARTModelToJson.Rd b/man/convertBARTModelToJson.Rd
new file mode 100644
index 00000000..de28613a
--- /dev/null
+++ b/man/convertBARTModelToJson.Rd
@@ -0,0 +1,41 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bart.R
+\name{convertBARTModelToJson}
+\alias{convertBARTModelToJson}
+\title{Convert the persistent aspects of a BART model to (in-memory) JSON}
+\usage{
+convertBARTModelToJson(object)
+}
+\arguments{
+\item{object}{Object of type \code{bartmodel} containing draws of a BART model and associated sampling outputs.}
+}
+\value{
+Object of type \code{CppJson}
+}
+\description{
+Convert the persistent aspects of a BART model to (in-memory) JSON
+}
+\examples{
+n <- 100
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+bart_model <- bart(X_train = X_train, y_train = y_train)
+# bart_json <- convertBARTModelToJson(bart_model)
+}
diff --git a/man/createBARTModelFromJson.Rd b/man/createBARTModelFromJson.Rd
new file mode 100644
index 00000000..0ebea7ee
--- /dev/null
+++ b/man/createBARTModelFromJson.Rd
@@ -0,0 +1,44 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bart.R
+\name{createBARTModelFromJson}
+\alias{createBARTModelFromJson}
+\title{Convert an (in-memory) JSON representation of a BART model to a BART model object
+which can be used for prediction, etc...}
+\usage{
+createBARTModelFromJson(json_object)
+}
+\arguments{
+\item{json_object}{Object of type \code{CppJson} containing Json representation of a BART model}
+}
+\value{
+Object of type \code{bartmodel}
+}
+\description{
+Convert an (in-memory) JSON representation of a BART model to a BART model object
+which can be used for prediction, etc...
+}
+\examples{
+n <- 100
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+bart_model <- bart(X_train = X_train, y_train = y_train)
+# bart_json <- convertBARTModelToJson(bart_model)
+# bart_model_roundtrip <- createBARTModelFromJson(bart_json)
+}
diff --git a/man/createBARTModelFromJsonFile.Rd b/man/createBARTModelFromJsonFile.Rd
new file mode 100644
index 00000000..e776bb6f
--- /dev/null
+++ b/man/createBARTModelFromJsonFile.Rd
@@ -0,0 +1,44 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bart.R
+\name{createBARTModelFromJsonFile}
+\alias{createBARTModelFromJsonFile}
+\title{Convert a JSON file containing sample information on a trained BART model
+to a BART model object which can be used for prediction, etc...}
+\usage{
+createBARTModelFromJsonFile(json_filename)
+}
+\arguments{
+\item{json_filename}{String of filepath, must end in ".json"}
+}
+\value{
+Object of type \code{bartmodel}
+}
+\description{
+Convert a JSON file containing sample information on a trained BART model
+to a BART model object which can be used for prediction, etc...
+}
+\examples{
+n <- 100
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+bart_model <- bart(X_train = X_train, y_train = y_train)
+# saveBARTModelToJsonFile(bart_model, "test.json")
+# bart_model_roundtrip <- createBARTModelFromJsonFile("test.json")
+}
diff --git a/man/createBARTModelFromJsonString.Rd b/man/createBARTModelFromJsonString.Rd
new file mode 100644
index 00000000..f26b9089
--- /dev/null
+++ b/man/createBARTModelFromJsonString.Rd
@@ -0,0 +1,46 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bart.R
+\name{createBARTModelFromJsonString}
+\alias{createBARTModelFromJsonString}
+\title{Convert a JSON string containing sample information on a trained BART model
+to a BART model object which can be used for prediction, etc...}
+\usage{
+createBARTModelFromJsonString(json_string)
+}
+\arguments{
+\item{json_string}{JSON string dump}
+}
+\value{
+Object of type \code{bartmodel}
+}
+\description{
+Convert a JSON string containing sample information on a trained BART model
+to a BART model object which can be used for prediction, etc...
+}
+\examples{
+n <- 100
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+bart_model <- bart(X_train = X_train, y_train = y_train)
+# bart_json <- saveBARTModelToJsonString(bart_model)
+# bart_model_roundtrip <- createBARTModelFromJsonString(bart_json)
+# y_hat_mean_roundtrip <- rowMeans(predict(bart_model_roundtrip, X_train)$y_hat)
+# plot(rowMeans(bart_model$y_hat_train), y_hat_mean_roundtrip)
+}
diff --git a/man/createBCFModelFromJson.Rd b/man/createBCFModelFromJson.Rd
index 28b21ef0..76c3ebcb 100644
--- a/man/createBCFModelFromJson.Rd
+++ b/man/createBCFModelFromJson.Rd
@@ -5,22 +5,15 @@
 \title{Convert an (in-memory) JSON representation of a BCF model to a BCF model object
 which can be used for prediction, etc...}
 \usage{
-createBCFModelFromJson(json_object)
-
 createBCFModelFromJson(json_object)
 }
 \arguments{
 \item{json_object}{Object of type \code{CppJson} containing Json representation of a BCF model}
 }
 \value{
-Object of type \code{bcf}
-
 Object of type \code{bcf}
 }
 \description{
-Convert an (in-memory) JSON representation of a BCF model to a BCF model object
-which can be used for prediction, etc...
-
 Convert an (in-memory) JSON representation of a BCF model to a BCF model object
 which can be used for prediction, etc...
 }
@@ -84,63 +77,4 @@ bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train,
                  sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
 # bcf_json <- convertBCFModelToJson(bcf_model)
 # bcf_model_roundtrip <- createBCFModelFromJson(bcf_json)
-n <- 500
-x1 <- rnorm(n)
-x2 <- rnorm(n)
-x3 <- rnorm(n)
-x4 <- as.numeric(rbinom(n,1,0.5))
-x5 <- as.numeric(sample(1:3,n,replace=TRUE))
-X <- cbind(x1,x2,x3,x4,x5)
-p <- ncol(X)
-g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,4))}
-mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
-mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
-tau1 <- function(x) {rep(3,nrow(x))}
-tau2 <- function(x) {1+2*x[,2]*x[,4]}
-mu_x <- mu1(X)
-tau_x <- tau2(X)
-pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
-Z <- rbinom(n,1,pi_x)
-E_XZ <- mu_x + Z*tau_x
-snr <- 3
-group_ids <- rep(c(1,2), n \%/\% 2)
-rfx_coefs <- matrix(c(-1, -1, 1, 1), nrow=2, byrow=TRUE)
-rfx_basis <- cbind(1, runif(n, -1, 1))
-rfx_term <- rowSums(rfx_coefs[group_ids,] * rfx_basis)
-y <- E_XZ + rfx_term + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
-X <- as.data.frame(X)
-X$x4 <- factor(X$x4, ordered = TRUE)
-X$x5 <- factor(X$x5, ordered = TRUE)
-test_set_pct <- 0.2
-n_test <- round(test_set_pct*n)
-n_train <- n - n_test
-test_inds <- sort(sample(1:n, n_test, replace = FALSE))
-train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
-X_test <- X[test_inds,]
-X_train <- X[train_inds,]
-pi_test <- pi_x[test_inds]
-pi_train <- pi_x[train_inds]
-Z_test <- Z[test_inds]
-Z_train <- Z[train_inds]
-y_test <- y[test_inds]
-y_train <- y[train_inds]
-mu_test <- mu_x[test_inds]
-mu_train <- mu_x[train_inds]
-tau_test <- tau_x[test_inds]
-tau_train <- tau_x[train_inds]
-group_ids_test <- group_ids[test_inds]
-group_ids_train <- group_ids[train_inds]
-rfx_basis_test <- rfx_basis[test_inds,]
-rfx_basis_train <- rfx_basis[train_inds,]
-rfx_term_test <- rfx_term[test_inds]
-rfx_term_train <- rfx_term[train_inds]
-bcf_model <- bcf(X_train = X_train, Z_train = Z_train, y_train = y_train, 
-                 pi_train = pi_train, group_ids_train = group_ids_train, 
-                 rfx_basis_train = rfx_basis_train, X_test = X_test, 
-                 Z_test = Z_test, pi_test = pi_test, group_ids_test = group_ids_test,
-                 rfx_basis_test = rfx_basis_test, 
-                 num_gfr = 100, num_burnin = 0, num_mcmc = 100, 
-                 sample_sigma_leaf_mu = TRUE, sample_sigma_leaf_tau = FALSE)
-# bcf_json <- convertBCFModelToJson(bcf_model)
-# bcf_model_roundtrip <- createBCFModelFromJson(bcf_json)
 }
diff --git a/man/saveBARTModelToJsonFile.Rd b/man/saveBARTModelToJsonFile.Rd
new file mode 100644
index 00000000..29763e81
--- /dev/null
+++ b/man/saveBARTModelToJsonFile.Rd
@@ -0,0 +1,40 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bart.R
+\name{saveBARTModelToJsonFile}
+\alias{saveBARTModelToJsonFile}
+\title{Convert the persistent aspects of a BART model to (in-memory) JSON and save to a file}
+\usage{
+saveBARTModelToJsonFile(object, filename)
+}
+\arguments{
+\item{object}{Object of type \code{bartmodel} containing draws of a BART model and associated sampling outputs.}
+
+\item{filename}{String of filepath, must end in ".json"}
+}
+\description{
+Convert the persistent aspects of a BART model to (in-memory) JSON and save to a file
+}
+\examples{
+n <- 100
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+bart_model <- bart(X_train = X_train, y_train = y_train)
+# saveBARTModelToJsonFile(bart_model, "test.json")
+}
diff --git a/man/saveBARTModelToJsonString.Rd b/man/saveBARTModelToJsonString.Rd
new file mode 100644
index 00000000..031b6d1e
--- /dev/null
+++ b/man/saveBARTModelToJsonString.Rd
@@ -0,0 +1,41 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bart.R
+\name{saveBARTModelToJsonString}
+\alias{saveBARTModelToJsonString}
+\title{Convert the persistent aspects of a BART model to (in-memory) JSON string}
+\usage{
+saveBARTModelToJsonString(object)
+}
+\arguments{
+\item{object}{Object of type \code{bartmodel} containing draws of a BART model and associated sampling outputs.}
+}
+\value{
+JSON string
+}
+\description{
+Convert the persistent aspects of a BART model to (in-memory) JSON string
+}
+\examples{
+n <- 100
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+bart_model <- bart(X_train = X_train, y_train = y_train)
+# saveBARTModelToJsonString(bart_model)
+}

From 5db1257b43e765b13634361a90c1993d2d925b76 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sun, 4 Aug 2024 09:04:40 -0500
Subject: [PATCH 03/41] Updated example code

---
 R/bart.R | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/R/bart.R b/R/bart.R
index 9eaeb47c..30dd0e70 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -1022,7 +1022,8 @@ createBARTModelFromJsonFile <- function(json_filename){
 #' # bart_json <- saveBARTModelToJsonString(bart_model)
 #' # bart_model_roundtrip <- createBARTModelFromJsonString(bart_json)
 #' # y_hat_mean_roundtrip <- rowMeans(predict(bart_model_roundtrip, X_train)$y_hat)
-#' # plot(rowMeans(bart_model$y_hat_train), y_hat_mean_roundtrip)
+#' # plot(rowMeans(bart_model$y_hat_train), y_hat_mean_roundtrip, 
+#' #      xlab = "original", ylab = "roundtrip")
 createBARTModelFromJsonString <- function(json_string){
     # Load a `CppJson` object from string
     bart_json <- createCppJsonString(json_string)

From 8bd7948016f74bd398c54b4414ebd7b7e8878db0 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Thu, 8 Aug 2024 12:36:55 -0700
Subject: [PATCH 04/41] Added code to combine multiple forests

---
 NAMESPACE                                    |   2 +
 R/cpp11.R                                    |  12 ++
 R/forest.R                                   |  29 +++-
 R/serialization.R                            |  40 ++++++
 _pkgdown.yml                                 |   7 +-
 include/stochtree/container.h                |   2 +
 man/ForestSamples.Rd                         |  71 +++++++++-
 man/createBARTModelFromJsonString.Rd         |   3 +-
 man/loadForestContainerCombinedJson.Rd       |  19 +++
 man/loadForestContainerCombinedJsonString.Rd |  19 +++
 src/container.cpp                            |  22 +++
 src/cpp11.cpp                                |  26 ++++
 src/forest.cpp                               |  40 ++++++
 tools/debug/multichain_seq.R                 |  47 +++++++
 vignettes/MultiChain.Rmd                     | 140 +++++++++++++++++++
 15 files changed, 474 insertions(+), 5 deletions(-)
 create mode 100644 man/loadForestContainerCombinedJson.Rd
 create mode 100644 man/loadForestContainerCombinedJsonString.Rd
 create mode 100644 tools/debug/multichain_seq.R
 create mode 100644 vignettes/MultiChain.Rmd

diff --git a/NAMESPACE b/NAMESPACE
index 5c8c8869..ecefca33 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -32,6 +32,8 @@ export(createRandomEffectsDataset)
 export(createRandomEffectsModel)
 export(createRandomEffectsTracker)
 export(getRandomEffectSamples)
+export(loadForestContainerCombinedJson)
+export(loadForestContainerCombinedJsonString)
 export(loadForestContainerJson)
 export(loadRandomEffectSamplesJson)
 export(loadScalarJson)
diff --git a/R/cpp11.R b/R/cpp11.R
index b9e710b7..4debd218 100644
--- a/R/cpp11.R
+++ b/R/cpp11.R
@@ -188,6 +188,18 @@ forest_container_from_json_cpp <- function(json_ptr, forest_label) {
   .Call(`_stochtree_forest_container_from_json_cpp`, json_ptr, forest_label)
 }
 
+forest_container_append_from_json_cpp <- function(forest_sample_ptr, json_ptr, forest_label) {
+  invisible(.Call(`_stochtree_forest_container_append_from_json_cpp`, forest_sample_ptr, json_ptr, forest_label))
+}
+
+forest_container_from_json_string_cpp <- function(json_string, forest_label) {
+  .Call(`_stochtree_forest_container_from_json_string_cpp`, json_string, forest_label)
+}
+
+forest_container_append_from_json_string_cpp <- function(forest_sample_ptr, json_string, forest_label) {
+  invisible(.Call(`_stochtree_forest_container_append_from_json_string_cpp`, forest_sample_ptr, json_string, forest_label))
+}
+
 num_samples_forest_container_cpp <- function(forest_samples) {
   .Call(`_stochtree_num_samples_forest_container_cpp`, forest_samples)
 }
diff --git a/R/forest.R b/R/forest.R
index 953aa585..2feec6af 100644
--- a/R/forest.R
+++ b/R/forest.R
@@ -22,7 +22,7 @@ ForestSamples <- R6::R6Class(
         }, 
         
         #' @description
-        #' Create a new ForestContainer object from a json object
+        #' Create a new `ForestContainer` object from a json object
         #' @param json_object Object of class `CppJson`
         #' @param json_forest_label Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy
         #' @return A new `ForestContainer` object.
@@ -30,6 +30,33 @@ ForestSamples <- R6::R6Class(
             self$forest_container_ptr <- forest_container_from_json_cpp(json_object$json_ptr, json_forest_label)
         }, 
         
+        #' @description
+        #' Append to a `ForestContainer` object from a json object
+        #' @param json_object Object of class `CppJson`
+        #' @param json_forest_label Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy
+        #' @return NULL
+        append_from_json = function(json_object, json_forest_label) {
+            forest_container_append_from_json_cpp(self$forest_container_ptr, json_object$json_ptr, json_forest_label)
+        }, 
+        
+        #' @description
+        #' Create a new `ForestContainer` object from a json object
+        #' @param json_string JSON string which parses into object of class `CppJson`
+        #' @param json_forest_label Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy
+        #' @return A new `ForestContainer` object.
+        load_from_json_string = function(json_string, json_forest_label) {
+            self$forest_container_ptr <- forest_container_from_json_string_cpp(json_string, json_forest_label)
+        }, 
+        
+        #' @description
+        #' Append to a `ForestContainer` object from a json object
+        #' @param json_string JSON string which parses into object of class `CppJson`
+        #' @param json_forest_label Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy
+        #' @return NULL
+        append_from_json_string = function(json_string, json_forest_label) {
+            forest_container_append_from_json_string_cpp(self$forest_container_ptr, json_string, json_forest_label)
+        }, 
+        
         #' @description
         #' Predict every tree ensemble on every sample in `forest_dataset`
         #' @param forest_dataset `ForestDataset` R class
diff --git a/R/serialization.R b/R/serialization.R
index 525f5abf..cf0ba267 100644
--- a/R/serialization.R
+++ b/R/serialization.R
@@ -322,6 +322,46 @@ loadForestContainerJson <- function(json_object, json_forest_label) {
     return(output)
 }
 
+#' Combine multiple JSON model objects containing forests (with the same hierarchy / schema) into a single forest_container
+#'
+#' @param json_object_list List of objects of class `CppJson`
+#' @param json_forest_label Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy (must exist in every json object in the list)
+#'
+#' @return `ForestSamples` object
+#' @export
+loadForestContainerCombinedJson <- function(json_object_list, json_forest_label) {
+    invisible(output <- ForestSamples$new(0,1,T))
+    for (i in 1:length(json_object_list)) {
+        json_object <- json_object_list[i]
+        if (i == 1) {
+            output$load_from_json(json_object, json_forest_label)
+        } else {
+            output$append_from_json(json_object, json_forest_label)
+        }
+    }
+    return(output)
+}
+
+#' Combine multiple JSON strings representing model objects containing forests (with the same hierarchy / schema) into a single forest_container
+#'
+#' @param json_string_list List of strings that parse into objects of type `CppJson`
+#' @param json_forest_label Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy (must exist in every json object in the list)
+#'
+#' @return `ForestSamples` object
+#' @export
+loadForestContainerCombinedJsonString <- function(json_string_list, json_forest_label) {
+    invisible(output <- ForestSamples$new(0,1,T))
+    for (i in 1:length(json_string_list)) {
+        json_string <- json_string_list[[i]]
+        if (i == 1) {
+            output$load_from_json_string(json_string, json_forest_label)
+        } else {
+            output$append_from_json_string(json_string, json_forest_label)
+        }
+    }
+    return(output)
+}
+
 #' Load a container of random effect samples from json
 #'
 #' @param json_object Object of class `CppJson`
diff --git a/_pkgdown.yml b/_pkgdown.yml
index 8292609e..f919a864 100644
--- a/_pkgdown.yml
+++ b/_pkgdown.yml
@@ -30,12 +30,14 @@ reference:
   contents:
   - CppJson
   - createCppJson
+  - createCppJsonFile
+  - createCppJsonString
   - loadForestContainerJson
+  - loadForestContainerCombinedJson
+  - loadForestContainerCombinedJsonString
   - loadRandomEffectSamplesJson
   - loadVectorJson
   - loadScalarJson
-  - createCppJsonFile
-  - createCppJsonString
 
 - subtitle: Data
   desc: >
@@ -104,6 +106,7 @@ articles:
   contents:
   - BayesianSupervisedLearning
   - CausalInference
+  - MultiChain
   - ModelSerialization
 
 - title: Prototype Interface
diff --git a/include/stochtree/container.h b/include/stochtree/container.h
index 78139bb3..e189957a 100644
--- a/include/stochtree/container.h
+++ b/include/stochtree/container.h
@@ -90,6 +90,8 @@ class ForestContainer {
   nlohmann::json to_json();
   /*! \brief Load from JSON */
   void from_json(const nlohmann::json& forest_container_json);
+  /*! \brief Append to a forest container from JSON, requires that the ensemble already contains a nonzero number of forests */
+  void append_from_json(const nlohmann::json& forest_container_json);
 
  private:
   std::vector<std::unique_ptr<TreeEnsemble>> forests_;
diff --git a/man/ForestSamples.Rd b/man/ForestSamples.Rd
index b629ca1a..4b945926 100644
--- a/man/ForestSamples.Rd
+++ b/man/ForestSamples.Rd
@@ -18,6 +18,9 @@ Wrapper around a C++ container of tree ensembles
 \itemize{
 \item \href{#method-ForestSamples-new}{\code{ForestSamples$new()}}
 \item \href{#method-ForestSamples-load_from_json}{\code{ForestSamples$load_from_json()}}
+\item \href{#method-ForestSamples-append_from_json}{\code{ForestSamples$append_from_json()}}
+\item \href{#method-ForestSamples-load_from_json_string}{\code{ForestSamples$load_from_json_string()}}
+\item \href{#method-ForestSamples-append_from_json_string}{\code{ForestSamples$append_from_json_string()}}
 \item \href{#method-ForestSamples-predict}{\code{ForestSamples$predict()}}
 \item \href{#method-ForestSamples-predict_raw}{\code{ForestSamples$predict_raw()}}
 \item \href{#method-ForestSamples-predict_raw_single_forest}{\code{ForestSamples$predict_raw_single_forest()}}
@@ -69,7 +72,7 @@ A new \code{ForestContainer} object.
 \if{html}{\out{<a id="method-ForestSamples-load_from_json"></a>}}
 \if{latex}{\out{\hypertarget{method-ForestSamples-load_from_json}{}}}
 \subsection{Method \code{load_from_json()}}{
-Create a new ForestContainer object from a json object
+Create a new \code{ForestContainer} object from a json object
 \subsection{Usage}{
 \if{html}{\out{<div class="r">}}\preformatted{ForestSamples$load_from_json(json_object, json_forest_label)}\if{html}{\out{</div>}}
 }
@@ -88,6 +91,72 @@ A new \code{ForestContainer} object.
 }
 }
 \if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-ForestSamples-append_from_json"></a>}}
+\if{latex}{\out{\hypertarget{method-ForestSamples-append_from_json}{}}}
+\subsection{Method \code{append_from_json()}}{
+Append to a \code{ForestContainer} object from a json object
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{ForestSamples$append_from_json(json_object, json_forest_label)}\if{html}{\out{</div>}}
+}
+
+\subsection{Arguments}{
+\if{html}{\out{<div class="arguments">}}
+\describe{
+\item{\code{json_object}}{Object of class \code{CppJson}}
+
+\item{\code{json_forest_label}}{Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy}
+}
+\if{html}{\out{</div>}}
+}
+\subsection{Returns}{
+NULL
+}
+}
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-ForestSamples-load_from_json_string"></a>}}
+\if{latex}{\out{\hypertarget{method-ForestSamples-load_from_json_string}{}}}
+\subsection{Method \code{load_from_json_string()}}{
+Create a new \code{ForestContainer} object from a json object
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{ForestSamples$load_from_json_string(json_string, json_forest_label)}\if{html}{\out{</div>}}
+}
+
+\subsection{Arguments}{
+\if{html}{\out{<div class="arguments">}}
+\describe{
+\item{\code{json_string}}{JSON string which parses into object of class \code{CppJson}}
+
+\item{\code{json_forest_label}}{Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy}
+}
+\if{html}{\out{</div>}}
+}
+\subsection{Returns}{
+A new \code{ForestContainer} object.
+}
+}
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-ForestSamples-append_from_json_string"></a>}}
+\if{latex}{\out{\hypertarget{method-ForestSamples-append_from_json_string}{}}}
+\subsection{Method \code{append_from_json_string()}}{
+Append to a \code{ForestContainer} object from a json object
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{ForestSamples$append_from_json_string(json_string, json_forest_label)}\if{html}{\out{</div>}}
+}
+
+\subsection{Arguments}{
+\if{html}{\out{<div class="arguments">}}
+\describe{
+\item{\code{json_string}}{JSON string which parses into object of class \code{CppJson}}
+
+\item{\code{json_forest_label}}{Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy}
+}
+\if{html}{\out{</div>}}
+}
+\subsection{Returns}{
+NULL
+}
+}
+\if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-ForestSamples-predict"></a>}}
 \if{latex}{\out{\hypertarget{method-ForestSamples-predict}{}}}
 \subsection{Method \code{predict()}}{
diff --git a/man/createBARTModelFromJsonString.Rd b/man/createBARTModelFromJsonString.Rd
index f26b9089..735fb48f 100644
--- a/man/createBARTModelFromJsonString.Rd
+++ b/man/createBARTModelFromJsonString.Rd
@@ -42,5 +42,6 @@ bart_model <- bart(X_train = X_train, y_train = y_train)
 # bart_json <- saveBARTModelToJsonString(bart_model)
 # bart_model_roundtrip <- createBARTModelFromJsonString(bart_json)
 # y_hat_mean_roundtrip <- rowMeans(predict(bart_model_roundtrip, X_train)$y_hat)
-# plot(rowMeans(bart_model$y_hat_train), y_hat_mean_roundtrip)
+# plot(rowMeans(bart_model$y_hat_train), y_hat_mean_roundtrip, 
+#      xlab = "original", ylab = "roundtrip")
 }
diff --git a/man/loadForestContainerCombinedJson.Rd b/man/loadForestContainerCombinedJson.Rd
new file mode 100644
index 00000000..90d4e051
--- /dev/null
+++ b/man/loadForestContainerCombinedJson.Rd
@@ -0,0 +1,19 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/serialization.R
+\name{loadForestContainerCombinedJson}
+\alias{loadForestContainerCombinedJson}
+\title{Combine multiple JSON model objects containing forests (with the same hierarchy / schema) into a single forest_container}
+\usage{
+loadForestContainerCombinedJson(json_object_list, json_forest_label)
+}
+\arguments{
+\item{json_object_list}{List of objects of class \code{CppJson}}
+
+\item{json_forest_label}{Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy (must exist in every json object in the list)}
+}
+\value{
+\code{ForestSamples} object
+}
+\description{
+Combine multiple JSON model objects containing forests (with the same hierarchy / schema) into a single forest_container
+}
diff --git a/man/loadForestContainerCombinedJsonString.Rd b/man/loadForestContainerCombinedJsonString.Rd
new file mode 100644
index 00000000..7b9a4d82
--- /dev/null
+++ b/man/loadForestContainerCombinedJsonString.Rd
@@ -0,0 +1,19 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/serialization.R
+\name{loadForestContainerCombinedJsonString}
+\alias{loadForestContainerCombinedJsonString}
+\title{Combine multiple JSON strings representing model objects containing forests (with the same hierarchy / schema) into a single forest_container}
+\usage{
+loadForestContainerCombinedJsonString(json_string_list, json_forest_label)
+}
+\arguments{
+\item{json_string_list}{List of strings that parse into objects of type \code{CppJson}}
+
+\item{json_forest_label}{Label referring to a particular forest (i.e. "forest_0") in the overall json hierarchy (must exist in every json object in the list)}
+}
+\value{
+\code{ForestSamples} object
+}
+\description{
+Combine multiple JSON strings representing model objects containing forests (with the same hierarchy / schema) into a single forest_container
+}
diff --git a/src/container.cpp b/src/container.cpp
index 79e940d6..fac4a0ed 100644
--- a/src/container.cpp
+++ b/src/container.cpp
@@ -157,4 +157,26 @@ void ForestContainer::from_json(const json& forest_container_json) {
   }
 }
 
+/*! \brief Append forests to a container from a JSON forest specification */
+void ForestContainer::append_from_json(const json& forest_container_json) {
+  CHECK_GT(this->num_samples_, 0);
+  CHECK_EQ(this->num_trees_, forest_container_json.at("num_trees"));
+  CHECK_EQ(this->output_dimension_, forest_container_json.at("output_dimension"));
+  CHECK_EQ(this->is_leaf_constant_, forest_container_json.at("is_leaf_constant"));
+  CHECK_EQ(this->initialized_, forest_container_json.at("initialized"));
+  int new_num_samples = forest_container_json.at("num_samples");
+
+  std::string forest_label;
+  // forests_.resize(this->num_samples_);
+  int forest_ind;
+  for (int i = 0; i < forest_container_json.at("num_samples"); i++) {
+    forest_ind = this->num_samples_ + i;
+    forest_label = "forest_" + std::to_string(i);
+    // forests_[forest_ind] = std::make_unique<TreeEnsemble>(this->num_trees_, this->output_dimension_, this->is_leaf_constant_);
+    forests_.push_back(std::make_unique<TreeEnsemble>(this->num_trees_, this->output_dimension_, this->is_leaf_constant_));
+    forests_[forest_ind]->from_json(forest_container_json.at(forest_label));
+  }
+  this->num_samples_ += new_num_samples;
+}
+
 } // namespace StochTree
\ No newline at end of file
diff --git a/src/cpp11.cpp b/src/cpp11.cpp
index 6a5b883f..ca2f168e 100644
--- a/src/cpp11.cpp
+++ b/src/cpp11.cpp
@@ -349,6 +349,29 @@ extern "C" SEXP _stochtree_forest_container_from_json_cpp(SEXP json_ptr, SEXP fo
   END_CPP11
 }
 // forest.cpp
+void forest_container_append_from_json_cpp(cpp11::external_pointer<StochTree::ForestContainer> forest_sample_ptr, cpp11::external_pointer<nlohmann::json> json_ptr, std::string forest_label);
+extern "C" SEXP _stochtree_forest_container_append_from_json_cpp(SEXP forest_sample_ptr, SEXP json_ptr, SEXP forest_label) {
+  BEGIN_CPP11
+    forest_container_append_from_json_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestContainer>>>(forest_sample_ptr), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<nlohmann::json>>>(json_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(forest_label));
+    return R_NilValue;
+  END_CPP11
+}
+// forest.cpp
+cpp11::external_pointer<StochTree::ForestContainer> forest_container_from_json_string_cpp(std::string json_string, std::string forest_label);
+extern "C" SEXP _stochtree_forest_container_from_json_string_cpp(SEXP json_string, SEXP forest_label) {
+  BEGIN_CPP11
+    return cpp11::as_sexp(forest_container_from_json_string_cpp(cpp11::as_cpp<cpp11::decay_t<std::string>>(json_string), cpp11::as_cpp<cpp11::decay_t<std::string>>(forest_label)));
+  END_CPP11
+}
+// forest.cpp
+void forest_container_append_from_json_string_cpp(cpp11::external_pointer<StochTree::ForestContainer> forest_sample_ptr, std::string json_string, std::string forest_label);
+extern "C" SEXP _stochtree_forest_container_append_from_json_string_cpp(SEXP forest_sample_ptr, SEXP json_string, SEXP forest_label) {
+  BEGIN_CPP11
+    forest_container_append_from_json_string_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestContainer>>>(forest_sample_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(json_string), cpp11::as_cpp<cpp11::decay_t<std::string>>(forest_label));
+    return R_NilValue;
+  END_CPP11
+}
+// forest.cpp
 int num_samples_forest_container_cpp(cpp11::external_pointer<StochTree::ForestContainer> forest_samples);
 extern "C" SEXP _stochtree_num_samples_forest_container_cpp(SEXP forest_samples) {
   BEGIN_CPP11
@@ -909,8 +932,11 @@ static const R_CallMethodDef CallEntries[] = {
     {"_stochtree_dataset_num_rows_cpp",                                (DL_FUNC) &_stochtree_dataset_num_rows_cpp,                                 1},
     {"_stochtree_ensemble_average_max_depth_forest_container_cpp",     (DL_FUNC) &_stochtree_ensemble_average_max_depth_forest_container_cpp,      2},
     {"_stochtree_ensemble_tree_max_depth_forest_container_cpp",        (DL_FUNC) &_stochtree_ensemble_tree_max_depth_forest_container_cpp,         3},
+    {"_stochtree_forest_container_append_from_json_cpp",               (DL_FUNC) &_stochtree_forest_container_append_from_json_cpp,                3},
+    {"_stochtree_forest_container_append_from_json_string_cpp",        (DL_FUNC) &_stochtree_forest_container_append_from_json_string_cpp,         3},
     {"_stochtree_forest_container_cpp",                                (DL_FUNC) &_stochtree_forest_container_cpp,                                 3},
     {"_stochtree_forest_container_from_json_cpp",                      (DL_FUNC) &_stochtree_forest_container_from_json_cpp,                       2},
+    {"_stochtree_forest_container_from_json_string_cpp",               (DL_FUNC) &_stochtree_forest_container_from_json_string_cpp,                2},
     {"_stochtree_forest_dataset_add_basis_cpp",                        (DL_FUNC) &_stochtree_forest_dataset_add_basis_cpp,                         2},
     {"_stochtree_forest_dataset_add_covariates_cpp",                   (DL_FUNC) &_stochtree_forest_dataset_add_covariates_cpp,                    2},
     {"_stochtree_forest_dataset_add_weights_cpp",                      (DL_FUNC) &_stochtree_forest_dataset_add_weights_cpp,                       2},
diff --git a/src/forest.cpp b/src/forest.cpp
index c1f22c4e..fc2dd574 100644
--- a/src/forest.cpp
+++ b/src/forest.cpp
@@ -36,6 +36,46 @@ cpp11::external_pointer<StochTree::ForestContainer> forest_container_from_json_c
     return cpp11::external_pointer<StochTree::ForestContainer>(forest_sample_ptr_.release());
 }
 
+[[cpp11::register]]
+void forest_container_append_from_json_cpp(cpp11::external_pointer<StochTree::ForestContainer> forest_sample_ptr, cpp11::external_pointer<nlohmann::json> json_ptr, std::string forest_label) {
+    // Extract the forest's json
+    nlohmann::json forest_json = json_ptr->at("forests").at(forest_label);
+    
+    // Append to the forest sample container using the json
+    forest_sample_ptr->append_from_json(forest_json);
+}
+
+[[cpp11::register]]
+cpp11::external_pointer<StochTree::ForestContainer> forest_container_from_json_string_cpp(std::string json_string, std::string forest_label) {
+    // Create smart pointer to newly allocated object
+    std::unique_ptr<StochTree::ForestContainer> forest_sample_ptr_ = std::make_unique<StochTree::ForestContainer>(0, 1, true);
+    
+    // Create a nlohmann::json object from the string
+    nlohmann::json json_object = nlohmann::json::parse(json_string);
+    
+    // Extract the forest's json
+    nlohmann::json forest_json = json_object.at("forests").at(forest_label);
+    
+    // Reset the forest sample container using the json
+    forest_sample_ptr_->Reset();
+    forest_sample_ptr_->from_json(forest_json);
+    
+    // Release management of the pointer to R session
+    return cpp11::external_pointer<StochTree::ForestContainer>(forest_sample_ptr_.release());
+}
+
+[[cpp11::register]]
+void forest_container_append_from_json_string_cpp(cpp11::external_pointer<StochTree::ForestContainer> forest_sample_ptr, std::string json_string, std::string forest_label) {
+    // Create a nlohmann::json object from the string
+    nlohmann::json json_object = nlohmann::json::parse(json_string);
+    
+    // Extract the forest's json
+    nlohmann::json forest_json = json_object.at("forests").at(forest_label);
+    
+    // Append to the forest sample container using the json
+    forest_sample_ptr->append_from_json(forest_json);
+}
+
 [[cpp11::register]]
 int num_samples_forest_container_cpp(cpp11::external_pointer<StochTree::ForestContainer> forest_samples) {
     return forest_samples->NumSamples();
diff --git a/tools/debug/multichain_seq.R b/tools/debug/multichain_seq.R
new file mode 100644
index 00000000..49b159c8
--- /dev/null
+++ b/tools/debug/multichain_seq.R
@@ -0,0 +1,47 @@
+library(stochtree)
+n <- 500
+p_x <- 10
+p_w <- 1
+snr <- 3
+X <- matrix(runif(n*p_x), ncol = p_x)
+W <- matrix(runif(n*p_w), ncol = p_w)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5*W[,1]) + 
+        ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5*W[,1]) + 
+        ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5*W[,1]) + 
+        ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5*W[,1])
+)
+noise_sd <- sd(f_XW) / snr
+y <- f_XW + rnorm(n, 0, 1)*noise_sd
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- as.data.frame(X[test_inds,])
+X_train <- as.data.frame(X[train_inds,])
+W_test <- W[test_inds,]
+W_train <- W[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+num_chains <- 4
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 100
+num_trees <- 100
+bart_models <- list()
+for (i in 1:num_chains) {
+    bart_models[[i]] <- stochtree::bart(
+        X_train = X_train, W_train = W_train, y_train = y_train, 
+        X_test = X_test, W_test = W_test, num_trees = num_trees, 
+        num_gfr = num_gfr, num_burnin = num_burnin, 
+        num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T
+    )
+}
+json_string_list <- list()
+for (i in 1:num_chains) {
+    json_string_list[[i]] <- saveBARTModelToJsonString(bart_models[[i]])
+}
+combined_forests <- loadForestContainerCombinedJsonString(json_string_list, "forest_0")
+test_dataset <- createForestDataset(as.matrix(X_test), W_test)
+yhat_combined <- combined_forests$predict(test_dataset)
\ No newline at end of file
diff --git a/vignettes/MultiChain.Rmd b/vignettes/MultiChain.Rmd
new file mode 100644
index 00000000..4c09a49b
--- /dev/null
+++ b/vignettes/MultiChain.Rmd
@@ -0,0 +1,140 @@
+---
+title: "Running Multiple Chains (Sequentially or in Parallel) in StochTree"
+output: rmarkdown::html_vignette
+vignette: >
+  %\VignetteIndexEntry{Prototype-Interface}
+  %\VignetteEncoding{UTF-8}
+  %\VignetteEngine{knitr::rmarkdown}
+bibliography: vignettes.bib
+editor_options: 
+  markdown: 
+    wrap: 72
+---
+
+```{r, include = FALSE}
+knitr::opts_chunk$set(
+  collapse = TRUE,
+  comment = "#>"
+)
+```
+
+# Motivation
+
+Mixing of an MCMC sampler is a perennial concern for complex Bayesian models, 
+and BART is no exception. On common way to address such concerns is to run 
+multiple independent "chains" of an MCMC sampler, so that if each chain gets 
+stuck in a different region of the posterior, their combined samples attain 
+better coverage of the full posterior.
+
+This idea works with the classic "from-root" MCMC sampler of @chipman2010bart, 
+but a key insight of @he2023stochastic is that the XBART algorithm may be used 
+to warm-start initialize multiple chains of the BART MCMC sampler. 
+
+Operationally, the above two approaches have the same implementation (setting 
+`num_gfr` > 0 if warm-start initialization is desired), so this vignette will 
+demonstrate how to run a multi-chain sampler sequentially or in parallel.
+
+To begin, load the `stochtree` package
+
+```{r setup}
+library(stochtree)
+```
+
+# Demo 1: Supervised Learning, Sequential Multi Chain Sampler
+
+## Simulation
+
+Simulate a simple partitioned linear model
+
+```{r}
+# Generate the data
+n <- 500
+p_x <- 10
+p_w <- 1
+snr <- 3
+X <- matrix(runif(n*p_x), ncol = p_x)
+W <- matrix(runif(n*p_w), ncol = p_w)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5*W[,1]) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5*W[,1]) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5*W[,1]) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5*W[,1])
+)
+noise_sd <- sd(f_XW) / snr
+y <- f_XW + rnorm(n, 0, 1)*noise_sd
+
+# Split data into test and train sets
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- as.data.frame(X[test_inds,])
+X_train <- as.data.frame(X[train_inds,])
+W_test <- W[test_inds,]
+W_train <- W[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+```
+
+## Sampling
+
+Define some high-level parameters, including number of chains to run and number of 
+samples per chain. Here we run 4 independent chains with 5 warm-start iterations 
+and 100 MCMC iterations each.
+
+```{r}
+num_chains <- 4
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 100
+num_trees <- 100
+```
+
+Run the sampler, storing the resulting BART objects in a list
+
+```{r}
+bart_models <- list()
+for (i in 1:num_chains) {
+    bart_models[[i]] <- stochtree::bart(
+        X_train = X_train, W_train = W_train, y_train = y_train, 
+        X_test = X_test, W_test = W_test, num_trees = num_trees, 
+        num_gfr = num_gfr, num_burnin = num_burnin, 
+        num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T
+    )
+}
+```
+
+Now, if we want to combine the forests from each of these BART models into a 
+single forest, we can do so as follows
+
+```{r}
+json_string_list <- list()
+for (i in 1:num_chains) {
+    json_string_list[[i]] <- saveBARTModelToJsonString(bart_models[[i]])
+}
+combined_forests <- loadForestContainerCombinedJsonString(json_string_list, "forest_0")
+```
+
+We can predict from this combined forest as follows
+
+```{r}
+test_dataset <- createForestDataset(as.matrix(X_test), W_test)
+yhat_combined <- combined_forests$predict(test_dataset)
+```
+
+Compare to the original $\hat{y}$ values
+
+```{r}
+num_samples <- num_gfr+num_burnin+num_mcmc
+for (i in 1:num_chains) {
+    offset <- (i-1)*num_samples
+    inds_start <- offset + 1 + num_burnin + num_gfr
+    inds_end <- offset + num_samples
+    plot(rowMeans(bart_models[[i]]$y_hat_test), 
+         rowMeans(yhat_combined[,inds_start:inds_end]))
+}
+```
+
+
+# References

From 1ab2828e9dac19bab80346d6657d7875a79e9d0c Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Thu, 8 Aug 2024 18:01:59 -0700
Subject: [PATCH 05/41] Updated multichain vignette

---
 vignettes/MultiChain.Rmd | 83 ++++++++++++++++++++++++++++++++++++++--
 1 file changed, 79 insertions(+), 4 deletions(-)

diff --git a/vignettes/MultiChain.Rmd b/vignettes/MultiChain.Rmd
index 4c09a49b..13275117 100644
--- a/vignettes/MultiChain.Rmd
+++ b/vignettes/MultiChain.Rmd
@@ -34,15 +34,17 @@ Operationally, the above two approaches have the same implementation (setting
 `num_gfr` > 0 if warm-start initialization is desired), so this vignette will 
 demonstrate how to run a multi-chain sampler sequentially or in parallel.
 
-To begin, load the `stochtree` package
+To begin, load `stochtree` and other necessary packages
 
 ```{r setup}
 library(stochtree)
+library(foreach)
+library(doParallel)
 ```
 
-# Demo 1: Supervised Learning, Sequential Multi Chain Sampler
+# Demo 1: Supervised Learning
 
-## Simulation
+## Data Simulation
 
 Simulate a simple partitioned linear model
 
@@ -77,7 +79,7 @@ y_test <- y[test_inds]
 y_train <- y[train_inds]
 ```
 
-## Sampling
+## Sampling Multiple Chains Sequentially
 
 Define some high-level parameters, including number of chains to run and number of 
 samples per chain. Here we run 4 independent chains with 5 warm-start iterations 
@@ -136,5 +138,78 @@ for (i in 1:num_chains) {
 }
 ```
 
+## Sampling Multiple Chains in Parallel
+
+We use the same high-level parameters as in the sequential demo. 
+
+```{r}
+num_chains <- 4
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 100
+num_trees <- 100
+```
+
+In order to run this sampler in parallel, a parallel backend must be registered in your R environment. 
+The code below will register a parallel backend with access to as many cores are available on your machine.
+Note that we do not **evaluate** the code snippet below in order to interact nicely with CRAN / Github Actions environments.
+
+```{r, eval=FALSE}
+ncores <- parallel::detectCores()
+cl <- makeCluster(ncores)
+registerDoParallel(cl)
+```
+
+Run the sampler, storing the resulting BART objects in a list
+
+```{r}
+bart_models <- foreach (i = 1:num_chains) %dopar% {
+  random_seed <- i
+  stochtree::bart(
+    X_train = X_train, W_train = W_train, y_train = y_train, 
+    X_test = X_test, W_test = W_test, num_trees = num_trees, 
+    num_gfr = num_gfr, num_burnin = num_burnin, 
+    num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T,
+    random_seed = random_seed
+  )
+}
+```
+
+Close the parallel cluster (not evaluated here, as explained above).
+
+```{r, eval=FALSE}
+stopCluster(cl)
+```
+
+Now, if we want to combine the forests from each of these BART models into a 
+single forest, we can do so as follows
+
+```{r}
+json_string_list <- list()
+for (i in 1:num_chains) {
+    json_string_list[[i]] <- saveBARTModelToJsonString(bart_models[[i]])
+}
+combined_forests <- loadForestContainerCombinedJsonString(json_string_list, "forest_0")
+```
+
+We can predict from this combined forest as follows
+
+```{r}
+test_dataset <- createForestDataset(as.matrix(X_test), W_test)
+yhat_combined <- combined_forests$predict(test_dataset)
+```
+
+Compare to the original $\hat{y}$ values
+
+```{r}
+num_samples <- num_gfr+num_burnin+num_mcmc
+for (i in 1:num_chains) {
+    offset <- (i-1)*num_samples
+    inds_start <- offset + 1 + num_burnin + num_gfr
+    inds_end <- offset + num_samples
+    plot(rowMeans(bart_models[[i]]$y_hat_test), 
+         rowMeans(yhat_combined[,inds_start:inds_end]))
+}
+```
 
 # References

From 35be06771d09ae4ce6717fa2da4fb8bec85c7dac Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Thu, 8 Aug 2024 18:02:22 -0700
Subject: [PATCH 06/41] Added functions to combine random effects samples from
 multiple JSON strings / objects

---
 NAMESPACE                                  |  1 +
 R/cpp11.R                                  | 20 +++++
 R/random_effects.R                         | 35 ++++++++
 R/serialization.R                          | 48 ++++++++++-
 include/stochtree/random_effects.h         |  1 +
 man/RandomEffectSamples.Rd                 | 96 ++++++++++++++++++++++
 man/loadRandomEffectSamplesCombinedJson.Rd | 27 ++++++
 src/R_random_effects.cpp                   | 79 ++++++++++++++++++
 src/cpp11.cpp                              | 42 ++++++++++
 src/random_effects.cpp                     | 23 ++++++
 10 files changed, 371 insertions(+), 1 deletion(-)
 create mode 100644 man/loadRandomEffectSamplesCombinedJson.Rd

diff --git a/NAMESPACE b/NAMESPACE
index ecefca33..4029e17c 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -35,6 +35,7 @@ export(getRandomEffectSamples)
 export(loadForestContainerCombinedJson)
 export(loadForestContainerCombinedJsonString)
 export(loadForestContainerJson)
+export(loadRandomEffectSamplesCombinedJson)
 export(loadRandomEffectSamplesJson)
 export(loadScalarJson)
 export(loadVectorJson)
diff --git a/R/cpp11.R b/R/cpp11.R
index 4debd218..a6d060fd 100644
--- a/R/cpp11.R
+++ b/R/cpp11.R
@@ -96,6 +96,26 @@ rfx_group_ids_from_json_cpp <- function(json_ptr, rfx_label) {
   .Call(`_stochtree_rfx_group_ids_from_json_cpp`, json_ptr, rfx_label)
 }
 
+rfx_container_append_from_json_cpp <- function(rfx_container_ptr, json_ptr, rfx_label) {
+  invisible(.Call(`_stochtree_rfx_container_append_from_json_cpp`, rfx_container_ptr, json_ptr, rfx_label))
+}
+
+rfx_container_from_json_string_cpp <- function(json_string, rfx_label) {
+  .Call(`_stochtree_rfx_container_from_json_string_cpp`, json_string, rfx_label)
+}
+
+rfx_label_mapper_from_json_string_cpp <- function(json_string, rfx_label) {
+  .Call(`_stochtree_rfx_label_mapper_from_json_string_cpp`, json_string, rfx_label)
+}
+
+rfx_group_ids_from_json_string_cpp <- function(json_string, rfx_label) {
+  .Call(`_stochtree_rfx_group_ids_from_json_string_cpp`, json_string, rfx_label)
+}
+
+rfx_container_append_from_json_string_cpp <- function(rfx_container_ptr, json_string, rfx_label) {
+  invisible(.Call(`_stochtree_rfx_container_append_from_json_string_cpp`, rfx_container_ptr, json_string, rfx_label))
+}
+
 rfx_model_cpp <- function(num_components, num_groups) {
   .Call(`_stochtree_rfx_model_cpp`, num_components, num_groups)
 }
diff --git a/R/random_effects.R b/R/random_effects.R
index dbcdbbb4..f9d0eaf9 100644
--- a/R/random_effects.R
+++ b/R/random_effects.R
@@ -53,6 +53,41 @@ RandomEffectSamples <- R6::R6Class(
             self$training_group_ids <- rfx_group_ids_from_json_cpp(json_object$json_ptr, json_rfx_groupids_label)
         }, 
         
+        #' @description
+        #' Append random effect draws to `RandomEffectSamples` object from a json object
+        #' @param json_object Object of class `CppJson`
+        #' @param json_rfx_container_label Label referring to a particular rfx sample container (i.e. "random_effect_container_0") in the overall json hierarchy
+        #' @param json_rfx_mapper_label Label referring to a particular rfx label mapper (i.e. "random_effect_label_mapper_0") in the overall json hierarchy
+        #' @param json_rfx_groupids_label Label referring to a particular set of rfx group IDs (i.e. "random_effect_groupids_0") in the overall json hierarchy
+        #' @return NULL (updates object in-place)
+        append_from_json = function(json_object, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label) {
+            rfx_container_append_from_json_cpp(self$rfx_container_ptr, json_object$json_ptr, json_rfx_container_label)
+        }, 
+        
+        #' @description
+        #' Construct RandomEffectSamples object from a json object
+        #' @param json_string JSON string which parses into object of class `CppJson`
+        #' @param json_rfx_container_label Label referring to a particular rfx sample container (i.e. "random_effect_container_0") in the overall json hierarchy
+        #' @param json_rfx_mapper_label Label referring to a particular rfx label mapper (i.e. "random_effect_label_mapper_0") in the overall json hierarchy
+        #' @param json_rfx_groupids_label Label referring to a particular set of rfx group IDs (i.e. "random_effect_groupids_0") in the overall json hierarchy
+        #' @return A new `RandomEffectSamples` object.
+        load_from_json_string = function(json_string, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label) {
+            self$rfx_container_ptr <- rfx_container_from_json_string_cpp(json_object$json_ptr, json_rfx_container_label)
+            self$label_mapper_ptr <- rfx_label_mapper_from_json_string_cpp(json_object$json_ptr, json_rfx_mapper_label)
+            self$training_group_ids <- rfx_group_ids_from_json_string_cpp(json_object$json_ptr, json_rfx_groupids_label)
+        }, 
+        
+        #' @description
+        #' Append random effect draws to `RandomEffectSamples` object from a json object
+        #' @param json_string JSON string which parses into object of class `CppJson`
+        #' @param json_rfx_container_label Label referring to a particular rfx sample container (i.e. "random_effect_container_0") in the overall json hierarchy
+        #' @param json_rfx_mapper_label Label referring to a particular rfx label mapper (i.e. "random_effect_label_mapper_0") in the overall json hierarchy
+        #' @param json_rfx_groupids_label Label referring to a particular set of rfx group IDs (i.e. "random_effect_groupids_0") in the overall json hierarchy
+        #' @return NULL (updates object in-place)
+        append_from_json_string = function(json_string, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label) {
+            rfx_container_append_from_json_string_cpp(self$rfx_container_ptr, json_object$json_ptr, json_rfx_container_label)
+        }, 
+        
         #' @description
         #' Predict random effects for each observation implied by `rfx_group_ids` and `rfx_basis`. 
         #' If a random effects model is "intercept-only" the `rfx_basis` will be a vector of ones of size `length(rfx_group_ids)`.
diff --git a/R/serialization.R b/R/serialization.R
index cf0ba267..6d25e802 100644
--- a/R/serialization.R
+++ b/R/serialization.R
@@ -332,7 +332,7 @@ loadForestContainerJson <- function(json_object, json_forest_label) {
 loadForestContainerCombinedJson <- function(json_object_list, json_forest_label) {
     invisible(output <- ForestSamples$new(0,1,T))
     for (i in 1:length(json_object_list)) {
-        json_object <- json_object_list[i]
+        json_object <- json_object_list[[i]]
         if (i == 1) {
             output$load_from_json(json_object, json_forest_label)
         } else {
@@ -378,6 +378,52 @@ loadRandomEffectSamplesJson <- function(json_object, json_rfx_num) {
     return(output)
 }
 
+#' Combine multiple JSON model objects containing random effects (with the same hierarchy / schema) into a single container
+#'
+#' @param json_object_list List of objects of class `CppJson`
+#' @param json_rfx_num Integer index indicating the position of the random effects term to be unpacked
+#'
+#' @return `RandomEffectSamples` object
+#' @export
+loadRandomEffectSamplesCombinedJson <- function(json_object_list, json_rfx_num) {
+    json_rfx_container_label <- paste0("random_effect_container_", json_rfx_num)
+    json_rfx_mapper_label <- paste0("random_effect_label_mapper_", json_rfx_num)
+    json_rfx_groupids_label <- paste0("random_effect_groupids_", json_rfx_num)
+    invisible(output <- RandomEffectSamples$new())
+    for (i in 1:length(json_object_list)) {
+        json_object <- json_object_list[[i]]
+        if (i == 1) {
+            output$load_from_json(json_object, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label)
+        } else {
+            output$append_from_json(json_object, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label)
+        }
+    }
+    return(output)
+}
+
+#' Combine multiple JSON strings representing model objects containing random effects (with the same hierarchy / schema) into a single container
+#'
+#' @param json_string_list List of objects of class `CppJson`
+#' @param json_rfx_num Integer index indicating the position of the random effects term to be unpacked
+#'
+#' @return `RandomEffectSamples` object
+#' @export
+loadRandomEffectSamplesCombinedJson <- function(json_string_list, json_rfx_num) {
+    json_rfx_container_label <- paste0("random_effect_container_", json_rfx_num)
+    json_rfx_mapper_label <- paste0("random_effect_label_mapper_", json_rfx_num)
+    json_rfx_groupids_label <- paste0("random_effect_groupids_", json_rfx_num)
+    invisible(output <- RandomEffectSamples$new())
+    for (i in 1:length(json_object_list)) {
+        json_string <- json_string_list[[i]]
+        if (i == 1) {
+            output$load_from_json(json_object, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label)
+        } else {
+            output$append_from_json(json_object, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label)
+        }
+    }
+    return(output)
+}
+
 #' Load a vector from json
 #'
 #' @param json_object Object of class `CppJson`
diff --git a/include/stochtree/random_effects.h b/include/stochtree/random_effects.h
index 7d7a65c0..623a1103 100644
--- a/include/stochtree/random_effects.h
+++ b/include/stochtree/random_effects.h
@@ -279,6 +279,7 @@ class RandomEffectsContainer {
   std::vector<double>& GetSigma() {return sigma_xi_;}
   nlohmann::json to_json();
   void from_json(const nlohmann::json& rfx_container_json);
+  void append_from_json(const nlohmann::json& rfx_container_json);
  private:
   int num_samples_;
   int num_components_;
diff --git a/man/RandomEffectSamples.Rd b/man/RandomEffectSamples.Rd
index 55887c03..90981546 100644
--- a/man/RandomEffectSamples.Rd
+++ b/man/RandomEffectSamples.Rd
@@ -28,6 +28,9 @@ needed for prediction / serialization
 \item \href{#method-RandomEffectSamples-new}{\code{RandomEffectSamples$new()}}
 \item \href{#method-RandomEffectSamples-load_in_session}{\code{RandomEffectSamples$load_in_session()}}
 \item \href{#method-RandomEffectSamples-load_from_json}{\code{RandomEffectSamples$load_from_json()}}
+\item \href{#method-RandomEffectSamples-append_from_json}{\code{RandomEffectSamples$append_from_json()}}
+\item \href{#method-RandomEffectSamples-load_from_json_string}{\code{RandomEffectSamples$load_from_json_string()}}
+\item \href{#method-RandomEffectSamples-append_from_json_string}{\code{RandomEffectSamples$append_from_json_string()}}
 \item \href{#method-RandomEffectSamples-predict}{\code{RandomEffectSamples$predict()}}
 \item \href{#method-RandomEffectSamples-extract_parameter_samples}{\code{RandomEffectSamples$extract_parameter_samples()}}
 \item \href{#method-RandomEffectSamples-extract_label_mapping}{\code{RandomEffectSamples$extract_label_mapping()}}
@@ -106,6 +109,99 @@ A new \code{RandomEffectSamples} object.
 }
 }
 \if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-RandomEffectSamples-append_from_json"></a>}}
+\if{latex}{\out{\hypertarget{method-RandomEffectSamples-append_from_json}{}}}
+\subsection{Method \code{append_from_json()}}{
+Append random effect draws to \code{RandomEffectSamples} object from a json object
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{RandomEffectSamples$append_from_json(
+  json_object,
+  json_rfx_container_label,
+  json_rfx_mapper_label,
+  json_rfx_groupids_label
+)}\if{html}{\out{</div>}}
+}
+
+\subsection{Arguments}{
+\if{html}{\out{<div class="arguments">}}
+\describe{
+\item{\code{json_object}}{Object of class \code{CppJson}}
+
+\item{\code{json_rfx_container_label}}{Label referring to a particular rfx sample container (i.e. "random_effect_container_0") in the overall json hierarchy}
+
+\item{\code{json_rfx_mapper_label}}{Label referring to a particular rfx label mapper (i.e. "random_effect_label_mapper_0") in the overall json hierarchy}
+
+\item{\code{json_rfx_groupids_label}}{Label referring to a particular set of rfx group IDs (i.e. "random_effect_groupids_0") in the overall json hierarchy}
+}
+\if{html}{\out{</div>}}
+}
+\subsection{Returns}{
+NULL (updates object in-place)
+}
+}
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-RandomEffectSamples-load_from_json_string"></a>}}
+\if{latex}{\out{\hypertarget{method-RandomEffectSamples-load_from_json_string}{}}}
+\subsection{Method \code{load_from_json_string()}}{
+Construct RandomEffectSamples object from a json object
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{RandomEffectSamples$load_from_json_string(
+  json_string,
+  json_rfx_container_label,
+  json_rfx_mapper_label,
+  json_rfx_groupids_label
+)}\if{html}{\out{</div>}}
+}
+
+\subsection{Arguments}{
+\if{html}{\out{<div class="arguments">}}
+\describe{
+\item{\code{json_string}}{JSON string which parses into object of class \code{CppJson}}
+
+\item{\code{json_rfx_container_label}}{Label referring to a particular rfx sample container (i.e. "random_effect_container_0") in the overall json hierarchy}
+
+\item{\code{json_rfx_mapper_label}}{Label referring to a particular rfx label mapper (i.e. "random_effect_label_mapper_0") in the overall json hierarchy}
+
+\item{\code{json_rfx_groupids_label}}{Label referring to a particular set of rfx group IDs (i.e. "random_effect_groupids_0") in the overall json hierarchy}
+}
+\if{html}{\out{</div>}}
+}
+\subsection{Returns}{
+A new \code{RandomEffectSamples} object.
+}
+}
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-RandomEffectSamples-append_from_json_string"></a>}}
+\if{latex}{\out{\hypertarget{method-RandomEffectSamples-append_from_json_string}{}}}
+\subsection{Method \code{append_from_json_string()}}{
+Append random effect draws to \code{RandomEffectSamples} object from a json object
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{RandomEffectSamples$append_from_json_string(
+  json_string,
+  json_rfx_container_label,
+  json_rfx_mapper_label,
+  json_rfx_groupids_label
+)}\if{html}{\out{</div>}}
+}
+
+\subsection{Arguments}{
+\if{html}{\out{<div class="arguments">}}
+\describe{
+\item{\code{json_string}}{JSON string which parses into object of class \code{CppJson}}
+
+\item{\code{json_rfx_container_label}}{Label referring to a particular rfx sample container (i.e. "random_effect_container_0") in the overall json hierarchy}
+
+\item{\code{json_rfx_mapper_label}}{Label referring to a particular rfx label mapper (i.e. "random_effect_label_mapper_0") in the overall json hierarchy}
+
+\item{\code{json_rfx_groupids_label}}{Label referring to a particular set of rfx group IDs (i.e. "random_effect_groupids_0") in the overall json hierarchy}
+}
+\if{html}{\out{</div>}}
+}
+\subsection{Returns}{
+NULL (updates object in-place)
+}
+}
+\if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-RandomEffectSamples-predict"></a>}}
 \if{latex}{\out{\hypertarget{method-RandomEffectSamples-predict}{}}}
 \subsection{Method \code{predict()}}{
diff --git a/man/loadRandomEffectSamplesCombinedJson.Rd b/man/loadRandomEffectSamplesCombinedJson.Rd
new file mode 100644
index 00000000..ac4c1723
--- /dev/null
+++ b/man/loadRandomEffectSamplesCombinedJson.Rd
@@ -0,0 +1,27 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/serialization.R
+\name{loadRandomEffectSamplesCombinedJson}
+\alias{loadRandomEffectSamplesCombinedJson}
+\title{Combine multiple JSON model objects containing random effects (with the same hierarchy / schema) into a single container}
+\usage{
+loadRandomEffectSamplesCombinedJson(json_string_list, json_rfx_num)
+
+loadRandomEffectSamplesCombinedJson(json_string_list, json_rfx_num)
+}
+\arguments{
+\item{json_string_list}{List of objects of class \code{CppJson}}
+
+\item{json_rfx_num}{Integer index indicating the position of the random effects term to be unpacked}
+
+\item{json_object_list}{List of objects of class \code{CppJson}}
+}
+\value{
+\code{RandomEffectSamples} object
+
+\code{RandomEffectSamples} object
+}
+\description{
+Combine multiple JSON model objects containing random effects (with the same hierarchy / schema) into a single container
+
+Combine multiple JSON strings representing model objects containing random effects (with the same hierarchy / schema) into a single container
+}
diff --git a/src/R_random_effects.cpp b/src/R_random_effects.cpp
index 463b8e97..ccb3aa98 100644
--- a/src/R_random_effects.cpp
+++ b/src/R_random_effects.cpp
@@ -69,6 +69,85 @@ cpp11::writable::integers rfx_group_ids_from_json_cpp(cpp11::external_pointer<nl
     return output;
 }
 
+[[cpp11::register]]
+void rfx_container_append_from_json_cpp(cpp11::external_pointer<StochTree::RandomEffectsContainer> rfx_container_ptr, cpp11::external_pointer<nlohmann::json> json_ptr, std::string rfx_label) {
+    // Extract the random effect container's json
+    nlohmann::json rfx_json = json_ptr->at("random_effects").at(rfx_label);
+    
+    // Reset the forest sample container using the json
+    rfx_container_ptr->append_from_json(rfx_json);
+}
+
+[[cpp11::register]]
+cpp11::external_pointer<StochTree::RandomEffectsContainer> rfx_container_from_json_string_cpp(std::string json_string, std::string rfx_label) {
+    // Create smart pointer to newly allocated object
+    std::unique_ptr<StochTree::RandomEffectsContainer> rfx_container_ptr_ = std::make_unique<StochTree::RandomEffectsContainer>();
+    
+    // Create a nlohmann::json object from the string
+    nlohmann::json json_object = nlohmann::json::parse(json_string);
+    
+    // Extract the random effect container's json
+    nlohmann::json rfx_json = json_object.at("random_effects").at(rfx_label);
+    
+    // Reset the forest sample container using the json
+    rfx_container_ptr_->Reset();
+    rfx_container_ptr_->from_json(rfx_json);
+    
+    // Release management of the pointer to R session
+    return cpp11::external_pointer<StochTree::RandomEffectsContainer>(rfx_container_ptr_.release());
+}
+
+[[cpp11::register]]
+cpp11::external_pointer<StochTree::LabelMapper> rfx_label_mapper_from_json_string_cpp(std::string json_string, std::string rfx_label) {
+    // Create smart pointer to newly allocated object
+    std::unique_ptr<StochTree::LabelMapper> label_mapper_ptr_ = std::make_unique<StochTree::LabelMapper>();
+    
+    // Create a nlohmann::json object from the string
+    nlohmann::json json_object = nlohmann::json::parse(json_string);
+    
+    // Extract the label mapper's json
+    nlohmann::json rfx_json = json_object.at("random_effects").at(rfx_label);
+    
+    // Reset the label mapper using the json
+    label_mapper_ptr_->Reset();
+    label_mapper_ptr_->from_json(rfx_json);
+    
+    // Release management of the pointer to R session
+    return cpp11::external_pointer<StochTree::LabelMapper>(label_mapper_ptr_.release());
+}
+
+[[cpp11::register]]
+cpp11::writable::integers rfx_group_ids_from_json_string_cpp(std::string json_string, std::string rfx_label) {
+    // Create smart pointer to newly allocated object
+    cpp11::writable::integers output;
+    
+    // Create a nlohmann::json object from the string
+    nlohmann::json json_object = nlohmann::json::parse(json_string);
+    
+    // Extract the groupids' json
+    nlohmann::json rfx_json = json_object.at("random_effects").at(rfx_label);
+    
+    // Reset the forest sample container using the json
+    int num_groups = rfx_json.size();
+    for (int i = 0; i < num_groups; i++) {
+        output.push_back(rfx_json.at(i));
+    }
+    
+    return output;
+}
+
+[[cpp11::register]]
+void rfx_container_append_from_json_string_cpp(cpp11::external_pointer<StochTree::RandomEffectsContainer> rfx_container_ptr, std::string json_string, std::string rfx_label) {
+    // Create a nlohmann::json object from the string
+    nlohmann::json json_object = nlohmann::json::parse(json_string);
+    
+    // Extract the random effect container's json
+    nlohmann::json rfx_json = json_object.at("random_effects").at(rfx_label);
+    
+    // Reset the forest sample container using the json
+    rfx_container_ptr->append_from_json(rfx_json);
+}
+
 [[cpp11::register]]
 cpp11::external_pointer<StochTree::MultivariateRegressionRandomEffectsModel> rfx_model_cpp(int num_components, int num_groups) {
     // Create smart pointer to newly allocated object
diff --git a/src/cpp11.cpp b/src/cpp11.cpp
index ca2f168e..b4293c7c 100644
--- a/src/cpp11.cpp
+++ b/src/cpp11.cpp
@@ -181,6 +181,43 @@ extern "C" SEXP _stochtree_rfx_group_ids_from_json_cpp(SEXP json_ptr, SEXP rfx_l
   END_CPP11
 }
 // R_random_effects.cpp
+void rfx_container_append_from_json_cpp(cpp11::external_pointer<StochTree::RandomEffectsContainer> rfx_container_ptr, cpp11::external_pointer<nlohmann::json> json_ptr, std::string rfx_label);
+extern "C" SEXP _stochtree_rfx_container_append_from_json_cpp(SEXP rfx_container_ptr, SEXP json_ptr, SEXP rfx_label) {
+  BEGIN_CPP11
+    rfx_container_append_from_json_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::RandomEffectsContainer>>>(rfx_container_ptr), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<nlohmann::json>>>(json_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(rfx_label));
+    return R_NilValue;
+  END_CPP11
+}
+// R_random_effects.cpp
+cpp11::external_pointer<StochTree::RandomEffectsContainer> rfx_container_from_json_string_cpp(std::string json_string, std::string rfx_label);
+extern "C" SEXP _stochtree_rfx_container_from_json_string_cpp(SEXP json_string, SEXP rfx_label) {
+  BEGIN_CPP11
+    return cpp11::as_sexp(rfx_container_from_json_string_cpp(cpp11::as_cpp<cpp11::decay_t<std::string>>(json_string), cpp11::as_cpp<cpp11::decay_t<std::string>>(rfx_label)));
+  END_CPP11
+}
+// R_random_effects.cpp
+cpp11::external_pointer<StochTree::LabelMapper> rfx_label_mapper_from_json_string_cpp(std::string json_string, std::string rfx_label);
+extern "C" SEXP _stochtree_rfx_label_mapper_from_json_string_cpp(SEXP json_string, SEXP rfx_label) {
+  BEGIN_CPP11
+    return cpp11::as_sexp(rfx_label_mapper_from_json_string_cpp(cpp11::as_cpp<cpp11::decay_t<std::string>>(json_string), cpp11::as_cpp<cpp11::decay_t<std::string>>(rfx_label)));
+  END_CPP11
+}
+// R_random_effects.cpp
+cpp11::writable::integers rfx_group_ids_from_json_string_cpp(std::string json_string, std::string rfx_label);
+extern "C" SEXP _stochtree_rfx_group_ids_from_json_string_cpp(SEXP json_string, SEXP rfx_label) {
+  BEGIN_CPP11
+    return cpp11::as_sexp(rfx_group_ids_from_json_string_cpp(cpp11::as_cpp<cpp11::decay_t<std::string>>(json_string), cpp11::as_cpp<cpp11::decay_t<std::string>>(rfx_label)));
+  END_CPP11
+}
+// R_random_effects.cpp
+void rfx_container_append_from_json_string_cpp(cpp11::external_pointer<StochTree::RandomEffectsContainer> rfx_container_ptr, std::string json_string, std::string rfx_label);
+extern "C" SEXP _stochtree_rfx_container_append_from_json_string_cpp(SEXP rfx_container_ptr, SEXP json_string, SEXP rfx_label) {
+  BEGIN_CPP11
+    rfx_container_append_from_json_string_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::RandomEffectsContainer>>>(rfx_container_ptr), cpp11::as_cpp<cpp11::decay_t<std::string>>(json_string), cpp11::as_cpp<cpp11::decay_t<std::string>>(rfx_label));
+    return R_NilValue;
+  END_CPP11
+}
+// R_random_effects.cpp
 cpp11::external_pointer<StochTree::MultivariateRegressionRandomEffectsModel> rfx_model_cpp(int num_components, int num_groups);
 extern "C" SEXP _stochtree_rfx_model_cpp(SEXP num_components, SEXP num_groups) {
   BEGIN_CPP11
@@ -996,8 +1033,11 @@ static const R_CallMethodDef CallEntries[] = {
     {"_stochtree_predict_forest_cpp",                                  (DL_FUNC) &_stochtree_predict_forest_cpp,                                   2},
     {"_stochtree_predict_forest_raw_cpp",                              (DL_FUNC) &_stochtree_predict_forest_raw_cpp,                               2},
     {"_stochtree_predict_forest_raw_single_forest_cpp",                (DL_FUNC) &_stochtree_predict_forest_raw_single_forest_cpp,                 3},
+    {"_stochtree_rfx_container_append_from_json_cpp",                  (DL_FUNC) &_stochtree_rfx_container_append_from_json_cpp,                   3},
+    {"_stochtree_rfx_container_append_from_json_string_cpp",           (DL_FUNC) &_stochtree_rfx_container_append_from_json_string_cpp,            3},
     {"_stochtree_rfx_container_cpp",                                   (DL_FUNC) &_stochtree_rfx_container_cpp,                                    2},
     {"_stochtree_rfx_container_from_json_cpp",                         (DL_FUNC) &_stochtree_rfx_container_from_json_cpp,                          2},
+    {"_stochtree_rfx_container_from_json_string_cpp",                  (DL_FUNC) &_stochtree_rfx_container_from_json_string_cpp,                   2},
     {"_stochtree_rfx_container_get_alpha_cpp",                         (DL_FUNC) &_stochtree_rfx_container_get_alpha_cpp,                          1},
     {"_stochtree_rfx_container_get_beta_cpp",                          (DL_FUNC) &_stochtree_rfx_container_get_beta_cpp,                           1},
     {"_stochtree_rfx_container_get_sigma_cpp",                         (DL_FUNC) &_stochtree_rfx_container_get_sigma_cpp,                          1},
@@ -1014,8 +1054,10 @@ static const R_CallMethodDef CallEntries[] = {
     {"_stochtree_rfx_dataset_has_variance_weights_cpp",                (DL_FUNC) &_stochtree_rfx_dataset_has_variance_weights_cpp,                 1},
     {"_stochtree_rfx_dataset_num_rows_cpp",                            (DL_FUNC) &_stochtree_rfx_dataset_num_rows_cpp,                             1},
     {"_stochtree_rfx_group_ids_from_json_cpp",                         (DL_FUNC) &_stochtree_rfx_group_ids_from_json_cpp,                          2},
+    {"_stochtree_rfx_group_ids_from_json_string_cpp",                  (DL_FUNC) &_stochtree_rfx_group_ids_from_json_string_cpp,                   2},
     {"_stochtree_rfx_label_mapper_cpp",                                (DL_FUNC) &_stochtree_rfx_label_mapper_cpp,                                 1},
     {"_stochtree_rfx_label_mapper_from_json_cpp",                      (DL_FUNC) &_stochtree_rfx_label_mapper_from_json_cpp,                       2},
+    {"_stochtree_rfx_label_mapper_from_json_string_cpp",               (DL_FUNC) &_stochtree_rfx_label_mapper_from_json_string_cpp,                2},
     {"_stochtree_rfx_label_mapper_to_list_cpp",                        (DL_FUNC) &_stochtree_rfx_label_mapper_to_list_cpp,                         1},
     {"_stochtree_rfx_model_cpp",                                       (DL_FUNC) &_stochtree_rfx_model_cpp,                                        2},
     {"_stochtree_rfx_model_predict_cpp",                               (DL_FUNC) &_stochtree_rfx_model_predict_cpp,                                3},
diff --git a/src/random_effects.cpp b/src/random_effects.cpp
index bc746e81..efb141cf 100644
--- a/src/random_effects.cpp
+++ b/src/random_effects.cpp
@@ -294,4 +294,27 @@ void RandomEffectsContainer::from_json(const nlohmann::json& rfx_container_json)
   }
 }
 
+void RandomEffectsContainer::append_from_json(const nlohmann::json& rfx_container_json) {
+  CHECK_EQ(this->num_components_, rfx_container_json.at("num_components"));
+  CHECK_EQ(this->num_groups_, rfx_container_json.at("num_groups"));
+  
+  // Update internal sample count and extract size of parameter vectors
+  int new_num_samples = rfx_container_json.at("num_samples");
+  this->num_samples_ += new_num_samples;
+  int beta_size = rfx_container_json.at("beta_size");
+  int alpha_size = rfx_container_json.at("alpha_size");
+  
+  // Unpack beta and xi
+  for (int i = 0; i < beta_size; i++) {
+    beta_.push_back(rfx_container_json.at("beta").at(i));
+    xi_.push_back(rfx_container_json.at("xi").at(i));
+  }
+  
+  // Unpack alpha and sigma_xi
+  for (int i = 0; i < alpha_size; i++) {
+    alpha_.push_back(rfx_container_json.at("alpha").at(i));
+    sigma_xi_.push_back(rfx_container_json.at("sigma_xi").at(i));
+  }
+}
+
 }  // namespace StochTree

From be80a1c32a12558a0ae5755da6087afc2e0f1dd0 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Fri, 9 Aug 2024 01:18:09 -0500
Subject: [PATCH 07/41] Updated multichain code and demos

---
 NAMESPACE                                     |   3 +
 R/bart.R                                      | 268 ++++++++++++++++++
 R/serialization.R                             |   6 +-
 _pkgdown.yml                                  |  11 +
 man/createBARTModelFromCombinedJson.Rd        |  44 +++
 man/createBARTModelFromCombinedJsonString.Rd  |  44 +++
 man/loadRandomEffectSamplesCombinedJson.Rd    |  12 +-
 ...adRandomEffectSamplesCombinedJsonString.Rd |  19 ++
 vignettes/MultiChain.Rmd                      |  63 ++--
 9 files changed, 432 insertions(+), 38 deletions(-)
 create mode 100644 man/createBARTModelFromCombinedJson.Rd
 create mode 100644 man/createBARTModelFromCombinedJsonString.Rd
 create mode 100644 man/loadRandomEffectSamplesCombinedJsonString.Rd

diff --git a/NAMESPACE b/NAMESPACE
index 4029e17c..eb7284d2 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -10,6 +10,8 @@ export(computeForestKernels)
 export(computeForestLeafIndices)
 export(convertBARTModelToJson)
 export(convertBCFModelToJson)
+export(createBARTModelFromCombinedJson)
+export(createBARTModelFromCombinedJsonString)
 export(createBARTModelFromJson)
 export(createBARTModelFromJsonFile)
 export(createBARTModelFromJsonString)
@@ -36,6 +38,7 @@ export(loadForestContainerCombinedJson)
 export(loadForestContainerCombinedJsonString)
 export(loadForestContainerJson)
 export(loadRandomEffectSamplesCombinedJson)
+export(loadRandomEffectSamplesCombinedJsonString)
 export(loadRandomEffectSamplesJson)
 export(loadScalarJson)
 export(loadVectorJson)
diff --git a/R/bart.R b/R/bart.R
index 30dd0e70..39ec45f6 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -1033,3 +1033,271 @@ createBARTModelFromJsonString <- function(json_string){
     
     return(bart_object)
 }
+
+#' Convert a list of (in-memory) JSON representations of a BART model to a single combined BART model object 
+#' which can be used for prediction, etc...
+#'
+#' @param json_object_list List of objects of type `CppJson` containing Json representation of a BART model
+#'
+#' @return Object of type `bartmodel`
+#' @export
+#'
+#' @examples
+#' n <- 100
+#' p <- 5
+#' X <- matrix(runif(n*p), ncol = p)
+#' f_XW <- (
+#'     ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+#'     ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+#'     ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+#'     ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+#' )
+#' noise_sd <- 1
+#' y <- f_XW + rnorm(n, 0, noise_sd)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' bart_model <- bart(X_train = X_train, y_train = y_train)
+#' # bart_json <- list(convertBARTModelToJson(bart_model))
+#' # bart_model_roundtrip <- createBARTModelFromCombinedJson(bart_json)
+createBARTModelFromCombinedJson <- function(json_object_list){
+    # Initialize the BCF model
+    output <- list()
+    
+    # Unpack the forests
+    output[["forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_0")
+    
+    # For scalar / preprocessing details which aren't sample-dependent, 
+    # defer to the first json
+    json_object_default <- json_object_list[[1]]
+    
+    # Unpack metadata
+    train_set_metadata = list()
+    train_set_metadata[["num_numeric_vars"]] <- json_object_default$get_scalar("num_numeric_vars")
+    train_set_metadata[["num_ordered_cat_vars"]] <- json_object_default$get_scalar("num_ordered_cat_vars")
+    train_set_metadata[["num_unordered_cat_vars"]] <- json_object_default$get_scalar("num_unordered_cat_vars")
+    if (train_set_metadata[["num_numeric_vars"]] > 0) {
+        train_set_metadata[["numeric_vars"]] <- json_object_default$get_string_vector("numeric_vars")
+    }
+    if (train_set_metadata[["num_ordered_cat_vars"]] > 0) {
+        train_set_metadata[["ordered_cat_vars"]] <- json_object_default$get_string_vector("ordered_cat_vars")
+        train_set_metadata[["ordered_unique_levels"]] <- json_object_default$get_string_list("ordered_unique_levels", train_set_metadata[["ordered_cat_vars"]])
+    }
+    if (train_set_metadata[["num_unordered_cat_vars"]] > 0) {
+        train_set_metadata[["unordered_cat_vars"]] <- json_object_default$get_string_vector("unordered_cat_vars")
+        train_set_metadata[["unordered_unique_levels"]] <- json_object_default$get_string_list("unordered_unique_levels", train_set_metadata[["unordered_cat_vars"]])
+    }
+    output[["train_set_metadata"]] <- train_set_metadata
+
+    # Unpack model params
+    model_params = list()
+    model_params[["outcome_scale"]] <- json_object_default$get_scalar("outcome_scale")
+    model_params[["outcome_mean"]] <- json_object_default$get_scalar("outcome_mean")
+    model_params[["sample_sigma"]] <- json_object_default$get_boolean("sample_sigma")
+    model_params[["sample_tau"]] <- json_object_default$get_boolean("sample_tau")
+    model_params[["has_rfx"]] <- json_object_default$get_boolean("has_rfx")
+    model_params[["has_rfx_basis"]] <- json_object_default$get_boolean("has_rfx_basis")
+    model_params[["num_rfx_basis"]] <- json_object_default$get_scalar("num_rfx_basis")
+    model_params[["num_covariates"]] <- json_object_default$get_scalar("num_covariates")
+    model_params[["num_basis"]] <- json_object_default$get_scalar("num_basis")
+    model_params[["requires_basis"]] <- json_object_default$get_boolean("requires_basis")
+
+    # Combine values that are sample-specific
+    keep_index_offset <- 0
+    keep_indices <- c()
+    for (i in 1:length(json_object_list)) {
+        json_object <- json_object_list[[i]]
+        if (i == 1) {
+            model_params[["num_gfr"]] <- json_object$get_scalar("num_gfr")
+            model_params[["num_burnin"]] <- json_object$get_scalar("num_burnin")
+            model_params[["num_mcmc"]] <- json_object$get_scalar("num_mcmc")
+            model_params[["num_samples"]] <- json_object$get_scalar("num_samples")
+            keep_indices <- c(keep_indices, keep_index_offset + json_object$get_vector("keep_indices"))
+        } else {
+            prev_json <- json_object_list[[i-1]]
+            model_params[["num_gfr"]] <- model_params[["num_gfr"]] + json_object$get_scalar("num_gfr")
+            model_params[["num_burnin"]] <- model_params[["num_burnin"]] + json_object$get_scalar("num_burnin")
+            model_params[["num_mcmc"]] <- model_params[["num_mcmc"]] + json_object$get_scalar("num_mcmc")
+            model_params[["num_samples"]] <- model_params[["num_samples"]] + json_object$get_scalar("num_samples")
+            keep_index_offset <- keep_index_offset + prev_json$get_scalar("num_samples")
+            keep_indices <- c(keep_indices, keep_index_offset + json_object$get_vector("keep_indices"))
+        }
+    }
+    output[["keep_indices"]] <- keep_indices
+    output[["model_params"]] <- model_params
+    
+    # Unpack sampled parameters
+    if (model_params[["sample_sigma"]]) {
+        for (i in 1:length(json_object_list)) {
+            json_object <- json_object_list[[i]]
+            if (i == 1) {
+                output[["sigma2_samples"]] <- json_object$get_vector("sigma2_samples", "parameters")
+            } else {
+                output[["sigma2_samples"]] <- c(output[["sigma2_samples"]], json_object$get_vector("sigma2_samples", "parameters"))
+            }
+        }
+    }
+    if (model_params[["sample_tau"]]) {
+        for (i in 1:length(json_object_list)) {
+            json_object <- json_object_list[[i]]
+            if (i == 1) {
+                output[["tau_samples"]] <- json_object$get_vector("tau_samples", "parameters")
+            } else {
+                output[["tau_samples"]] <- c(output[["tau_samples"]], json_object$get_vector("tau_samples", "parameters"))
+            }
+        }
+    }
+    
+    # Unpack random effects
+    if (model_params[["has_rfx"]]) {
+        output[["rfx_unique_group_ids"]] <- json_object_default$get_string_vector("rfx_unique_group_ids")
+        output[["rfx_samples"]] <- loadRandomEffectSamplesCombinedJson(json_object_list, 0)
+    }
+    
+    class(output) <- "bartmodel"
+    return(output)
+}
+
+#' Convert a list of (in-memory) JSON strings that represent BART models to a single combined BART model object 
+#' which can be used for prediction, etc...
+#'
+#' @param json_string_list List of JSON strings which can be parsed to objects of type `CppJson` containing Json representation of a BART model
+#'
+#' @return Object of type `bartmodel`
+#' @export
+#'
+#' @examples
+#' n <- 100
+#' p <- 5
+#' X <- matrix(runif(n*p), ncol = p)
+#' f_XW <- (
+#'     ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+#'     ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+#'     ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+#'     ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+#' )
+#' noise_sd <- 1
+#' y <- f_XW + rnorm(n, 0, noise_sd)
+#' test_set_pct <- 0.2
+#' n_test <- round(test_set_pct*n)
+#' n_train <- n - n_test
+#' test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+#' train_inds <- (1:n)[!((1:n) %in% test_inds)]
+#' X_test <- X[test_inds,]
+#' X_train <- X[train_inds,]
+#' y_test <- y[test_inds]
+#' y_train <- y[train_inds]
+#' bart_model <- bart(X_train = X_train, y_train = y_train)
+#' # bart_json_string_list <- list(saveBARTModelToJsonString(bart_model))
+#' # bart_model_roundtrip <- createBARTModelFromCombinedJsonString(bart_json_string_list)
+createBARTModelFromCombinedJsonString <- function(json_string_list){
+    # Initialize the BCF model
+    output <- list()
+    
+    # Convert JSON strings
+    json_object_list <- list()
+    for (i in 1:length(json_string_list)) {
+        json_string <- json_string_list[[i]]
+        json_object_list[[i]] <- createCppJsonString(json_string)
+    }
+    
+    # Unpack the forests
+    output[["forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_0")
+    
+    # For scalar / preprocessing details which aren't sample-dependent, 
+    # defer to the first json
+    json_object_default <- json_object_list[[1]]
+    
+    # Unpack metadata
+    train_set_metadata = list()
+    train_set_metadata[["num_numeric_vars"]] <- json_object_default$get_scalar("num_numeric_vars")
+    train_set_metadata[["num_ordered_cat_vars"]] <- json_object_default$get_scalar("num_ordered_cat_vars")
+    train_set_metadata[["num_unordered_cat_vars"]] <- json_object_default$get_scalar("num_unordered_cat_vars")
+    if (train_set_metadata[["num_numeric_vars"]] > 0) {
+        train_set_metadata[["numeric_vars"]] <- json_object_default$get_string_vector("numeric_vars")
+    }
+    if (train_set_metadata[["num_ordered_cat_vars"]] > 0) {
+        train_set_metadata[["ordered_cat_vars"]] <- json_object_default$get_string_vector("ordered_cat_vars")
+        train_set_metadata[["ordered_unique_levels"]] <- json_object_default$get_string_list("ordered_unique_levels", train_set_metadata[["ordered_cat_vars"]])
+    }
+    if (train_set_metadata[["num_unordered_cat_vars"]] > 0) {
+        train_set_metadata[["unordered_cat_vars"]] <- json_object_default$get_string_vector("unordered_cat_vars")
+        train_set_metadata[["unordered_unique_levels"]] <- json_object_default$get_string_list("unordered_unique_levels", train_set_metadata[["unordered_cat_vars"]])
+    }
+    output[["train_set_metadata"]] <- train_set_metadata
+    output[["keep_indices"]] <- json_object_default$get_vector("keep_indices")
+    
+    # Unpack model params
+    model_params = list()
+    model_params[["outcome_scale"]] <- json_object_default$get_scalar("outcome_scale")
+    model_params[["outcome_mean"]] <- json_object_default$get_scalar("outcome_mean")
+    model_params[["sample_sigma"]] <- json_object_default$get_boolean("sample_sigma")
+    model_params[["sample_tau"]] <- json_object_default$get_boolean("sample_tau")
+    model_params[["has_rfx"]] <- json_object_default$get_boolean("has_rfx")
+    model_params[["has_rfx_basis"]] <- json_object_default$get_boolean("has_rfx_basis")
+    model_params[["num_rfx_basis"]] <- json_object_default$get_scalar("num_rfx_basis")
+    model_params[["num_covariates"]] <- json_object_default$get_scalar("num_covariates")
+    model_params[["num_basis"]] <- json_object_default$get_scalar("num_basis")
+    model_params[["requires_basis"]] <- json_object_default$get_boolean("requires_basis")
+    
+    # Combine values that are sample-specific
+    keep_index_offset <- 0
+    keep_indices <- c()
+    for (i in 1:length(json_object_list)) {
+        json_object <- json_object_list[[i]]
+        if (i == 1) {
+            model_params[["num_gfr"]] <- json_object$get_scalar("num_gfr")
+            model_params[["num_burnin"]] <- json_object$get_scalar("num_burnin")
+            model_params[["num_mcmc"]] <- json_object$get_scalar("num_mcmc")
+            model_params[["num_samples"]] <- json_object$get_scalar("num_samples")
+            keep_indices <- c(keep_indices, keep_index_offset + json_object$get_vector("keep_indices"))
+        } else {
+            prev_json <- json_object_list[[i-1]]
+            model_params[["num_gfr"]] <- model_params[["num_gfr"]] + json_object$get_scalar("num_gfr")
+            model_params[["num_burnin"]] <- model_params[["num_burnin"]] + json_object$get_scalar("num_burnin")
+            model_params[["num_mcmc"]] <- model_params[["num_mcmc"]] + json_object$get_scalar("num_mcmc")
+            model_params[["num_samples"]] <- model_params[["num_samples"]] + json_object$get_scalar("num_samples")
+            keep_index_offset <- keep_index_offset + prev_json$get_scalar("num_samples")
+            keep_indices <- c(keep_indices, keep_index_offset + json_object$get_vector("keep_indices"))
+        }
+    }
+    output[["keep_indices"]] <- keep_indices
+    output[["model_params"]] <- model_params
+    
+    # Unpack sampled parameters
+    if (model_params[["sample_sigma"]]) {
+        for (i in 1:length(json_object_list)) {
+            json_object <- json_object_list[[i]]
+            if (i == 1) {
+                output[["sigma2_samples"]] <- json_object$get_vector("sigma2_samples", "parameters")
+            } else {
+                output[["sigma2_samples"]] <- c(output[["sigma2_samples"]], json_object$get_vector("sigma2_samples", "parameters"))
+            }
+        }
+    }
+    if (model_params[["sample_tau"]]) {
+        for (i in 1:length(json_object_list)) {
+            json_object <- json_object_list[[i]]
+            if (i == 1) {
+                output[["tau_samples"]] <- json_object$get_vector("tau_samples", "parameters")
+            } else {
+                output[["tau_samples"]] <- c(output[["tau_samples"]], json_object$get_vector("tau_samples", "parameters"))
+            }
+        }
+    }
+    
+    # Unpack random effects
+    if (model_params[["has_rfx"]]) {
+        output[["rfx_unique_group_ids"]] <- json_object_default$get_string_vector("rfx_unique_group_ids")
+        output[["rfx_samples"]] <- loadRandomEffectSamplesCombinedJson(json_object_list, 0)
+    }
+    
+    class(output) <- "bartmodel"
+    return(output)
+}
diff --git a/R/serialization.R b/R/serialization.R
index 6d25e802..4c6ec0cb 100644
--- a/R/serialization.R
+++ b/R/serialization.R
@@ -408,7 +408,7 @@ loadRandomEffectSamplesCombinedJson <- function(json_object_list, json_rfx_num)
 #'
 #' @return `RandomEffectSamples` object
 #' @export
-loadRandomEffectSamplesCombinedJson <- function(json_string_list, json_rfx_num) {
+loadRandomEffectSamplesCombinedJsonString <- function(json_string_list, json_rfx_num) {
     json_rfx_container_label <- paste0("random_effect_container_", json_rfx_num)
     json_rfx_mapper_label <- paste0("random_effect_label_mapper_", json_rfx_num)
     json_rfx_groupids_label <- paste0("random_effect_groupids_", json_rfx_num)
@@ -416,9 +416,9 @@ loadRandomEffectSamplesCombinedJson <- function(json_string_list, json_rfx_num)
     for (i in 1:length(json_object_list)) {
         json_string <- json_string_list[[i]]
         if (i == 1) {
-            output$load_from_json(json_object, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label)
+            output$load_from_json_string(json_string, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label)
         } else {
-            output$append_from_json(json_object, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label)
+            output$append_from_json_string(json_string, json_rfx_container_label, json_rfx_mapper_label, json_rfx_groupids_label)
         }
     }
     return(output)
diff --git a/_pkgdown.yml b/_pkgdown.yml
index f919a864..ec8742fd 100644
--- a/_pkgdown.yml
+++ b/_pkgdown.yml
@@ -38,6 +38,17 @@ reference:
   - loadRandomEffectSamplesJson
   - loadVectorJson
   - loadScalarJson
+  - convertBARTModelToJson
+  - createBARTModelFromCombinedJson
+  - createBARTModelFromCombinedJsonString
+  - createBARTModelFromJson
+  - createBARTModelFromJsonFile
+  - createBARTModelFromJsonString
+  - loadRandomEffectSamplesCombinedJson
+  - loadRandomEffectSamplesCombinedJsonString
+  - saveBARTModelToJsonFile
+  - saveBARTModelToJsonString
+  - saveBCFModelToJsonString
 
 - subtitle: Data
   desc: >
diff --git a/man/createBARTModelFromCombinedJson.Rd b/man/createBARTModelFromCombinedJson.Rd
new file mode 100644
index 00000000..72c3e675
--- /dev/null
+++ b/man/createBARTModelFromCombinedJson.Rd
@@ -0,0 +1,44 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bart.R
+\name{createBARTModelFromCombinedJson}
+\alias{createBARTModelFromCombinedJson}
+\title{Convert a list of (in-memory) JSON representations of a BART model to a single combined BART model object
+which can be used for prediction, etc...}
+\usage{
+createBARTModelFromCombinedJson(json_object_list)
+}
+\arguments{
+\item{json_object_list}{List of objects of type \code{CppJson} containing Json representation of a BART model}
+}
+\value{
+Object of type \code{bartmodel}
+}
+\description{
+Convert a list of (in-memory) JSON representations of a BART model to a single combined BART model object
+which can be used for prediction, etc...
+}
+\examples{
+n <- 100
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+bart_model <- bart(X_train = X_train, y_train = y_train)
+# bart_json <- list(convertBARTModelToJson(bart_model))
+# bart_model_roundtrip <- createBARTModelFromCombinedJson(bart_json)
+}
diff --git a/man/createBARTModelFromCombinedJsonString.Rd b/man/createBARTModelFromCombinedJsonString.Rd
new file mode 100644
index 00000000..99c248b7
--- /dev/null
+++ b/man/createBARTModelFromCombinedJsonString.Rd
@@ -0,0 +1,44 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/bart.R
+\name{createBARTModelFromCombinedJsonString}
+\alias{createBARTModelFromCombinedJsonString}
+\title{Convert a list of (in-memory) JSON strings that represent BART models to a single combined BART model object
+which can be used for prediction, etc...}
+\usage{
+createBARTModelFromCombinedJsonString(json_string_list)
+}
+\arguments{
+\item{json_string_list}{List of JSON strings which can be parsed to objects of type \code{CppJson} containing Json representation of a BART model}
+}
+\value{
+Object of type \code{bartmodel}
+}
+\description{
+Convert a list of (in-memory) JSON strings that represent BART models to a single combined BART model object
+which can be used for prediction, etc...
+}
+\examples{
+n <- 100
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) \%in\% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+bart_model <- bart(X_train = X_train, y_train = y_train)
+# bart_json_string_list <- list(saveBARTModelToJsonString(bart_model))
+# bart_model_roundtrip <- createBARTModelFromCombinedJsonString(bart_json_string_list)
+}
diff --git a/man/loadRandomEffectSamplesCombinedJson.Rd b/man/loadRandomEffectSamplesCombinedJson.Rd
index ac4c1723..d7ef5705 100644
--- a/man/loadRandomEffectSamplesCombinedJson.Rd
+++ b/man/loadRandomEffectSamplesCombinedJson.Rd
@@ -4,24 +4,16 @@
 \alias{loadRandomEffectSamplesCombinedJson}
 \title{Combine multiple JSON model objects containing random effects (with the same hierarchy / schema) into a single container}
 \usage{
-loadRandomEffectSamplesCombinedJson(json_string_list, json_rfx_num)
-
-loadRandomEffectSamplesCombinedJson(json_string_list, json_rfx_num)
+loadRandomEffectSamplesCombinedJson(json_object_list, json_rfx_num)
 }
 \arguments{
-\item{json_string_list}{List of objects of class \code{CppJson}}
+\item{json_object_list}{List of objects of class \code{CppJson}}
 
 \item{json_rfx_num}{Integer index indicating the position of the random effects term to be unpacked}
-
-\item{json_object_list}{List of objects of class \code{CppJson}}
 }
 \value{
-\code{RandomEffectSamples} object
-
 \code{RandomEffectSamples} object
 }
 \description{
 Combine multiple JSON model objects containing random effects (with the same hierarchy / schema) into a single container
-
-Combine multiple JSON strings representing model objects containing random effects (with the same hierarchy / schema) into a single container
 }
diff --git a/man/loadRandomEffectSamplesCombinedJsonString.Rd b/man/loadRandomEffectSamplesCombinedJsonString.Rd
new file mode 100644
index 00000000..3531b968
--- /dev/null
+++ b/man/loadRandomEffectSamplesCombinedJsonString.Rd
@@ -0,0 +1,19 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/serialization.R
+\name{loadRandomEffectSamplesCombinedJsonString}
+\alias{loadRandomEffectSamplesCombinedJsonString}
+\title{Combine multiple JSON strings representing model objects containing random effects (with the same hierarchy / schema) into a single container}
+\usage{
+loadRandomEffectSamplesCombinedJsonString(json_string_list, json_rfx_num)
+}
+\arguments{
+\item{json_string_list}{List of objects of class \code{CppJson}}
+
+\item{json_rfx_num}{Integer index indicating the position of the random effects term to be unpacked}
+}
+\value{
+\code{RandomEffectSamples} object
+}
+\description{
+Combine multiple JSON strings representing model objects containing random effects (with the same hierarchy / schema) into a single container
+}
diff --git a/vignettes/MultiChain.Rmd b/vignettes/MultiChain.Rmd
index 13275117..9cecaadd 100644
--- a/vignettes/MultiChain.Rmd
+++ b/vignettes/MultiChain.Rmd
@@ -115,27 +115,30 @@ json_string_list <- list()
 for (i in 1:num_chains) {
     json_string_list[[i]] <- saveBARTModelToJsonString(bart_models[[i]])
 }
-combined_forests <- loadForestContainerCombinedJsonString(json_string_list, "forest_0")
+combined_bart <- createBARTModelFromCombinedJsonString(json_string_list)
 ```
 
 We can predict from this combined forest as follows
 
 ```{r}
-test_dataset <- createForestDataset(as.matrix(X_test), W_test)
-yhat_combined <- combined_forests$predict(test_dataset)
+yhat_combined <- predict(combined_bart, X_test, W_test)$y_hat
 ```
 
 Compare to the original $\hat{y}$ values
 
 ```{r}
-num_samples <- num_gfr+num_burnin+num_mcmc
+par(mfrow = c(1,2))
 for (i in 1:num_chains) {
-    offset <- (i-1)*num_samples
-    inds_start <- offset + 1 + num_burnin + num_gfr
-    inds_end <- offset + num_samples
+    offset <- (i-1)*num_mcmc
+    inds_start <- offset + 1
+    inds_end <- offset + num_mcmc
     plot(rowMeans(bart_models[[i]]$y_hat_test), 
-         rowMeans(yhat_combined[,inds_start:inds_end]))
+         rowMeans(yhat_combined[,inds_start:inds_end]),
+         xlab = "original", ylab = "deserialized", 
+         main = paste0("Chain ", i, "\nPredictions"))
+    abline(0,1,col="red",lty=3,lwd=3)
 }
+par(mfrow = c(1,1))
 ```
 
 ## Sampling Multiple Chains in Parallel
@@ -160,18 +163,29 @@ cl <- makeCluster(ncores)
 registerDoParallel(cl)
 ```
 
-Run the sampler, storing the resulting BART objects in a list
+Note that the `bartmodel` object contains external pointers to forests created by 
+the `stochtree` shared object, and when `stochtree::bart()` is run in parallel 
+on independent subprocesses, these pointers are not generally accessible in the 
+session that kicked off the parallel run. 
+
+To overcome this, you can return a JSON representation of a `bartmodel` in memory 
+and combine them into a single in-memory `bartmodel` object.
+
+The first step of this process is to run the sampler in parallel, 
+storing the resulting BART JSON strings in a list.
 
 ```{r}
-bart_models <- foreach (i = 1:num_chains) %dopar% {
+bart_model_strings <- foreach (i = 1:num_chains) %dopar% {
   random_seed <- i
-  stochtree::bart(
+  bart_model <- stochtree::bart(
     X_train = X_train, W_train = W_train, y_train = y_train, 
     X_test = X_test, W_test = W_test, num_trees = num_trees, 
     num_gfr = num_gfr, num_burnin = num_burnin, 
     num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T,
     random_seed = random_seed
   )
+  bart_model_string <- stochtree::saveBARTModelToJsonString(bart_model)
+  bart_model_string
 }
 ```
 
@@ -185,31 +199,30 @@ Now, if we want to combine the forests from each of these BART models into a
 single forest, we can do so as follows
 
 ```{r}
-json_string_list <- list()
-for (i in 1:num_chains) {
-    json_string_list[[i]] <- saveBARTModelToJsonString(bart_models[[i]])
-}
-combined_forests <- loadForestContainerCombinedJsonString(json_string_list, "forest_0")
+combined_bart <- createBARTModelFromCombinedJsonString(bart_model_strings)
 ```
 
 We can predict from this combined forest as follows
 
 ```{r}
-test_dataset <- createForestDataset(as.matrix(X_test), W_test)
-yhat_combined <- combined_forests$predict(test_dataset)
+yhat_combined <- predict(combined_bart, X_test, W_test)$y_hat
 ```
 
-Compare to the original $\hat{y}$ values
+Since we don't have access to the original $\hat{y}$ values, we instead 
+compare average predictions from each chain to the true $y$ values.
 
 ```{r}
-num_samples <- num_gfr+num_burnin+num_mcmc
+par(mfrow = c(1,2))
 for (i in 1:num_chains) {
-    offset <- (i-1)*num_samples
-    inds_start <- offset + 1 + num_burnin + num_gfr
-    inds_end <- offset + num_samples
-    plot(rowMeans(bart_models[[i]]$y_hat_test), 
-         rowMeans(yhat_combined[,inds_start:inds_end]))
+    offset <- (i-1)*num_mcmc
+    inds_start <- offset + 1
+    inds_end <- offset + num_mcmc
+    plot(rowMeans(yhat_combined[,inds_start:inds_end]), y_test,
+         xlab = "predicted", ylab = "actual", 
+         main = paste0("Chain ", i, "\nPredictions"))
+    abline(0,1,col="red",lty=3,lwd=3)
 }
+par(mfrow = c(1,1))
 ```
 
 # References

From 20170539b11274aec6e6d8a7470e6b7d781d2788 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Fri, 23 Aug 2024 23:54:14 -0500
Subject: [PATCH 08/41] Refactored the sampler classes into stateless templated
 functions

---
 debug/api_debug.cpp              |  18 +-
 include/stochtree/tree_sampler.h | 854 +++++++++++++++----------------
 src/py_stochtree.cpp             |  18 +-
 src/sampler.cpp                  |  20 +-
 4 files changed, 436 insertions(+), 474 deletions(-)

diff --git a/debug/api_debug.cpp b/debug/api_debug.cpp
index d827d8cb..d7420d5f 100644
--- a/debug/api_debug.cpp
+++ b/debug/api_debug.cpp
@@ -270,16 +270,13 @@ void sampleGFR(ForestTracker& tracker, TreePrior& tree_prior, ForestContainer& f
                ForestLeafModel leaf_model_type, Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size) {
   if (leaf_model_type == ForestLeafModel::kConstant) {
     GaussianConstantLeafModel leaf_model = GaussianConstantLeafModel(leaf_scale);
-    GFRForestSampler<GaussianConstantLeafModel> sampler = GFRForestSampler<GaussianConstantLeafModel>(cutpoint_grid_size);
-    sampler.SampleOneIter(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types);
+    GFRSampleOneIter<GaussianConstantLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
   } else if (leaf_model_type == ForestLeafModel::kUnivariateRegression) {
     GaussianUnivariateRegressionLeafModel leaf_model = GaussianUnivariateRegressionLeafModel(leaf_scale);
-    GFRForestSampler<GaussianUnivariateRegressionLeafModel> sampler = GFRForestSampler<GaussianUnivariateRegressionLeafModel>(cutpoint_grid_size);
-    sampler.SampleOneIter(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types);
+    GFRSampleOneIter<GaussianUnivariateRegressionLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
   } else if (leaf_model_type == ForestLeafModel::kMultivariateRegression) {
     GaussianMultivariateRegressionLeafModel leaf_model = GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-    GFRForestSampler<GaussianMultivariateRegressionLeafModel> sampler = GFRForestSampler<GaussianMultivariateRegressionLeafModel>(cutpoint_grid_size);
-    sampler.SampleOneIter(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types);
+    GFRSampleOneIter<GaussianMultivariateRegressionLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
   }
 }
 
@@ -288,16 +285,13 @@ void sampleMCMC(ForestTracker& tracker, TreePrior& tree_prior, ForestContainer&
                 ForestLeafModel leaf_model_type, Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size) {
   if (leaf_model_type == ForestLeafModel::kConstant) {
     GaussianConstantLeafModel leaf_model = GaussianConstantLeafModel(leaf_scale);
-    MCMCForestSampler<GaussianConstantLeafModel> sampler = MCMCForestSampler<GaussianConstantLeafModel>();
-    sampler.SampleOneIter(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
+    MCMCSampleOneIter<GaussianConstantLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
   } else if (leaf_model_type == ForestLeafModel::kUnivariateRegression) {
     GaussianUnivariateRegressionLeafModel leaf_model = GaussianUnivariateRegressionLeafModel(leaf_scale);
-    MCMCForestSampler<GaussianUnivariateRegressionLeafModel> sampler = MCMCForestSampler<GaussianUnivariateRegressionLeafModel>();
-    sampler.SampleOneIter(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
+    MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
   } else if (leaf_model_type == ForestLeafModel::kMultivariateRegression) {
     GaussianMultivariateRegressionLeafModel leaf_model = GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-    MCMCForestSampler<GaussianMultivariateRegressionLeafModel> sampler = MCMCForestSampler<GaussianMultivariateRegressionLeafModel>();
-    sampler.SampleOneIter(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
+    MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
   }
 }
 
diff --git a/include/stochtree/tree_sampler.h b/include/stochtree/tree_sampler.h
index 9c9a854e..9db97f02 100644
--- a/include/stochtree/tree_sampler.h
+++ b/include/stochtree/tree_sampler.h
@@ -234,266 +234,183 @@ static inline void UpdateResidualNewBasis(ForestTracker& tracker, ForestDataset&
 }
 
 template <typename LeafModel>
-class MCMCForestSampler {
- public:
-  MCMCForestSampler() {}
-  ~MCMCForestSampler() {}
+static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
+                                     ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
+                                     double global_variance, bool pre_initialized = false) {
+  // Previous number of samples
+  int prev_num_samples = forests.NumSamples();
   
-  void SampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
-                     ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                     double global_variance, bool pre_initialized = false) {
-    // Previous number of samples
-    int prev_num_samples = forests.NumSamples();
+  if ((prev_num_samples == 0) && (!pre_initialized)) {
+    // Add new forest to the container
+    forests.AddSamples(1);
     
-    if ((prev_num_samples == 0) && (!pre_initialized)) {
-      // Add new forest to the container
-      forests.AddSamples(1);
-      
-      // Set initial value for each leaf in the forest
-      double root_pred = ComputeMeanOutcome(residual) / static_cast<double>(forests.NumTrees());
-      TreeEnsemble* ensemble = forests.GetEnsemble(0);
-      leaf_model.SetEnsembleRootPredictedValue(dataset, ensemble, root_pred);
-    } else if (prev_num_samples > 0) {
-      // Add new forest to the container
-      forests.AddSamples(1);
-      
-      // Copy previous forest
-      forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
-    } else {
-      forests.IncrementSampleCount();
-    }
+    // Set initial value for each leaf in the forest
+    double root_pred = ComputeMeanOutcome(residual) / static_cast<double>(forests.NumTrees());
+    TreeEnsemble* ensemble = forests.GetEnsemble(0);
+    leaf_model.SetEnsembleRootPredictedValue(dataset, ensemble, root_pred);
+  } else if (prev_num_samples > 0) {
+    // Add new forest to the container
+    forests.AddSamples(1);
     
-    // Run the MCMC algorithm for each tree
-    TreeEnsemble* ensemble = forests.GetEnsemble(prev_num_samples);
-    Tree* tree;
-    int num_trees = forests.NumTrees();
-    for (int i = 0; i < num_trees; i++) {
-      // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
-      tree = ensemble->GetTree(i);
-      UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), plus_op_, false);
-      
-      // Sample tree i
-      tree = ensemble->GetTree(i);
-      SampleTreeOneIter(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance);
-      
-      // Sample leaf parameters for tree i
-      tree = ensemble->GetTree(i);
-      leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
-      
-      // Subtract tree i's predictions back out of the residual
-      tree = ensemble->GetTree(i);
-      UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), minus_op_, true);
-    }
+    // Copy previous forest
+    forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
+  } else {
+    forests.IncrementSampleCount();
   }
- 
- private:
-  // Function objects for element-wise addition and subtraction (used in the residual update function which takes std::function as an argument)
-  std::plus<double> plus_op_;
-  std::minus<double> minus_op_;
   
-  void SampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
-                         ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                         int tree_num, double global_variance) {
-    // Determine whether it is possible to grow any of the leaves
-    bool grow_possible = false;
-    std::vector<int> leaves = tree->GetLeaves();
-    for (auto& leaf: leaves) {
-      if (tracker.UnsortedNodeSize(tree_num, leaf) > 2 * tree_prior.GetMinSamplesLeaf()) {
-        grow_possible = true;
-        break;
-      }
-    }
+  // Run the MCMC algorithm for each tree
+  TreeEnsemble* ensemble = forests.GetEnsemble(prev_num_samples);
+  Tree* tree;
+  int num_trees = forests.NumTrees();
+  for (int i = 0; i < num_trees; i++) {
+    // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
+    tree = ensemble->GetTree(i);
+    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
+    
+    // Sample tree i
+    tree = ensemble->GetTree(i);
+    MCMCSampleTreeOneIter<LeafModel>(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance);
+    
+    // Sample leaf parameters for tree i
+    tree = ensemble->GetTree(i);
+    leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
+    
+    // Subtract tree i's predictions back out of the residual
+    tree = ensemble->GetTree(i);
+    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
+  }
+}
 
-    // Determine whether it is possible to prune the tree
-    bool prune_possible = false;
-    if (tree->NumValidNodes() > 1) {
-      prune_possible = true;
+template <typename LeafModel>
+static inline void MCMCSampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
+                                         ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
+                                         int tree_num, double global_variance) {
+  // Determine whether it is possible to grow any of the leaves
+  bool grow_possible = false;
+  std::vector<int> leaves = tree->GetLeaves();
+  for (auto& leaf: leaves) {
+    if (tracker.UnsortedNodeSize(tree_num, leaf) > 2 * tree_prior.GetMinSamplesLeaf()) {
+      grow_possible = true;
+      break;
     }
+  }
 
-    // Determine the relative probability of grow vs prune (0 = grow, 1 = prune)
-    double prob_grow;
-    std::vector<double> step_probs(2);
-    if (grow_possible && prune_possible) {
-      step_probs = {0.5, 0.5};
-      prob_grow = 0.5;
-    } else if (!grow_possible && prune_possible) {
-      step_probs = {0.0, 1.0};
-      prob_grow = 0.0;
-    } else if (grow_possible && !prune_possible) {
-      step_probs = {1.0, 0.0};
-      prob_grow = 1.0;
-    } else {
-      Log::Fatal("In this tree, neither grow nor prune is possible");
-    }
-    std::discrete_distribution<> step_dist(step_probs.begin(), step_probs.end());
+  // Determine whether it is possible to prune the tree
+  bool prune_possible = false;
+  if (tree->NumValidNodes() > 1) {
+    prune_possible = true;
+  }
 
-    // Draw a split rule at random
-    data_size_t step_chosen = step_dist(gen);
-    bool accept;
-    
-    if (step_chosen == 0) {
-      GrowTreeOneIter(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, variable_weights, global_variance, prob_grow);
-    } else {
-      PruneTreeOneIter(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance);
-    }
+  // Determine the relative probability of grow vs prune (0 = grow, 1 = prune)
+  double prob_grow;
+  std::vector<double> step_probs(2);
+  if (grow_possible && prune_possible) {
+    step_probs = {0.5, 0.5};
+    prob_grow = 0.5;
+  } else if (!grow_possible && prune_possible) {
+    step_probs = {0.0, 1.0};
+    prob_grow = 0.0;
+  } else if (grow_possible && !prune_possible) {
+    step_probs = {1.0, 0.0};
+    prob_grow = 1.0;
+  } else {
+    Log::Fatal("In this tree, neither grow nor prune is possible");
   }
+  std::discrete_distribution<> step_dist(step_probs.begin(), step_probs.end());
 
-  void GrowTreeOneIter(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
-                       TreePrior& tree_prior, std::mt19937& gen, int tree_num, std::vector<double>& variable_weights, 
-                       double global_variance, double prob_grow_old) {
-    // Extract dataset information
-    data_size_t n = dataset.GetCovariates().rows();
-
-    // Choose a leaf node at random
-    int num_leaves = tree->NumLeaves();
-    std::vector<int> leaves = tree->GetLeaves();
-    std::vector<double> leaf_weights(num_leaves);
-    std::fill(leaf_weights.begin(), leaf_weights.end(), 1.0/num_leaves);
-    std::discrete_distribution<> leaf_dist(leaf_weights.begin(), leaf_weights.end());
-    int leaf_chosen = leaves[leaf_dist(gen)];
-    int leaf_depth = tree->GetDepth(leaf_chosen);
-
-    // Maximum leaf depth
-    int32_t max_depth = tree_prior.GetMaxDepth();
-
-    // Terminate early if cannot be split
-    bool accept;
-    if ((leaf_depth >= max_depth) && (max_depth != -1)) {
-      accept = false;
-    } else {
+  // Draw a split rule at random
+  data_size_t step_chosen = step_dist(gen);
+  bool accept;
+  
+  if (step_chosen == 0) {
+    MCMCGrowTreeOneIter<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, variable_weights, global_variance, prob_grow);
+  } else {
+    MCMCPruneTreeOneIter<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance);
+  }
+}
 
-      // Select a split variable at random
-      int p = dataset.GetCovariates().cols();
-      CHECK_EQ(variable_weights.size(), p);
-      // std::vector<double> var_weights(p);
-      // std::fill(var_weights.begin(), var_weights.end(), 1.0/p);
-      std::discrete_distribution<> var_dist(variable_weights.begin(), variable_weights.end());
-      int var_chosen = var_dist(gen);
-
-      // Determine the range of possible cutpoints
-      // TODO: specialize this for binary / ordered categorical / unordered categorical variables
-      double var_min, var_max;
-      VarSplitRange(tracker, dataset, tree_num, leaf_chosen, var_chosen, var_min, var_max);
-      if (var_max <= var_min) {
-        return;
-      }
-      
-      // Split based on var_min to var_max in a given node
-      std::uniform_real_distribution<double> split_point_dist(var_min, var_max);
-      double split_point_chosen = split_point_dist(gen);
-
-      // Create a split object
-      TreeSplit split = TreeSplit(split_point_chosen);
-
-      // Compute the marginal likelihood of split and no split, given the leaf prior
-      std::tuple<double, double, int32_t, int32_t> split_eval = leaf_model.EvaluateProposedSplit(dataset, tracker, residual, split, tree_num, leaf_chosen, var_chosen, global_variance);
-      double split_log_marginal_likelihood = std::get<0>(split_eval);
-      double no_split_log_marginal_likelihood = std::get<1>(split_eval);
-      int32_t left_n = std::get<2>(split_eval);
-      int32_t right_n = std::get<3>(split_eval);
-      
-      // Determine probability of growing the split node and its two new left and right nodes
-      double pg = tree_prior.GetAlpha() * std::pow(1+leaf_depth, -tree_prior.GetBeta());
-      double pgl = tree_prior.GetAlpha() * std::pow(1+leaf_depth+1, -tree_prior.GetBeta());
-      double pgr = tree_prior.GetAlpha() * std::pow(1+leaf_depth+1, -tree_prior.GetBeta());
-
-      // Determine whether a "grow" move is possible from the newly formed tree
-      // in order to compute the probability of choosing "prune" from the new tree
-      // (which is always possible by construction)
-      bool non_constant = NodesNonConstantAfterSplit(dataset, tracker, split, tree_num, leaf_chosen, var_chosen);
-      bool min_samples_left_check = left_n >= 2*tree_prior.GetMinSamplesLeaf();
-      bool min_samples_right_check = right_n >= 2*tree_prior.GetMinSamplesLeaf();
-      double prob_prune_new;
-      if (non_constant && (min_samples_left_check || min_samples_right_check)) {
-        prob_prune_new = 0.5;
-      } else {
-        prob_prune_new = 1.0;
-      }
+template <typename LeafModel>
+static inline void MCMCGrowTreeOneIter(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
+                                       TreePrior& tree_prior, std::mt19937& gen, int tree_num, std::vector<double>& variable_weights, 
+                                       double global_variance, double prob_grow_old) {
+  // Extract dataset information
+  data_size_t n = dataset.GetCovariates().rows();
 
-      // Determine the number of leaves in the current tree and leaf parents in the proposed tree
-      int num_leaf_parents = tree->NumLeafParents();
-      double p_leaf = 1/static_cast<double>(num_leaves);
-      double p_leaf_parent = 1/static_cast<double>(num_leaf_parents+1);
-
-      // Compute the final MH ratio
-      double log_mh_ratio = (
-        std::log(pg) + std::log(1-pgl) + std::log(1-pgr) - std::log(1-pg) + std::log(prob_prune_new) +
-        std::log(p_leaf_parent) - std::log(prob_grow_old) - std::log(p_leaf) - no_split_log_marginal_likelihood + split_log_marginal_likelihood
-      );
-      // Threshold at 0
-      if (log_mh_ratio > 0) {
-        log_mh_ratio = 0;
-      }
+  // Choose a leaf node at random
+  int num_leaves = tree->NumLeaves();
+  std::vector<int> leaves = tree->GetLeaves();
+  std::vector<double> leaf_weights(num_leaves);
+  std::fill(leaf_weights.begin(), leaf_weights.end(), 1.0/num_leaves);
+  std::discrete_distribution<> leaf_dist(leaf_weights.begin(), leaf_weights.end());
+  int leaf_chosen = leaves[leaf_dist(gen)];
+  int leaf_depth = tree->GetDepth(leaf_chosen);
+
+  // Maximum leaf depth
+  int32_t max_depth = tree_prior.GetMaxDepth();
+
+  // Terminate early if cannot be split
+  bool accept;
+  if ((leaf_depth >= max_depth) && (max_depth != -1)) {
+    accept = false;
+  } else {
 
-      // Draw a uniform random variable and accept/reject the proposal on this basis
-      std::uniform_real_distribution<double> mh_accept(0.0, 1.0);
-      double log_acceptance_prob = std::log(mh_accept(gen));
-      if (log_acceptance_prob <= log_mh_ratio) {
-        accept = true;
-        AddSplitToModel(tracker, dataset, tree_prior, split, gen, tree, tree_num, leaf_chosen, var_chosen, false);
-      } else {
-        accept = false;
-      }
+    // Select a split variable at random
+    int p = dataset.GetCovariates().cols();
+    CHECK_EQ(variable_weights.size(), p);
+    // std::vector<double> var_weights(p);
+    // std::fill(var_weights.begin(), var_weights.end(), 1.0/p);
+    std::discrete_distribution<> var_dist(variable_weights.begin(), variable_weights.end());
+    int var_chosen = var_dist(gen);
+
+    // Determine the range of possible cutpoints
+    // TODO: specialize this for binary / ordered categorical / unordered categorical variables
+    double var_min, var_max;
+    VarSplitRange(tracker, dataset, tree_num, leaf_chosen, var_chosen, var_min, var_max);
+    if (var_max <= var_min) {
+      return;
     }
-  }
-
-  void PruneTreeOneIter(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
-                        TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance) {
-    // Choose a "leaf parent" node at random
-    int num_leaves = tree->NumLeaves();
-    int num_leaf_parents = tree->NumLeafParents();
-    std::vector<int> leaf_parents = tree->GetLeafParents();
-    std::vector<double> leaf_parent_weights(num_leaf_parents);
-    std::fill(leaf_parent_weights.begin(), leaf_parent_weights.end(), 1.0/num_leaf_parents);
-    std::discrete_distribution<> leaf_parent_dist(leaf_parent_weights.begin(), leaf_parent_weights.end());
-    int leaf_parent_chosen = leaf_parents[leaf_parent_dist(gen)];
-    int leaf_parent_depth = tree->GetDepth(leaf_parent_chosen);
-    int left_node = tree->LeftChild(leaf_parent_chosen);
-    int right_node = tree->RightChild(leaf_parent_chosen);
-    int feature_split = tree->SplitIndex(leaf_parent_chosen);
     
-    // Compute the marginal likelihood for the leaf parent and its left and right nodes
-    std::tuple<double, double, int32_t, int32_t> split_eval = leaf_model.EvaluateExistingSplit(dataset, tracker, residual, global_variance, tree_num, leaf_parent_chosen, left_node, right_node);
+    // Split based on var_min to var_max in a given node
+    std::uniform_real_distribution<double> split_point_dist(var_min, var_max);
+    double split_point_chosen = split_point_dist(gen);
+
+    // Create a split object
+    TreeSplit split = TreeSplit(split_point_chosen);
+
+    // Compute the marginal likelihood of split and no split, given the leaf prior
+    std::tuple<double, double, int32_t, int32_t> split_eval = leaf_model.EvaluateProposedSplit(dataset, tracker, residual, split, tree_num, leaf_chosen, var_chosen, global_variance);
     double split_log_marginal_likelihood = std::get<0>(split_eval);
     double no_split_log_marginal_likelihood = std::get<1>(split_eval);
     int32_t left_n = std::get<2>(split_eval);
     int32_t right_n = std::get<3>(split_eval);
     
     // Determine probability of growing the split node and its two new left and right nodes
-    double pg = tree_prior.GetAlpha() * std::pow(1+leaf_parent_depth, -tree_prior.GetBeta());
-    double pgl = tree_prior.GetAlpha() * std::pow(1+leaf_parent_depth+1, -tree_prior.GetBeta());
-    double pgr = tree_prior.GetAlpha() * std::pow(1+leaf_parent_depth+1, -tree_prior.GetBeta());
+    double pg = tree_prior.GetAlpha() * std::pow(1+leaf_depth, -tree_prior.GetBeta());
+    double pgl = tree_prior.GetAlpha() * std::pow(1+leaf_depth+1, -tree_prior.GetBeta());
+    double pgr = tree_prior.GetAlpha() * std::pow(1+leaf_depth+1, -tree_prior.GetBeta());
 
-    // Determine whether a "prune" move is possible from the new tree,
-    // in order to compute the probability of choosing "grow" from the new tree
+    // Determine whether a "grow" move is possible from the newly formed tree
+    // in order to compute the probability of choosing "prune" from the new tree
     // (which is always possible by construction)
-    bool non_root_tree = tree->NumNodes() > 1;
-    double prob_grow_new;
-    if (non_root_tree) {
-      prob_grow_new = 0.5;
-    } else {
-      prob_grow_new = 1.0;
-    }
-
-    // Determine whether a "grow" move was possible from the old tree,
-    // in order to compute the probability of choosing "prune" from the old tree
-    bool non_constant_left = NodeNonConstant(dataset, tracker, tree_num, left_node);
-    bool non_constant_right = NodeNonConstant(dataset, tracker, tree_num, right_node);
-    double prob_prune_old;
-    if (non_constant_left && non_constant_right) {
-      prob_prune_old = 0.5;
+    bool non_constant = NodesNonConstantAfterSplit(dataset, tracker, split, tree_num, leaf_chosen, var_chosen);
+    bool min_samples_left_check = left_n >= 2*tree_prior.GetMinSamplesLeaf();
+    bool min_samples_right_check = right_n >= 2*tree_prior.GetMinSamplesLeaf();
+    double prob_prune_new;
+    if (non_constant && (min_samples_left_check || min_samples_right_check)) {
+      prob_prune_new = 0.5;
     } else {
-      prob_prune_old = 1.0;
+      prob_prune_new = 1.0;
     }
 
     // Determine the number of leaves in the current tree and leaf parents in the proposed tree
-    double p_leaf = 1/static_cast<double>(num_leaves-1);
-    double p_leaf_parent = 1/static_cast<double>(num_leaf_parents);
+    int num_leaf_parents = tree->NumLeafParents();
+    double p_leaf = 1/static_cast<double>(num_leaves);
+    double p_leaf_parent = 1/static_cast<double>(num_leaf_parents+1);
 
     // Compute the final MH ratio
     double log_mh_ratio = (
-      std::log(1-pg) - std::log(pg) - std::log(1-pgl) - std::log(1-pgr) + std::log(prob_prune_old) +
-      std::log(p_leaf) - std::log(prob_grow_new) - std::log(p_leaf_parent) + no_split_log_marginal_likelihood - split_log_marginal_likelihood
+      std::log(pg) + std::log(1-pgl) + std::log(1-pgr) - std::log(1-pg) + std::log(prob_prune_new) +
+      std::log(p_leaf_parent) - std::log(prob_grow_old) - std::log(p_leaf) - no_split_log_marginal_likelihood + split_log_marginal_likelihood
     );
     // Threshold at 0
     if (log_mh_ratio > 0) {
@@ -501,242 +418,305 @@ class MCMCForestSampler {
     }
 
     // Draw a uniform random variable and accept/reject the proposal on this basis
-    bool accept;
     std::uniform_real_distribution<double> mh_accept(0.0, 1.0);
     double log_acceptance_prob = std::log(mh_accept(gen));
     if (log_acceptance_prob <= log_mh_ratio) {
       accept = true;
-      RemoveSplitFromModel(tracker, dataset, tree_prior, gen, tree, tree_num, leaf_parent_chosen, left_node, right_node, false);
+      AddSplitToModel(tracker, dataset, tree_prior, split, gen, tree, tree_num, leaf_chosen, var_chosen, false);
     } else {
       accept = false;
     }
   }
-};
+}
 
 template <typename LeafModel>
-class GFRForestSampler {
- public:
-  GFRForestSampler() {cutpoint_grid_size_ = 500;}
-  GFRForestSampler(int cutpoint_grid_size) {cutpoint_grid_size_ = cutpoint_grid_size;}
-  ~GFRForestSampler() {}
-
-  void SampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
-                     ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                     double global_variance, std::vector<FeatureType>& feature_types, bool pre_initialized = false) {
-    // Previous number of samples
-    int prev_num_samples = forests.NumSamples();
-    
-    if ((prev_num_samples == 0) && (!pre_initialized)) {
-      // Add new forest to the container
-      forests.AddSamples(1);
-      
-      // Set initial value for each leaf in the forest
-      double root_pred = ComputeMeanOutcome(residual) / static_cast<double>(forests.NumTrees());
-      TreeEnsemble* ensemble = forests.GetEnsemble(0);
-      leaf_model.SetEnsembleRootPredictedValue(dataset, ensemble, root_pred);
-    } else if (prev_num_samples > 0) {
-      // Add new forest to the container
-      forests.AddSamples(1);
-
-      // NOTE: only doing this for the simplicity of the partial residual step
-      // We could alternatively "reach back" to the tree predictions from a previous
-      // sample (whenever there is more than one sample). This is cleaner / quicker
-      // to implement during this refactor.
-      forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
-    } else {
-      forests.IncrementSampleCount();
-    }
-    
-    // Run the GFR algorithm for each tree
-    TreeEnsemble* ensemble = forests.GetEnsemble(prev_num_samples);
-    int num_trees = forests.NumTrees();
-    for (int i = 0; i < num_trees; i++) {
-      // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
-      Tree* tree = ensemble->GetTree(i);
-      UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), plus_op_, false);
-      
-      // Reset the tree and sample trackers
-      ensemble->ResetInitTree(i);
-      tracker.ResetRoot(dataset.GetCovariates(), feature_types, i);
-      tree = ensemble->GetTree(i);
-      
-      // Sample tree i
-      SampleTreeOneIter(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance, feature_types);
-      
-      // Sample leaf parameters for tree i
-      tree = ensemble->GetTree(i);
-      leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
-      
-      // Subtract tree i's predictions back out of the residual
-      UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), minus_op_, true);
-    }
+static inline void MCMCPruneTreeOneIter(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
+                                        TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance) {
+  // Choose a "leaf parent" node at random
+  int num_leaves = tree->NumLeaves();
+  int num_leaf_parents = tree->NumLeafParents();
+  std::vector<int> leaf_parents = tree->GetLeafParents();
+  std::vector<double> leaf_parent_weights(num_leaf_parents);
+  std::fill(leaf_parent_weights.begin(), leaf_parent_weights.end(), 1.0/num_leaf_parents);
+  std::discrete_distribution<> leaf_parent_dist(leaf_parent_weights.begin(), leaf_parent_weights.end());
+  int leaf_parent_chosen = leaf_parents[leaf_parent_dist(gen)];
+  int leaf_parent_depth = tree->GetDepth(leaf_parent_chosen);
+  int left_node = tree->LeftChild(leaf_parent_chosen);
+  int right_node = tree->RightChild(leaf_parent_chosen);
+  int feature_split = tree->SplitIndex(leaf_parent_chosen);
+  
+  // Compute the marginal likelihood for the leaf parent and its left and right nodes
+  std::tuple<double, double, int32_t, int32_t> split_eval = leaf_model.EvaluateExistingSplit(dataset, tracker, residual, global_variance, tree_num, leaf_parent_chosen, left_node, right_node);
+  double split_log_marginal_likelihood = std::get<0>(split_eval);
+  double no_split_log_marginal_likelihood = std::get<1>(split_eval);
+  int32_t left_n = std::get<2>(split_eval);
+  int32_t right_n = std::get<3>(split_eval);
+  
+  // Determine probability of growing the split node and its two new left and right nodes
+  double pg = tree_prior.GetAlpha() * std::pow(1+leaf_parent_depth, -tree_prior.GetBeta());
+  double pgl = tree_prior.GetAlpha() * std::pow(1+leaf_parent_depth+1, -tree_prior.GetBeta());
+  double pgr = tree_prior.GetAlpha() * std::pow(1+leaf_parent_depth+1, -tree_prior.GetBeta());
+
+  // Determine whether a "prune" move is possible from the new tree,
+  // in order to compute the probability of choosing "grow" from the new tree
+  // (which is always possible by construction)
+  bool non_root_tree = tree->NumNodes() > 1;
+  double prob_grow_new;
+  if (non_root_tree) {
+    prob_grow_new = 0.5;
+  } else {
+    prob_grow_new = 1.0;
+  }
+
+  // Determine whether a "grow" move was possible from the old tree,
+  // in order to compute the probability of choosing "prune" from the old tree
+  bool non_constant_left = NodeNonConstant(dataset, tracker, tree_num, left_node);
+  bool non_constant_right = NodeNonConstant(dataset, tracker, tree_num, right_node);
+  double prob_prune_old;
+  if (non_constant_left && non_constant_right) {
+    prob_prune_old = 0.5;
+  } else {
+    prob_prune_old = 1.0;
+  }
+
+  // Determine the number of leaves in the current tree and leaf parents in the proposed tree
+  double p_leaf = 1/static_cast<double>(num_leaves-1);
+  double p_leaf_parent = 1/static_cast<double>(num_leaf_parents);
+
+  // Compute the final MH ratio
+  double log_mh_ratio = (
+    std::log(1-pg) - std::log(pg) - std::log(1-pgl) - std::log(1-pgr) + std::log(prob_prune_old) +
+    std::log(p_leaf) - std::log(prob_grow_new) - std::log(p_leaf_parent) + no_split_log_marginal_likelihood - split_log_marginal_likelihood
+  );
+  // Threshold at 0
+  if (log_mh_ratio > 0) {
+    log_mh_ratio = 0;
   }
 
- private:
-  // Maximum cutpoint grid size in the enumeration of possible splits
-  int cutpoint_grid_size_;
+  // Draw a uniform random variable and accept/reject the proposal on this basis
+  bool accept;
+  std::uniform_real_distribution<double> mh_accept(0.0, 1.0);
+  double log_acceptance_prob = std::log(mh_accept(gen));
+  if (log_acceptance_prob <= log_mh_ratio) {
+    accept = true;
+    RemoveSplitFromModel(tracker, dataset, tree_prior, gen, tree, tree_num, leaf_parent_chosen, left_node, right_node, false);
+  } else {
+    accept = false;
+  }
+}
+
+template <typename LeafModel>
+static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
+                                    ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
+                                    double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size = 500, 
+                                    bool pre_initialized = false) {
+  // Previous number of samples
+  int prev_num_samples = forests.NumSamples();
   
-  // Function objects for element-wise addition and subtraction (used in the residual update function which takes std::function as an argument)
-  std::plus<double> plus_op_;
-  std::minus<double> minus_op_;
+  if ((prev_num_samples == 0) && (!pre_initialized)) {
+    // Add new forest to the container
+    forests.AddSamples(1);
+    
+    // Set initial value for each leaf in the forest
+    double root_pred = ComputeMeanOutcome(residual) / static_cast<double>(forests.NumTrees());
+    TreeEnsemble* ensemble = forests.GetEnsemble(0);
+    leaf_model.SetEnsembleRootPredictedValue(dataset, ensemble, root_pred);
+  } else if (prev_num_samples > 0) {
+    // Add new forest to the container
+    forests.AddSamples(1);
+
+    // NOTE: only doing this for the simplicity of the partial residual step
+    // We could alternatively "reach back" to the tree predictions from a previous
+    // sample (whenever there is more than one sample). This is cleaner / quicker
+    // to implement during this refactor.
+    forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
+  } else {
+    forests.IncrementSampleCount();
+  }
   
-  void SampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
-                         ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                         int tree_num, double global_variance, std::vector<FeatureType>& feature_types) {
-    int root_id = Tree::kRoot;
-    int curr_node_id;
-    data_size_t curr_node_begin;
-    data_size_t curr_node_end;
-    data_size_t n = dataset.GetCovariates().rows();
-    // Mapping from node id to start and end points of sorted indices
-    std::unordered_map<int, std::pair<data_size_t, data_size_t>> node_index_map;
-    node_index_map.insert({root_id, std::make_pair(0, n)});
-    std::pair<data_size_t, data_size_t> begin_end;
-    // Add root node to the split queue
-    std::deque<node_t> split_queue;
-    split_queue.push_back(Tree::kRoot);
-    // Run the "GrowFromRoot" procedure using a stack in place of recursion
-    while (!split_queue.empty()) {
-      // Remove the next node from the queue
-      curr_node_id = split_queue.front();
-      split_queue.pop_front();
-      // Determine the beginning and ending indices of the left and right nodes
-      begin_end = node_index_map[curr_node_id];
-      curr_node_begin = begin_end.first;
-      curr_node_end = begin_end.second;
-      // Draw a split rule at random
-      SampleSplitRule(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance, cutpoint_grid_size_, 
-                      node_index_map, split_queue, curr_node_id, curr_node_begin, curr_node_end, variable_weights, feature_types);
-    }
+  // Run the GFR algorithm for each tree
+  TreeEnsemble* ensemble = forests.GetEnsemble(prev_num_samples);
+  int num_trees = forests.NumTrees();
+  for (int i = 0; i < num_trees; i++) {
+    // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
+    Tree* tree = ensemble->GetTree(i);
+    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
+    
+    // Reset the tree and sample trackers
+    ensemble->ResetInitTree(i);
+    tracker.ResetRoot(dataset.GetCovariates(), feature_types, i);
+    tree = ensemble->GetTree(i);
+    
+    // Sample tree i
+    GFRSampleTreeOneIter<LeafModel>(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance, feature_types, cutpoint_grid_size);
+    
+    // Sample leaf parameters for tree i
+    tree = ensemble->GetTree(i);
+    leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
+    
+    // Subtract tree i's predictions back out of the residual
+    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
   }
+}
 
-  void SampleSplitRule(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
-                       TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, 
-                       std::unordered_map<int, std::pair<data_size_t, data_size_t>>& node_index_map, std::deque<node_t>& split_queue, 
-                       int node_id, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
-                       std::vector<FeatureType>& feature_types) {
-    // Leaf depth
-    int leaf_depth = tree->GetDepth(node_id);
-
-    // Maximum leaf depth
-    int32_t max_depth = tree_prior.GetMaxDepth();
+template <typename LeafModel>
+static inline void GFRSampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
+                                        ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
+                                        int tree_num, double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size) {
+  int root_id = Tree::kRoot;
+  int curr_node_id;
+  data_size_t curr_node_begin;
+  data_size_t curr_node_end;
+  data_size_t n = dataset.GetCovariates().rows();
+  // Mapping from node id to start and end points of sorted indices
+  std::unordered_map<int, std::pair<data_size_t, data_size_t>> node_index_map;
+  node_index_map.insert({root_id, std::make_pair(0, n)});
+  std::pair<data_size_t, data_size_t> begin_end;
+  // Add root node to the split queue
+  std::deque<node_t> split_queue;
+  split_queue.push_back(Tree::kRoot);
+  // Run the "GrowFromRoot" procedure using a stack in place of recursion
+  while (!split_queue.empty()) {
+    // Remove the next node from the queue
+    curr_node_id = split_queue.front();
+    split_queue.pop_front();
+    // Determine the beginning and ending indices of the left and right nodes
+    begin_end = node_index_map[curr_node_id];
+    curr_node_begin = begin_end.first;
+    curr_node_end = begin_end.second;
+    // Draw a split rule at random
+    SampleSplitRule<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance, cutpoint_grid_size, 
+                               node_index_map, split_queue, curr_node_id, curr_node_begin, curr_node_end, variable_weights, feature_types);
+  }
+}
 
-    if ((max_depth == -1) || (leaf_depth < max_depth)) {
+template <typename LeafModel>
+static inline void SampleSplitRule(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
+                                   TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, 
+                                   std::unordered_map<int, std::pair<data_size_t, data_size_t>>& node_index_map, std::deque<node_t>& split_queue, 
+                                   int node_id, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
+                                   std::vector<FeatureType>& feature_types) {
+  // Leaf depth
+  int leaf_depth = tree->GetDepth(node_id);
+
+  // Maximum leaf depth
+  int32_t max_depth = tree_prior.GetMaxDepth();
+
+  if ((max_depth == -1) || (leaf_depth < max_depth)) {
+  
+    // Cutpoint enumeration
+    std::vector<double> log_cutpoint_evaluations;
+    std::vector<int> cutpoint_features;
+    std::vector<double> cutpoint_values;
+    std::vector<FeatureType> cutpoint_feature_types;
+    StochTree::data_size_t valid_cutpoint_count;
+    CutpointGridContainer cutpoint_grid_container(dataset.GetCovariates(), residual.GetData(), cutpoint_grid_size);
+    EvaluateCutpoints<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance,
+                                 cutpoint_grid_size, node_id, node_begin, node_end, log_cutpoint_evaluations, cutpoint_features, 
+                                 cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, variable_weights, feature_types, 
+                                 cutpoint_grid_container);
+    // TODO: maybe add some checks here?
+    
+    // Convert log marginal likelihood to marginal likelihood, normalizing by the maximum log-likelihood
+    double largest_mll = *std::max_element(log_cutpoint_evaluations.begin(), log_cutpoint_evaluations.end());
+    std::vector<double> cutpoint_evaluations(log_cutpoint_evaluations.size());
+    for (data_size_t i = 0; i < log_cutpoint_evaluations.size(); i++){
+      cutpoint_evaluations[i] = std::exp(log_cutpoint_evaluations[i] - largest_mll);
+    }
     
-      // Cutpoint enumeration
-      std::vector<double> log_cutpoint_evaluations;
-      std::vector<int> cutpoint_features;
-      std::vector<double> cutpoint_values;
-      std::vector<FeatureType> cutpoint_feature_types;
-      StochTree::data_size_t valid_cutpoint_count;
-      CutpointGridContainer cutpoint_grid_container(dataset.GetCovariates(), residual.GetData(), cutpoint_grid_size);
-      EvaluateCutpoints(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance,
-                        cutpoint_grid_size, node_id, node_begin, node_end, log_cutpoint_evaluations, cutpoint_features, 
-                        cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, variable_weights, feature_types, 
-                        cutpoint_grid_container);
-      // TODO: maybe add some checks here?
+    // Sample the split (including a "no split" option)
+    std::discrete_distribution<data_size_t> split_dist(cutpoint_evaluations.begin(), cutpoint_evaluations.end());
+    data_size_t split_chosen = split_dist(gen);
+    
+    if (split_chosen == valid_cutpoint_count){
+      // "No split" sampled, don't split or add any nodes to split queue
+      return;
+    } else {
+      // Split sampled
+      int feature_split = cutpoint_features[split_chosen];
+      FeatureType feature_type = cutpoint_feature_types[split_chosen];
+      double split_value = cutpoint_values[split_chosen];
+      // Perform all of the relevant "split" operations in the model, tree and training dataset
       
-      // Convert log marginal likelihood to marginal likelihood, normalizing by the maximum log-likelihood
-      double largest_mll = *std::max_element(log_cutpoint_evaluations.begin(), log_cutpoint_evaluations.end());
-      std::vector<double> cutpoint_evaluations(log_cutpoint_evaluations.size());
-      for (data_size_t i = 0; i < log_cutpoint_evaluations.size(); i++){
-        cutpoint_evaluations[i] = std::exp(log_cutpoint_evaluations[i] - largest_mll);
-      }
+      // Compute node sample size
+      data_size_t node_n = node_end - node_begin;
       
-      // Sample the split (including a "no split" option)
-      std::discrete_distribution<data_size_t> split_dist(cutpoint_evaluations.begin(), cutpoint_evaluations.end());
-      data_size_t split_chosen = split_dist(gen);
+      // Actual numeric cutpoint used for ordered categorical and numeric features
+      double split_value_numeric;
+      TreeSplit tree_split;
       
-      if (split_chosen == valid_cutpoint_count){
-        // "No split" sampled, don't split or add any nodes to split queue
-        return;
+      // We will use these later in the model expansion
+      data_size_t left_n = 0;
+      data_size_t right_n = 0;
+      data_size_t sort_idx;
+      double feature_value;
+      bool split_true;
+
+      if (feature_type == FeatureType::kUnorderedCategorical) {
+        // Determine the number of categories available in a categorical split and the set of categories that route observations to the left node after split
+        int num_categories;
+        std::vector<std::uint32_t> categories = cutpoint_grid_container.CutpointVector(static_cast<std::uint32_t>(split_value), feature_split);
+        tree_split = TreeSplit(categories);
+      } else if (feature_type == FeatureType::kOrderedCategorical) {
+        // Convert the bin split to an actual split value
+        split_value_numeric = cutpoint_grid_container.CutpointValue(static_cast<std::uint32_t>(split_value), feature_split);
+        tree_split = TreeSplit(split_value_numeric);
+      } else if (feature_type == FeatureType::kNumeric) {
+        // Convert the bin split to an actual split value
+        split_value_numeric = cutpoint_grid_container.CutpointValue(static_cast<std::uint32_t>(split_value), feature_split);
+        tree_split = TreeSplit(split_value_numeric);
       } else {
-        // Split sampled
-        int feature_split = cutpoint_features[split_chosen];
-        FeatureType feature_type = cutpoint_feature_types[split_chosen];
-        double split_value = cutpoint_values[split_chosen];
-        // Perform all of the relevant "split" operations in the model, tree and training dataset
-        
-        // Compute node sample size
-        data_size_t node_n = node_end - node_begin;
-        
-        // Actual numeric cutpoint used for ordered categorical and numeric features
-        double split_value_numeric;
-        TreeSplit tree_split;
-        
-        // We will use these later in the model expansion
-        data_size_t left_n = 0;
-        data_size_t right_n = 0;
-        data_size_t sort_idx;
-        double feature_value;
-        bool split_true;
-
-        if (feature_type == FeatureType::kUnorderedCategorical) {
-          // Determine the number of categories available in a categorical split and the set of categories that route observations to the left node after split
-          int num_categories;
-          std::vector<std::uint32_t> categories = cutpoint_grid_container.CutpointVector(static_cast<std::uint32_t>(split_value), feature_split);
-          tree_split = TreeSplit(categories);
-        } else if (feature_type == FeatureType::kOrderedCategorical) {
-          // Convert the bin split to an actual split value
-          split_value_numeric = cutpoint_grid_container.CutpointValue(static_cast<std::uint32_t>(split_value), feature_split);
-          tree_split = TreeSplit(split_value_numeric);
-        } else if (feature_type == FeatureType::kNumeric) {
-          // Convert the bin split to an actual split value
-          split_value_numeric = cutpoint_grid_container.CutpointValue(static_cast<std::uint32_t>(split_value), feature_split);
-          tree_split = TreeSplit(split_value_numeric);
-        } else {
-          Log::Fatal("Invalid split type");
-        }
-        
-        // Add split to tree and trackers
-        AddSplitToModel(tracker, dataset, tree_prior, tree_split, gen, tree, tree_num, node_id, feature_split, true);
-
-        // Determine the number of observation in the newly created left node
-        int left_node = tree->LeftChild(node_id);
-        int right_node = tree->RightChild(node_id);
-        auto left_begin_iter = tracker.SortedNodeBeginIterator(left_node, feature_split);
-        auto left_end_iter = tracker.SortedNodeEndIterator(left_node, feature_split);
-        for (auto i = left_begin_iter; i < left_end_iter; i++) {
-          left_n += 1;
-        }
+        Log::Fatal("Invalid split type");
+      }
+      
+      // Add split to tree and trackers
+      AddSplitToModel(tracker, dataset, tree_prior, tree_split, gen, tree, tree_num, node_id, feature_split, true);
+
+      // Determine the number of observation in the newly created left node
+      int left_node = tree->LeftChild(node_id);
+      int right_node = tree->RightChild(node_id);
+      auto left_begin_iter = tracker.SortedNodeBeginIterator(left_node, feature_split);
+      auto left_end_iter = tracker.SortedNodeEndIterator(left_node, feature_split);
+      for (auto i = left_begin_iter; i < left_end_iter; i++) {
+        left_n += 1;
+      }
 
-        // Add the begin and end indices for the new left and right nodes to node_index_map
-        node_index_map.insert({left_node, std::make_pair(node_begin, node_begin + left_n)});
-        node_index_map.insert({right_node, std::make_pair(node_begin + left_n, node_end)});
+      // Add the begin and end indices for the new left and right nodes to node_index_map
+      node_index_map.insert({left_node, std::make_pair(node_begin, node_begin + left_n)});
+      node_index_map.insert({right_node, std::make_pair(node_begin + left_n, node_end)});
 
-        // Add the left and right nodes to the split tracker
-        split_queue.push_front(right_node);
-        split_queue.push_front(left_node);      
-      }
+      // Add the left and right nodes to the split tracker
+      split_queue.push_front(right_node);
+      split_queue.push_front(left_node);      
     }
   }
+}
 
-  void EvaluateCutpoints(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, TreePrior& tree_prior, 
-                         std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, int node_id, data_size_t node_begin, data_size_t node_end, 
-                         std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, 
-                         std::vector<FeatureType>& cutpoint_feature_types, data_size_t& valid_cutpoint_count, std::vector<double>& variable_weights, 
-                         std::vector<FeatureType>& feature_types, CutpointGridContainer& cutpoint_grid_container) {
-    // Evaluate all possible cutpoints according to the leaf node model, 
-    // recording their log-likelihood and other split information in a series of vectors.
-    // The last element of these vectors concerns the "no-split" option.
-    leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, tree_num, node_id, log_cutpoint_evaluations, 
-                                         cutpoint_features, cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, 
-                                         cutpoint_grid_container, node_begin, node_end, variable_weights, feature_types);
-
-    // Compute an adjustment to reflect the no split prior probability and the number of cutpoints
-    double bart_prior_no_split_adj;
-    double alpha = tree_prior.GetAlpha();
-    double beta = tree_prior.GetBeta();
-    int node_depth = tree->GetDepth(node_id);
-    if (valid_cutpoint_count == 0) {
-      bart_prior_no_split_adj = std::log(((std::pow(1+node_depth, beta))/alpha) - 1.0);
-    } else {
-      bart_prior_no_split_adj = std::log(((std::pow(1+node_depth, beta))/alpha) - 1.0) + std::log(valid_cutpoint_count);
-    }
-    log_cutpoint_evaluations[log_cutpoint_evaluations.size()-1] += bart_prior_no_split_adj;
+template <typename LeafModel>
+static inline void EvaluateCutpoints(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, TreePrior& tree_prior, 
+                                     std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, int node_id, data_size_t node_begin, data_size_t node_end, 
+                                     std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, 
+                                     std::vector<FeatureType>& cutpoint_feature_types, data_size_t& valid_cutpoint_count, std::vector<double>& variable_weights, 
+                                     std::vector<FeatureType>& feature_types, CutpointGridContainer& cutpoint_grid_container) {
+  // Evaluate all possible cutpoints according to the leaf node model, 
+  // recording their log-likelihood and other split information in a series of vectors.
+  // The last element of these vectors concerns the "no-split" option.
+  leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, tree_num, node_id, log_cutpoint_evaluations, 
+                                        cutpoint_features, cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, 
+                                        cutpoint_grid_container, node_begin, node_end, variable_weights, feature_types);
+
+  // Compute an adjustment to reflect the no split prior probability and the number of cutpoints
+  double bart_prior_no_split_adj;
+  double alpha = tree_prior.GetAlpha();
+  double beta = tree_prior.GetBeta();
+  int node_depth = tree->GetDepth(node_id);
+  if (valid_cutpoint_count == 0) {
+    bart_prior_no_split_adj = std::log(((std::pow(1+node_depth, beta))/alpha) - 1.0);
+  } else {
+    bart_prior_no_split_adj = std::log(((std::pow(1+node_depth, beta))/alpha) - 1.0) + std::log(valid_cutpoint_count);
   }
-
-};
+  log_cutpoint_evaluations[log_cutpoint_evaluations.size()-1] += bart_prior_no_split_adj;
+}
 
 } // namespace StochTree
 
diff --git a/src/py_stochtree.cpp b/src/py_stochtree.cpp
index 3c8ca606..47e9e26b 100644
--- a/src/py_stochtree.cpp
+++ b/src/py_stochtree.cpp
@@ -512,16 +512,13 @@ class ForestSamplerCpp {
                          Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size, bool pre_initialized) {
     if (leaf_model_enum == ForestLeafModel::kConstant) {
       StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-      StochTree::GFRForestSampler<StochTree::GaussianConstantLeafModel> sampler = StochTree::GFRForestSampler<StochTree::GaussianConstantLeafModel>(cutpoint_grid_size);
-      sampler.SampleOneIter(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, pre_initialized);
+      GFRSampleOneIter<StochTree::GaussianConstantLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
       StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-      StochTree::GFRForestSampler<StochTree::GaussianUnivariateRegressionLeafModel> sampler = StochTree::GFRForestSampler<StochTree::GaussianUnivariateRegressionLeafModel>(cutpoint_grid_size);
-      sampler.SampleOneIter(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, pre_initialized);
+      GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
       StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-      StochTree::GFRForestSampler<StochTree::GaussianMultivariateRegressionLeafModel> sampler = StochTree::GFRForestSampler<StochTree::GaussianMultivariateRegressionLeafModel>(cutpoint_grid_size);
-      sampler.SampleOneIter(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, pre_initialized);
+      GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     }
   }
 
@@ -530,16 +527,13 @@ class ForestSamplerCpp {
                           Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size, bool pre_initialized) {
     if (leaf_model_enum == ForestLeafModel::kConstant) {
       StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-      StochTree::MCMCForestSampler<StochTree::GaussianConstantLeafModel> sampler = StochTree::MCMCForestSampler<StochTree::GaussianConstantLeafModel>();
-      sampler.SampleOneIter(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      MCMCSampleOneIter<StochTree::GaussianConstantLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
       StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-      StochTree::MCMCForestSampler<StochTree::GaussianUnivariateRegressionLeafModel> sampler = StochTree::MCMCForestSampler<StochTree::GaussianUnivariateRegressionLeafModel>();
-      sampler.SampleOneIter(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
       StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-      StochTree::MCMCForestSampler<StochTree::GaussianMultivariateRegressionLeafModel> sampler = StochTree::MCMCForestSampler<StochTree::GaussianMultivariateRegressionLeafModel>();
-      sampler.SampleOneIter(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     }
   }
 };
diff --git a/src/sampler.cpp b/src/sampler.cpp
index 0edf6a7a..bfb0fe6e 100644
--- a/src/sampler.cpp
+++ b/src/sampler.cpp
@@ -61,16 +61,13 @@ void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDatas
     // Run one iteration of the sampler
     if (leaf_model_enum == ForestLeafModel::kConstant) {
         StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        StochTree::GFRForestSampler<StochTree::GaussianConstantLeafModel> sampler = StochTree::GFRForestSampler<StochTree::GaussianConstantLeafModel>(cutpoint_grid_size);
-        sampler.SampleOneIter(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, pre_initialized);
+        GFRSampleOneIter<StochTree::GaussianConstantLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
         StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        StochTree::GFRForestSampler<StochTree::GaussianUnivariateRegressionLeafModel> sampler = StochTree::GFRForestSampler<StochTree::GaussianUnivariateRegressionLeafModel>(cutpoint_grid_size);
-        sampler.SampleOneIter(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, pre_initialized);
+        GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
         StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        StochTree::GFRForestSampler<StochTree::GaussianMultivariateRegressionLeafModel> sampler = StochTree::GFRForestSampler<StochTree::GaussianMultivariateRegressionLeafModel>(cutpoint_grid_size);
-        sampler.SampleOneIter(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, pre_initialized);
+        GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     }
 }
 
@@ -125,16 +122,13 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
     // Run one iteration of the sampler
     if (leaf_model_enum == ForestLeafModel::kConstant) {
         StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        StochTree::MCMCForestSampler<StochTree::GaussianConstantLeafModel> sampler = StochTree::MCMCForestSampler<StochTree::GaussianConstantLeafModel>();
-        sampler.SampleOneIter(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        MCMCSampleOneIter<StochTree::GaussianConstantLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
         StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        StochTree::MCMCForestSampler<StochTree::GaussianUnivariateRegressionLeafModel> sampler = StochTree::MCMCForestSampler<StochTree::GaussianUnivariateRegressionLeafModel>();
-        sampler.SampleOneIter(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
-        StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        StochTree::MCMCForestSampler<StochTree::GaussianMultivariateRegressionLeafModel> sampler = StochTree::MCMCForestSampler<StochTree::GaussianMultivariateRegressionLeafModel>();
-        sampler.SampleOneIter(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
+        MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     }
 }
 

From c3bfa66cf86bc1c23f3e011c437b9e111987b98c Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sat, 24 Aug 2024 00:05:57 -0500
Subject: [PATCH 09/41] Fixed R package bug and rearranged tree_sampler header
 file

---
 include/stochtree/tree_sampler.h | 470 +++++++++++++++----------------
 src/sampler.cpp                  |   4 +-
 2 files changed, 237 insertions(+), 237 deletions(-)

diff --git a/include/stochtree/tree_sampler.h b/include/stochtree/tree_sampler.h
index 9db97f02..302ae6bf 100644
--- a/include/stochtree/tree_sampler.h
+++ b/include/stochtree/tree_sampler.h
@@ -234,9 +234,169 @@ static inline void UpdateResidualNewBasis(ForestTracker& tracker, ForestDataset&
 }
 
 template <typename LeafModel>
-static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
-                                     ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                     double global_variance, bool pre_initialized = false) {
+static inline void EvaluateCutpoints(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, TreePrior& tree_prior, 
+                                     std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, int node_id, data_size_t node_begin, data_size_t node_end, 
+                                     std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, 
+                                     std::vector<FeatureType>& cutpoint_feature_types, data_size_t& valid_cutpoint_count, std::vector<double>& variable_weights, 
+                                     std::vector<FeatureType>& feature_types, CutpointGridContainer& cutpoint_grid_container) {
+  // Evaluate all possible cutpoints according to the leaf node model, 
+  // recording their log-likelihood and other split information in a series of vectors.
+  // The last element of these vectors concerns the "no-split" option.
+  leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, tree_num, node_id, log_cutpoint_evaluations, 
+                                        cutpoint_features, cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, 
+                                        cutpoint_grid_container, node_begin, node_end, variable_weights, feature_types);
+
+  // Compute an adjustment to reflect the no split prior probability and the number of cutpoints
+  double bart_prior_no_split_adj;
+  double alpha = tree_prior.GetAlpha();
+  double beta = tree_prior.GetBeta();
+  int node_depth = tree->GetDepth(node_id);
+  if (valid_cutpoint_count == 0) {
+    bart_prior_no_split_adj = std::log(((std::pow(1+node_depth, beta))/alpha) - 1.0);
+  } else {
+    bart_prior_no_split_adj = std::log(((std::pow(1+node_depth, beta))/alpha) - 1.0) + std::log(valid_cutpoint_count);
+  }
+  log_cutpoint_evaluations[log_cutpoint_evaluations.size()-1] += bart_prior_no_split_adj;
+}
+
+template <typename LeafModel>
+static inline void SampleSplitRule(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
+                                   TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, 
+                                   std::unordered_map<int, std::pair<data_size_t, data_size_t>>& node_index_map, std::deque<node_t>& split_queue, 
+                                   int node_id, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
+                                   std::vector<FeatureType>& feature_types) {
+  // Leaf depth
+  int leaf_depth = tree->GetDepth(node_id);
+
+  // Maximum leaf depth
+  int32_t max_depth = tree_prior.GetMaxDepth();
+
+  if ((max_depth == -1) || (leaf_depth < max_depth)) {
+  
+    // Cutpoint enumeration
+    std::vector<double> log_cutpoint_evaluations;
+    std::vector<int> cutpoint_features;
+    std::vector<double> cutpoint_values;
+    std::vector<FeatureType> cutpoint_feature_types;
+    StochTree::data_size_t valid_cutpoint_count;
+    CutpointGridContainer cutpoint_grid_container(dataset.GetCovariates(), residual.GetData(), cutpoint_grid_size);
+    EvaluateCutpoints<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance,
+                                 cutpoint_grid_size, node_id, node_begin, node_end, log_cutpoint_evaluations, cutpoint_features, 
+                                 cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, variable_weights, feature_types, 
+                                 cutpoint_grid_container);
+    // TODO: maybe add some checks here?
+    
+    // Convert log marginal likelihood to marginal likelihood, normalizing by the maximum log-likelihood
+    double largest_mll = *std::max_element(log_cutpoint_evaluations.begin(), log_cutpoint_evaluations.end());
+    std::vector<double> cutpoint_evaluations(log_cutpoint_evaluations.size());
+    for (data_size_t i = 0; i < log_cutpoint_evaluations.size(); i++){
+      cutpoint_evaluations[i] = std::exp(log_cutpoint_evaluations[i] - largest_mll);
+    }
+    
+    // Sample the split (including a "no split" option)
+    std::discrete_distribution<data_size_t> split_dist(cutpoint_evaluations.begin(), cutpoint_evaluations.end());
+    data_size_t split_chosen = split_dist(gen);
+    
+    if (split_chosen == valid_cutpoint_count){
+      // "No split" sampled, don't split or add any nodes to split queue
+      return;
+    } else {
+      // Split sampled
+      int feature_split = cutpoint_features[split_chosen];
+      FeatureType feature_type = cutpoint_feature_types[split_chosen];
+      double split_value = cutpoint_values[split_chosen];
+      // Perform all of the relevant "split" operations in the model, tree and training dataset
+      
+      // Compute node sample size
+      data_size_t node_n = node_end - node_begin;
+      
+      // Actual numeric cutpoint used for ordered categorical and numeric features
+      double split_value_numeric;
+      TreeSplit tree_split;
+      
+      // We will use these later in the model expansion
+      data_size_t left_n = 0;
+      data_size_t right_n = 0;
+      data_size_t sort_idx;
+      double feature_value;
+      bool split_true;
+
+      if (feature_type == FeatureType::kUnorderedCategorical) {
+        // Determine the number of categories available in a categorical split and the set of categories that route observations to the left node after split
+        int num_categories;
+        std::vector<std::uint32_t> categories = cutpoint_grid_container.CutpointVector(static_cast<std::uint32_t>(split_value), feature_split);
+        tree_split = TreeSplit(categories);
+      } else if (feature_type == FeatureType::kOrderedCategorical) {
+        // Convert the bin split to an actual split value
+        split_value_numeric = cutpoint_grid_container.CutpointValue(static_cast<std::uint32_t>(split_value), feature_split);
+        tree_split = TreeSplit(split_value_numeric);
+      } else if (feature_type == FeatureType::kNumeric) {
+        // Convert the bin split to an actual split value
+        split_value_numeric = cutpoint_grid_container.CutpointValue(static_cast<std::uint32_t>(split_value), feature_split);
+        tree_split = TreeSplit(split_value_numeric);
+      } else {
+        Log::Fatal("Invalid split type");
+      }
+      
+      // Add split to tree and trackers
+      AddSplitToModel(tracker, dataset, tree_prior, tree_split, gen, tree, tree_num, node_id, feature_split, true);
+
+      // Determine the number of observation in the newly created left node
+      int left_node = tree->LeftChild(node_id);
+      int right_node = tree->RightChild(node_id);
+      auto left_begin_iter = tracker.SortedNodeBeginIterator(left_node, feature_split);
+      auto left_end_iter = tracker.SortedNodeEndIterator(left_node, feature_split);
+      for (auto i = left_begin_iter; i < left_end_iter; i++) {
+        left_n += 1;
+      }
+
+      // Add the begin and end indices for the new left and right nodes to node_index_map
+      node_index_map.insert({left_node, std::make_pair(node_begin, node_begin + left_n)});
+      node_index_map.insert({right_node, std::make_pair(node_begin + left_n, node_end)});
+
+      // Add the left and right nodes to the split tracker
+      split_queue.push_front(right_node);
+      split_queue.push_front(left_node);      
+    }
+  }
+}
+
+template <typename LeafModel>
+static inline void GFRSampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
+                                        ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
+                                        int tree_num, double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size) {
+  int root_id = Tree::kRoot;
+  int curr_node_id;
+  data_size_t curr_node_begin;
+  data_size_t curr_node_end;
+  data_size_t n = dataset.GetCovariates().rows();
+  // Mapping from node id to start and end points of sorted indices
+  std::unordered_map<int, std::pair<data_size_t, data_size_t>> node_index_map;
+  node_index_map.insert({root_id, std::make_pair(0, n)});
+  std::pair<data_size_t, data_size_t> begin_end;
+  // Add root node to the split queue
+  std::deque<node_t> split_queue;
+  split_queue.push_back(Tree::kRoot);
+  // Run the "GrowFromRoot" procedure using a stack in place of recursion
+  while (!split_queue.empty()) {
+    // Remove the next node from the queue
+    curr_node_id = split_queue.front();
+    split_queue.pop_front();
+    // Determine the beginning and ending indices of the left and right nodes
+    begin_end = node_index_map[curr_node_id];
+    curr_node_begin = begin_end.first;
+    curr_node_end = begin_end.second;
+    // Draw a split rule at random
+    SampleSplitRule<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance, cutpoint_grid_size, 
+                               node_index_map, split_queue, curr_node_id, curr_node_begin, curr_node_end, variable_weights, feature_types);
+  }
+}
+
+template <typename LeafModel>
+static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
+                                    ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
+                                    double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size = 500, 
+                                    bool pre_initialized = false) {
   // Previous number of samples
   int prev_num_samples = forests.NumSamples();
   
@@ -251,84 +411,41 @@ static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& fo
   } else if (prev_num_samples > 0) {
     // Add new forest to the container
     forests.AddSamples(1);
-    
-    // Copy previous forest
+
+    // NOTE: only doing this for the simplicity of the partial residual step
+    // We could alternatively "reach back" to the tree predictions from a previous
+    // sample (whenever there is more than one sample). This is cleaner / quicker
+    // to implement during this refactor.
     forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
   } else {
     forests.IncrementSampleCount();
   }
   
-  // Run the MCMC algorithm for each tree
+  // Run the GFR algorithm for each tree
   TreeEnsemble* ensemble = forests.GetEnsemble(prev_num_samples);
-  Tree* tree;
   int num_trees = forests.NumTrees();
   for (int i = 0; i < num_trees; i++) {
     // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
-    tree = ensemble->GetTree(i);
+    Tree* tree = ensemble->GetTree(i);
     UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
     
-    // Sample tree i
+    // Reset the tree and sample trackers
+    ensemble->ResetInitTree(i);
+    tracker.ResetRoot(dataset.GetCovariates(), feature_types, i);
     tree = ensemble->GetTree(i);
-    MCMCSampleTreeOneIter<LeafModel>(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance);
+    
+    // Sample tree i
+    GFRSampleTreeOneIter<LeafModel>(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance, feature_types, cutpoint_grid_size);
     
     // Sample leaf parameters for tree i
     tree = ensemble->GetTree(i);
     leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
     
     // Subtract tree i's predictions back out of the residual
-    tree = ensemble->GetTree(i);
     UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
   }
 }
 
-template <typename LeafModel>
-static inline void MCMCSampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
-                                         ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                         int tree_num, double global_variance) {
-  // Determine whether it is possible to grow any of the leaves
-  bool grow_possible = false;
-  std::vector<int> leaves = tree->GetLeaves();
-  for (auto& leaf: leaves) {
-    if (tracker.UnsortedNodeSize(tree_num, leaf) > 2 * tree_prior.GetMinSamplesLeaf()) {
-      grow_possible = true;
-      break;
-    }
-  }
-
-  // Determine whether it is possible to prune the tree
-  bool prune_possible = false;
-  if (tree->NumValidNodes() > 1) {
-    prune_possible = true;
-  }
-
-  // Determine the relative probability of grow vs prune (0 = grow, 1 = prune)
-  double prob_grow;
-  std::vector<double> step_probs(2);
-  if (grow_possible && prune_possible) {
-    step_probs = {0.5, 0.5};
-    prob_grow = 0.5;
-  } else if (!grow_possible && prune_possible) {
-    step_probs = {0.0, 1.0};
-    prob_grow = 0.0;
-  } else if (grow_possible && !prune_possible) {
-    step_probs = {1.0, 0.0};
-    prob_grow = 1.0;
-  } else {
-    Log::Fatal("In this tree, neither grow nor prune is possible");
-  }
-  std::discrete_distribution<> step_dist(step_probs.begin(), step_probs.end());
-
-  // Draw a split rule at random
-  data_size_t step_chosen = step_dist(gen);
-  bool accept;
-  
-  if (step_chosen == 0) {
-    MCMCGrowTreeOneIter<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, variable_weights, global_variance, prob_grow);
-  } else {
-    MCMCPruneTreeOneIter<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance);
-  }
-}
-
 template <typename LeafModel>
 static inline void MCMCGrowTreeOneIter(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
                                        TreePrior& tree_prior, std::mt19937& gen, int tree_num, std::vector<double>& variable_weights, 
@@ -506,10 +623,57 @@ static inline void MCMCPruneTreeOneIter(Tree* tree, ForestTracker& tracker, Leaf
 }
 
 template <typename LeafModel>
-static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
-                                    ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                    double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size = 500, 
-                                    bool pre_initialized = false) {
+static inline void MCMCSampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
+                                         ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
+                                         int tree_num, double global_variance) {
+  // Determine whether it is possible to grow any of the leaves
+  bool grow_possible = false;
+  std::vector<int> leaves = tree->GetLeaves();
+  for (auto& leaf: leaves) {
+    if (tracker.UnsortedNodeSize(tree_num, leaf) > 2 * tree_prior.GetMinSamplesLeaf()) {
+      grow_possible = true;
+      break;
+    }
+  }
+
+  // Determine whether it is possible to prune the tree
+  bool prune_possible = false;
+  if (tree->NumValidNodes() > 1) {
+    prune_possible = true;
+  }
+
+  // Determine the relative probability of grow vs prune (0 = grow, 1 = prune)
+  double prob_grow;
+  std::vector<double> step_probs(2);
+  if (grow_possible && prune_possible) {
+    step_probs = {0.5, 0.5};
+    prob_grow = 0.5;
+  } else if (!grow_possible && prune_possible) {
+    step_probs = {0.0, 1.0};
+    prob_grow = 0.0;
+  } else if (grow_possible && !prune_possible) {
+    step_probs = {1.0, 0.0};
+    prob_grow = 1.0;
+  } else {
+    Log::Fatal("In this tree, neither grow nor prune is possible");
+  }
+  std::discrete_distribution<> step_dist(step_probs.begin(), step_probs.end());
+
+  // Draw a split rule at random
+  data_size_t step_chosen = step_dist(gen);
+  bool accept;
+  
+  if (step_chosen == 0) {
+    MCMCGrowTreeOneIter<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, variable_weights, global_variance, prob_grow);
+  } else {
+    MCMCPruneTreeOneIter<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance);
+  }
+}
+
+template <typename LeafModel>
+static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
+                                     ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
+                                     double global_variance, bool pre_initialized = false) {
   // Previous number of samples
   int prev_num_samples = forests.NumSamples();
   
@@ -524,200 +688,36 @@ static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& for
   } else if (prev_num_samples > 0) {
     // Add new forest to the container
     forests.AddSamples(1);
-
-    // NOTE: only doing this for the simplicity of the partial residual step
-    // We could alternatively "reach back" to the tree predictions from a previous
-    // sample (whenever there is more than one sample). This is cleaner / quicker
-    // to implement during this refactor.
+    
+    // Copy previous forest
     forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
   } else {
     forests.IncrementSampleCount();
   }
   
-  // Run the GFR algorithm for each tree
+  // Run the MCMC algorithm for each tree
   TreeEnsemble* ensemble = forests.GetEnsemble(prev_num_samples);
+  Tree* tree;
   int num_trees = forests.NumTrees();
   for (int i = 0; i < num_trees; i++) {
     // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
-    Tree* tree = ensemble->GetTree(i);
-    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
-    
-    // Reset the tree and sample trackers
-    ensemble->ResetInitTree(i);
-    tracker.ResetRoot(dataset.GetCovariates(), feature_types, i);
     tree = ensemble->GetTree(i);
+    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
     
     // Sample tree i
-    GFRSampleTreeOneIter<LeafModel>(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance, feature_types, cutpoint_grid_size);
+    tree = ensemble->GetTree(i);
+    MCMCSampleTreeOneIter<LeafModel>(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance);
     
     // Sample leaf parameters for tree i
     tree = ensemble->GetTree(i);
     leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
     
     // Subtract tree i's predictions back out of the residual
+    tree = ensemble->GetTree(i);
     UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
   }
 }
 
-template <typename LeafModel>
-static inline void GFRSampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
-                                        ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                        int tree_num, double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size) {
-  int root_id = Tree::kRoot;
-  int curr_node_id;
-  data_size_t curr_node_begin;
-  data_size_t curr_node_end;
-  data_size_t n = dataset.GetCovariates().rows();
-  // Mapping from node id to start and end points of sorted indices
-  std::unordered_map<int, std::pair<data_size_t, data_size_t>> node_index_map;
-  node_index_map.insert({root_id, std::make_pair(0, n)});
-  std::pair<data_size_t, data_size_t> begin_end;
-  // Add root node to the split queue
-  std::deque<node_t> split_queue;
-  split_queue.push_back(Tree::kRoot);
-  // Run the "GrowFromRoot" procedure using a stack in place of recursion
-  while (!split_queue.empty()) {
-    // Remove the next node from the queue
-    curr_node_id = split_queue.front();
-    split_queue.pop_front();
-    // Determine the beginning and ending indices of the left and right nodes
-    begin_end = node_index_map[curr_node_id];
-    curr_node_begin = begin_end.first;
-    curr_node_end = begin_end.second;
-    // Draw a split rule at random
-    SampleSplitRule<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance, cutpoint_grid_size, 
-                               node_index_map, split_queue, curr_node_id, curr_node_begin, curr_node_end, variable_weights, feature_types);
-  }
-}
-
-template <typename LeafModel>
-static inline void SampleSplitRule(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
-                                   TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, 
-                                   std::unordered_map<int, std::pair<data_size_t, data_size_t>>& node_index_map, std::deque<node_t>& split_queue, 
-                                   int node_id, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
-                                   std::vector<FeatureType>& feature_types) {
-  // Leaf depth
-  int leaf_depth = tree->GetDepth(node_id);
-
-  // Maximum leaf depth
-  int32_t max_depth = tree_prior.GetMaxDepth();
-
-  if ((max_depth == -1) || (leaf_depth < max_depth)) {
-  
-    // Cutpoint enumeration
-    std::vector<double> log_cutpoint_evaluations;
-    std::vector<int> cutpoint_features;
-    std::vector<double> cutpoint_values;
-    std::vector<FeatureType> cutpoint_feature_types;
-    StochTree::data_size_t valid_cutpoint_count;
-    CutpointGridContainer cutpoint_grid_container(dataset.GetCovariates(), residual.GetData(), cutpoint_grid_size);
-    EvaluateCutpoints<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance,
-                                 cutpoint_grid_size, node_id, node_begin, node_end, log_cutpoint_evaluations, cutpoint_features, 
-                                 cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, variable_weights, feature_types, 
-                                 cutpoint_grid_container);
-    // TODO: maybe add some checks here?
-    
-    // Convert log marginal likelihood to marginal likelihood, normalizing by the maximum log-likelihood
-    double largest_mll = *std::max_element(log_cutpoint_evaluations.begin(), log_cutpoint_evaluations.end());
-    std::vector<double> cutpoint_evaluations(log_cutpoint_evaluations.size());
-    for (data_size_t i = 0; i < log_cutpoint_evaluations.size(); i++){
-      cutpoint_evaluations[i] = std::exp(log_cutpoint_evaluations[i] - largest_mll);
-    }
-    
-    // Sample the split (including a "no split" option)
-    std::discrete_distribution<data_size_t> split_dist(cutpoint_evaluations.begin(), cutpoint_evaluations.end());
-    data_size_t split_chosen = split_dist(gen);
-    
-    if (split_chosen == valid_cutpoint_count){
-      // "No split" sampled, don't split or add any nodes to split queue
-      return;
-    } else {
-      // Split sampled
-      int feature_split = cutpoint_features[split_chosen];
-      FeatureType feature_type = cutpoint_feature_types[split_chosen];
-      double split_value = cutpoint_values[split_chosen];
-      // Perform all of the relevant "split" operations in the model, tree and training dataset
-      
-      // Compute node sample size
-      data_size_t node_n = node_end - node_begin;
-      
-      // Actual numeric cutpoint used for ordered categorical and numeric features
-      double split_value_numeric;
-      TreeSplit tree_split;
-      
-      // We will use these later in the model expansion
-      data_size_t left_n = 0;
-      data_size_t right_n = 0;
-      data_size_t sort_idx;
-      double feature_value;
-      bool split_true;
-
-      if (feature_type == FeatureType::kUnorderedCategorical) {
-        // Determine the number of categories available in a categorical split and the set of categories that route observations to the left node after split
-        int num_categories;
-        std::vector<std::uint32_t> categories = cutpoint_grid_container.CutpointVector(static_cast<std::uint32_t>(split_value), feature_split);
-        tree_split = TreeSplit(categories);
-      } else if (feature_type == FeatureType::kOrderedCategorical) {
-        // Convert the bin split to an actual split value
-        split_value_numeric = cutpoint_grid_container.CutpointValue(static_cast<std::uint32_t>(split_value), feature_split);
-        tree_split = TreeSplit(split_value_numeric);
-      } else if (feature_type == FeatureType::kNumeric) {
-        // Convert the bin split to an actual split value
-        split_value_numeric = cutpoint_grid_container.CutpointValue(static_cast<std::uint32_t>(split_value), feature_split);
-        tree_split = TreeSplit(split_value_numeric);
-      } else {
-        Log::Fatal("Invalid split type");
-      }
-      
-      // Add split to tree and trackers
-      AddSplitToModel(tracker, dataset, tree_prior, tree_split, gen, tree, tree_num, node_id, feature_split, true);
-
-      // Determine the number of observation in the newly created left node
-      int left_node = tree->LeftChild(node_id);
-      int right_node = tree->RightChild(node_id);
-      auto left_begin_iter = tracker.SortedNodeBeginIterator(left_node, feature_split);
-      auto left_end_iter = tracker.SortedNodeEndIterator(left_node, feature_split);
-      for (auto i = left_begin_iter; i < left_end_iter; i++) {
-        left_n += 1;
-      }
-
-      // Add the begin and end indices for the new left and right nodes to node_index_map
-      node_index_map.insert({left_node, std::make_pair(node_begin, node_begin + left_n)});
-      node_index_map.insert({right_node, std::make_pair(node_begin + left_n, node_end)});
-
-      // Add the left and right nodes to the split tracker
-      split_queue.push_front(right_node);
-      split_queue.push_front(left_node);      
-    }
-  }
-}
-
-template <typename LeafModel>
-static inline void EvaluateCutpoints(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, TreePrior& tree_prior, 
-                                     std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, int node_id, data_size_t node_begin, data_size_t node_end, 
-                                     std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, 
-                                     std::vector<FeatureType>& cutpoint_feature_types, data_size_t& valid_cutpoint_count, std::vector<double>& variable_weights, 
-                                     std::vector<FeatureType>& feature_types, CutpointGridContainer& cutpoint_grid_container) {
-  // Evaluate all possible cutpoints according to the leaf node model, 
-  // recording their log-likelihood and other split information in a series of vectors.
-  // The last element of these vectors concerns the "no-split" option.
-  leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, tree_num, node_id, log_cutpoint_evaluations, 
-                                        cutpoint_features, cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, 
-                                        cutpoint_grid_container, node_begin, node_end, variable_weights, feature_types);
-
-  // Compute an adjustment to reflect the no split prior probability and the number of cutpoints
-  double bart_prior_no_split_adj;
-  double alpha = tree_prior.GetAlpha();
-  double beta = tree_prior.GetBeta();
-  int node_depth = tree->GetDepth(node_id);
-  if (valid_cutpoint_count == 0) {
-    bart_prior_no_split_adj = std::log(((std::pow(1+node_depth, beta))/alpha) - 1.0);
-  } else {
-    bart_prior_no_split_adj = std::log(((std::pow(1+node_depth, beta))/alpha) - 1.0) + std::log(valid_cutpoint_count);
-  }
-  log_cutpoint_evaluations[log_cutpoint_evaluations.size()-1] += bart_prior_no_split_adj;
-}
-
 } // namespace StochTree
 
 #endif // STOCHTREE_TREE_SAMPLER_H_
\ No newline at end of file
diff --git a/src/sampler.cpp b/src/sampler.cpp
index bfb0fe6e..2fc241e6 100644
--- a/src/sampler.cpp
+++ b/src/sampler.cpp
@@ -127,8 +127,8 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
         StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
         MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
-        StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
+        MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     }
 }
 

From e934db26d2a52ae665a1e5ec2d2428c3739d2bad Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sat, 24 Aug 2024 00:12:42 -0500
Subject: [PATCH 10/41] Added StochTree scope to sampler function calls

---
 src/py_stochtree.cpp | 12 ++++++------
 src/sampler.cpp      | 12 ++++++------
 2 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/src/py_stochtree.cpp b/src/py_stochtree.cpp
index 47e9e26b..7025d8a9 100644
--- a/src/py_stochtree.cpp
+++ b/src/py_stochtree.cpp
@@ -512,13 +512,13 @@ class ForestSamplerCpp {
                          Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size, bool pre_initialized) {
     if (leaf_model_enum == ForestLeafModel::kConstant) {
       StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-      GFRSampleOneIter<StochTree::GaussianConstantLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
+      StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
       StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-      GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
+      StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
       StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-      GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
+      StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     }
   }
 
@@ -527,13 +527,13 @@ class ForestSamplerCpp {
                           Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size, bool pre_initialized) {
     if (leaf_model_enum == ForestLeafModel::kConstant) {
       StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-      MCMCSampleOneIter<StochTree::GaussianConstantLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
       StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-      MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
       StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-      MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     }
   }
 };
diff --git a/src/sampler.cpp b/src/sampler.cpp
index 2fc241e6..1229d6f0 100644
--- a/src/sampler.cpp
+++ b/src/sampler.cpp
@@ -61,13 +61,13 @@ void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDatas
     // Run one iteration of the sampler
     if (leaf_model_enum == ForestLeafModel::kConstant) {
         StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        GFRSampleOneIter<StochTree::GaussianConstantLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
         StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
         StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     }
 }
 
@@ -122,13 +122,13 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
     // Run one iteration of the sampler
     if (leaf_model_enum == ForestLeafModel::kConstant) {
         StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        MCMCSampleOneIter<StochTree::GaussianConstantLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
         StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
         StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     }
 }
 

From 9646a0844488e2ef3db58284764ff720b09a593b Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 27 Aug 2024 00:46:12 -0500
Subject: [PATCH 11/41] Refactor sampler iteration to avoid incremental object
 creation

---
 debug/README.md                  |  15 +-
 debug/api_debug.cpp              | 121 ++++----
 include/stochtree/leaf_model.h   | 155 ++++++++--
 include/stochtree/meta.h         |  10 +-
 include/stochtree/tree_sampler.h | 248 ++++++++++++---
 src/leaf_model.cpp               | 501 -------------------------------
 src/py_stochtree.cpp             |  12 +-
 src/sampler.cpp                  |  12 +-
 8 files changed, 444 insertions(+), 630 deletions(-)

diff --git a/debug/README.md b/debug/README.md
index 907a4ec0..e740b4ef 100644
--- a/debug/README.md
+++ b/debug/README.md
@@ -4,12 +4,19 @@ This subdirectory contains a debug program for the C++ codebase.
 The program takes several command line arguments (in order):
 
 1. Which data-generating process (DGP) to run (integer-coded, see below for a detailed description)
-2. Whether or not to include random effects (0 = no, 1 = yes)
-3. Number of grow-from-root (GFR) samples
-4. Number of MCMC samples
-5. Seed for random number generator (-1 means we defer to C++ `std::random_device`)
+1. Which leaf model to sample (integer-coded, see below for a detailed description)
+3. Whether or not to include random effects (0 = no, 1 = yes)
+4. Number of grow-from-root (GFR) samples
+5. Number of MCMC samples
+6. Seed for random number generator (-1 means we defer to C++ `std::random_device`)
 
 The DGPs are numbered as follows:
 
 0. Simple leaf regression model with a univariate basis for the leaf model
 1. Constant leaf model with a large number of deep interactions between features
+
+The models are numbered as follows:
+
+0. Constant leaf tree model (the "classic" BART / XBART model)
+1. "Univariate basis" leaf regression model
+2. "Multivariate basis" leaf regression model
diff --git a/debug/api_debug.cpp b/debug/api_debug.cpp
index d7420d5f..5d84c00b 100644
--- a/debug/api_debug.cpp
+++ b/debug/api_debug.cpp
@@ -16,16 +16,11 @@
 #include <random>
 #include <string>
 #include <unordered_map>
+#include <variant>
 #include <vector>
 
 namespace StochTree{
 
-enum ForestLeafModel {
-    kConstant, 
-    kUnivariateRegression, 
-    kMultivariateRegression
-};
-
 void GenerateDGP1(std::vector<double>& covariates, std::vector<double>& basis, std::vector<double>& outcome, std::vector<double>& rfx_basis, std::vector<int32_t>& rfx_groups, std::vector<FeatureType>& feature_types, std::mt19937& gen, int& n, int& x_cols, int& omega_cols, int& y_cols, int& rfx_basis_cols, int& num_rfx_groups, bool rfx_included, int random_seed = -1) {
   // Data dimensions
   n = 1000;
@@ -265,37 +260,37 @@ void OutcomeOffsetScale(ColumnVector& residual, double& outcome_offset, double&
   }
 }
 
-void sampleGFR(ForestTracker& tracker, TreePrior& tree_prior, ForestContainer& forest_samples, ForestDataset& dataset, 
-               ColumnVector& residual, std::mt19937& rng, std::vector<FeatureType>& feature_types, std::vector<double>& var_weights_vector, 
-               ForestLeafModel leaf_model_type, Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size) {
-  if (leaf_model_type == ForestLeafModel::kConstant) {
-    GaussianConstantLeafModel leaf_model = GaussianConstantLeafModel(leaf_scale);
-    GFRSampleOneIter<GaussianConstantLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
-  } else if (leaf_model_type == ForestLeafModel::kUnivariateRegression) {
-    GaussianUnivariateRegressionLeafModel leaf_model = GaussianUnivariateRegressionLeafModel(leaf_scale);
-    GFRSampleOneIter<GaussianUnivariateRegressionLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
-  } else if (leaf_model_type == ForestLeafModel::kMultivariateRegression) {
-    GaussianMultivariateRegressionLeafModel leaf_model = GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-    GFRSampleOneIter<GaussianMultivariateRegressionLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
-  }
-}
-
-void sampleMCMC(ForestTracker& tracker, TreePrior& tree_prior, ForestContainer& forest_samples, ForestDataset& dataset, 
-                ColumnVector& residual, std::mt19937& rng, std::vector<FeatureType>& feature_types, std::vector<double>& var_weights_vector, 
-                ForestLeafModel leaf_model_type, Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size) {
-  if (leaf_model_type == ForestLeafModel::kConstant) {
-    GaussianConstantLeafModel leaf_model = GaussianConstantLeafModel(leaf_scale);
-    MCMCSampleOneIter<GaussianConstantLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
-  } else if (leaf_model_type == ForestLeafModel::kUnivariateRegression) {
-    GaussianUnivariateRegressionLeafModel leaf_model = GaussianUnivariateRegressionLeafModel(leaf_scale);
-    MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
-  } else if (leaf_model_type == ForestLeafModel::kMultivariateRegression) {
-    GaussianMultivariateRegressionLeafModel leaf_model = GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-    MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
-  }
-}
-
-void RunDebug(int dgp_num = 0, bool rfx_included = false, int num_gfr = 10, int num_mcmc = 100, int random_seed = -1) {
+// void sampleGFR(ForestTracker& tracker, TreePrior& tree_prior, ForestContainer& forest_samples, ForestDataset& dataset, 
+//                ColumnVector& residual, std::mt19937& rng, std::vector<FeatureType>& feature_types, std::vector<double>& var_weights_vector, 
+//                ForestLeafModel leaf_model_type, Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size) {
+//   if (leaf_model_type == ForestLeafModel::kConstant) {
+//     GaussianConstantLeafModel leaf_model = GaussianConstantLeafModel(leaf_scale);
+//     GFRSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
+//   } else if (leaf_model_type == ForestLeafModel::kUnivariateRegression) {
+//     GaussianUnivariateRegressionLeafModel leaf_model = GaussianUnivariateRegressionLeafModel(leaf_scale);
+//     GFRSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
+//   } else if (leaf_model_type == ForestLeafModel::kMultivariateRegression) {
+//     GaussianMultivariateRegressionLeafModel leaf_model = GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
+//     GFRSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
+//   }
+// }
+
+// void sampleMCMC(ForestTracker& tracker, TreePrior& tree_prior, ForestContainer& forest_samples, ForestDataset& dataset, 
+//                 ColumnVector& residual, std::mt19937& rng, std::vector<FeatureType>& feature_types, std::vector<double>& var_weights_vector, 
+//                 ForestLeafModel leaf_model_type, Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size) {
+//   if (leaf_model_type == ForestLeafModel::kConstant) {
+//     GaussianConstantLeafModel leaf_model = GaussianConstantLeafModel(leaf_scale);
+//     MCMCSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
+//   } else if (leaf_model_type == ForestLeafModel::kUnivariateRegression) {
+//     GaussianUnivariateRegressionLeafModel leaf_model = GaussianUnivariateRegressionLeafModel(leaf_scale);
+//     MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
+//   } else if (leaf_model_type == ForestLeafModel::kMultivariateRegression) {
+//     GaussianMultivariateRegressionLeafModel leaf_model = GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
+//     MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
+//   }
+// }
+
+void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, bool rfx_included = false, int num_gfr = 10, int num_mcmc = 100, int random_seed = -1) {
   // Flag the data as row-major
   bool row_major = true;
 
@@ -326,24 +321,26 @@ void RunDebug(int dgp_num = 0, bool rfx_included = false, int num_gfr = 10, int
   std::vector<int32_t> rfx_groups;
   std::vector<FeatureType> feature_types;
 
+  // Check for DGP : ModelType compatibility
+  if ((model_type != kConstantLeafGaussian) && (dgp_num == 1)) {
+    Log::Fatal("dgp 2 is only compatible with a constant leaf model");
+  }
+
   // Generate the data
   int output_dimension;
   bool is_leaf_constant;
-  ForestLeafModel leaf_model_type;
   if (dgp_num == 0) {
     GenerateDGP1(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
     dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
     dataset.AddBasis(basis_raw.data(), n, omega_cols, row_major);
     output_dimension = 1;
     is_leaf_constant = false;
-    leaf_model_type = ForestLeafModel::kUnivariateRegression;
   }
   else if (dgp_num == 1) {
     GenerateDGP2(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
     dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
     output_dimension = 1;
     is_leaf_constant = true;
-    leaf_model_type = ForestLeafModel::kConstant;
   }
   else {
     Log::Fatal("Invalid dgp_num");
@@ -441,6 +438,9 @@ void RunDebug(int dgp_num = 0, bool rfx_included = false, int num_gfr = 10, int
   std::vector<double> global_variance_samples{};
   std::vector<double> leaf_variance_samples{};
 
+  // Prepare the samplers
+  LeafModelVariant leaf_model = leafModelFactory(model_type, leaf_scale, leaf_scale_matrix);
+
   // Run the GFR sampler
   if (num_gfr > 0) {
     for (int i = 0; i < num_gfr; i++) {
@@ -454,8 +454,13 @@ void RunDebug(int dgp_num = 0, bool rfx_included = false, int num_gfr = 10, int
       }
 
       // Sample tree ensemble
-      sampleGFR(tracker, tree_prior, forest_samples, dataset, residual, gen, feature_types, variable_weights,
-        leaf_model_type, leaf_scale_matrix, global_variance, leaf_scale, cutpoint_grid_size);
+      if (model_type == ModelType::kConstantLeafGaussian) {
+        GFRSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false);
+      } else if (model_type == ModelType::kUnivariateRegressionLeafGaussian) {
+        GFRSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false);
+      } else if (model_type == ModelType::kMultivariateRegressionLeafGaussian) {
+        GFRSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, omega_cols);
+      }
 
       if (rfx_included) {
         // Sample random effects
@@ -484,8 +489,13 @@ void RunDebug(int dgp_num = 0, bool rfx_included = false, int num_gfr = 10, int
       }
 
       // Sample tree ensemble
-      sampleMCMC(tracker, tree_prior, forest_samples, dataset, residual, gen, feature_types, variable_weights,
-        leaf_model_type, leaf_scale_matrix, global_variance, leaf_scale, cutpoint_grid_size);
+      if (model_type == ModelType::kConstantLeafGaussian) {
+        MCMCSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false);
+      } else if (model_type == ModelType::kUnivariateRegressionLeafGaussian) {
+        MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false);
+      } else if (model_type == ModelType::kMultivariateRegressionLeafGaussian) {
+        MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, omega_cols);
+      }
 
       if (rfx_included) {
         // Sample random effects
@@ -531,24 +541,29 @@ int main(int argc, char* argv[]) {
   if ((dgp_num != 0) && (dgp_num != 1)) {
     StochTree::Log::Fatal("The first command line argument must be 0 or 1");
   }
-  int rfx_int = std::stoi(argv[2]);
+  int model_type_int = static_cast<StochTree::ModelType>(std::stoi(argv[2]));
+  if ((model_type_int != 0) && (model_type_int != 1) && (model_type_int != 2)) {
+    StochTree::Log::Fatal("The second command line argument must be 0, 1, or 2");
+  }
+  StochTree::ModelType model_type = static_cast<StochTree::ModelType>(model_type_int);
+  int rfx_int = std::stoi(argv[3]);
   if ((rfx_int != 0) && (rfx_int != 1)) {
-    StochTree::Log::Fatal("The second command line argument must be 0 or 1");
+    StochTree::Log::Fatal("The third command line argument must be 0 or 1");
   }
   bool rfx_included = static_cast<bool>(rfx_int);
-  int num_gfr = std::stoi(argv[3]);
+  int num_gfr = std::stoi(argv[4]);
   if (num_gfr < 0) {
-    StochTree::Log::Fatal("The third command line argument must be >= 0");
+    StochTree::Log::Fatal("The fourth command line argument must be >= 0");
   }
-  int num_mcmc = std::stoi(argv[4]);
+  int num_mcmc = std::stoi(argv[5]);
   if (num_mcmc < 0) {
-    StochTree::Log::Fatal("The fourth command line argument must be >= 0");
+    StochTree::Log::Fatal("The fifth command line argument must be >= 0");
   }
-  int random_seed = std::stoi(argv[5]);
+  int random_seed = std::stoi(argv[6]);
   if (random_seed < -1) {
-    StochTree::Log::Fatal("The fifth command line argument must be >= -0");
+    StochTree::Log::Fatal("The sixth command line argument must be >= -0");
   }
 
   // Run the debug program
-  StochTree::RunDebug(dgp_num, rfx_included, num_gfr, num_mcmc);
+  StochTree::RunDebug(dgp_num, model_type, rfx_included, num_gfr, num_mcmc);
 }
diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index 3ea7a8bb..f006566f 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -20,6 +20,12 @@
 
 namespace StochTree {
 
+enum ModelType {
+  kConstantLeafGaussian, 
+  kUnivariateRegressionLeafGaussian, 
+  kMultivariateRegressionLeafGaussian
+};
+
 /*! \brief Sufficient statistic and associated operations for gaussian homoskedastic constant leaf outcome model */
 class GaussianConstantSuffStat {
  public:
@@ -67,12 +73,6 @@ class GaussianConstantLeafModel {
  public:
   GaussianConstantLeafModel(double tau) {tau_ = tau; normal_sampler_ = UnivariateNormalSampler();}
   ~GaussianConstantLeafModel() {}
-  std::tuple<double, double, data_size_t, data_size_t> EvaluateProposedSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreeSplit& split, int tree_num, int leaf_num, int split_feature, double global_variance);
-  std::tuple<double, double, data_size_t, data_size_t> EvaluateExistingSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, double global_variance, int tree_num, int split_node_id, int left_node_id, int right_node_id);
-  void EvaluateAllPossibleSplits(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreePrior& tree_prior, double global_variance, int tree_num, int split_node_id, 
-                                 std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, std::vector<FeatureType>& cutpoint_feature_types, 
-                                 data_size_t& valid_cutpoint_count, CutpointGridContainer& cutpoint_grid_container, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
-                                 std::vector<FeatureType>& feature_types);
   double SplitLogMarginalLikelihood(GaussianConstantSuffStat& left_stat, GaussianConstantSuffStat& right_stat, double global_variance);
   double NoSplitLogMarginalLikelihood(GaussianConstantSuffStat& suff_stat, double global_variance);
   double PosteriorParameterMean(GaussianConstantSuffStat& suff_stat, double global_variance);
@@ -133,12 +133,6 @@ class GaussianUnivariateRegressionLeafModel {
  public:
   GaussianUnivariateRegressionLeafModel(double tau) {tau_ = tau; normal_sampler_ = UnivariateNormalSampler();}
   ~GaussianUnivariateRegressionLeafModel() {}
-  std::tuple<double, double, data_size_t, data_size_t> EvaluateProposedSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreeSplit& split, int tree_num, int leaf_num, int split_feature, double global_variance);
-  std::tuple<double, double, data_size_t, data_size_t> EvaluateExistingSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, double global_variance, int tree_num, int split_node_id, int left_node_id, int right_node_id);
-  void EvaluateAllPossibleSplits(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreePrior& tree_prior, double global_variance, int tree_num, int split_node_id, 
-                                 std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, std::vector<FeatureType>& cutpoint_feature_types, 
-                                 data_size_t& valid_cutpoint_count, CutpointGridContainer& cutpoint_grid_container, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
-                                 std::vector<FeatureType>& feature_types);
   double SplitLogMarginalLikelihood(GaussianUnivariateRegressionSuffStat& left_stat, GaussianUnivariateRegressionSuffStat& right_stat, double global_variance);
   double NoSplitLogMarginalLikelihood(GaussianUnivariateRegressionSuffStat& suff_stat, double global_variance);
   double PosteriorParameterMean(GaussianUnivariateRegressionSuffStat& suff_stat, double global_variance);
@@ -201,12 +195,6 @@ class GaussianMultivariateRegressionLeafModel {
  public:
   GaussianMultivariateRegressionLeafModel(Eigen::MatrixXd& Sigma_0) {Sigma_0_ = Sigma_0; multivariate_normal_sampler_ = MultivariateNormalSampler();}
   ~GaussianMultivariateRegressionLeafModel() {}
-  std::tuple<double, double, data_size_t, data_size_t> EvaluateProposedSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreeSplit& split, int tree_num, int leaf_num, int split_feature, double global_variance);
-  std::tuple<double, double, data_size_t, data_size_t> EvaluateExistingSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, double global_variance, int tree_num, int split_node_id, int left_node_id, int right_node_id);
-  void EvaluateAllPossibleSplits(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreePrior& tree_prior, double global_variance, int tree_num, int split_node_id, 
-                                 std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, std::vector<FeatureType>& cutpoint_feature_types, 
-                                 data_size_t& valid_cutpoint_count, CutpointGridContainer& cutpoint_grid_container, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
-                                 std::vector<FeatureType>& feature_types);
   double SplitLogMarginalLikelihood(GaussianMultivariateRegressionSuffStat& left_stat, GaussianMultivariateRegressionSuffStat& right_stat, double global_variance);
   double NoSplitLogMarginalLikelihood(GaussianMultivariateRegressionSuffStat& suff_stat, double global_variance);
   Eigen::VectorXd PosteriorParameterMean(GaussianMultivariateRegressionSuffStat& suff_stat, double global_variance);
@@ -220,6 +208,137 @@ class GaussianMultivariateRegressionLeafModel {
   MultivariateNormalSampler multivariate_normal_sampler_;
 };
 
+using SuffStatVariant = std::variant<GaussianConstantSuffStat, 
+                                     GaussianUnivariateRegressionSuffStat, 
+                                     GaussianMultivariateRegressionSuffStat>;
+
+using LeafModelVariant = std::variant<GaussianConstantLeafModel, 
+                                      GaussianUnivariateRegressionLeafModel, 
+                                      GaussianMultivariateRegressionLeafModel>;
+
+template<typename SuffStatType, typename... SuffStatConstructorArgs>
+static inline SuffStatVariant createSuffStat(SuffStatConstructorArgs... leaf_suff_stat_args) {
+  return SuffStatType(leaf_suff_stat_args...);
+}
+
+template<typename LeafModelType, typename... LeafModelConstructorArgs>
+static inline LeafModelVariant createLeafModel(LeafModelConstructorArgs... leaf_model_args) {
+  return LeafModelType(leaf_model_args...);
+}
+
+static inline SuffStatVariant suffStatFactory(ModelType model_type, int basis_dim = 0) {
+  if (model_type == kConstantLeafGaussian) {
+    return createSuffStat<GaussianConstantSuffStat>();
+  } else if (model_type == kUnivariateRegressionLeafGaussian) {
+    return createSuffStat<GaussianUnivariateRegressionSuffStat>();
+  } else {
+    return createSuffStat<GaussianMultivariateRegressionSuffStat, int>(basis_dim);
+  }
+}
+
+static inline LeafModelVariant leafModelFactory(ModelType model_type, double tau, Eigen::MatrixXd& Sigma0) {
+  if (model_type == kConstantLeafGaussian) {
+    return createLeafModel<GaussianConstantLeafModel, double>(tau);
+  } else if (model_type == kUnivariateRegressionLeafGaussian) {
+    return createLeafModel<GaussianUnivariateRegressionLeafModel, double>(tau);
+  } else {
+    return createLeafModel<GaussianMultivariateRegressionLeafModel, Eigen::MatrixXd>(Sigma0);
+  }
+}
+
+template<typename SuffStatType>
+static inline void AccumulateSuffStatProposed(SuffStatType& node_suff_stat, SuffStatType& left_suff_stat, SuffStatType& right_suff_stat, ForestDataset& dataset, ForestTracker& tracker, 
+                                ColumnVector& residual, double global_variance, TreeSplit& split, int tree_num, int leaf_num, int split_feature) {
+  // Acquire iterators
+  auto node_begin_iter = tracker.UnsortedNodeBeginIterator(tree_num, leaf_num);
+  auto node_end_iter = tracker.UnsortedNodeEndIterator(tree_num, leaf_num);
+
+  // Accumulate sufficient statistics
+  for (auto i = node_begin_iter; i != node_end_iter; i++) {
+    auto idx = *i;
+    double feature_value = dataset.CovariateValue(idx, split_feature);
+    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    if (split.SplitTrue(feature_value)) {
+      left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    } else {
+      right_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    }
+  }
+}
+
+template<typename SuffStatType>
+static inline void AccumulateSuffStatExisting(SuffStatType& node_suff_stat, SuffStatType& left_suff_stat, SuffStatType& right_suff_stat, ForestDataset& dataset, ForestTracker& tracker, 
+                                ColumnVector& residual, double global_variance, int tree_num, int split_node_id, int left_node_id, int right_node_id) {
+  // Acquire iterators
+  auto left_node_begin_iter = tracker.UnsortedNodeBeginIterator(tree_num, left_node_id);
+  auto left_node_end_iter = tracker.UnsortedNodeEndIterator(tree_num, left_node_id);
+  auto right_node_begin_iter = tracker.UnsortedNodeBeginIterator(tree_num, right_node_id);
+  auto right_node_end_iter = tracker.UnsortedNodeEndIterator(tree_num, right_node_id);
+
+  // Accumulate sufficient statistics for the left and split nodes
+  for (auto i = left_node_begin_iter; i != left_node_end_iter; i++) {
+    auto idx = *i;
+    left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+  }
+
+  // Accumulate sufficient statistics for the right and split nodes
+  for (auto i = right_node_begin_iter; i != right_node_end_iter; i++) {
+    auto idx = *i;
+    right_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+  }
+}
+
+template<typename SuffStatType, bool sorted>
+static inline void AccumulateSingleNodeSuffStat(SuffStatType& node_suff_stat, ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, int tree_num, int node_id) {
+  // Acquire iterators
+  std::vector<data_size_t>::iterator node_begin_iter;
+  std::vector<data_size_t>::iterator node_end_iter;
+  if (sorted) {
+    // Default to the first feature if we're using the presort tracker
+    node_begin_iter = tracker.SortedNodeBeginIterator(node_id, 0);
+    node_end_iter = tracker.SortedNodeEndIterator(node_id, 0);
+  } else {
+    node_begin_iter = tracker.UnsortedNodeBeginIterator(tree_num, node_id);
+    node_end_iter = tracker.UnsortedNodeEndIterator(tree_num, node_id);
+  }
+  
+  // Accumulate sufficient statistics
+  for (auto i = node_begin_iter; i != node_end_iter; i++) {
+    auto idx = *i;
+    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+  }
+}
+
+template<typename SuffStatType>
+static inline void AccumulateCutpointBinSuffStat(SuffStatType& left_suff_stat, ForestTracker& tracker, CutpointGridContainer& cutpoint_grid_container, 
+                                   ForestDataset& dataset, ColumnVector& residual, double global_variance, int tree_num, int node_id, 
+                                   int feature_num, int cutpoint_num) {
+  // Acquire iterators
+  auto node_begin_iter = tracker.SortedNodeBeginIterator(node_id, feature_num);
+  auto node_end_iter = tracker.SortedNodeEndIterator(node_id, feature_num);
+  
+  // Determine node start point
+  data_size_t node_begin = tracker.SortedNodeBegin(node_id, feature_num);
+
+  // Determine cutpoint bin start and end points
+  data_size_t current_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_num, feature_num);
+  data_size_t current_bin_size = cutpoint_grid_container.BinLength(cutpoint_num, feature_num);
+  data_size_t next_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_num + 1, feature_num);
+
+  // Cutpoint specific iterators
+  // TODO: fix the hack of having to subtract off node_begin, probably by cleaning up the CutpointGridContainer interface
+  auto cutpoint_begin_iter = node_begin_iter + (current_bin_begin - node_begin);
+  auto cutpoint_end_iter = node_begin_iter + (next_bin_begin - node_begin);
+
+  // Accumulate sufficient statistics
+  for (auto i = cutpoint_begin_iter; i != cutpoint_end_iter; i++) {
+    auto idx = *i;
+    left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+  }
+}
+
 } // namespace StochTree
 
 #endif // STOCHTREE_LEAF_MODEL_H_
diff --git a/include/stochtree/meta.h b/include/stochtree/meta.h
index b77179ec..f078777c 100644
--- a/include/stochtree/meta.h
+++ b/include/stochtree/meta.h
@@ -41,11 +41,11 @@ enum ForestLeafVarianceType {
   kFixed
 };
 
-enum ForestLeafPriorType {
-  kConstantLeafGaussian,
-  kUnivariateRegressionLeafGaussian,
-  kMultivariateRegressionLeafGaussian
-};
+// enum ForestLeafPriorType {
+//   kConstantLeafGaussian,
+//   kUnivariateRegressionLeafGaussian,
+//   kMultivariateRegressionLeafGaussian
+// };
 
 enum ForestSampler {
   kMCMC,
diff --git a/include/stochtree/tree_sampler.h b/include/stochtree/tree_sampler.h
index 302ae6bf..b75b6b00 100644
--- a/include/stochtree/tree_sampler.h
+++ b/include/stochtree/tree_sampler.h
@@ -6,6 +6,7 @@
 #include <stochtree/cutpoint_candidates.h>
 #include <stochtree/data.h>
 #include <stochtree/ensemble.h>
+#include <stochtree/leaf_model.h>
 #include <stochtree/partition_tracker.h>
 #include <stochtree/prior.h>
 
@@ -111,7 +112,8 @@ static inline bool NodeNonConstant(ForestDataset& dataset, ForestTracker& tracke
   return false;
 }
 
-static inline void AddSplitToModel(ForestTracker& tracker, ForestDataset& dataset, TreePrior& tree_prior, TreeSplit& split, std::mt19937& gen, Tree* tree, int tree_num, int leaf_node, int feature_split, bool keep_sorted = false) {
+static inline void AddSplitToModel(ForestTracker& tracker, ForestDataset& dataset, TreePrior& tree_prior, TreeSplit& split, std::mt19937& gen, Tree* tree, 
+                                   int tree_num, int leaf_node, int feature_split, bool keep_sorted = false) {
   // Use zeros as a "temporary" leaf values since we draw leaf parameters after tree sampling is complete
   if (tree->OutputDimension() > 1) {
     std::vector<double> temp_leaf_values(tree->OutputDimension(), 0.);
@@ -127,7 +129,8 @@ static inline void AddSplitToModel(ForestTracker& tracker, ForestDataset& datase
   tracker.AddSplit(dataset.GetCovariates(), split, feature_split, tree_num, leaf_node, left_node, right_node, keep_sorted);
 }
 
-static inline void RemoveSplitFromModel(ForestTracker& tracker, ForestDataset& dataset, TreePrior& tree_prior, std::mt19937& gen, Tree* tree, int tree_num, int leaf_node, int left_node, int right_node, bool keep_sorted = false) {
+static inline void RemoveSplitFromModel(ForestTracker& tracker, ForestDataset& dataset, TreePrior& tree_prior, std::mt19937& gen, Tree* tree, 
+                                        int tree_num, int leaf_node, int left_node, int right_node, bool keep_sorted = false) {
   // Use zeros as a "temporary" leaf values since we draw leaf parameters after tree sampling is complete
   if (tree->OutputDimension() > 1) {
     std::vector<double> temp_leaf_values(tree->OutputDimension(), 0.);
@@ -150,7 +153,8 @@ static inline double ComputeMeanOutcome(ColumnVector& residual) {
   return total_outcome / static_cast<double>(n);
 }
 
-static inline void UpdateResidualEntireForest(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, TreeEnsemble* forest, bool requires_basis, std::function<double(double, double)> op) {
+static inline void UpdateResidualEntireForest(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, TreeEnsemble* forest, 
+                                              bool requires_basis, std::function<double(double, double)> op) {
   data_size_t n = dataset.GetCovariates().rows();
   double tree_pred = 0.;
   double pred_value = 0.;
@@ -175,7 +179,8 @@ static inline void UpdateResidualEntireForest(ForestTracker& tracker, ForestData
   }
 }
 
-static inline void UpdateResidualTree(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, Tree* tree, int tree_num, bool requires_basis, std::function<double(double, double)> op, bool tree_new) {
+static inline void UpdateResidualTree(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, Tree* tree, int tree_num, 
+                                      bool requires_basis, std::function<double(double, double)> op, bool tree_new) {
   data_size_t n = dataset.GetCovariates().rows();
   double pred_value;
   int32_t leaf_pred;
@@ -233,19 +238,168 @@ static inline void UpdateResidualNewBasis(ForestTracker& tracker, ForestDataset&
   }
 }
 
-template <typename LeafModel>
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
+static inline std::tuple<double, double, data_size_t, data_size_t> EvaluateProposedSplit(
+  ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, LeafModel& leaf_model, 
+  TreeSplit& split, int tree_num, int leaf_num, int split_feature, double global_variance, 
+  LeafSuffStatConstructorArgs&... leaf_suff_stat_args
+) {
+  // Initialize sufficient statistics
+  LeafSuffStat node_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+  LeafSuffStat left_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+  LeafSuffStat right_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+
+  // Accumulate sufficient statistics
+  AccumulateSuffStatProposed<LeafSuffStat>(node_suff_stat, left_suff_stat, right_suff_stat, dataset, tracker, 
+                                           residual, global_variance, split, tree_num, leaf_num, split_feature);
+  data_size_t left_n = left_suff_stat.n;
+  data_size_t right_n = right_suff_stat.n;
+
+  // Evaluate split
+  double split_log_ml = leaf_model.SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
+  double no_split_log_ml = leaf_model.NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
+
+  return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
+}
+
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
+static inline std::tuple<double, double, data_size_t, data_size_t> EvaluateExistingSplit(
+  ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, LeafModel& leaf_model, 
+  double global_variance, int tree_num, int split_node_id, int left_node_id, int right_node_id, 
+  LeafSuffStatConstructorArgs&... leaf_suff_stat_args
+) {
+  // Initialize sufficient statistics
+  LeafSuffStat node_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+  LeafSuffStat left_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+  LeafSuffStat right_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+
+  // Accumulate sufficient statistics
+  AccumulateSuffStatExisting<LeafSuffStat>(node_suff_stat, left_suff_stat, right_suff_stat, dataset, tracker, 
+                                           residual, global_variance, tree_num, split_node_id, left_node_id, right_node_id);
+  data_size_t left_n = left_suff_stat.n;
+  data_size_t right_n = right_suff_stat.n;
+
+  // Evaluate split
+  double split_log_ml = leaf_model.SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
+  double no_split_log_ml = leaf_model.NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
+
+  return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
+}
+
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
+static inline void EvaluateAllPossibleSplits(
+  ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreePrior& tree_prior, LeafModel& leaf_model, double global_variance, int tree_num, int split_node_id, 
+  std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, std::vector<FeatureType>& cutpoint_feature_types, 
+  data_size_t& valid_cutpoint_count, CutpointGridContainer& cutpoint_grid_container, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
+  std::vector<FeatureType>& feature_types, LeafSuffStatConstructorArgs&... leaf_suff_stat_args
+) {
+    // Initialize sufficient statistics
+  LeafSuffStat node_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+  LeafSuffStat left_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+  LeafSuffStat right_suff_stat = LeafSuffStat(leaf_suff_stat_args...);
+
+  // Accumulate aggregate sufficient statistic for the node to be split
+  AccumulateSingleNodeSuffStat<LeafSuffStat, false>(node_suff_stat, dataset, tracker, residual, tree_num, split_node_id);
+
+  // Compute the "no split" log marginal likelihood
+  double no_split_log_ml = leaf_model.NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
+
+  // Unpack data
+  Eigen::MatrixXd covariates = dataset.GetCovariates();
+  Eigen::VectorXd outcome = residual.GetData();
+  Eigen::VectorXd var_weights;
+  bool has_weights = dataset.HasVarWeights();
+  if (has_weights) var_weights = dataset.GetVarWeights();
+  
+  // Minimum size of newly created leaf nodes (used to rule out invalid splits)
+  int32_t min_samples_in_leaf = tree_prior.GetMinSamplesLeaf();
+
+  // Compute sufficient statistics for each possible split
+  data_size_t num_cutpoints = 0;
+  bool valid_split = false;
+  data_size_t node_row_iter;
+  data_size_t current_bin_begin, current_bin_size, next_bin_begin;
+  data_size_t feature_sort_idx;
+  data_size_t row_iter_idx;
+  double outcome_val, outcome_val_sq;
+  FeatureType feature_type;
+  double feature_value = 0.0;
+  double cutoff_value = 0.0;
+  double log_split_eval = 0.0;
+  double split_log_ml;
+  for (int j = 0; j < covariates.cols(); j++) {
+
+    if (std::abs(variable_weights.at(j)) > kEpsilon) {
+      // Enumerate cutpoint strides
+      cutpoint_grid_container.CalculateStrides(covariates, outcome, tracker.GetSortedNodeSampleTracker(), split_node_id, node_begin, node_end, j, feature_types);
+      
+      // Reset sufficient statistics
+      left_suff_stat.ResetSuffStat();
+      right_suff_stat.ResetSuffStat();
+
+      // Iterate through possible cutpoints
+      int32_t num_feature_cutpoints = cutpoint_grid_container.NumCutpoints(j);
+      feature_type = feature_types[j];
+      // Since we partition an entire cutpoint bin to the left, we must stop one bin before the total number of cutpoint bins
+      for (data_size_t cutpoint_idx = 0; cutpoint_idx < (num_feature_cutpoints - 1); cutpoint_idx++) {
+        current_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_idx, j);
+        current_bin_size = cutpoint_grid_container.BinLength(cutpoint_idx, j);
+        next_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_idx + 1, j);
+
+        // Accumulate sufficient statistics for the left node
+        AccumulateCutpointBinSuffStat<LeafSuffStat>(left_suff_stat, tracker, cutpoint_grid_container, dataset, residual,
+                                                    global_variance, tree_num, split_node_id, j, cutpoint_idx);
+
+        // Compute the corresponding right node sufficient statistics
+        right_suff_stat.SubtractSuffStat(node_suff_stat, left_suff_stat);
+
+        // Store the bin index as the "cutpoint value" - we can use this to query the actual split 
+        // value or the set of split categories later on once a split is chose
+        cutoff_value = cutpoint_idx;
+
+        // Only include cutpoint for consideration if it defines a valid split in the training data
+        valid_split = (left_suff_stat.SampleGreaterThanEqual(min_samples_in_leaf) && 
+                      right_suff_stat.SampleGreaterThanEqual(min_samples_in_leaf));
+        if (valid_split) {
+          num_cutpoints++;
+          // Add to split rule vector
+          cutpoint_feature_types.push_back(feature_type);
+          cutpoint_features.push_back(j);
+          cutpoint_values.push_back(cutoff_value);
+          // Add the log marginal likelihood of the split to the split eval vector 
+          split_log_ml = leaf_model.SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
+          log_cutpoint_evaluations.push_back(split_log_ml);
+        }
+      }
+    }
+
+  }
+
+  // Add the log marginal likelihood of the "no-split" option (adjusted for tree prior and cutpoint size per the XBART paper)
+  cutpoint_features.push_back(-1);
+  cutpoint_values.push_back(std::numeric_limits<double>::max());
+  cutpoint_feature_types.push_back(FeatureType::kNumeric);
+  log_cutpoint_evaluations.push_back(no_split_log_ml);
+
+  // Update valid cutpoint count
+  valid_cutpoint_count = num_cutpoints;
+}
+
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void EvaluateCutpoints(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, TreePrior& tree_prior, 
                                      std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, int node_id, data_size_t node_begin, data_size_t node_end, 
                                      std::vector<double>& log_cutpoint_evaluations, std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, 
                                      std::vector<FeatureType>& cutpoint_feature_types, data_size_t& valid_cutpoint_count, std::vector<double>& variable_weights, 
-                                     std::vector<FeatureType>& feature_types, CutpointGridContainer& cutpoint_grid_container) {
+                                     std::vector<FeatureType>& feature_types, CutpointGridContainer& cutpoint_grid_container, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Evaluate all possible cutpoints according to the leaf node model, 
   // recording their log-likelihood and other split information in a series of vectors.
   // The last element of these vectors concerns the "no-split" option.
-  leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, tree_num, node_id, log_cutpoint_evaluations, 
-                                        cutpoint_features, cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, 
-                                        cutpoint_grid_container, node_begin, node_end, variable_weights, feature_types);
-
+  EvaluateAllPossibleSplits<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+    dataset, tracker, residual, tree_prior, leaf_model, global_variance, tree_num, node_id, log_cutpoint_evaluations, 
+    cutpoint_features, cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 
+    node_begin, node_end, variable_weights, feature_types, leaf_suff_stat_args...
+  );
+  
   // Compute an adjustment to reflect the no split prior probability and the number of cutpoints
   double bart_prior_no_split_adj;
   double alpha = tree_prior.GetAlpha();
@@ -259,12 +413,12 @@ static inline void EvaluateCutpoints(Tree* tree, ForestTracker& tracker, LeafMod
   log_cutpoint_evaluations[log_cutpoint_evaluations.size()-1] += bart_prior_no_split_adj;
 }
 
-template <typename LeafModel>
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void SampleSplitRule(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
                                    TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance, int cutpoint_grid_size, 
                                    std::unordered_map<int, std::pair<data_size_t, data_size_t>>& node_index_map, std::deque<node_t>& split_queue, 
                                    int node_id, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, 
-                                   std::vector<FeatureType>& feature_types) {
+                                   std::vector<FeatureType>& feature_types, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Leaf depth
   int leaf_depth = tree->GetDepth(node_id);
 
@@ -280,10 +434,12 @@ static inline void SampleSplitRule(Tree* tree, ForestTracker& tracker, LeafModel
     std::vector<FeatureType> cutpoint_feature_types;
     StochTree::data_size_t valid_cutpoint_count;
     CutpointGridContainer cutpoint_grid_container(dataset.GetCovariates(), residual.GetData(), cutpoint_grid_size);
-    EvaluateCutpoints<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance,
-                                 cutpoint_grid_size, node_id, node_begin, node_end, log_cutpoint_evaluations, cutpoint_features, 
-                                 cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, variable_weights, feature_types, 
-                                 cutpoint_grid_container);
+    EvaluateCutpoints<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+      tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance,
+      cutpoint_grid_size, node_id, node_begin, node_end, log_cutpoint_evaluations, cutpoint_features, 
+      cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, variable_weights, feature_types, 
+      cutpoint_grid_container, leaf_suff_stat_args...
+    );
     // TODO: maybe add some checks here?
     
     // Convert log marginal likelihood to marginal likelihood, normalizing by the maximum log-likelihood
@@ -361,10 +517,11 @@ static inline void SampleSplitRule(Tree* tree, ForestTracker& tracker, LeafModel
   }
 }
 
-template <typename LeafModel>
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void GFRSampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
                                         ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                        int tree_num, double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size) {
+                                        int tree_num, double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size, 
+                                        LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   int root_id = Tree::kRoot;
   int curr_node_id;
   data_size_t curr_node_begin;
@@ -387,16 +544,18 @@ static inline void GFRSampleTreeOneIter(Tree* tree, ForestTracker& tracker, Fore
     curr_node_begin = begin_end.first;
     curr_node_end = begin_end.second;
     // Draw a split rule at random
-    SampleSplitRule<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance, cutpoint_grid_size, 
-                               node_index_map, split_queue, curr_node_id, curr_node_begin, curr_node_end, variable_weights, feature_types);
+    SampleSplitRule<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+      tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance, cutpoint_grid_size, 
+      node_index_map, split_queue, curr_node_id, curr_node_begin, curr_node_end, variable_weights, feature_types, 
+      leaf_suff_stat_args...);
   }
 }
 
-template <typename LeafModel>
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
                                     ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                    double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size = 500, 
-                                    bool pre_initialized = false) {
+                                    double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size, 
+                                    bool pre_initialized, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Previous number of samples
   int prev_num_samples = forests.NumSamples();
   
@@ -435,7 +594,11 @@ static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& for
     tree = ensemble->GetTree(i);
     
     // Sample tree i
-    GFRSampleTreeOneIter<LeafModel>(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance, feature_types, cutpoint_grid_size);
+    GFRSampleTreeOneIter<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+      tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, 
+      variable_weights, i, global_variance, feature_types, cutpoint_grid_size, 
+      leaf_suff_stat_args...
+    );
     
     // Sample leaf parameters for tree i
     tree = ensemble->GetTree(i);
@@ -446,10 +609,10 @@ static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& for
   }
 }
 
-template <typename LeafModel>
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void MCMCGrowTreeOneIter(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
                                        TreePrior& tree_prior, std::mt19937& gen, int tree_num, std::vector<double>& variable_weights, 
-                                       double global_variance, double prob_grow_old) {
+                                       double global_variance, double prob_grow_old, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Extract dataset information
   data_size_t n = dataset.GetCovariates().rows();
 
@@ -495,7 +658,9 @@ static inline void MCMCGrowTreeOneIter(Tree* tree, ForestTracker& tracker, LeafM
     TreeSplit split = TreeSplit(split_point_chosen);
 
     // Compute the marginal likelihood of split and no split, given the leaf prior
-    std::tuple<double, double, int32_t, int32_t> split_eval = leaf_model.EvaluateProposedSplit(dataset, tracker, residual, split, tree_num, leaf_chosen, var_chosen, global_variance);
+    std::tuple<double, double, int32_t, int32_t> split_eval = EvaluateProposedSplit<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+      dataset, tracker, residual, leaf_model, split, tree_num, leaf_chosen, var_chosen, global_variance, leaf_suff_stat_args...
+    );
     double split_log_marginal_likelihood = std::get<0>(split_eval);
     double no_split_log_marginal_likelihood = std::get<1>(split_eval);
     int32_t left_n = std::get<2>(split_eval);
@@ -546,9 +711,9 @@ static inline void MCMCGrowTreeOneIter(Tree* tree, ForestTracker& tracker, LeafM
   }
 }
 
-template <typename LeafModel>
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void MCMCPruneTreeOneIter(Tree* tree, ForestTracker& tracker, LeafModel& leaf_model, ForestDataset& dataset, ColumnVector& residual, 
-                                        TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance) {
+                                        TreePrior& tree_prior, std::mt19937& gen, int tree_num, double global_variance, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Choose a "leaf parent" node at random
   int num_leaves = tree->NumLeaves();
   int num_leaf_parents = tree->NumLeafParents();
@@ -563,7 +728,9 @@ static inline void MCMCPruneTreeOneIter(Tree* tree, ForestTracker& tracker, Leaf
   int feature_split = tree->SplitIndex(leaf_parent_chosen);
   
   // Compute the marginal likelihood for the leaf parent and its left and right nodes
-  std::tuple<double, double, int32_t, int32_t> split_eval = leaf_model.EvaluateExistingSplit(dataset, tracker, residual, global_variance, tree_num, leaf_parent_chosen, left_node, right_node);
+  std::tuple<double, double, int32_t, int32_t> split_eval = EvaluateExistingSplit<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+    dataset, tracker, residual, leaf_model, global_variance, tree_num, leaf_parent_chosen, left_node, right_node, leaf_suff_stat_args...
+  );
   double split_log_marginal_likelihood = std::get<0>(split_eval);
   double no_split_log_marginal_likelihood = std::get<1>(split_eval);
   int32_t left_n = std::get<2>(split_eval);
@@ -622,10 +789,10 @@ static inline void MCMCPruneTreeOneIter(Tree* tree, ForestTracker& tracker, Leaf
   }
 }
 
-template <typename LeafModel>
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void MCMCSampleTreeOneIter(Tree* tree, ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset,
                                          ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                         int tree_num, double global_variance) {
+                                         int tree_num, double global_variance, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Determine whether it is possible to grow any of the leaves
   bool grow_possible = false;
   std::vector<int> leaves = tree->GetLeaves();
@@ -664,16 +831,20 @@ static inline void MCMCSampleTreeOneIter(Tree* tree, ForestTracker& tracker, For
   bool accept;
   
   if (step_chosen == 0) {
-    MCMCGrowTreeOneIter<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, variable_weights, global_variance, prob_grow);
+    MCMCGrowTreeOneIter<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+      tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, variable_weights, global_variance, prob_grow, leaf_suff_stat_args...
+    );
   } else {
-    MCMCPruneTreeOneIter<LeafModel>(tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance);
+    MCMCPruneTreeOneIter<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+      tree, tracker, leaf_model, dataset, residual, tree_prior, gen, tree_num, global_variance, leaf_suff_stat_args...
+    );
   }
 }
 
-template <typename LeafModel>
+template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
                                      ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                     double global_variance, bool pre_initialized = false) {
+                                     double global_variance, bool pre_initialized, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Previous number of samples
   int prev_num_samples = forests.NumSamples();
   
@@ -706,7 +877,10 @@ static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& fo
     
     // Sample tree i
     tree = ensemble->GetTree(i);
-    MCMCSampleTreeOneIter<LeafModel>(tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, global_variance);
+    MCMCSampleTreeOneIter<LeafModel, LeafSuffStat, LeafSuffStatConstructorArgs...>(
+      tree, tracker, forests, leaf_model, dataset, residual, tree_prior, gen, variable_weights, i, 
+      global_variance, leaf_suff_stat_args...
+    );
     
     // Sample leaf parameters for tree i
     tree = ensemble->GetTree(i);
diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index 797e3758..a3ae9b38 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -2,234 +2,6 @@
 
 namespace StochTree {
 
-template<typename SuffStatType>
-void AccumulateSuffStatProposed(SuffStatType& node_suff_stat, SuffStatType& left_suff_stat, SuffStatType& right_suff_stat, ForestDataset& dataset, ForestTracker& tracker, 
-                                ColumnVector& residual, double global_variance, TreeSplit& split, int tree_num, int leaf_num, int split_feature) {
-  // Acquire iterators
-  auto node_begin_iter = tracker.UnsortedNodeBeginIterator(tree_num, leaf_num);
-  auto node_end_iter = tracker.UnsortedNodeEndIterator(tree_num, leaf_num);
-
-  // Accumulate sufficient statistics
-  for (auto i = node_begin_iter; i != node_end_iter; i++) {
-    auto idx = *i;
-    double feature_value = dataset.CovariateValue(idx, split_feature);
-    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-    if (split.SplitTrue(feature_value)) {
-      left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-    } else {
-      right_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-    }
-  }
-}
-
-template<typename SuffStatType>
-void AccumulateSuffStatExisting(SuffStatType& node_suff_stat, SuffStatType& left_suff_stat, SuffStatType& right_suff_stat, ForestDataset& dataset, ForestTracker& tracker, 
-                                ColumnVector& residual, double global_variance, int tree_num, int split_node_id, int left_node_id, int right_node_id) {
-  // Acquire iterators
-  auto left_node_begin_iter = tracker.UnsortedNodeBeginIterator(tree_num, left_node_id);
-  auto left_node_end_iter = tracker.UnsortedNodeEndIterator(tree_num, left_node_id);
-  auto right_node_begin_iter = tracker.UnsortedNodeBeginIterator(tree_num, right_node_id);
-  auto right_node_end_iter = tracker.UnsortedNodeEndIterator(tree_num, right_node_id);
-
-  // Accumulate sufficient statistics for the left and split nodes
-  for (auto i = left_node_begin_iter; i != left_node_end_iter; i++) {
-    auto idx = *i;
-    left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-  }
-
-  // Accumulate sufficient statistics for the right and split nodes
-  for (auto i = right_node_begin_iter; i != right_node_end_iter; i++) {
-    auto idx = *i;
-    right_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-  }
-}
-
-template<typename SuffStatType, bool sorted>
-void AccumulateSingleNodeSuffStat(SuffStatType& node_suff_stat, ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, int tree_num, int node_id) {
-  // Acquire iterators
-  std::vector<data_size_t>::iterator node_begin_iter;
-  std::vector<data_size_t>::iterator node_end_iter;
-  if (sorted) {
-    // Default to the first feature if we're using the presort tracker
-    node_begin_iter = tracker.SortedNodeBeginIterator(node_id, 0);
-    node_end_iter = tracker.SortedNodeEndIterator(node_id, 0);
-  } else {
-    node_begin_iter = tracker.UnsortedNodeBeginIterator(tree_num, node_id);
-    node_end_iter = tracker.UnsortedNodeEndIterator(tree_num, node_id);
-  }
-  
-  // Accumulate sufficient statistics
-  for (auto i = node_begin_iter; i != node_end_iter; i++) {
-    auto idx = *i;
-    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-  }
-}
-
-template<typename SuffStatType>
-void AccumulateCutpointBinSuffStat(SuffStatType& left_suff_stat, ForestTracker& tracker, CutpointGridContainer& cutpoint_grid_container, 
-                                   ForestDataset& dataset, ColumnVector& residual, double global_variance, int tree_num, int node_id, 
-                                   int feature_num, int cutpoint_num) {
-  // Acquire iterators
-  auto node_begin_iter = tracker.SortedNodeBeginIterator(node_id, feature_num);
-  auto node_end_iter = tracker.SortedNodeEndIterator(node_id, feature_num);
-  
-  // Determine node start point
-  data_size_t node_begin = tracker.SortedNodeBegin(node_id, feature_num);
-
-  // Determine cutpoint bin start and end points
-  data_size_t current_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_num, feature_num);
-  data_size_t current_bin_size = cutpoint_grid_container.BinLength(cutpoint_num, feature_num);
-  data_size_t next_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_num + 1, feature_num);
-
-  // Cutpoint specific iterators
-  // TODO: fix the hack of having to subtract off node_begin, probably by cleaning up the CutpointGridContainer interface
-  auto cutpoint_begin_iter = node_begin_iter + (current_bin_begin - node_begin);
-  auto cutpoint_end_iter = node_begin_iter + (next_bin_begin - node_begin);
-
-  // Accumulate sufficient statistics
-  for (auto i = cutpoint_begin_iter; i != cutpoint_end_iter; i++) {
-    auto idx = *i;
-    left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-  }
-}
-
-std::tuple<double, double, data_size_t, data_size_t> GaussianConstantLeafModel::EvaluateProposedSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, 
-                                                                                                      TreeSplit& split, int tree_num, int leaf_num, int split_feature, double global_variance) {
-  // Initialize sufficient statistics
-  GaussianConstantSuffStat node_suff_stat = GaussianConstantSuffStat();
-  GaussianConstantSuffStat left_suff_stat = GaussianConstantSuffStat();
-  GaussianConstantSuffStat right_suff_stat = GaussianConstantSuffStat();
-
-  // Accumulate sufficient statistics
-  AccumulateSuffStatProposed<GaussianConstantSuffStat>(node_suff_stat, left_suff_stat, right_suff_stat, dataset, tracker, 
-                                                       residual, global_variance, split, tree_num, leaf_num, split_feature);
-  data_size_t left_n = left_suff_stat.n;
-  data_size_t right_n = right_suff_stat.n;
-
-  // Evaluate split
-  double split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
-}
-
-std::tuple<double, double, data_size_t, data_size_t> GaussianConstantLeafModel::EvaluateExistingSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, double global_variance, 
-                                                                                                      int tree_num, int split_node_id, int left_node_id, int right_node_id) {
-  // Initialize sufficient statistics
-  GaussianConstantSuffStat node_suff_stat = GaussianConstantSuffStat();
-  GaussianConstantSuffStat left_suff_stat = GaussianConstantSuffStat();
-  GaussianConstantSuffStat right_suff_stat = GaussianConstantSuffStat();
-
-  // Accumulate sufficient statistics
-  AccumulateSuffStatExisting<GaussianConstantSuffStat>(node_suff_stat, left_suff_stat, right_suff_stat, dataset, tracker, 
-                                                       residual, global_variance, tree_num, split_node_id, left_node_id, right_node_id);
-  data_size_t left_n = left_suff_stat.n;
-  data_size_t right_n = right_suff_stat.n;
-
-  // Evaluate split
-  double split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
-}
-
-void GaussianConstantLeafModel::EvaluateAllPossibleSplits(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreePrior& tree_prior, double global_variance, int tree_num, int node_id, std::vector<double>& log_cutpoint_evaluations, 
-                                                          std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, std::vector<FeatureType>& cutpoint_feature_types, data_size_t& valid_cutpoint_count, 
-                                                          CutpointGridContainer& cutpoint_grid_container, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, std::vector<FeatureType>& feature_types) {
-  // Initialize sufficient statistics
-  GaussianConstantSuffStat node_suff_stat = GaussianConstantSuffStat();
-  GaussianConstantSuffStat left_suff_stat = GaussianConstantSuffStat();
-  GaussianConstantSuffStat right_suff_stat = GaussianConstantSuffStat();
-
-  // Accumulate aggregate sufficient statistic for the node to be split
-  AccumulateSingleNodeSuffStat<GaussianConstantSuffStat, false>(node_suff_stat, dataset, tracker, residual, tree_num, node_id);
-
-  // Compute the "no split" log marginal likelihood
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  // Unpack data
-  Eigen::MatrixXd covariates = dataset.GetCovariates();
-  Eigen::VectorXd outcome = residual.GetData();
-  Eigen::VectorXd var_weights;
-  bool has_weights = dataset.HasVarWeights();
-  if (has_weights) var_weights = dataset.GetVarWeights();
-  
-  // Minimum size of newly created leaf nodes (used to rule out invalid splits)
-  int32_t min_samples_in_leaf = tree_prior.GetMinSamplesLeaf();
-
-  // Compute sufficient statistics for each possible split
-  data_size_t num_cutpoints = 0;
-  bool valid_split = false;
-  data_size_t node_row_iter;
-  data_size_t current_bin_begin, current_bin_size, next_bin_begin;
-  data_size_t feature_sort_idx;
-  data_size_t row_iter_idx;
-  double outcome_val, outcome_val_sq;
-  FeatureType feature_type;
-  double feature_value = 0.0;
-  double cutoff_value = 0.0;
-  double log_split_eval = 0.0;
-  double split_log_ml;
-  for (int j = 0; j < covariates.cols(); j++) {
-
-    if (std::abs(variable_weights.at(j)) > kEpsilon) {
-      // Enumerate cutpoint strides
-      cutpoint_grid_container.CalculateStrides(covariates, outcome, tracker.GetSortedNodeSampleTracker(), node_id, node_begin, node_end, j, feature_types);
-      
-      // Reset sufficient statistics
-      left_suff_stat.ResetSuffStat();
-      right_suff_stat.ResetSuffStat();
-
-      // Iterate through possible cutpoints
-      int32_t num_feature_cutpoints = cutpoint_grid_container.NumCutpoints(j);
-      feature_type = feature_types[j];
-      // Since we partition an entire cutpoint bin to the left, we must stop one bin before the total number of cutpoint bins
-      for (data_size_t cutpoint_idx = 0; cutpoint_idx < (num_feature_cutpoints - 1); cutpoint_idx++) {
-        current_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_idx, j);
-        current_bin_size = cutpoint_grid_container.BinLength(cutpoint_idx, j);
-        next_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_idx + 1, j);
-
-        // Accumulate sufficient statistics for the left node
-        AccumulateCutpointBinSuffStat<GaussianConstantSuffStat>(left_suff_stat, tracker, cutpoint_grid_container, dataset, residual,
-                                                                global_variance, tree_num, node_id, j, cutpoint_idx);
-
-        // Compute the corresponding right node sufficient statistics
-        right_suff_stat.SubtractSuffStat(node_suff_stat, left_suff_stat);
-
-        // Store the bin index as the "cutpoint value" - we can use this to query the actual split 
-        // value or the set of split categories later on once a split is chose
-        cutoff_value = cutpoint_idx;
-
-        // Only include cutpoint for consideration if it defines a valid split in the training data
-        valid_split = (left_suff_stat.SampleGreaterThanEqual(min_samples_in_leaf) && 
-                      right_suff_stat.SampleGreaterThanEqual(min_samples_in_leaf));
-        if (valid_split) {
-          num_cutpoints++;
-          // Add to split rule vector
-          cutpoint_feature_types.push_back(feature_type);
-          cutpoint_features.push_back(j);
-          cutpoint_values.push_back(cutoff_value);
-          // Add the log marginal likelihood of the split to the split eval vector 
-          split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-          log_cutpoint_evaluations.push_back(split_log_ml);
-        }
-      }
-    }
-
-  }
-
-  // Add the log marginal likelihood of the "no-split" option (adjusted for tree prior and cutpoint size per the XBART paper)
-  cutpoint_features.push_back(-1);
-  cutpoint_values.push_back(std::numeric_limits<double>::max());
-  cutpoint_feature_types.push_back(FeatureType::kNumeric);
-  log_cutpoint_evaluations.push_back(no_split_log_ml);
-
-  // Update valid cutpoint count
-  valid_cutpoint_count = num_cutpoints;
-}
-
 double GaussianConstantLeafModel::SplitLogMarginalLikelihood(GaussianConstantSuffStat& left_stat, GaussianConstantSuffStat& right_stat, double global_variance) {
   double left_log_ml = (
     -0.5*std::log(1 + tau_*(left_stat.sum_w/global_variance)) + ((tau_*left_stat.sum_yw*left_stat.sum_yw)/(2.0*global_variance*(tau_*left_stat.sum_w + global_variance)))
@@ -294,141 +66,6 @@ void GaussianConstantLeafModel::SetEnsembleRootPredictedValue(ForestDataset& dat
   }
 }
 
-std::tuple<double, double, data_size_t, data_size_t> GaussianUnivariateRegressionLeafModel::EvaluateProposedSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual,
-                                                                                                      TreeSplit& split, int tree_num, int leaf_num, int split_feature, double global_variance) {
-  // Initialize sufficient statistics
-  GaussianUnivariateRegressionSuffStat node_suff_stat = GaussianUnivariateRegressionSuffStat();
-  GaussianUnivariateRegressionSuffStat left_suff_stat = GaussianUnivariateRegressionSuffStat();
-  GaussianUnivariateRegressionSuffStat right_suff_stat = GaussianUnivariateRegressionSuffStat();
-
-  // Accumulate sufficient statistics
-  AccumulateSuffStatProposed<GaussianUnivariateRegressionSuffStat>(node_suff_stat, left_suff_stat, right_suff_stat, dataset, tracker,
-                                                       residual, global_variance, split, tree_num, leaf_num, split_feature);
-  data_size_t left_n = left_suff_stat.n;
-  data_size_t right_n = right_suff_stat.n;
-
-  // Evaluate split
-  double split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
-}
-
-std::tuple<double, double, data_size_t, data_size_t> GaussianUnivariateRegressionLeafModel::EvaluateExistingSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, double global_variance,
-                                                                                                      int tree_num, int split_node_id, int left_node_id, int right_node_id) {
-  // Initialize sufficient statistics
-  GaussianUnivariateRegressionSuffStat node_suff_stat = GaussianUnivariateRegressionSuffStat();
-  GaussianUnivariateRegressionSuffStat left_suff_stat = GaussianUnivariateRegressionSuffStat();
-  GaussianUnivariateRegressionSuffStat right_suff_stat = GaussianUnivariateRegressionSuffStat();
-
-  // Accumulate sufficient statistics
-  AccumulateSuffStatExisting<GaussianUnivariateRegressionSuffStat>(node_suff_stat, left_suff_stat, right_suff_stat, dataset, tracker,
-                                                       residual, global_variance, tree_num, split_node_id, left_node_id, right_node_id);
-  data_size_t left_n = left_suff_stat.n;
-  data_size_t right_n = right_suff_stat.n;
-
-  // Evaluate split
-  double split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
-}
-
-void GaussianUnivariateRegressionLeafModel::EvaluateAllPossibleSplits(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreePrior& tree_prior, double global_variance, int tree_num, int node_id, std::vector<double>& log_cutpoint_evaluations,
-                                                          std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, std::vector<FeatureType>& cutpoint_feature_types, data_size_t& valid_cutpoint_count,
-                                                          CutpointGridContainer& cutpoint_grid_container, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, std::vector<FeatureType>& feature_types) {
-  // Initialize sufficient statistics
-  GaussianUnivariateRegressionSuffStat node_suff_stat = GaussianUnivariateRegressionSuffStat();
-  GaussianUnivariateRegressionSuffStat left_suff_stat = GaussianUnivariateRegressionSuffStat();
-  GaussianUnivariateRegressionSuffStat right_suff_stat = GaussianUnivariateRegressionSuffStat();
-
-  // Accumulate aggregate sufficient statistic for the node to be split
-  AccumulateSingleNodeSuffStat<GaussianUnivariateRegressionSuffStat, false>(node_suff_stat, dataset, tracker, residual, tree_num, node_id);
-
-  // Compute the "no split" log marginal likelihood
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  // Unpack data
-  Eigen::MatrixXd covariates = dataset.GetCovariates();
-  Eigen::VectorXd outcome = residual.GetData();
-  Eigen::VectorXd var_weights;
-  bool has_weights = dataset.HasVarWeights();
-  if (has_weights) var_weights = dataset.GetVarWeights();
-  
-  // Minimum size of newly created leaf nodes (used to rule out invalid splits)
-  int32_t min_samples_in_leaf = tree_prior.GetMinSamplesLeaf();
-
-  // Compute sufficient statistics for each possible split
-  data_size_t num_cutpoints = 0;
-  bool valid_split = false;
-  data_size_t node_row_iter;
-  data_size_t current_bin_begin, current_bin_size, next_bin_begin;
-  data_size_t feature_sort_idx;
-  data_size_t row_iter_idx;
-  double outcome_val, outcome_val_sq;
-  FeatureType feature_type;
-  double feature_value = 0.0;
-  double cutoff_value = 0.0;
-  double log_split_eval = 0.0;
-  double split_log_ml;
-  for (int j = 0; j < covariates.cols(); j++) {
-
-    if (std::abs(variable_weights.at(j)) > kEpsilon) {
-      // Enumerate cutpoint strides
-      cutpoint_grid_container.CalculateStrides(covariates, outcome, tracker.GetSortedNodeSampleTracker(), node_id, node_begin, node_end, j, feature_types);
-      
-      // Reset sufficient statistics
-      left_suff_stat.ResetSuffStat();
-      right_suff_stat.ResetSuffStat();
-
-      // Iterate through possible cutpoints
-      int32_t num_feature_cutpoints = cutpoint_grid_container.NumCutpoints(j);
-      feature_type = feature_types[j];
-      // Since we partition an entire cutpoint bin to the left, we must stop one bin before the total number of cutpoint bins
-      for (data_size_t cutpoint_idx = 0; cutpoint_idx < (num_feature_cutpoints - 1); cutpoint_idx++) {
-        current_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_idx, j);
-        current_bin_size = cutpoint_grid_container.BinLength(cutpoint_idx, j);
-        next_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_idx + 1, j);
-
-        // Accumulate sufficient statistics for the left node
-        AccumulateCutpointBinSuffStat<GaussianUnivariateRegressionSuffStat>(left_suff_stat, tracker, cutpoint_grid_container, dataset, residual,
-                                                                global_variance, tree_num, node_id, j, cutpoint_idx);
-
-        // Compute the corresponding right node sufficient statistics
-        right_suff_stat.SubtractSuffStat(node_suff_stat, left_suff_stat);
-
-        // Store the bin index as the "cutpoint value" - we can use this to query the actual split
-        // value or the set of split categories later on once a split is chose
-        cutoff_value = cutpoint_idx;
-
-        // Only include cutpoint for consideration if it defines a valid split in the training data
-        valid_split = (left_suff_stat.SampleGreaterThanEqual(min_samples_in_leaf) &&
-                      right_suff_stat.SampleGreaterThanEqual(min_samples_in_leaf));
-        if (valid_split) {
-          num_cutpoints++;
-          // Add to split rule vector
-          cutpoint_feature_types.push_back(feature_type);
-          cutpoint_features.push_back(j);
-          cutpoint_values.push_back(cutoff_value);
-          // Add the log marginal likelihood of the split to the split eval vector
-          split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-          log_cutpoint_evaluations.push_back(split_log_ml);
-        }
-      }
-    }
-
-  }
-
-  // Add the log marginal likelihood of the "no-split" option (adjusted for tree prior and cutpoint size per the XBART paper)
-  cutpoint_features.push_back(-1);
-  cutpoint_values.push_back(std::numeric_limits<double>::max());
-  cutpoint_feature_types.push_back(FeatureType::kNumeric);
-  log_cutpoint_evaluations.push_back(no_split_log_ml);
-
-  // Update valid cutpoint count
-  valid_cutpoint_count = num_cutpoints;
-}
-
 double GaussianUnivariateRegressionLeafModel::SplitLogMarginalLikelihood(GaussianUnivariateRegressionSuffStat& left_stat, GaussianUnivariateRegressionSuffStat& right_stat, double global_variance) {
   double left_log_ml = (
     -0.5*std::log(1 + tau_*(left_stat.sum_xxw/global_variance)) + ((tau_*left_stat.sum_yxw*left_stat.sum_yxw)/(2.0*global_variance*(tau_*left_stat.sum_xxw + global_variance)))
@@ -493,144 +130,6 @@ void GaussianUnivariateRegressionLeafModel::SetEnsembleRootPredictedValue(Forest
   }
 }
 
-std::tuple<double, double, data_size_t, data_size_t> GaussianMultivariateRegressionLeafModel::EvaluateProposedSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual,
-                                                                                                      TreeSplit& split, int tree_num, int leaf_num, int split_feature, double global_variance) {
-  // Initialize sufficient statistics
-  int num_basis = dataset.GetBasis().cols();
-  GaussianMultivariateRegressionSuffStat node_suff_stat = GaussianMultivariateRegressionSuffStat(num_basis);
-  GaussianMultivariateRegressionSuffStat left_suff_stat = GaussianMultivariateRegressionSuffStat(num_basis);
-  GaussianMultivariateRegressionSuffStat right_suff_stat = GaussianMultivariateRegressionSuffStat(num_basis);
-
-  // Accumulate sufficient statistics
-  AccumulateSuffStatProposed<GaussianMultivariateRegressionSuffStat>(node_suff_stat, left_suff_stat, right_suff_stat, dataset, tracker,
-                                                                     residual, global_variance, split, tree_num, leaf_num, split_feature);
-  data_size_t left_n = left_suff_stat.n;
-  data_size_t right_n = right_suff_stat.n;
-
-  // Evaluate split
-  double split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
-}
-
-std::tuple<double, double, data_size_t, data_size_t> GaussianMultivariateRegressionLeafModel::EvaluateExistingSplit(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, double global_variance,
-                                                                                                      int tree_num, int split_node_id, int left_node_id, int right_node_id) {
-  // Initialize sufficient statistics
-  int num_basis = dataset.GetBasis().cols();
-  GaussianMultivariateRegressionSuffStat node_suff_stat = GaussianMultivariateRegressionSuffStat(num_basis);
-  GaussianMultivariateRegressionSuffStat left_suff_stat = GaussianMultivariateRegressionSuffStat(num_basis);
-  GaussianMultivariateRegressionSuffStat right_suff_stat = GaussianMultivariateRegressionSuffStat(num_basis);
-
-  // Accumulate sufficient statistics
-  AccumulateSuffStatExisting<GaussianMultivariateRegressionSuffStat>(node_suff_stat, left_suff_stat, right_suff_stat, dataset, tracker,
-                                                                     residual, global_variance, tree_num, split_node_id, left_node_id, right_node_id);
-  data_size_t left_n = left_suff_stat.n;
-  data_size_t right_n = right_suff_stat.n;
-
-  // Evaluate split
-  double split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
-}
-
-void GaussianMultivariateRegressionLeafModel::EvaluateAllPossibleSplits(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreePrior& tree_prior, double global_variance, int tree_num, int node_id, std::vector<double>& log_cutpoint_evaluations,
-                                                          std::vector<int>& cutpoint_features, std::vector<double>& cutpoint_values, std::vector<FeatureType>& cutpoint_feature_types, data_size_t& valid_cutpoint_count,
-                                                          CutpointGridContainer& cutpoint_grid_container, data_size_t node_begin, data_size_t node_end, std::vector<double>& variable_weights, std::vector<FeatureType>& feature_types) {
-  // Initialize sufficient statistics
-  int basis_dim = dataset.GetBasis().cols();
-  GaussianMultivariateRegressionSuffStat node_suff_stat = GaussianMultivariateRegressionSuffStat(basis_dim);
-  GaussianMultivariateRegressionSuffStat left_suff_stat = GaussianMultivariateRegressionSuffStat(basis_dim);
-  GaussianMultivariateRegressionSuffStat right_suff_stat = GaussianMultivariateRegressionSuffStat(basis_dim);
-
-  // Accumulate aggregate sufficient statistic for the node to be split
-  AccumulateSingleNodeSuffStat<GaussianMultivariateRegressionSuffStat, false>(node_suff_stat, dataset, tracker, residual, tree_num, node_id);
-
-  // Compute the "no split" log marginal likelihood
-  double no_split_log_ml = NoSplitLogMarginalLikelihood(node_suff_stat, global_variance);
-
-  // Unpack data
-  Eigen::MatrixXd covariates = dataset.GetCovariates();
-  Eigen::VectorXd outcome = residual.GetData();
-  Eigen::VectorXd var_weights;
-  bool has_weights = dataset.HasVarWeights();
-  if (has_weights) var_weights = dataset.GetVarWeights();
-  
-  // Minimum size of newly created leaf nodes (used to rule out invalid splits)
-  int32_t min_samples_in_leaf = tree_prior.GetMinSamplesLeaf();
-
-  // Compute sufficient statistics for each possible split
-  data_size_t num_cutpoints = 0;
-  bool valid_split = false;
-  data_size_t node_row_iter;
-  data_size_t current_bin_begin, current_bin_size, next_bin_begin;
-  data_size_t feature_sort_idx;
-  data_size_t row_iter_idx;
-  double outcome_val, outcome_val_sq;
-  FeatureType feature_type;
-  double feature_value = 0.0;
-  double cutoff_value = 0.0;
-  double log_split_eval = 0.0;
-  double split_log_ml;
-  for (int j = 0; j < covariates.cols(); j++) {
-
-    if (std::abs(variable_weights.at(j)) > kEpsilon) {
-      // Enumerate cutpoint strides
-      cutpoint_grid_container.CalculateStrides(covariates, outcome, tracker.GetSortedNodeSampleTracker(), node_id, node_begin, node_end, j, feature_types);
-      
-      // Reset sufficient statistics
-      left_suff_stat.ResetSuffStat();
-      right_suff_stat.ResetSuffStat();
-
-      // Iterate through possible cutpoints
-      int32_t num_feature_cutpoints = cutpoint_grid_container.NumCutpoints(j);
-      feature_type = feature_types[j];
-      // Since we partition an entire cutpoint bin to the left, we must stop one bin before the total number of cutpoint bins
-      for (data_size_t cutpoint_idx = 0; cutpoint_idx < (num_feature_cutpoints - 1); cutpoint_idx++) {
-        current_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_idx, j);
-        current_bin_size = cutpoint_grid_container.BinLength(cutpoint_idx, j);
-        next_bin_begin = cutpoint_grid_container.BinStartIndex(cutpoint_idx + 1, j);
-
-        // Accumulate sufficient statistics for the left node
-        AccumulateCutpointBinSuffStat<GaussianMultivariateRegressionSuffStat>(left_suff_stat, tracker, cutpoint_grid_container, dataset, residual,
-                                                                              global_variance, tree_num, node_id, j, cutpoint_idx);
-
-        // Compute the corresponding right node sufficient statistics
-        right_suff_stat.SubtractSuffStat(node_suff_stat, left_suff_stat);
-
-        // Store the bin index as the "cutpoint value" - we can use this to query the actual split
-        // value or the set of split categories later on once a split is chose
-        cutoff_value = cutpoint_idx;
-
-        // Only include cutpoint for consideration if it defines a valid split in the training data
-        valid_split = (left_suff_stat.SampleGreaterThanEqual(min_samples_in_leaf) &&
-                      right_suff_stat.SampleGreaterThanEqual(min_samples_in_leaf));
-        if (valid_split) {
-          num_cutpoints++;
-          // Add to split rule vector
-          cutpoint_feature_types.push_back(feature_type);
-          cutpoint_features.push_back(j);
-          cutpoint_values.push_back(cutoff_value);
-          // Add the log marginal likelihood of the split to the split eval vector
-          split_log_ml = SplitLogMarginalLikelihood(left_suff_stat, right_suff_stat, global_variance);
-          log_cutpoint_evaluations.push_back(split_log_ml);
-        }
-      }
-    }
-
-  }
-
-  // Add the log marginal likelihood of the "no-split" option (adjusted for tree prior and cutpoint size per the XBART paper)
-  cutpoint_features.push_back(-1);
-  cutpoint_values.push_back(std::numeric_limits<double>::max());
-  cutpoint_feature_types.push_back(FeatureType::kNumeric);
-  log_cutpoint_evaluations.push_back(no_split_log_ml);
-
-  // Update valid cutpoint count
-  valid_cutpoint_count = num_cutpoints;
-}
-
 double GaussianMultivariateRegressionLeafModel::SplitLogMarginalLikelihood(GaussianMultivariateRegressionSuffStat& left_stat, GaussianMultivariateRegressionSuffStat& right_stat, double global_variance) {
   Eigen::MatrixXd I_p = Eigen::MatrixXd::Identity(left_stat.p, left_stat.p);
   double left_log_ml = (
diff --git a/src/py_stochtree.cpp b/src/py_stochtree.cpp
index 7025d8a9..207d1ce0 100644
--- a/src/py_stochtree.cpp
+++ b/src/py_stochtree.cpp
@@ -512,13 +512,13 @@ class ForestSamplerCpp {
                          Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size, bool pre_initialized) {
     if (leaf_model_enum == ForestLeafModel::kConstant) {
       StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-      StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
+      StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
       StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-      StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
+      StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
       StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-      StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
+      StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
     }
   }
 
@@ -527,13 +527,13 @@ class ForestSamplerCpp {
                           Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size, bool pre_initialized) {
     if (leaf_model_enum == ForestLeafModel::kConstant) {
       StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-      StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
       StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-      StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
       StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-      StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
+      StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
     }
   }
 };
diff --git a/src/sampler.cpp b/src/sampler.cpp
index 1229d6f0..7631bdd1 100644
--- a/src/sampler.cpp
+++ b/src/sampler.cpp
@@ -61,13 +61,13 @@ void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDatas
     // Run one iteration of the sampler
     if (leaf_model_enum == ForestLeafModel::kConstant) {
         StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
         StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
         StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
     }
 }
 
@@ -122,13 +122,13 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
     // Run one iteration of the sampler
     if (leaf_model_enum == ForestLeafModel::kConstant) {
         StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
         StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
         StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
     }
 }
 

From 894deb2a09c6ee25e056eccd3843c4dec3d71d5c Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 27 Aug 2024 01:31:57 -0500
Subject: [PATCH 12/41] Refactored R package C++ calls

---
 debug/api_debug.cpp              | 106 ++++++++++++++++++++++++++++---
 src/sampler.cpp                  |  79 +++++++++++++----------
 tools/perf/bart_microbenchmark.R |  29 +++++++++
 3 files changed, 172 insertions(+), 42 deletions(-)
 create mode 100644 tools/perf/bart_microbenchmark.R

diff --git a/debug/api_debug.cpp b/debug/api_debug.cpp
index 5d84c00b..5f19af57 100644
--- a/debug/api_debug.cpp
+++ b/debug/api_debug.cpp
@@ -239,6 +239,86 @@ void GenerateDGP2(std::vector<double>& covariates, std::vector<double>& basis, s
   }
 }
 
+void GenerateDGP3(std::vector<double>& covariates, std::vector<double>& basis, std::vector<double>& outcome, std::vector<double>& rfx_basis, std::vector<int32_t>& rfx_groups, std::vector<FeatureType>& feature_types, std::mt19937& gen, int& n, int& x_cols, int& omega_cols, int& y_cols, int& rfx_basis_cols, int& num_rfx_groups, bool rfx_included, int random_seed = -1) {
+  // Data dimensions
+  n = 1000;
+  x_cols = 2;
+  omega_cols = 2;
+  y_cols = 1;
+  if (rfx_included) {
+    num_rfx_groups = 2;
+    rfx_basis_cols = 1;
+  } else {
+    num_rfx_groups = 0;
+    rfx_basis_cols = 0;
+  }
+
+  // Resize data
+  covariates.resize(n * x_cols);
+  basis.resize(n * omega_cols);
+  rfx_basis.resize(n * rfx_basis_cols);
+  outcome.resize(n * y_cols);
+  rfx_groups.resize(n);
+  feature_types.resize(x_cols, FeatureType::kNumeric);
+  
+  // Random number generation
+  std::uniform_real_distribution<double> uniform_dist{0.0,1.0};
+  std::normal_distribution<double> normal_dist(0.,1.);
+  
+  // DGP parameters
+  std::vector<double> betas{-10, -5, 5, 10};
+  int num_partitions = betas.size();
+  double f_x_omega;
+  double rfx;
+  double error;
+
+  for (int i = 0; i < n; i++) {
+    for (int j = 0; j < x_cols; j++) {
+      covariates[i*x_cols + j] = uniform_dist(gen);
+    }
+    
+    for (int j = 0; j < omega_cols; j++) {
+      basis[i*omega_cols + j] = uniform_dist(gen);
+    }
+    
+    if (rfx_included) {
+      for (int j = 0; j < rfx_basis_cols; j++) {
+        rfx_basis[i * rfx_basis_cols + j] = 1;
+      }
+
+      if (i % 2 == 0) {
+        rfx_groups[i] = 1;
+      }
+      else {
+        rfx_groups[i] = 2;
+      }
+    }
+    
+    for (int j = 0; j < y_cols; j++) {
+      if ((covariates[i * x_cols + 0] >= 0.0) && covariates[i * x_cols + 0] < 0.25) {
+        f_x_omega = betas[0] * basis[i * omega_cols + 0];
+      } else if ((covariates[i * x_cols + 0] >= 0.25) && covariates[i * x_cols + 0] < 0.5) {
+        f_x_omega = betas[1] * basis[i * omega_cols + 0];
+      } else if ((covariates[i * x_cols + 0] >= 0.5) && covariates[i * x_cols + 0] < 0.75) {
+        f_x_omega = betas[2] * basis[i * omega_cols + 0];
+      } else {
+        f_x_omega = betas[3] * basis[i * omega_cols + 0];
+      }
+      error = 0.1 * normal_dist(gen);
+      outcome[i * y_cols + j] = f_x_omega + error;
+      if (rfx_included) {
+        if (rfx_groups[i] == 1) {
+          rfx = 5.;
+        }
+        else {
+          rfx = -5.;
+        }
+        outcome[i * y_cols + j] += rfx;
+      }
+    }
+  }
+}
+
 void OutcomeOffsetScale(ColumnVector& residual, double& outcome_offset, double& outcome_scale) {
   data_size_t n = residual.NumRows();
   double outcome_val = 0.0;
@@ -335,14 +415,18 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
     dataset.AddBasis(basis_raw.data(), n, omega_cols, row_major);
     output_dimension = 1;
     is_leaf_constant = false;
-  }
-  else if (dgp_num == 1) {
+  } else if (dgp_num == 1) {
     GenerateDGP2(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
     dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
     output_dimension = 1;
     is_leaf_constant = true;
-  }
-  else {
+  } else if (dgp_num == 2) {
+    GenerateDGP3(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
+    dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
+    dataset.AddBasis(basis_raw.data(), n, omega_cols, row_major);
+    output_dimension = omega_cols;
+    is_leaf_constant = false;
+  } else {
     Log::Fatal("Invalid dgp_num");
   }
 
@@ -413,14 +497,16 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
   double lamb = 0.5;
 
   // Set leaf model parameters
-  double leaf_scale_init = 1.;
-  Eigen::MatrixXd leaf_scale_matrix, leaf_scale_matrix_init;
-  // leaf_scale_matrix_init << 1.0, 0.0, 0.0, 1.0;
   double leaf_scale;
+  double leaf_scale_init = 1.;
+  Eigen::MatrixXd leaf_scale_matrix(omega_cols, omega_cols);
+  Eigen::MatrixXd leaf_scale_matrix_init(omega_cols, omega_cols);
+  leaf_scale_matrix_init << 1.0, 0.0, 0.0, 1.0;
+  leaf_scale_matrix = leaf_scale_matrix_init;
 
   // Set global variance
-  double global_variance_init = 1.0;
   double global_variance;
+  double global_variance_init = 1.0;
 
   // Set variable weights
   double const_var_wt = static_cast<double>(1. / x_cols);
@@ -538,8 +624,8 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
 int main(int argc, char* argv[]) {
   // Unpack command line arguments
   int dgp_num = std::stoi(argv[1]);
-  if ((dgp_num != 0) && (dgp_num != 1)) {
-    StochTree::Log::Fatal("The first command line argument must be 0 or 1");
+  if ((dgp_num != 0) && (dgp_num != 1) && (dgp_num != 2)) {
+    StochTree::Log::Fatal("The first command line argument must be 0, 1, or 2");
   }
   int model_type_int = static_cast<StochTree::ModelType>(std::stoi(argv[2]));
   if ((model_type_int != 0) && (model_type_int != 1) && (model_type_int != 2)) {
diff --git a/src/sampler.cpp b/src/sampler.cpp
index 7631bdd1..e9da2c81 100644
--- a/src/sampler.cpp
+++ b/src/sampler.cpp
@@ -8,6 +8,7 @@
 #include <stochtree/variance_model.h>
 #include <functional>
 #include <memory>
+#include <variant>
 #include <vector>
 
 [[cpp11::register]]
@@ -30,18 +31,18 @@ void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDatas
     }
     
     // Convert leaf model type to enum
-    ForestLeafModel leaf_model_enum;
-    if (leaf_model_int == 0) leaf_model_enum = ForestLeafModel::kConstant;
-    else if (leaf_model_int == 1) leaf_model_enum = ForestLeafModel::kUnivariateRegression;
-    else if (leaf_model_int == 2) leaf_model_enum = ForestLeafModel::kMultivariateRegression;
+    StochTree::ModelType model_type;
+    if (leaf_model_int == 0) model_type = StochTree::ModelType::kConstantLeafGaussian;
+    else if (leaf_model_int == 1) model_type = StochTree::ModelType::kUnivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 2) model_type = StochTree::ModelType::kMultivariateRegressionLeafGaussian;
     
     // Unpack leaf model parameters
     double leaf_scale;
     Eigen::MatrixXd leaf_scale_matrix;
-    if ((leaf_model_enum == ForestLeafModel::kConstant) || 
-        (leaf_model_enum == ForestLeafModel::kUnivariateRegression)) {
+    if ((model_type == StochTree::ModelType::kConstantLeafGaussian) || 
+        (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian)) {
         leaf_scale = leaf_model_scale_input(0,0);
-    } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
         int num_row = leaf_model_scale_input.nrow();
         int num_col = leaf_model_scale_input.ncol();
         leaf_scale_matrix.resize(num_row, num_col);
@@ -58,16 +59,23 @@ void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDatas
         var_weights_vector[i] = variable_weights[i];
     }
     
+    // Prepare the samplers
+    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix);
+    int num_basis = data->NumBasis();
+    
     // Run one iteration of the sampler
-    if (leaf_model_enum == ForestLeafModel::kConstant) {
-        StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
-    } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
-        StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
-    } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
-        StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+    if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
+        // StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
+        // StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+    } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
+        // StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
+        // StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
+        // StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
+        // StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*tracker, *forest_samples, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, num_basis);
     }
 }
 
@@ -91,18 +99,18 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
     }
     
     // Convert leaf model type to enum
-    ForestLeafModel leaf_model_enum;
-    if (leaf_model_int == 0) leaf_model_enum = ForestLeafModel::kConstant;
-    else if (leaf_model_int == 1) leaf_model_enum = ForestLeafModel::kUnivariateRegression;
-    else if (leaf_model_int == 2) leaf_model_enum = ForestLeafModel::kMultivariateRegression;
+    StochTree::ModelType model_type;
+    if (leaf_model_int == 0) model_type = StochTree::ModelType::kConstantLeafGaussian;
+    else if (leaf_model_int == 1) model_type = StochTree::ModelType::kUnivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 2) model_type = StochTree::ModelType::kMultivariateRegressionLeafGaussian;
     
     // Unpack leaf model parameters
     double leaf_scale;
     Eigen::MatrixXd leaf_scale_matrix;
-    if ((leaf_model_enum == ForestLeafModel::kConstant) || 
-        (leaf_model_enum == ForestLeafModel::kUnivariateRegression)) {
+    if ((model_type == StochTree::ModelType::kConstantLeafGaussian) || 
+        (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian)) {
         leaf_scale = leaf_model_scale_input(0,0);
-    } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
         int num_row = leaf_model_scale_input.nrow();
         int num_col = leaf_model_scale_input.ncol();
         leaf_scale_matrix.resize(num_row, num_col);
@@ -119,16 +127,23 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
         var_weights_vector[i] = variable_weights[i];
     }
     
+    // Prepare the samplers
+    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix);
+    int num_basis = data->NumBasis();
+    
     // Run one iteration of the sampler
-    if (leaf_model_enum == ForestLeafModel::kConstant) {
-        StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
-    } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
-        StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
-    } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
-        StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+    if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
+        // StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
+        // StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+    } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
+        // StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
+        // StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
+        // StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
+        // StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*tracker, *forest_samples, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized, num_basis);
     }
 }
 
diff --git a/tools/perf/bart_microbenchmark.R b/tools/perf/bart_microbenchmark.R
new file mode 100644
index 00000000..21e5e171
--- /dev/null
+++ b/tools/perf/bart_microbenchmark.R
@@ -0,0 +1,29 @@
+library(microbenchmark)
+library(stochtree)
+
+# Generate data needed to train BART model
+n <- 1000
+p <- 5
+X <- matrix(runif(n*p), ncol = p)
+f_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (-7.5) + 
+        ((0.25 <= X[,1]) & (0.5 > X[,1])) * (-2.5) + 
+        ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2.5) + 
+        ((0.75 <= X[,1]) & (1 > X[,1])) * (7.5)
+)
+noise_sd <- 1
+y <- f_XW + rnorm(n, 0, noise_sd)
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+
+# Run microbenchmark
+microbenchmark(
+    bart(X_train = X_train, y_train = y_train, X_test = X_test, num_gfr = 10, num_mcmc = 1000)
+)

From 7e2a110533db041446d5cff0fefd30d8dbec60c4 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 27 Aug 2024 02:22:57 -0500
Subject: [PATCH 13/41] Updated python library C++ code

---
 src/py_stochtree.cpp | 68 +++++++++++++++++---------------------------
 1 file changed, 26 insertions(+), 42 deletions(-)

diff --git a/src/py_stochtree.cpp b/src/py_stochtree.cpp
index 207d1ce0..b576cb2d 100644
--- a/src/py_stochtree.cpp
+++ b/src/py_stochtree.cpp
@@ -461,18 +461,18 @@ class ForestSamplerCpp {
     }
 
     // Convert leaf model type to enum
-    ForestLeafModel leaf_model_enum;
-    if (leaf_model_int == 0) leaf_model_enum = ForestLeafModel::kConstant;
-    else if (leaf_model_int == 1) leaf_model_enum = ForestLeafModel::kUnivariateRegression;
-    else if (leaf_model_int == 2) leaf_model_enum = ForestLeafModel::kMultivariateRegression;
+    StochTree::ModelType model_type;
+    if (leaf_model_int == 0) model_type = StochTree::ModelType::kConstantLeafGaussian;
+    else if (leaf_model_int == 1) model_type = StochTree::ModelType::kUnivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 2) model_type = StochTree::ModelType::kMultivariateRegressionLeafGaussian;
 
     // Unpack leaf model parameters
     double leaf_scale;
     Eigen::MatrixXd leaf_scale_matrix;
-    if ((leaf_model_enum == ForestLeafModel::kConstant) || 
-        (leaf_model_enum == ForestLeafModel::kUnivariateRegression)) {
+    if ((model_type == StochTree::ModelType::kConstantLeafGaussian) || 
+        (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian)) {
         leaf_scale = leaf_model_scale_input.at(0,0);
-    } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
         int num_row = leaf_model_scale_input.shape(0);
         int num_col = leaf_model_scale_input.shape(1);
         leaf_scale_matrix.resize(num_row, num_col);
@@ -482,60 +482,44 @@ class ForestSamplerCpp {
             }
         }
     }
-    
+
     // Convert variable weights to std::vector
     std::vector<double> var_weights_vector(variable_weights.size());
     for (int i = 0; i < variable_weights.size(); i++) {
         var_weights_vector[i] = variable_weights.at(i);
     }
 
+    // Prepare the samplers
+    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix);
+    
     // Run one iteration of the sampler
     StochTree::ForestContainer* forest_sample_ptr = forest_samples.GetContainer();
     StochTree::ForestDataset* forest_data_ptr = dataset.GetDataset();
     StochTree::ColumnVector* residual_data_ptr = residual.GetData();
+    int num_basis = forest_data_ptr->NumBasis();
     std::mt19937* rng_ptr = rng.GetRng();
     if (gfr) {
-      InternalSampleGFR(*forest_sample_ptr, *forest_data_ptr, *residual_data_ptr, *rng_ptr, feature_types_, var_weights_vector, 
-                        leaf_model_enum, leaf_scale_matrix, global_variance, leaf_scale, cutpoint_grid_size, pre_initialized);
+      if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
+        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+      } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
+        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+      } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
+        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, num_basis);
+      }
     } else {
-      InternalSampleMCMC(*forest_sample_ptr, *forest_data_ptr, *residual_data_ptr, *rng_ptr, feature_types_, var_weights_vector, 
-                         leaf_model_enum, leaf_scale_matrix, global_variance, leaf_scale, cutpoint_grid_size, pre_initialized);
+      if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
+        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized);
+      } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
+        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized);
+      } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
+        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized, num_basis);
+      }
     }
   }
 
  private:
   std::unique_ptr<StochTree::ForestTracker> tracker_;
   std::unique_ptr<StochTree::TreePrior> split_prior_;
-
-  void InternalSampleGFR(StochTree::ForestContainer& forest_samples, StochTree::ForestDataset& dataset, StochTree::ColumnVector& residual, std::mt19937& rng, 
-                         std::vector<StochTree::FeatureType>& feature_types, std::vector<double>& var_weights_vector, ForestLeafModel leaf_model_enum, 
-                         Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size, bool pre_initialized) {
-    if (leaf_model_enum == ForestLeafModel::kConstant) {
-      StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-      StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
-    } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
-      StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-      StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
-    } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
-      StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-      StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size, pre_initialized);
-    }
-  }
-
-  void InternalSampleMCMC(StochTree::ForestContainer& forest_samples, StochTree::ForestDataset& dataset, StochTree::ColumnVector& residual, std::mt19937& rng, 
-                          std::vector<StochTree::FeatureType>& feature_types, std::vector<double>& var_weights_vector, ForestLeafModel leaf_model_enum, 
-                          Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size, bool pre_initialized) {
-    if (leaf_model_enum == ForestLeafModel::kConstant) {
-      StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-      StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
-    } else if (leaf_model_enum == ForestLeafModel::kUnivariateRegression) {
-      StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-      StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
-    } else if (leaf_model_enum == ForestLeafModel::kMultivariateRegression) {
-      StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-      StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*(tracker_.get()), forest_samples, leaf_model, dataset, residual, *(split_prior_.get()), rng, var_weights_vector, global_variance, pre_initialized);
-    }
-  }
 };
 
 class GlobalVarianceModelCpp {

From 64c19e8b0f4b012ee8ef02075fa0c23d4a603d37 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 27 Aug 2024 02:27:42 -0500
Subject: [PATCH 14/41] Added include <variant>

---
 include/stochtree/leaf_model.h   | 1 +
 include/stochtree/tree_sampler.h | 1 +
 2 files changed, 2 insertions(+)

diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index f006566f..57ac1b69 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -17,6 +17,7 @@
 
 #include <random>
 #include <tuple>
+#include <variant>
 
 namespace StochTree {
 
diff --git a/include/stochtree/tree_sampler.h b/include/stochtree/tree_sampler.h
index b75b6b00..4aadb373 100644
--- a/include/stochtree/tree_sampler.h
+++ b/include/stochtree/tree_sampler.h
@@ -17,6 +17,7 @@
 #include <set>
 #include <string>
 #include <type_traits>
+#include <variant>
 #include <vector>
 
 namespace StochTree {

From 06efbb5560b04f23cf4eadc3c03675de1eb5d9e1 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 27 Aug 2024 02:36:42 -0500
Subject: [PATCH 15/41] Updated unit tests

---
 test/cpp/test_model.cpp | 30 ++++++++++++++++++------------
 1 file changed, 18 insertions(+), 12 deletions(-)

diff --git a/test/cpp/test_model.cpp b/test/cpp/test_model.cpp
index 23e2e929..0e729bef 100644
--- a/test/cpp/test_model.cpp
+++ b/test/cpp/test_model.cpp
@@ -4,6 +4,7 @@
 #include <stochtree/leaf_model.h>
 #include <stochtree/log.h>
 #include <stochtree/partition_tracker.h>
+#include <stochtree/tree_sampler.h>
 #include <iostream>
 #include <memory>
 #include <vector>
@@ -49,9 +50,10 @@ TEST(LeafConstantModel, FullEnumeration) {
   StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(tau);
 
   // Evaluate all possible cutpoints
-  leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, 0, 0, log_cutpoint_evaluations, cutpoint_features, 
-                                       cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 0, n, variable_weights, 
-                                       feature_types);
+  StochTree::EvaluateAllPossibleSplits<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(
+    dataset, tracker, residual, tree_prior, leaf_model, global_variance, 0, 0, log_cutpoint_evaluations, cutpoint_features, cutpoint_values, 
+    cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 0, n, variable_weights, feature_types
+  );
 
   // Check that there are (n - 2*min_samples_leaf + 1)*p + 1 cutpoints considered
   ASSERT_EQ(log_cutpoint_evaluations.size(), (n - 2*min_samples_leaf + 1)*p + 1);
@@ -107,9 +109,10 @@ TEST(LeafConstantModel, CutpointThinning) {
   StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(tau);
 
   // Evaluate all possible cutpoints
-  leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, 0, 0, log_cutpoint_evaluations, cutpoint_features, 
-                                       cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 0, n, variable_weights, 
-                                       feature_types);
+  StochTree::EvaluateAllPossibleSplits<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(
+    dataset, tracker, residual, tree_prior, leaf_model, global_variance, 0, 0, log_cutpoint_evaluations, cutpoint_features, cutpoint_values, 
+    cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 0, n, variable_weights, feature_types
+  );
 
   // Check that there are (n - 2*min_samples_leaf + 1)*p + 1 cutpoints considered
   ASSERT_EQ(log_cutpoint_evaluations.size(), (cutpoint_grid_size - 1)*p + 1);
@@ -165,9 +168,10 @@ TEST(LeafUnivariateRegressionModel, FullEnumeration) {
   StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(tau);
 
   // Evaluate all possible cutpoints
-  leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, 0, 0, log_cutpoint_evaluations, cutpoint_features, 
-                                       cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 0, n, variable_weights, 
-                                       feature_types);
+  StochTree::EvaluateAllPossibleSplits<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(
+    dataset, tracker, residual, tree_prior, leaf_model, global_variance, 0, 0, log_cutpoint_evaluations, cutpoint_features, cutpoint_values, 
+    cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 0, n, variable_weights, feature_types
+  );
 
   // Check that there are (n - 2*min_samples_leaf + 1)*p + 1 cutpoints considered
   ASSERT_EQ(log_cutpoint_evaluations.size(), (n - 2*min_samples_leaf + 1)*p + 1);
@@ -224,9 +228,11 @@ TEST(LeafUnivariateRegressionModel, CutpointThinning) {
   StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(tau);
 
   // Evaluate all possible cutpoints
-  leaf_model.EvaluateAllPossibleSplits(dataset, tracker, residual, tree_prior, global_variance, 0, 0, log_cutpoint_evaluations, cutpoint_features, 
-                                       cutpoint_values, cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 0, n, variable_weights, 
-                                       feature_types);
+  StochTree::EvaluateAllPossibleSplits<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(
+    dataset, tracker, residual, tree_prior, leaf_model, global_variance, 0, 0, log_cutpoint_evaluations, cutpoint_features, cutpoint_values, 
+    cutpoint_feature_types, valid_cutpoint_count, cutpoint_grid_container, 0, n, variable_weights, feature_types
+  );
+
 
   // Check that there are (n - 2*min_samples_leaf + 1)*p + 1 cutpoints considered
   ASSERT_EQ(log_cutpoint_evaluations.size(), (cutpoint_grid_size - 1)*p + 1);

From ad03adb3ab3dc2dc06f1e2f2a97dc9378d2de7cc Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sat, 31 Aug 2024 01:31:43 -0500
Subject: [PATCH 16/41] Initial setup for building and publishing C++
 documentation

---
 .gitignore                |    4 +-
 cpp_docs/Doxyfile         | 2862 +++++++++++++++++++++++++++++++++++++
 cpp_docs/Makefile         |   20 +
 cpp_docs/README.md        |   21 +
 cpp_docs/conf.py          |   40 +
 cpp_docs/index.rst        |    8 +
 cpp_docs/make.bat         |   35 +
 cpp_docs/requirements.txt |   39 +
 python_docs/README.md     |    2 +-
 9 files changed, 3029 insertions(+), 2 deletions(-)
 create mode 100644 cpp_docs/Doxyfile
 create mode 100644 cpp_docs/Makefile
 create mode 100644 cpp_docs/README.md
 create mode 100644 cpp_docs/conf.py
 create mode 100644 cpp_docs/index.rst
 create mode 100644 cpp_docs/make.bat
 create mode 100644 cpp_docs/requirements.txt

diff --git a/.gitignore b/.gitignore
index 14f9b134..8d64c5b1 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,7 +1,6 @@
 ## System and data files
 *.pdf
 *.csv
-*.txt
 *.DS_Store
 lib/
 build/
@@ -9,6 +8,9 @@ build/
 xcode/
 *.json
 .vs/
+cpp_docs/doxyoutput/html
+cpp_docs/doxyoutput/xml
+cpp_docs/doxyoutput/latex
 
 ## R gitignore
 
diff --git a/cpp_docs/Doxyfile b/cpp_docs/Doxyfile
new file mode 100644
index 00000000..2b178775
--- /dev/null
+++ b/cpp_docs/Doxyfile
@@ -0,0 +1,2862 @@
+# Doxyfile 1.12.0
+
+# This file describes the settings to be used by the documentation system
+# Doxygen (www.doxygen.org) for a project.
+#
+# All text after a double hash (##) is considered a comment and is placed in
+# front of the TAG it is preceding.
+#
+# All text after a single hash (#) is considered a comment and will be ignored.
+# The format is:
+# TAG = value [value, ...]
+# For lists, items can also be appended using:
+# TAG += value [value, ...]
+# Values that contain spaces should be placed between quotes (\" \").
+#
+# Note:
+#
+# Use Doxygen to compare the used configuration file with the template
+# configuration file:
+# doxygen -x [configFile]
+# Use Doxygen to compare the used configuration file with the template
+# configuration file without replacing the environment variables or CMake type
+# replacement variables:
+# doxygen -x_noenv [configFile]
+
+#---------------------------------------------------------------------------
+# Project related configuration options
+#---------------------------------------------------------------------------
+
+# This tag specifies the encoding used for all characters in the configuration
+# file that follow. The default is UTF-8 which is also the encoding used for all
+# text before the first occurrence of this tag. Doxygen uses libiconv (or the
+# iconv built into libc) for the transcoding. See
+# https://www.gnu.org/software/libiconv/ for the list of possible encodings.
+# The default value is: UTF-8.
+
+DOXYFILE_ENCODING      = UTF-8
+
+# The PROJECT_NAME tag is a single word (or a sequence of words surrounded by
+# double-quotes, unless you are using Doxywizard) that should identify the
+# project for which the documentation is generated. This name is used in the
+# title of most generated pages and in a few other places.
+# The default value is: My Project.
+
+PROJECT_NAME           = "StochTree"
+
+# The PROJECT_NUMBER tag can be used to enter a project or revision number. This
+# could be handy for archiving the generated documentation or if some version
+# control system is used.
+
+PROJECT_NUMBER         = 0.0.1
+
+# Using the PROJECT_BRIEF tag one can provide an optional one line description
+# for a project that appears at the top of each page and should give viewer a
+# quick idea about the purpose of the project. Keep the description short.
+
+PROJECT_BRIEF          =
+
+# With the PROJECT_LOGO tag one can specify a logo or an icon that is included
+# in the documentation. The maximum height of the logo should not exceed 55
+# pixels and the maximum width should not exceed 200 pixels. Doxygen will copy
+# the logo to the output directory.
+
+PROJECT_LOGO           =
+
+# With the PROJECT_ICON tag one can specify an icon that is included in the tabs
+# when the HTML document is shown. Doxygen will copy the logo to the output
+# directory.
+
+PROJECT_ICON           =
+
+# The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute) path
+# into which the generated documentation will be written. If a relative path is
+# entered, it will be relative to the location where Doxygen was started. If
+# left blank the current directory will be used.
+
+OUTPUT_DIRECTORY       = doxyoutput
+
+# If the CREATE_SUBDIRS tag is set to YES then Doxygen will create up to 4096
+# sub-directories (in 2 levels) under the output directory of each output format
+# and will distribute the generated files over these directories. Enabling this
+# option can be useful when feeding Doxygen a huge amount of source files, where
+# putting all generated files in the same directory would otherwise causes
+# performance problems for the file system. Adapt CREATE_SUBDIRS_LEVEL to
+# control the number of sub-directories.
+# The default value is: NO.
+
+CREATE_SUBDIRS         = NO
+
+# Controls the number of sub-directories that will be created when
+# CREATE_SUBDIRS tag is set to YES. Level 0 represents 16 directories, and every
+# level increment doubles the number of directories, resulting in 4096
+# directories at level 8 which is the default and also the maximum value. The
+# sub-directories are organized in 2 levels, the first level always has a fixed
+# number of 16 directories.
+# Minimum value: 0, maximum value: 8, default value: 8.
+# This tag requires that the tag CREATE_SUBDIRS is set to YES.
+
+CREATE_SUBDIRS_LEVEL   = 8
+
+# If the ALLOW_UNICODE_NAMES tag is set to YES, Doxygen will allow non-ASCII
+# characters to appear in the names of generated files. If set to NO, non-ASCII
+# characters will be escaped, for example _xE3_x81_x84 will be used for Unicode
+# U+3044.
+# The default value is: NO.
+
+ALLOW_UNICODE_NAMES    = NO
+
+# The OUTPUT_LANGUAGE tag is used to specify the language in which all
+# documentation generated by Doxygen is written. Doxygen will use this
+# information to generate all constant output in the proper language.
+# Possible values are: Afrikaans, Arabic, Armenian, Brazilian, Bulgarian,
+# Catalan, Chinese, Chinese-Traditional, Croatian, Czech, Danish, Dutch, English
+# (United States), Esperanto, Farsi (Persian), Finnish, French, German, Greek,
+# Hindi, Hungarian, Indonesian, Italian, Japanese, Japanese-en (Japanese with
+# English messages), Korean, Korean-en (Korean with English messages), Latvian,
+# Lithuanian, Macedonian, Norwegian, Persian (Farsi), Polish, Portuguese,
+# Romanian, Russian, Serbian, Serbian-Cyrillic, Slovak, Slovene, Spanish,
+# Swedish, Turkish, Ukrainian and Vietnamese.
+# The default value is: English.
+
+OUTPUT_LANGUAGE        = English
+
+# If the BRIEF_MEMBER_DESC tag is set to YES, Doxygen will include brief member
+# descriptions after the members that are listed in the file and class
+# documentation (similar to Javadoc). Set to NO to disable this.
+# The default value is: YES.
+
+BRIEF_MEMBER_DESC      = YES
+
+# If the REPEAT_BRIEF tag is set to YES, Doxygen will prepend the brief
+# description of a member or function before the detailed description
+#
+# Note: If both HIDE_UNDOC_MEMBERS and BRIEF_MEMBER_DESC are set to NO, the
+# brief descriptions will be completely suppressed.
+# The default value is: YES.
+
+REPEAT_BRIEF           = YES
+
+# This tag implements a quasi-intelligent brief description abbreviator that is
+# used to form the text in various listings. Each string in this list, if found
+# as the leading text of the brief description, will be stripped from the text
+# and the result, after processing the whole list, is used as the annotated
+# text. Otherwise, the brief description is used as-is. If left blank, the
+# following values are used ($name is automatically replaced with the name of
+# the entity):The $name class, The $name widget, The $name file, is, provides,
+# specifies, contains, represents, a, an and the.
+
+ABBREVIATE_BRIEF       = "The $name class" \
+                         "The $name widget" \
+                         "The $name file" \
+                         is \
+                         provides \
+                         specifies \
+                         contains \
+                         represents \
+                         a \
+                         an \
+                         the
+
+# If the ALWAYS_DETAILED_SEC and REPEAT_BRIEF tags are both set to YES then
+# Doxygen will generate a detailed section even if there is only a brief
+# description.
+# The default value is: NO.
+
+ALWAYS_DETAILED_SEC    = NO
+
+# If the INLINE_INHERITED_MEMB tag is set to YES, Doxygen will show all
+# inherited members of a class in the documentation of that class as if those
+# members were ordinary class members. Constructors, destructors and assignment
+# operators of the base classes will not be shown.
+# The default value is: NO.
+
+INLINE_INHERITED_MEMB  = NO
+
+# If the FULL_PATH_NAMES tag is set to YES, Doxygen will prepend the full path
+# before files name in the file list and in the header files. If set to NO the
+# shortest path that makes the file name unique will be used
+# The default value is: YES.
+
+FULL_PATH_NAMES        = YES
+
+# The STRIP_FROM_PATH tag can be used to strip a user-defined part of the path.
+# Stripping is only done if one of the specified strings matches the left-hand
+# part of the path. The tag can be used to show relative paths in the file list.
+# If left blank the directory from which Doxygen is run is used as the path to
+# strip.
+#
+# Note that you can specify absolute paths here, but also relative paths, which
+# will be relative from the directory where Doxygen is started.
+# This tag requires that the tag FULL_PATH_NAMES is set to YES.
+
+STRIP_FROM_PATH        =
+
+# The STRIP_FROM_INC_PATH tag can be used to strip a user-defined part of the
+# path mentioned in the documentation of a class, which tells the reader which
+# header file to include in order to use a class. If left blank only the name of
+# the header file containing the class definition is used. Otherwise one should
+# specify the list of include paths that are normally passed to the compiler
+# using the -I flag.
+
+STRIP_FROM_INC_PATH    =
+
+# If the SHORT_NAMES tag is set to YES, Doxygen will generate much shorter (but
+# less readable) file names. This can be useful is your file systems doesn't
+# support long names like on DOS, Mac, or CD-ROM.
+# The default value is: NO.
+
+SHORT_NAMES            = NO
+
+# If the JAVADOC_AUTOBRIEF tag is set to YES then Doxygen will interpret the
+# first line (until the first dot) of a Javadoc-style comment as the brief
+# description. If set to NO, the Javadoc-style will behave just like regular Qt-
+# style comments (thus requiring an explicit @brief command for a brief
+# description.)
+# The default value is: NO.
+
+JAVADOC_AUTOBRIEF      = NO
+
+# If the JAVADOC_BANNER tag is set to YES then Doxygen will interpret a line
+# such as
+# /***************
+# as being the beginning of a Javadoc-style comment "banner". If set to NO, the
+# Javadoc-style will behave just like regular comments and it will not be
+# interpreted by Doxygen.
+# The default value is: NO.
+
+JAVADOC_BANNER         = NO
+
+# If the QT_AUTOBRIEF tag is set to YES then Doxygen will interpret the first
+# line (until the first dot) of a Qt-style comment as the brief description. If
+# set to NO, the Qt-style will behave just like regular Qt-style comments (thus
+# requiring an explicit \brief command for a brief description.)
+# The default value is: NO.
+
+QT_AUTOBRIEF           = NO
+
+# The MULTILINE_CPP_IS_BRIEF tag can be set to YES to make Doxygen treat a
+# multi-line C++ special comment block (i.e. a block of //! or /// comments) as
+# a brief description. This used to be the default behavior. The new default is
+# to treat a multi-line C++ comment block as a detailed description. Set this
+# tag to YES if you prefer the old behavior instead.
+#
+# Note that setting this tag to YES also means that rational rose comments are
+# not recognized any more.
+# The default value is: NO.
+
+MULTILINE_CPP_IS_BRIEF = NO
+
+# By default Python docstrings are displayed as preformatted text and Doxygen's
+# special commands cannot be used. By setting PYTHON_DOCSTRING to NO the
+# Doxygen's special commands can be used and the contents of the docstring
+# documentation blocks is shown as Doxygen documentation.
+# The default value is: YES.
+
+PYTHON_DOCSTRING       = YES
+
+# If the INHERIT_DOCS tag is set to YES then an undocumented member inherits the
+# documentation from any documented member that it re-implements.
+# The default value is: YES.
+
+INHERIT_DOCS           = YES
+
+# If the SEPARATE_MEMBER_PAGES tag is set to YES then Doxygen will produce a new
+# page for each member. If set to NO, the documentation of a member will be part
+# of the file/class/namespace that contains it.
+# The default value is: NO.
+
+SEPARATE_MEMBER_PAGES  = NO
+
+# The TAB_SIZE tag can be used to set the number of spaces in a tab. Doxygen
+# uses this value to replace tabs by spaces in code fragments.
+# Minimum value: 1, maximum value: 16, default value: 4.
+
+TAB_SIZE               = 4
+
+# This tag can be used to specify a number of aliases that act as commands in
+# the documentation. An alias has the form:
+# name=value
+# For example adding
+# "sideeffect=@par Side Effects:^^"
+# will allow you to put the command \sideeffect (or @sideeffect) in the
+# documentation, which will result in a user-defined paragraph with heading
+# "Side Effects:". Note that you cannot put \n's in the value part of an alias
+# to insert newlines (in the resulting output). You can put ^^ in the value part
+# of an alias to insert a newline as if a physical newline was in the original
+# file. When you need a literal { or } or , in the value part of an alias you
+# have to escape them by means of a backslash (\), this can lead to conflicts
+# with the commands \{ and \} for these it is advised to use the version @{ and
+# @} or use a double escape (\\{ and \\})
+
+ALIASES                =
+
+# Set the OPTIMIZE_OUTPUT_FOR_C tag to YES if your project consists of C sources
+# only. Doxygen will then generate output that is more tailored for C. For
+# instance, some of the names that are used will be different. The list of all
+# members will be omitted, etc.
+# The default value is: NO.
+
+OPTIMIZE_OUTPUT_FOR_C  = NO
+
+# Set the OPTIMIZE_OUTPUT_JAVA tag to YES if your project consists of Java or
+# Python sources only. Doxygen will then generate output that is more tailored
+# for that language. For instance, namespaces will be presented as packages,
+# qualified scopes will look different, etc.
+# The default value is: NO.
+
+OPTIMIZE_OUTPUT_JAVA   = NO
+
+# Set the OPTIMIZE_FOR_FORTRAN tag to YES if your project consists of Fortran
+# sources. Doxygen will then generate output that is tailored for Fortran.
+# The default value is: NO.
+
+OPTIMIZE_FOR_FORTRAN   = NO
+
+# Set the OPTIMIZE_OUTPUT_VHDL tag to YES if your project consists of VHDL
+# sources. Doxygen will then generate output that is tailored for VHDL.
+# The default value is: NO.
+
+OPTIMIZE_OUTPUT_VHDL   = NO
+
+# Set the OPTIMIZE_OUTPUT_SLICE tag to YES if your project consists of Slice
+# sources only. Doxygen will then generate output that is more tailored for that
+# language. For instance, namespaces will be presented as modules, types will be
+# separated into more groups, etc.
+# The default value is: NO.
+
+OPTIMIZE_OUTPUT_SLICE  = NO
+
+# Doxygen selects the parser to use depending on the extension of the files it
+# parses. With this tag you can assign which parser to use for a given
+# extension. Doxygen has a built-in mapping, but you can override or extend it
+# using this tag. The format is ext=language, where ext is a file extension, and
+# language is one of the parsers supported by Doxygen: IDL, Java, JavaScript,
+# Csharp (C#), C, C++, Lex, D, PHP, md (Markdown), Objective-C, Python, Slice,
+# VHDL, Fortran (fixed format Fortran: FortranFixed, free formatted Fortran:
+# FortranFree, unknown formatted Fortran: Fortran. In the later case the parser
+# tries to guess whether the code is fixed or free formatted code, this is the
+# default for Fortran type files). For instance to make Doxygen treat .inc files
+# as Fortran files (default is PHP), and .f files as C (default is Fortran),
+# use: inc=Fortran f=C.
+#
+# Note: For files without extension you can use no_extension as a placeholder.
+#
+# Note that for custom extensions you also need to set FILE_PATTERNS otherwise
+# the files are not read by Doxygen. When specifying no_extension you should add
+# * to the FILE_PATTERNS.
+#
+# Note see also the list of default file extension mappings.
+
+EXTENSION_MAPPING      =
+
+# If the MARKDOWN_SUPPORT tag is enabled then Doxygen pre-processes all comments
+# according to the Markdown format, which allows for more readable
+# documentation. See https://daringfireball.net/projects/markdown/ for details.
+# The output of markdown processing is further processed by Doxygen, so you can
+# mix Doxygen, HTML, and XML commands with Markdown formatting. Disable only in
+# case of backward compatibilities issues.
+# The default value is: YES.
+
+MARKDOWN_SUPPORT       = YES
+
+# When the TOC_INCLUDE_HEADINGS tag is set to a non-zero value, all headings up
+# to that level are automatically included in the table of contents, even if
+# they do not have an id attribute.
+# Note: This feature currently applies only to Markdown headings.
+# Minimum value: 0, maximum value: 99, default value: 6.
+# This tag requires that the tag MARKDOWN_SUPPORT is set to YES.
+
+TOC_INCLUDE_HEADINGS   = 6
+
+# The MARKDOWN_ID_STYLE tag can be used to specify the algorithm used to
+# generate identifiers for the Markdown headings. Note: Every identifier is
+# unique.
+# Possible values are: DOXYGEN use a fixed 'autotoc_md' string followed by a
+# sequence number starting at 0 and GITHUB use the lower case version of title
+# with any whitespace replaced by '-' and punctuation characters removed.
+# The default value is: DOXYGEN.
+# This tag requires that the tag MARKDOWN_SUPPORT is set to YES.
+
+MARKDOWN_ID_STYLE      = DOXYGEN
+
+# When enabled Doxygen tries to link words that correspond to documented
+# classes, or namespaces to their corresponding documentation. Such a link can
+# be prevented in individual cases by putting a % sign in front of the word or
+# globally by setting AUTOLINK_SUPPORT to NO.
+# The default value is: YES.
+
+AUTOLINK_SUPPORT       = YES
+
+# If you use STL classes (i.e. std::string, std::vector, etc.) but do not want
+# to include (a tag file for) the STL sources as input, then you should set this
+# tag to YES in order to let Doxygen match functions declarations and
+# definitions whose arguments contain STL classes (e.g. func(std::string);
+# versus func(std::string) {}). This also makes the inheritance and
+# collaboration diagrams that involve STL classes more complete and accurate.
+# The default value is: NO.
+
+BUILTIN_STL_SUPPORT    = NO
+
+# If you use Microsoft's C++/CLI language, you should set this option to YES to
+# enable parsing support.
+# The default value is: NO.
+
+CPP_CLI_SUPPORT        = NO
+
+# Set the SIP_SUPPORT tag to YES if your project consists of sip (see:
+# https://www.riverbankcomputing.com/software) sources only. Doxygen will parse
+# them like normal C++ but will assume all classes use public instead of private
+# inheritance when no explicit protection keyword is present.
+# The default value is: NO.
+
+SIP_SUPPORT            = NO
+
+# For Microsoft's IDL there are propget and propput attributes to indicate
+# getter and setter methods for a property. Setting this option to YES will make
+# Doxygen to replace the get and set methods by a property in the documentation.
+# This will only work if the methods are indeed getting or setting a simple
+# type. If this is not the case, or you want to show the methods anyway, you
+# should set this option to NO.
+# The default value is: YES.
+
+IDL_PROPERTY_SUPPORT   = YES
+
+# If member grouping is used in the documentation and the DISTRIBUTE_GROUP_DOC
+# tag is set to YES then Doxygen will reuse the documentation of the first
+# member in the group (if any) for the other members of the group. By default
+# all members of a group must be documented explicitly.
+# The default value is: NO.
+
+DISTRIBUTE_GROUP_DOC   = NO
+
+# If one adds a struct or class to a group and this option is enabled, then also
+# any nested class or struct is added to the same group. By default this option
+# is disabled and one has to add nested compounds explicitly via \ingroup.
+# The default value is: NO.
+
+GROUP_NESTED_COMPOUNDS = NO
+
+# Set the SUBGROUPING tag to YES to allow class member groups of the same type
+# (for instance a group of public functions) to be put as a subgroup of that
+# type (e.g. under the Public Functions section). Set it to NO to prevent
+# subgrouping. Alternatively, this can be done per class using the
+# \nosubgrouping command.
+# The default value is: YES.
+
+SUBGROUPING            = YES
+
+# When the INLINE_GROUPED_CLASSES tag is set to YES, classes, structs and unions
+# are shown inside the group in which they are included (e.g. using \ingroup)
+# instead of on a separate page (for HTML and Man pages) or section (for LaTeX
+# and RTF).
+#
+# Note that this feature does not work in combination with
+# SEPARATE_MEMBER_PAGES.
+# The default value is: NO.
+
+INLINE_GROUPED_CLASSES = NO
+
+# When the INLINE_SIMPLE_STRUCTS tag is set to YES, structs, classes, and unions
+# with only public data fields or simple typedef fields will be shown inline in
+# the documentation of the scope in which they are defined (i.e. file,
+# namespace, or group documentation), provided this scope is documented. If set
+# to NO, structs, classes, and unions are shown on a separate page (for HTML and
+# Man pages) or section (for LaTeX and RTF).
+# The default value is: NO.
+
+INLINE_SIMPLE_STRUCTS  = NO
+
+# When TYPEDEF_HIDES_STRUCT tag is enabled, a typedef of a struct, union, or
+# enum is documented as struct, union, or enum with the name of the typedef. So
+# typedef struct TypeS {} TypeT, will appear in the documentation as a struct
+# with name TypeT. When disabled the typedef will appear as a member of a file,
+# namespace, or class. And the struct will be named TypeS. This can typically be
+# useful for C code in case the coding convention dictates that all compound
+# types are typedef'ed and only the typedef is referenced, never the tag name.
+# The default value is: NO.
+
+TYPEDEF_HIDES_STRUCT   = NO
+
+# The size of the symbol lookup cache can be set using LOOKUP_CACHE_SIZE. This
+# cache is used to resolve symbols given their name and scope. Since this can be
+# an expensive process and often the same symbol appears multiple times in the
+# code, Doxygen keeps a cache of pre-resolved symbols. If the cache is too small
+# Doxygen will become slower. If the cache is too large, memory is wasted. The
+# cache size is given by this formula: 2^(16+LOOKUP_CACHE_SIZE). The valid range
+# is 0..9, the default is 0, corresponding to a cache size of 2^16=65536
+# symbols. At the end of a run Doxygen will report the cache usage and suggest
+# the optimal cache size from a speed point of view.
+# Minimum value: 0, maximum value: 9, default value: 0.
+
+LOOKUP_CACHE_SIZE      = 0
+
+# The NUM_PROC_THREADS specifies the number of threads Doxygen is allowed to use
+# during processing. When set to 0 Doxygen will based this on the number of
+# cores available in the system. You can set it explicitly to a value larger
+# than 0 to get more control over the balance between CPU load and processing
+# speed. At this moment only the input processing can be done using multiple
+# threads. Since this is still an experimental feature the default is set to 1,
+# which effectively disables parallel processing. Please report any issues you
+# encounter. Generating dot graphs in parallel is controlled by the
+# DOT_NUM_THREADS setting.
+# Minimum value: 0, maximum value: 32, default value: 1.
+
+NUM_PROC_THREADS       = 1
+
+# If the TIMESTAMP tag is set different from NO then each generated page will
+# contain the date or date and time when the page was generated. Setting this to
+# NO can help when comparing the output of multiple runs.
+# Possible values are: YES, NO, DATETIME and DATE.
+# The default value is: NO.
+
+TIMESTAMP              = NO
+
+#---------------------------------------------------------------------------
+# Build related configuration options
+#---------------------------------------------------------------------------
+
+# If the EXTRACT_ALL tag is set to YES, Doxygen will assume all entities in
+# documentation are documented, even if no documentation was available. Private
+# class members and static file members will be hidden unless the
+# EXTRACT_PRIVATE respectively EXTRACT_STATIC tags are set to YES.
+# Note: This will also disable the warnings about undocumented members that are
+# normally produced when WARNINGS is set to YES.
+# The default value is: NO.
+
+EXTRACT_ALL            = NO
+
+# If the EXTRACT_PRIVATE tag is set to YES, all private members of a class will
+# be included in the documentation.
+# The default value is: NO.
+
+EXTRACT_PRIVATE        = NO
+
+# If the EXTRACT_PRIV_VIRTUAL tag is set to YES, documented private virtual
+# methods of a class will be included in the documentation.
+# The default value is: NO.
+
+EXTRACT_PRIV_VIRTUAL   = NO
+
+# If the EXTRACT_PACKAGE tag is set to YES, all members with package or internal
+# scope will be included in the documentation.
+# The default value is: NO.
+
+EXTRACT_PACKAGE        = NO
+
+# If the EXTRACT_STATIC tag is set to YES, all static members of a file will be
+# included in the documentation.
+# The default value is: NO.
+
+EXTRACT_STATIC         = NO
+
+# If the EXTRACT_LOCAL_CLASSES tag is set to YES, classes (and structs) defined
+# locally in source files will be included in the documentation. If set to NO,
+# only classes defined in header files are included. Does not have any effect
+# for Java sources.
+# The default value is: YES.
+
+EXTRACT_LOCAL_CLASSES  = YES
+
+# This flag is only useful for Objective-C code. If set to YES, local methods,
+# which are defined in the implementation section but not in the interface are
+# included in the documentation. If set to NO, only methods in the interface are
+# included.
+# The default value is: NO.
+
+EXTRACT_LOCAL_METHODS  = NO
+
+# If this flag is set to YES, the members of anonymous namespaces will be
+# extracted and appear in the documentation as a namespace called
+# 'anonymous_namespace{file}', where file will be replaced with the base name of
+# the file that contains the anonymous namespace. By default anonymous namespace
+# are hidden.
+# The default value is: NO.
+
+EXTRACT_ANON_NSPACES   = NO
+
+# If this flag is set to YES, the name of an unnamed parameter in a declaration
+# will be determined by the corresponding definition. By default unnamed
+# parameters remain unnamed in the output.
+# The default value is: YES.
+
+RESOLVE_UNNAMED_PARAMS = YES
+
+# If the HIDE_UNDOC_MEMBERS tag is set to YES, Doxygen will hide all
+# undocumented members inside documented classes or files. If set to NO these
+# members will be included in the various overviews, but no documentation
+# section is generated. This option has no effect if EXTRACT_ALL is enabled.
+# The default value is: NO.
+
+HIDE_UNDOC_MEMBERS     = NO
+
+# If the HIDE_UNDOC_CLASSES tag is set to YES, Doxygen will hide all
+# undocumented classes that are normally visible in the class hierarchy. If set
+# to NO, these classes will be included in the various overviews. This option
+# will also hide undocumented C++ concepts if enabled. This option has no effect
+# if EXTRACT_ALL is enabled.
+# The default value is: NO.
+
+HIDE_UNDOC_CLASSES     = NO
+
+# If the HIDE_FRIEND_COMPOUNDS tag is set to YES, Doxygen will hide all friend
+# declarations. If set to NO, these declarations will be included in the
+# documentation.
+# The default value is: NO.
+
+HIDE_FRIEND_COMPOUNDS  = NO
+
+# If the HIDE_IN_BODY_DOCS tag is set to YES, Doxygen will hide any
+# documentation blocks found inside the body of a function. If set to NO, these
+# blocks will be appended to the function's detailed documentation block.
+# The default value is: NO.
+
+HIDE_IN_BODY_DOCS      = NO
+
+# The INTERNAL_DOCS tag determines if documentation that is typed after a
+# \internal command is included. If the tag is set to NO then the documentation
+# will be excluded. Set it to YES to include the internal documentation.
+# The default value is: NO.
+
+INTERNAL_DOCS          = NO
+
+# With the correct setting of option CASE_SENSE_NAMES Doxygen will better be
+# able to match the capabilities of the underlying filesystem. In case the
+# filesystem is case sensitive (i.e. it supports files in the same directory
+# whose names only differ in casing), the option must be set to YES to properly
+# deal with such files in case they appear in the input. For filesystems that
+# are not case sensitive the option should be set to NO to properly deal with
+# output files written for symbols that only differ in casing, such as for two
+# classes, one named CLASS and the other named Class, and to also support
+# references to files without having to specify the exact matching casing. On
+# Windows (including Cygwin) and macOS, users should typically set this option
+# to NO, whereas on Linux or other Unix flavors it should typically be set to
+# YES.
+# Possible values are: SYSTEM, NO and YES.
+# The default value is: SYSTEM.
+
+CASE_SENSE_NAMES       = SYSTEM
+
+# If the HIDE_SCOPE_NAMES tag is set to NO then Doxygen will show members with
+# their full class and namespace scopes in the documentation. If set to YES, the
+# scope will be hidden.
+# The default value is: NO.
+
+HIDE_SCOPE_NAMES       = NO
+
+# If the HIDE_COMPOUND_REFERENCE tag is set to NO (default) then Doxygen will
+# append additional text to a page's title, such as Class Reference. If set to
+# YES the compound reference will be hidden.
+# The default value is: NO.
+
+HIDE_COMPOUND_REFERENCE= NO
+
+# If the SHOW_HEADERFILE tag is set to YES then the documentation for a class
+# will show which file needs to be included to use the class.
+# The default value is: YES.
+
+SHOW_HEADERFILE        = YES
+
+# If the SHOW_INCLUDE_FILES tag is set to YES then Doxygen will put a list of
+# the files that are included by a file in the documentation of that file.
+# The default value is: YES.
+
+SHOW_INCLUDE_FILES     = YES
+
+# If the SHOW_GROUPED_MEMB_INC tag is set to YES then Doxygen will add for each
+# grouped member an include statement to the documentation, telling the reader
+# which file to include in order to use the member.
+# The default value is: NO.
+
+SHOW_GROUPED_MEMB_INC  = NO
+
+# If the FORCE_LOCAL_INCLUDES tag is set to YES then Doxygen will list include
+# files with double quotes in the documentation rather than with sharp brackets.
+# The default value is: NO.
+
+FORCE_LOCAL_INCLUDES   = NO
+
+# If the INLINE_INFO tag is set to YES then a tag [inline] is inserted in the
+# documentation for inline members.
+# The default value is: YES.
+
+INLINE_INFO            = YES
+
+# If the SORT_MEMBER_DOCS tag is set to YES then Doxygen will sort the
+# (detailed) documentation of file and class members alphabetically by member
+# name. If set to NO, the members will appear in declaration order.
+# The default value is: YES.
+
+SORT_MEMBER_DOCS       = YES
+
+# If the SORT_BRIEF_DOCS tag is set to YES then Doxygen will sort the brief
+# descriptions of file, namespace and class members alphabetically by member
+# name. If set to NO, the members will appear in declaration order. Note that
+# this will also influence the order of the classes in the class list.
+# The default value is: NO.
+
+SORT_BRIEF_DOCS        = NO
+
+# If the SORT_MEMBERS_CTORS_1ST tag is set to YES then Doxygen will sort the
+# (brief and detailed) documentation of class members so that constructors and
+# destructors are listed first. If set to NO the constructors will appear in the
+# respective orders defined by SORT_BRIEF_DOCS and SORT_MEMBER_DOCS.
+# Note: If SORT_BRIEF_DOCS is set to NO this option is ignored for sorting brief
+# member documentation.
+# Note: If SORT_MEMBER_DOCS is set to NO this option is ignored for sorting
+# detailed member documentation.
+# The default value is: NO.
+
+SORT_MEMBERS_CTORS_1ST = NO
+
+# If the SORT_GROUP_NAMES tag is set to YES then Doxygen will sort the hierarchy
+# of group names into alphabetical order. If set to NO the group names will
+# appear in their defined order.
+# The default value is: NO.
+
+SORT_GROUP_NAMES       = NO
+
+# If the SORT_BY_SCOPE_NAME tag is set to YES, the class list will be sorted by
+# fully-qualified names, including namespaces. If set to NO, the class list will
+# be sorted only by class name, not including the namespace part.
+# Note: This option is not very useful if HIDE_SCOPE_NAMES is set to YES.
+# Note: This option applies only to the class list, not to the alphabetical
+# list.
+# The default value is: NO.
+
+SORT_BY_SCOPE_NAME     = NO
+
+# If the STRICT_PROTO_MATCHING option is enabled and Doxygen fails to do proper
+# type resolution of all parameters of a function it will reject a match between
+# the prototype and the implementation of a member function even if there is
+# only one candidate or it is obvious which candidate to choose by doing a
+# simple string match. By disabling STRICT_PROTO_MATCHING Doxygen will still
+# accept a match between prototype and implementation in such cases.
+# The default value is: NO.
+
+STRICT_PROTO_MATCHING  = NO
+
+# The GENERATE_TODOLIST tag can be used to enable (YES) or disable (NO) the todo
+# list. This list is created by putting \todo commands in the documentation.
+# The default value is: YES.
+
+GENERATE_TODOLIST      = YES
+
+# The GENERATE_TESTLIST tag can be used to enable (YES) or disable (NO) the test
+# list. This list is created by putting \test commands in the documentation.
+# The default value is: YES.
+
+GENERATE_TESTLIST      = YES
+
+# The GENERATE_BUGLIST tag can be used to enable (YES) or disable (NO) the bug
+# list. This list is created by putting \bug commands in the documentation.
+# The default value is: YES.
+
+GENERATE_BUGLIST       = YES
+
+# The GENERATE_DEPRECATEDLIST tag can be used to enable (YES) or disable (NO)
+# the deprecated list. This list is created by putting \deprecated commands in
+# the documentation.
+# The default value is: YES.
+
+GENERATE_DEPRECATEDLIST= YES
+
+# The ENABLED_SECTIONS tag can be used to enable conditional documentation
+# sections, marked by \if <section_label> ... \endif and \cond <section_label>
+# ... \endcond blocks.
+
+ENABLED_SECTIONS       =
+
+# The MAX_INITIALIZER_LINES tag determines the maximum number of lines that the
+# initial value of a variable or macro / define can have for it to appear in the
+# documentation. If the initializer consists of more lines than specified here
+# it will be hidden. Use a value of 0 to hide initializers completely. The
+# appearance of the value of individual variables and macros / defines can be
+# controlled using \showinitializer or \hideinitializer command in the
+# documentation regardless of this setting.
+# Minimum value: 0, maximum value: 10000, default value: 30.
+
+MAX_INITIALIZER_LINES  = 30
+
+# Set the SHOW_USED_FILES tag to NO to disable the list of files generated at
+# the bottom of the documentation of classes and structs. If set to YES, the
+# list will mention the files that were used to generate the documentation.
+# The default value is: YES.
+
+SHOW_USED_FILES        = YES
+
+# Set the SHOW_FILES tag to NO to disable the generation of the Files page. This
+# will remove the Files entry from the Quick Index and from the Folder Tree View
+# (if specified).
+# The default value is: YES.
+
+SHOW_FILES             = YES
+
+# Set the SHOW_NAMESPACES tag to NO to disable the generation of the Namespaces
+# page. This will remove the Namespaces entry from the Quick Index and from the
+# Folder Tree View (if specified).
+# The default value is: YES.
+
+SHOW_NAMESPACES        = YES
+
+# The FILE_VERSION_FILTER tag can be used to specify a program or script that
+# Doxygen should invoke to get the current version for each file (typically from
+# the version control system). Doxygen will invoke the program by executing (via
+# popen()) the command command input-file, where command is the value of the
+# FILE_VERSION_FILTER tag, and input-file is the name of an input file provided
+# by Doxygen. Whatever the program writes to standard output is used as the file
+# version. For an example see the documentation.
+
+FILE_VERSION_FILTER    =
+
+# The LAYOUT_FILE tag can be used to specify a layout file which will be parsed
+# by Doxygen. The layout file controls the global structure of the generated
+# output files in an output format independent way. To create the layout file
+# that represents Doxygen's defaults, run Doxygen with the -l option. You can
+# optionally specify a file name after the option, if omitted DoxygenLayout.xml
+# will be used as the name of the layout file. See also section "Changing the
+# layout of pages" for information.
+#
+# Note that if you run Doxygen from a directory containing a file called
+# DoxygenLayout.xml, Doxygen will parse it automatically even if the LAYOUT_FILE
+# tag is left empty.
+
+LAYOUT_FILE            =
+
+# The CITE_BIB_FILES tag can be used to specify one or more bib files containing
+# the reference definitions. This must be a list of .bib files. The .bib
+# extension is automatically appended if omitted. This requires the bibtex tool
+# to be installed. See also https://en.wikipedia.org/wiki/BibTeX for more info.
+# For LaTeX the style of the bibliography can be controlled using
+# LATEX_BIB_STYLE. To use this feature you need bibtex and perl available in the
+# search path. See also \cite for info how to create references.
+
+CITE_BIB_FILES         =
+
+# The EXTERNAL_TOOL_PATH tag can be used to extend the search path (PATH
+# environment variable) so that external tools such as latex and gs can be
+# found.
+# Note: Directories specified with EXTERNAL_TOOL_PATH are added in front of the
+# path already specified by the PATH variable, and are added in the order
+# specified.
+# Note: This option is particularly useful for macOS version 14 (Sonoma) and
+# higher, when running Doxygen from Doxywizard, because in this case any user-
+# defined changes to the PATH are ignored. A typical example on macOS is to set
+# EXTERNAL_TOOL_PATH = /Library/TeX/texbin /usr/local/bin
+# together with the standard path, the full search path used by doxygen when
+# launching external tools will then become
+# PATH=/Library/TeX/texbin:/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin
+
+EXTERNAL_TOOL_PATH     =
+
+#---------------------------------------------------------------------------
+# Configuration options related to warning and progress messages
+#---------------------------------------------------------------------------
+
+# The QUIET tag can be used to turn on/off the messages that are generated to
+# standard output by Doxygen. If QUIET is set to YES this implies that the
+# messages are off.
+# The default value is: NO.
+
+QUIET                  = NO
+
+# The WARNINGS tag can be used to turn on/off the warning messages that are
+# generated to standard error (stderr) by Doxygen. If WARNINGS is set to YES
+# this implies that the warnings are on.
+#
+# Tip: Turn warnings on while writing the documentation.
+# The default value is: YES.
+
+WARNINGS               = YES
+
+# If the WARN_IF_UNDOCUMENTED tag is set to YES then Doxygen will generate
+# warnings for undocumented members. If EXTRACT_ALL is set to YES then this flag
+# will automatically be disabled.
+# The default value is: YES.
+
+WARN_IF_UNDOCUMENTED   = YES
+
+# If the WARN_IF_DOC_ERROR tag is set to YES, Doxygen will generate warnings for
+# potential errors in the documentation, such as documenting some parameters in
+# a documented function twice, or documenting parameters that don't exist or
+# using markup commands wrongly.
+# The default value is: YES.
+
+WARN_IF_DOC_ERROR      = YES
+
+# If WARN_IF_INCOMPLETE_DOC is set to YES, Doxygen will warn about incomplete
+# function parameter documentation. If set to NO, Doxygen will accept that some
+# parameters have no documentation without warning.
+# The default value is: YES.
+
+WARN_IF_INCOMPLETE_DOC = YES
+
+# This WARN_NO_PARAMDOC option can be enabled to get warnings for functions that
+# are documented, but have no documentation for their parameters or return
+# value. If set to NO, Doxygen will only warn about wrong parameter
+# documentation, but not about the absence of documentation. If EXTRACT_ALL is
+# set to YES then this flag will automatically be disabled. See also
+# WARN_IF_INCOMPLETE_DOC
+# The default value is: NO.
+
+WARN_NO_PARAMDOC       = NO
+
+# If WARN_IF_UNDOC_ENUM_VAL option is set to YES, Doxygen will warn about
+# undocumented enumeration values. If set to NO, Doxygen will accept
+# undocumented enumeration values. If EXTRACT_ALL is set to YES then this flag
+# will automatically be disabled.
+# The default value is: NO.
+
+WARN_IF_UNDOC_ENUM_VAL = NO
+
+# If the WARN_AS_ERROR tag is set to YES then Doxygen will immediately stop when
+# a warning is encountered. If the WARN_AS_ERROR tag is set to FAIL_ON_WARNINGS
+# then Doxygen will continue running as if WARN_AS_ERROR tag is set to NO, but
+# at the end of the Doxygen process Doxygen will return with a non-zero status.
+# If the WARN_AS_ERROR tag is set to FAIL_ON_WARNINGS_PRINT then Doxygen behaves
+# like FAIL_ON_WARNINGS but in case no WARN_LOGFILE is defined Doxygen will not
+# write the warning messages in between other messages but write them at the end
+# of a run, in case a WARN_LOGFILE is defined the warning messages will be
+# besides being in the defined file also be shown at the end of a run, unless
+# the WARN_LOGFILE is defined as - i.e. standard output (stdout) in that case
+# the behavior will remain as with the setting FAIL_ON_WARNINGS.
+# Possible values are: NO, YES, FAIL_ON_WARNINGS and FAIL_ON_WARNINGS_PRINT.
+# The default value is: NO.
+
+WARN_AS_ERROR          = NO
+
+# The WARN_FORMAT tag determines the format of the warning messages that Doxygen
+# can produce. The string should contain the $file, $line, and $text tags, which
+# will be replaced by the file and line number from which the warning originated
+# and the warning text. Optionally the format may contain $version, which will
+# be replaced by the version of the file (if it could be obtained via
+# FILE_VERSION_FILTER)
+# See also: WARN_LINE_FORMAT
+# The default value is: $file:$line: $text.
+
+WARN_FORMAT            = "$file:$line: $text"
+
+# In the $text part of the WARN_FORMAT command it is possible that a reference
+# to a more specific place is given. To make it easier to jump to this place
+# (outside of Doxygen) the user can define a custom "cut" / "paste" string.
+# Example:
+# WARN_LINE_FORMAT = "'vi $file +$line'"
+# See also: WARN_FORMAT
+# The default value is: at line $line of file $file.
+
+WARN_LINE_FORMAT       = "at line $line of file $file"
+
+# The WARN_LOGFILE tag can be used to specify a file to which warning and error
+# messages should be written. If left blank the output is written to standard
+# error (stderr). In case the file specified cannot be opened for writing the
+# warning and error messages are written to standard error. When as file - is
+# specified the warning and error messages are written to standard output
+# (stdout).
+
+WARN_LOGFILE           =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the input files
+#---------------------------------------------------------------------------
+
+# The INPUT tag is used to specify the files and/or directories that contain
+# documented source files. You may enter file names like myfile.cpp or
+# directories like /usr/src/myproject. Separate the files or directories with
+# spaces. See also FILE_PATTERNS and EXTENSION_MAPPING
+# Note: If this tag is empty the current directory is searched.
+
+INPUT                  = ../
+
+# This tag can be used to specify the character encoding of the source files
+# that Doxygen parses. Internally Doxygen uses the UTF-8 encoding. Doxygen uses
+# libiconv (or the iconv built into libc) for the transcoding. See the libiconv
+# documentation (see:
+# https://www.gnu.org/software/libiconv/) for the list of possible encodings.
+# See also: INPUT_FILE_ENCODING
+# The default value is: UTF-8.
+
+INPUT_ENCODING         = UTF-8
+
+# This tag can be used to specify the character encoding of the source files
+# that Doxygen parses The INPUT_FILE_ENCODING tag can be used to specify
+# character encoding on a per file pattern basis. Doxygen will compare the file
+# name with each pattern and apply the encoding instead of the default
+# INPUT_ENCODING) if there is a match. The character encodings are a list of the
+# form: pattern=encoding (like *.php=ISO-8859-1).
+# See also: INPUT_ENCODING for further information on supported encodings.
+
+INPUT_FILE_ENCODING    =
+
+# If the value of the INPUT tag contains directories, you can use the
+# FILE_PATTERNS tag to specify one or more wildcard patterns (like *.cpp and
+# *.h) to filter out the source-files in the directories.
+#
+# Note that for custom extensions or not directly supported extensions you also
+# need to set EXTENSION_MAPPING for the extension otherwise the files are not
+# read by Doxygen.
+#
+# Note the list of default checked file patterns might differ from the list of
+# default file extension mappings.
+#
+# If left blank the following patterns are tested:*.c, *.cc, *.cxx, *.cxxm,
+# *.cpp, *.cppm, *.ccm, *.c++, *.c++m, *.java, *.ii, *.ixx, *.ipp, *.i++, *.inl,
+# *.idl, *.ddl, *.odl, *.h, *.hh, *.hxx, *.hpp, *.h++, *.ixx, *.l, *.cs, *.d,
+# *.php, *.php4, *.php5, *.phtml, *.inc, *.m, *.markdown, *.md, *.mm, *.dox (to
+# be provided as Doxygen C comment), *.py, *.pyw, *.f90, *.f95, *.f03, *.f08,
+# *.f18, *.f, *.for, *.vhd, *.vhdl, *.ucf, *.qsf and *.ice.
+
+FILE_PATTERNS          = *.c \
+                         *.cc \
+                         *.cxx \
+                         *.cxxm \
+                         *.cpp \
+                         *.cppm \
+                         *.ccm \
+                         *.c++ \
+                         *.c++m \
+                         *.h \
+                         *.hh \
+                         *.hxx \
+                         *.hpp \
+                         *.h++ \
+
+# The RECURSIVE tag can be used to specify whether or not subdirectories should
+# be searched for input files as well.
+# The default value is: NO.
+
+RECURSIVE              = YES
+
+# The EXCLUDE tag can be used to specify files and/or directories that should be
+# excluded from the INPUT source files. This way you can easily exclude a
+# subdirectory from a directory tree whose root is specified with the INPUT tag.
+#
+# Note that relative paths are relative to the directory from which Doxygen is
+# run.
+
+EXCLUDE                = ../src/cpp11.cpp \
+                         ../src/py_stochtree.cpp \
+                         ../src/R_data.cpp \
+                         ../src/R_random_effects.cpp \
+                         ../src/sampler.cpp \
+                         ../src/serialization.cpp \
+                         ../src/stochtree_types.h
+
+# The EXCLUDE_SYMLINKS tag can be used to select whether or not files or
+# directories that are symbolic links (a Unix file system feature) are excluded
+# from the input.
+# The default value is: NO.
+
+EXCLUDE_SYMLINKS       = NO
+
+# If the value of the INPUT tag contains directories, you can use the
+# EXCLUDE_PATTERNS tag to specify one or more wildcard patterns to exclude
+# certain files from those directories.
+#
+# Note that the wildcards are matched against the file with absolute path, so to
+# exclude all test directories for example use the pattern */test/*
+
+EXCLUDE_PATTERNS       = */test/* \
+                         */tools/* \
+                         */vignettes/* \
+                         */R/* \
+                         */nlohmann/* \
+                         */debug/* \
+                         */demo/* \
+                         */deps/* \
+                         */venv/* \
+                         */xcode/*
+
+# The EXCLUDE_SYMBOLS tag can be used to specify one or more symbol names
+# (namespaces, classes, functions, etc.) that should be excluded from the
+# output. The symbol name can be a fully qualified name, a word, or if the
+# wildcard * is used, a substring. Examples: ANamespace, AClass,
+# ANamespace::AClass, ANamespace::*Test
+
+EXCLUDE_SYMBOLS        =
+
+# The EXAMPLE_PATH tag can be used to specify one or more files or directories
+# that contain example code fragments that are included (see the \include
+# command).
+
+EXAMPLE_PATH           =
+
+# If the value of the EXAMPLE_PATH tag contains directories, you can use the
+# EXAMPLE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp and
+# *.h) to filter out the source-files in the directories. If left blank all
+# files are included.
+
+EXAMPLE_PATTERNS       = *
+
+# If the EXAMPLE_RECURSIVE tag is set to YES then subdirectories will be
+# searched for input files to be used with the \include or \dontinclude commands
+# irrespective of the value of the RECURSIVE tag.
+# The default value is: NO.
+
+EXAMPLE_RECURSIVE      = NO
+
+# The IMAGE_PATH tag can be used to specify one or more files or directories
+# that contain images that are to be included in the documentation (see the
+# \image command).
+
+IMAGE_PATH             =
+
+# The INPUT_FILTER tag can be used to specify a program that Doxygen should
+# invoke to filter for each input file. Doxygen will invoke the filter program
+# by executing (via popen()) the command:
+#
+# <filter> <input-file>
+#
+# where <filter> is the value of the INPUT_FILTER tag, and <input-file> is the
+# name of an input file. Doxygen will then use the output that the filter
+# program writes to standard output. If FILTER_PATTERNS is specified, this tag
+# will be ignored.
+#
+# Note that the filter must not add or remove lines; it is applied before the
+# code is scanned, but not when the output code is generated. If lines are added
+# or removed, the anchors will not be placed correctly.
+#
+# Note that Doxygen will use the data processed and written to standard output
+# for further processing, therefore nothing else, like debug statements or used
+# commands (so in case of a Windows batch file always use @echo OFF), should be
+# written to standard output.
+#
+# Note that for custom extensions or not directly supported extensions you also
+# need to set EXTENSION_MAPPING for the extension otherwise the files are not
+# properly processed by Doxygen.
+
+INPUT_FILTER           =
+
+# The FILTER_PATTERNS tag can be used to specify filters on a per file pattern
+# basis. Doxygen will compare the file name with each pattern and apply the
+# filter if there is a match. The filters are a list of the form: pattern=filter
+# (like *.cpp=my_cpp_filter). See INPUT_FILTER for further information on how
+# filters are used. If the FILTER_PATTERNS tag is empty or if none of the
+# patterns match the file name, INPUT_FILTER is applied.
+#
+# Note that for custom extensions or not directly supported extensions you also
+# need to set EXTENSION_MAPPING for the extension otherwise the files are not
+# properly processed by Doxygen.
+
+FILTER_PATTERNS        =
+
+# If the FILTER_SOURCE_FILES tag is set to YES, the input filter (if set using
+# INPUT_FILTER) will also be used to filter the input files that are used for
+# producing the source files to browse (i.e. when SOURCE_BROWSER is set to YES).
+# The default value is: NO.
+
+FILTER_SOURCE_FILES    = NO
+
+# The FILTER_SOURCE_PATTERNS tag can be used to specify source filters per file
+# pattern. A pattern will override the setting for FILTER_PATTERN (if any) and
+# it is also possible to disable source filtering for a specific pattern using
+# *.ext= (so without naming a filter).
+# This tag requires that the tag FILTER_SOURCE_FILES is set to YES.
+
+FILTER_SOURCE_PATTERNS =
+
+# If the USE_MDFILE_AS_MAINPAGE tag refers to the name of a markdown file that
+# is part of the input, its contents will be placed on the main page
+# (index.html). This can be useful if you have a project on for instance GitHub
+# and want to reuse the introduction page also for the Doxygen output.
+
+USE_MDFILE_AS_MAINPAGE =
+
+# The Fortran standard specifies that for fixed formatted Fortran code all
+# characters from position 72 are to be considered as comment. A common
+# extension is to allow longer lines before the automatic comment starts. The
+# setting FORTRAN_COMMENT_AFTER will also make it possible that longer lines can
+# be processed before the automatic comment starts.
+# Minimum value: 7, maximum value: 10000, default value: 72.
+
+FORTRAN_COMMENT_AFTER  = 72
+
+#---------------------------------------------------------------------------
+# Configuration options related to source browsing
+#---------------------------------------------------------------------------
+
+# If the SOURCE_BROWSER tag is set to YES then a list of source files will be
+# generated. Documented entities will be cross-referenced with these sources.
+#
+# Note: To get rid of all source code in the generated output, make sure that
+# also VERBATIM_HEADERS is set to NO.
+# The default value is: NO.
+
+SOURCE_BROWSER         = NO
+
+# Setting the INLINE_SOURCES tag to YES will include the body of functions,
+# multi-line macros, enums or list initialized variables directly into the
+# documentation.
+# The default value is: NO.
+
+INLINE_SOURCES         = NO
+
+# Setting the STRIP_CODE_COMMENTS tag to YES will instruct Doxygen to hide any
+# special comment blocks from generated source code fragments. Normal C, C++ and
+# Fortran comments will always remain visible.
+# The default value is: YES.
+
+STRIP_CODE_COMMENTS    = YES
+
+# If the REFERENCED_BY_RELATION tag is set to YES then for each documented
+# entity all documented functions referencing it will be listed.
+# The default value is: NO.
+
+REFERENCED_BY_RELATION = NO
+
+# If the REFERENCES_RELATION tag is set to YES then for each documented function
+# all documented entities called/used by that function will be listed.
+# The default value is: NO.
+
+REFERENCES_RELATION    = NO
+
+# If the REFERENCES_LINK_SOURCE tag is set to YES and SOURCE_BROWSER tag is set
+# to YES then the hyperlinks from functions in REFERENCES_RELATION and
+# REFERENCED_BY_RELATION lists will link to the source code. Otherwise they will
+# link to the documentation.
+# The default value is: YES.
+
+REFERENCES_LINK_SOURCE = YES
+
+# If SOURCE_TOOLTIPS is enabled (the default) then hovering a hyperlink in the
+# source code will show a tooltip with additional information such as prototype,
+# brief description and links to the definition and documentation. Since this
+# will make the HTML file larger and loading of large files a bit slower, you
+# can opt to disable this feature.
+# The default value is: YES.
+# This tag requires that the tag SOURCE_BROWSER is set to YES.
+
+SOURCE_TOOLTIPS        = YES
+
+# If the USE_HTAGS tag is set to YES then the references to source code will
+# point to the HTML generated by the htags(1) tool instead of Doxygen built-in
+# source browser. The htags tool is part of GNU's global source tagging system
+# (see https://www.gnu.org/software/global/global.html). You will need version
+# 4.8.6 or higher.
+#
+# To use it do the following:
+# - Install the latest version of global
+# - Enable SOURCE_BROWSER and USE_HTAGS in the configuration file
+# - Make sure the INPUT points to the root of the source tree
+# - Run doxygen as normal
+#
+# Doxygen will invoke htags (and that will in turn invoke gtags), so these
+# tools must be available from the command line (i.e. in the search path).
+#
+# The result: instead of the source browser generated by Doxygen, the links to
+# source code will now point to the output of htags.
+# The default value is: NO.
+# This tag requires that the tag SOURCE_BROWSER is set to YES.
+
+USE_HTAGS              = NO
+
+# If the VERBATIM_HEADERS tag is set the YES then Doxygen will generate a
+# verbatim copy of the header file for each class for which an include is
+# specified. Set to NO to disable this.
+# See also: Section \class.
+# The default value is: YES.
+
+VERBATIM_HEADERS       = YES
+
+#---------------------------------------------------------------------------
+# Configuration options related to the alphabetical class index
+#---------------------------------------------------------------------------
+
+# If the ALPHABETICAL_INDEX tag is set to YES, an alphabetical index of all
+# compounds will be generated. Enable this if the project contains a lot of
+# classes, structs, unions or interfaces.
+# The default value is: YES.
+
+ALPHABETICAL_INDEX     = YES
+
+# The IGNORE_PREFIX tag can be used to specify a prefix (or a list of prefixes)
+# that should be ignored while generating the index headers. The IGNORE_PREFIX
+# tag works for classes, function and member names. The entity will be placed in
+# the alphabetical list under the first letter of the entity name that remains
+# after removing the prefix.
+# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.
+
+IGNORE_PREFIX          =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the HTML output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_HTML tag is set to YES, Doxygen will generate HTML output
+# The default value is: YES.
+
+GENERATE_HTML          = NO
+
+# The HTML_OUTPUT tag is used to specify where the HTML docs will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it.
+# The default directory is: html.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_OUTPUT            = html
+
+# The HTML_FILE_EXTENSION tag can be used to specify the file extension for each
+# generated HTML page (for example: .htm, .php, .asp).
+# The default value is: .html.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_FILE_EXTENSION    = .html
+
+# The HTML_HEADER tag can be used to specify a user-defined HTML header file for
+# each generated HTML page. If the tag is left blank Doxygen will generate a
+# standard header.
+#
+# To get valid HTML the header file that includes any scripts and style sheets
+# that Doxygen needs, which is dependent on the configuration options used (e.g.
+# the setting GENERATE_TREEVIEW). It is highly recommended to start with a
+# default header using
+# doxygen -w html new_header.html new_footer.html new_stylesheet.css
+# YourConfigFile
+# and then modify the file new_header.html. See also section "Doxygen usage"
+# for information on how to generate the default header that Doxygen normally
+# uses.
+# Note: The header is subject to change so you typically have to regenerate the
+# default header when upgrading to a newer version of Doxygen. For a description
+# of the possible markers and block names see the documentation.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_HEADER            =
+
+# The HTML_FOOTER tag can be used to specify a user-defined HTML footer for each
+# generated HTML page. If the tag is left blank Doxygen will generate a standard
+# footer. See HTML_HEADER for more information on how to generate a default
+# footer and what special commands can be used inside the footer. See also
+# section "Doxygen usage" for information on how to generate the default footer
+# that Doxygen normally uses.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_FOOTER            =
+
+# The HTML_STYLESHEET tag can be used to specify a user-defined cascading style
+# sheet that is used by each HTML page. It can be used to fine-tune the look of
+# the HTML output. If left blank Doxygen will generate a default style sheet.
+# See also section "Doxygen usage" for information on how to generate the style
+# sheet that Doxygen normally uses.
+# Note: It is recommended to use HTML_EXTRA_STYLESHEET instead of this tag, as
+# it is more robust and this tag (HTML_STYLESHEET) will in the future become
+# obsolete.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_STYLESHEET        =
+
+# The HTML_EXTRA_STYLESHEET tag can be used to specify additional user-defined
+# cascading style sheets that are included after the standard style sheets
+# created by Doxygen. Using this option one can overrule certain style aspects.
+# This is preferred over using HTML_STYLESHEET since it does not replace the
+# standard style sheet and is therefore more robust against future updates.
+# Doxygen will copy the style sheet files to the output directory.
+# Note: The order of the extra style sheet files is of importance (e.g. the last
+# style sheet in the list overrules the setting of the previous ones in the
+# list).
+# Note: Since the styling of scrollbars can currently not be overruled in
+# Webkit/Chromium, the styling will be left out of the default doxygen.css if
+# one or more extra stylesheets have been specified. So if scrollbar
+# customization is desired it has to be added explicitly. For an example see the
+# documentation.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_EXTRA_STYLESHEET  =
+
+# The HTML_EXTRA_FILES tag can be used to specify one or more extra images or
+# other source files which should be copied to the HTML output directory. Note
+# that these files will be copied to the base HTML output directory. Use the
+# $relpath^ marker in the HTML_HEADER and/or HTML_FOOTER files to load these
+# files. In the HTML_STYLESHEET file, use the file name only. Also note that the
+# files will be copied as-is; there are no commands or markers available.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_EXTRA_FILES       =
+
+# The HTML_COLORSTYLE tag can be used to specify if the generated HTML output
+# should be rendered with a dark or light theme.
+# Possible values are: LIGHT always generates light mode output, DARK always
+# generates dark mode output, AUTO_LIGHT automatically sets the mode according
+# to the user preference, uses light mode if no preference is set (the default),
+# AUTO_DARK automatically sets the mode according to the user preference, uses
+# dark mode if no preference is set and TOGGLE allows a user to switch between
+# light and dark mode via a button.
+# The default value is: AUTO_LIGHT.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_COLORSTYLE        = AUTO_LIGHT
+
+# The HTML_COLORSTYLE_HUE tag controls the color of the HTML output. Doxygen
+# will adjust the colors in the style sheet and background images according to
+# this color. Hue is specified as an angle on a color-wheel, see
+# https://en.wikipedia.org/wiki/Hue for more information. For instance the value
+# 0 represents red, 60 is yellow, 120 is green, 180 is cyan, 240 is blue, 300
+# purple, and 360 is red again.
+# Minimum value: 0, maximum value: 359, default value: 220.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_COLORSTYLE_HUE    = 220
+
+# The HTML_COLORSTYLE_SAT tag controls the purity (or saturation) of the colors
+# in the HTML output. For a value of 0 the output will use gray-scales only. A
+# value of 255 will produce the most vivid colors.
+# Minimum value: 0, maximum value: 255, default value: 100.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_COLORSTYLE_SAT    = 100
+
+# The HTML_COLORSTYLE_GAMMA tag controls the gamma correction applied to the
+# luminance component of the colors in the HTML output. Values below 100
+# gradually make the output lighter, whereas values above 100 make the output
+# darker. The value divided by 100 is the actual gamma applied, so 80 represents
+# a gamma of 0.8, The value 220 represents a gamma of 2.2, and 100 does not
+# change the gamma.
+# Minimum value: 40, maximum value: 240, default value: 80.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_COLORSTYLE_GAMMA  = 80
+
+# If the HTML_DYNAMIC_MENUS tag is set to YES then the generated HTML
+# documentation will contain a main index with vertical navigation menus that
+# are dynamically created via JavaScript. If disabled, the navigation index will
+# consists of multiple levels of tabs that are statically embedded in every HTML
+# page. Disable this option to support browsers that do not have JavaScript,
+# like the Qt help browser.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_DYNAMIC_MENUS     = YES
+
+# If the HTML_DYNAMIC_SECTIONS tag is set to YES then the generated HTML
+# documentation will contain sections that can be hidden and shown after the
+# page has loaded.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_DYNAMIC_SECTIONS  = NO
+
+# If the HTML_CODE_FOLDING tag is set to YES then classes and functions can be
+# dynamically folded and expanded in the generated HTML source code.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_CODE_FOLDING      = YES
+
+# If the HTML_COPY_CLIPBOARD tag is set to YES then Doxygen will show an icon in
+# the top right corner of code and text fragments that allows the user to copy
+# its content to the clipboard. Note this only works if supported by the browser
+# and the web page is served via a secure context (see:
+# https://www.w3.org/TR/secure-contexts/), i.e. using the https: or file:
+# protocol.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_COPY_CLIPBOARD    = YES
+
+# Doxygen stores a couple of settings persistently in the browser (via e.g.
+# cookies). By default these settings apply to all HTML pages generated by
+# Doxygen across all projects. The HTML_PROJECT_COOKIE tag can be used to store
+# the settings under a project specific key, such that the user preferences will
+# be stored separately.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_PROJECT_COOKIE    =
+
+# With HTML_INDEX_NUM_ENTRIES one can control the preferred number of entries
+# shown in the various tree structured indices initially; the user can expand
+# and collapse entries dynamically later on. Doxygen will expand the tree to
+# such a level that at most the specified number of entries are visible (unless
+# a fully collapsed tree already exceeds this amount). So setting the number of
+# entries 1 will produce a full collapsed tree by default. 0 is a special value
+# representing an infinite number of entries and will result in a full expanded
+# tree by default.
+# Minimum value: 0, maximum value: 9999, default value: 100.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_INDEX_NUM_ENTRIES = 100
+
+# If the GENERATE_DOCSET tag is set to YES, additional index files will be
+# generated that can be used as input for Apple's Xcode 3 integrated development
+# environment (see:
+# https://developer.apple.com/xcode/), introduced with OSX 10.5 (Leopard). To
+# create a documentation set, Doxygen will generate a Makefile in the HTML
+# output directory. Running make will produce the docset in that directory and
+# running make install will install the docset in
+# ~/Library/Developer/Shared/Documentation/DocSets so that Xcode will find it at
+# startup. See https://developer.apple.com/library/archive/featuredarticles/Doxy
+# genXcode/_index.html for more information.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_DOCSET        = NO
+
+# This tag determines the name of the docset feed. A documentation feed provides
+# an umbrella under which multiple documentation sets from a single provider
+# (such as a company or product suite) can be grouped.
+# The default value is: Doxygen generated docs.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_FEEDNAME        = "Doxygen generated docs"
+
+# This tag determines the URL of the docset feed. A documentation feed provides
+# an umbrella under which multiple documentation sets from a single provider
+# (such as a company or product suite) can be grouped.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_FEEDURL         =
+
+# This tag specifies a string that should uniquely identify the documentation
+# set bundle. This should be a reverse domain-name style string, e.g.
+# com.mycompany.MyDocSet. Doxygen will append .docset to the name.
+# The default value is: org.doxygen.Project.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_BUNDLE_ID       = org.doxygen.Project
+
+# The DOCSET_PUBLISHER_ID tag specifies a string that should uniquely identify
+# the documentation publisher. This should be a reverse domain-name style
+# string, e.g. com.mycompany.MyDocSet.documentation.
+# The default value is: org.doxygen.Publisher.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_PUBLISHER_ID    = org.doxygen.Publisher
+
+# The DOCSET_PUBLISHER_NAME tag identifies the documentation publisher.
+# The default value is: Publisher.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_PUBLISHER_NAME  = Publisher
+
+# If the GENERATE_HTMLHELP tag is set to YES then Doxygen generates three
+# additional HTML index files: index.hhp, index.hhc, and index.hhk. The
+# index.hhp is a project file that can be read by Microsoft's HTML Help Workshop
+# on Windows. In the beginning of 2021 Microsoft took the original page, with
+# a.o. the download links, offline the HTML help workshop was already many years
+# in maintenance mode). You can download the HTML help workshop from the web
+# archives at Installation executable (see:
+# http://web.archive.org/web/20160201063255/http://download.microsoft.com/downlo
+# ad/0/A/9/0A939EF6-E31C-430F-A3DF-DFAE7960D564/htmlhelp.exe).
+#
+# The HTML Help Workshop contains a compiler that can convert all HTML output
+# generated by Doxygen into a single compiled HTML file (.chm). Compiled HTML
+# files are now used as the Windows 98 help format, and will replace the old
+# Windows help format (.hlp) on all Windows platforms in the future. Compressed
+# HTML files also contain an index, a table of contents, and you can search for
+# words in the documentation. The HTML workshop also contains a viewer for
+# compressed HTML files.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_HTMLHELP      = NO
+
+# The CHM_FILE tag can be used to specify the file name of the resulting .chm
+# file. You can add a path in front of the file if the result should not be
+# written to the html output directory.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+CHM_FILE               =
+
+# The HHC_LOCATION tag can be used to specify the location (absolute path
+# including file name) of the HTML help compiler (hhc.exe). If non-empty,
+# Doxygen will try to run the HTML help compiler on the generated index.hhp.
+# The file has to be specified with full path.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+HHC_LOCATION           =
+
+# The GENERATE_CHI flag controls if a separate .chi index file is generated
+# (YES) or that it should be included in the main .chm file (NO).
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+GENERATE_CHI           = NO
+
+# The CHM_INDEX_ENCODING is used to encode HtmlHelp index (hhk), content (hhc)
+# and project file content.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+CHM_INDEX_ENCODING     =
+
+# The BINARY_TOC flag controls whether a binary table of contents is generated
+# (YES) or a normal table of contents (NO) in the .chm file. Furthermore it
+# enables the Previous and Next buttons.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+BINARY_TOC             = NO
+
+# The TOC_EXPAND flag can be set to YES to add extra items for group members to
+# the table of contents of the HTML help documentation and to the tree view.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+TOC_EXPAND             = NO
+
+# The SITEMAP_URL tag is used to specify the full URL of the place where the
+# generated documentation will be placed on the server by the user during the
+# deployment of the documentation. The generated sitemap is called sitemap.xml
+# and placed on the directory specified by HTML_OUTPUT. In case no SITEMAP_URL
+# is specified no sitemap is generated. For information about the sitemap
+# protocol see https://www.sitemaps.org
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+SITEMAP_URL            =
+
+# If the GENERATE_QHP tag is set to YES and both QHP_NAMESPACE and
+# QHP_VIRTUAL_FOLDER are set, an additional index file will be generated that
+# can be used as input for Qt's qhelpgenerator to generate a Qt Compressed Help
+# (.qch) of the generated HTML documentation.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_QHP           = NO
+
+# If the QHG_LOCATION tag is specified, the QCH_FILE tag can be used to specify
+# the file name of the resulting .qch file. The path specified is relative to
+# the HTML output folder.
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QCH_FILE               =
+
+# The QHP_NAMESPACE tag specifies the namespace to use when generating Qt Help
+# Project output. For more information please see Qt Help Project / Namespace
+# (see:
+# https://doc.qt.io/archives/qt-4.8/qthelpproject.html#namespace).
+# The default value is: org.doxygen.Project.
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_NAMESPACE          = org.doxygen.Project
+
+# The QHP_VIRTUAL_FOLDER tag specifies the namespace to use when generating Qt
+# Help Project output. For more information please see Qt Help Project / Virtual
+# Folders (see:
+# https://doc.qt.io/archives/qt-4.8/qthelpproject.html#virtual-folders).
+# The default value is: doc.
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_VIRTUAL_FOLDER     = doc
+
+# If the QHP_CUST_FILTER_NAME tag is set, it specifies the name of a custom
+# filter to add. For more information please see Qt Help Project / Custom
+# Filters (see:
+# https://doc.qt.io/archives/qt-4.8/qthelpproject.html#custom-filters).
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_CUST_FILTER_NAME   =
+
+# The QHP_CUST_FILTER_ATTRS tag specifies the list of the attributes of the
+# custom filter to add. For more information please see Qt Help Project / Custom
+# Filters (see:
+# https://doc.qt.io/archives/qt-4.8/qthelpproject.html#custom-filters).
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_CUST_FILTER_ATTRS  =
+
+# The QHP_SECT_FILTER_ATTRS tag specifies the list of the attributes this
+# project's filter section matches. Qt Help Project / Filter Attributes (see:
+# https://doc.qt.io/archives/qt-4.8/qthelpproject.html#filter-attributes).
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_SECT_FILTER_ATTRS  =
+
+# The QHG_LOCATION tag can be used to specify the location (absolute path
+# including file name) of Qt's qhelpgenerator. If non-empty Doxygen will try to
+# run qhelpgenerator on the generated .qhp file.
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHG_LOCATION           =
+
+# If the GENERATE_ECLIPSEHELP tag is set to YES, additional index files will be
+# generated, together with the HTML files, they form an Eclipse help plugin. To
+# install this plugin and make it available under the help contents menu in
+# Eclipse, the contents of the directory containing the HTML and XML files needs
+# to be copied into the plugins directory of eclipse. The name of the directory
+# within the plugins directory should be the same as the ECLIPSE_DOC_ID value.
+# After copying Eclipse needs to be restarted before the help appears.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_ECLIPSEHELP   = NO
+
+# A unique identifier for the Eclipse help plugin. When installing the plugin
+# the directory name containing the HTML and XML files should also have this
+# name. Each documentation set should have its own identifier.
+# The default value is: org.doxygen.Project.
+# This tag requires that the tag GENERATE_ECLIPSEHELP is set to YES.
+
+ECLIPSE_DOC_ID         = org.doxygen.Project
+
+# If you want full control over the layout of the generated HTML pages it might
+# be necessary to disable the index and replace it with your own. The
+# DISABLE_INDEX tag can be used to turn on/off the condensed index (tabs) at top
+# of each HTML page. A value of NO enables the index and the value YES disables
+# it. Since the tabs in the index contain the same information as the navigation
+# tree, you can set this option to YES if you also set GENERATE_TREEVIEW to YES.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+DISABLE_INDEX          = NO
+
+# The GENERATE_TREEVIEW tag is used to specify whether a tree-like index
+# structure should be generated to display hierarchical information. If the tag
+# value is set to YES, a side panel will be generated containing a tree-like
+# index structure (just like the one that is generated for HTML Help). For this
+# to work a browser that supports JavaScript, DHTML, CSS and frames is required
+# (i.e. any modern browser). Windows users are probably better off using the
+# HTML help feature. Via custom style sheets (see HTML_EXTRA_STYLESHEET) one can
+# further fine tune the look of the index (see "Fine-tuning the output"). As an
+# example, the default style sheet generated by Doxygen has an example that
+# shows how to put an image at the root of the tree instead of the PROJECT_NAME.
+# Since the tree basically has the same information as the tab index, you could
+# consider setting DISABLE_INDEX to YES when enabling this option.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_TREEVIEW      = NO
+
+# When both GENERATE_TREEVIEW and DISABLE_INDEX are set to YES, then the
+# FULL_SIDEBAR option determines if the side bar is limited to only the treeview
+# area (value NO) or if it should extend to the full height of the window (value
+# YES). Setting this to YES gives a layout similar to
+# https://docs.readthedocs.io with more room for contents, but less room for the
+# project logo, title, and description. If either GENERATE_TREEVIEW or
+# DISABLE_INDEX is set to NO, this option has no effect.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+FULL_SIDEBAR           = NO
+
+# The ENUM_VALUES_PER_LINE tag can be used to set the number of enum values that
+# Doxygen will group on one line in the generated HTML documentation.
+#
+# Note that a value of 0 will completely suppress the enum values from appearing
+# in the overview section.
+# Minimum value: 0, maximum value: 20, default value: 4.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+ENUM_VALUES_PER_LINE   = 4
+
+# When the SHOW_ENUM_VALUES tag is set doxygen will show the specified
+# enumeration values besides the enumeration mnemonics.
+# The default value is: NO.
+
+SHOW_ENUM_VALUES       = NO
+
+# If the treeview is enabled (see GENERATE_TREEVIEW) then this tag can be used
+# to set the initial width (in pixels) of the frame in which the tree is shown.
+# Minimum value: 0, maximum value: 1500, default value: 250.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+TREEVIEW_WIDTH         = 250
+
+# If the EXT_LINKS_IN_WINDOW option is set to YES, Doxygen will open links to
+# external symbols imported via tag files in a separate window.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+EXT_LINKS_IN_WINDOW    = NO
+
+# If the OBFUSCATE_EMAILS tag is set to YES, Doxygen will obfuscate email
+# addresses.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+OBFUSCATE_EMAILS       = YES
+
+# If the HTML_FORMULA_FORMAT option is set to svg, Doxygen will use the pdf2svg
+# tool (see https://github.com/dawbarton/pdf2svg) or inkscape (see
+# https://inkscape.org) to generate formulas as SVG images instead of PNGs for
+# the HTML output. These images will generally look nicer at scaled resolutions.
+# Possible values are: png (the default) and svg (looks nicer but requires the
+# pdf2svg or inkscape tool).
+# The default value is: png.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_FORMULA_FORMAT    = png
+
+# Use this tag to change the font size of LaTeX formulas included as images in
+# the HTML documentation. When you change the font size after a successful
+# Doxygen run you need to manually remove any form_*.png images from the HTML
+# output directory to force them to be regenerated.
+# Minimum value: 8, maximum value: 50, default value: 10.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+FORMULA_FONTSIZE       = 10
+
+# The FORMULA_MACROFILE can contain LaTeX \newcommand and \renewcommand commands
+# to create new LaTeX commands to be used in formulas as building blocks. See
+# the section "Including formulas" for details.
+
+FORMULA_MACROFILE      =
+
+# Enable the USE_MATHJAX option to render LaTeX formulas using MathJax (see
+# https://www.mathjax.org) which uses client side JavaScript for the rendering
+# instead of using pre-rendered bitmaps. Use this if you do not have LaTeX
+# installed or if you want to formulas look prettier in the HTML output. When
+# enabled you may also need to install MathJax separately and configure the path
+# to it using the MATHJAX_RELPATH option.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+USE_MATHJAX            = NO
+
+# With MATHJAX_VERSION it is possible to specify the MathJax version to be used.
+# Note that the different versions of MathJax have different requirements with
+# regards to the different settings, so it is possible that also other MathJax
+# settings have to be changed when switching between the different MathJax
+# versions.
+# Possible values are: MathJax_2 and MathJax_3.
+# The default value is: MathJax_2.
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_VERSION        = MathJax_2
+
+# When MathJax is enabled you can set the default output format to be used for
+# the MathJax output. For more details about the output format see MathJax
+# version 2 (see:
+# http://docs.mathjax.org/en/v2.7-latest/output.html) and MathJax version 3
+# (see:
+# http://docs.mathjax.org/en/latest/web/components/output.html).
+# Possible values are: HTML-CSS (which is slower, but has the best
+# compatibility. This is the name for Mathjax version 2, for MathJax version 3
+# this will be translated into chtml), NativeMML (i.e. MathML. Only supported
+# for MathJax 2. For MathJax version 3 chtml will be used instead.), chtml (This
+# is the name for Mathjax version 3, for MathJax version 2 this will be
+# translated into HTML-CSS) and SVG.
+# The default value is: HTML-CSS.
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_FORMAT         = HTML-CSS
+
+# When MathJax is enabled you need to specify the location relative to the HTML
+# output directory using the MATHJAX_RELPATH option. The destination directory
+# should contain the MathJax.js script. For instance, if the mathjax directory
+# is located at the same level as the HTML output directory, then
+# MATHJAX_RELPATH should be ../mathjax. The default value points to the MathJax
+# Content Delivery Network so you can quickly see the result without installing
+# MathJax. However, it is strongly recommended to install a local copy of
+# MathJax from https://www.mathjax.org before deployment. The default value is:
+# - in case of MathJax version 2: https://cdn.jsdelivr.net/npm/mathjax@2
+# - in case of MathJax version 3: https://cdn.jsdelivr.net/npm/mathjax@3
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_RELPATH        =
+
+# The MATHJAX_EXTENSIONS tag can be used to specify one or more MathJax
+# extension names that should be enabled during MathJax rendering. For example
+# for MathJax version 2 (see
+# https://docs.mathjax.org/en/v2.7-latest/tex.html#tex-and-latex-extensions):
+# MATHJAX_EXTENSIONS = TeX/AMSmath TeX/AMSsymbols
+# For example for MathJax version 3 (see
+# http://docs.mathjax.org/en/latest/input/tex/extensions/index.html):
+# MATHJAX_EXTENSIONS = ams
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_EXTENSIONS     =
+
+# The MATHJAX_CODEFILE tag can be used to specify a file with JavaScript pieces
+# of code that will be used on startup of the MathJax code. See the MathJax site
+# (see:
+# http://docs.mathjax.org/en/v2.7-latest/output.html) for more details. For an
+# example see the documentation.
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_CODEFILE       =
+
+# When the SEARCHENGINE tag is enabled Doxygen will generate a search box for
+# the HTML output. The underlying search engine uses JavaScript and DHTML and
+# should work on any modern browser. Note that when using HTML help
+# (GENERATE_HTMLHELP), Qt help (GENERATE_QHP), or docsets (GENERATE_DOCSET)
+# there is already a search function so this one should typically be disabled.
+# For large projects the JavaScript based search engine can be slow, then
+# enabling SERVER_BASED_SEARCH may provide a better solution. It is possible to
+# search using the keyboard; to jump to the search box use <access key> + S
+# (what the <access key> is depends on the OS and browser, but it is typically
+# <CTRL>, <ALT>/<option>, or both). Inside the search box use the <cursor down
+# key> to jump into the search results window, the results can be navigated
+# using the <cursor keys>. Press <Enter> to select an item or <escape> to cancel
+# the search. The filter options can be selected when the cursor is inside the
+# search box by pressing <Shift>+<cursor down>. Also here use the <cursor keys>
+# to select a filter and <Enter> or <escape> to activate or cancel the filter
+# option.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+SEARCHENGINE           = YES
+
+# When the SERVER_BASED_SEARCH tag is enabled the search engine will be
+# implemented using a web server instead of a web client using JavaScript. There
+# are two flavors of web server based searching depending on the EXTERNAL_SEARCH
+# setting. When disabled, Doxygen will generate a PHP script for searching and
+# an index file used by the script. When EXTERNAL_SEARCH is enabled the indexing
+# and searching needs to be provided by external tools. See the section
+# "External Indexing and Searching" for details.
+# The default value is: NO.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+SERVER_BASED_SEARCH    = NO
+
+# When EXTERNAL_SEARCH tag is enabled Doxygen will no longer generate the PHP
+# script for searching. Instead the search results are written to an XML file
+# which needs to be processed by an external indexer. Doxygen will invoke an
+# external search engine pointed to by the SEARCHENGINE_URL option to obtain the
+# search results.
+#
+# Doxygen ships with an example indexer (doxyindexer) and search engine
+# (doxysearch.cgi) which are based on the open source search engine library
+# Xapian (see:
+# https://xapian.org/).
+#
+# See the section "External Indexing and Searching" for details.
+# The default value is: NO.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+EXTERNAL_SEARCH        = NO
+
+# The SEARCHENGINE_URL should point to a search engine hosted by a web server
+# which will return the search results when EXTERNAL_SEARCH is enabled.
+#
+# Doxygen ships with an example indexer (doxyindexer) and search engine
+# (doxysearch.cgi) which are based on the open source search engine library
+# Xapian (see:
+# https://xapian.org/). See the section "External Indexing and Searching" for
+# details.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+SEARCHENGINE_URL       =
+
+# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the unindexed
+# search data is written to a file for indexing by an external tool. With the
+# SEARCHDATA_FILE tag the name of this file can be specified.
+# The default file is: searchdata.xml.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+SEARCHDATA_FILE        = searchdata.xml
+
+# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the
+# EXTERNAL_SEARCH_ID tag can be used as an identifier for the project. This is
+# useful in combination with EXTRA_SEARCH_MAPPINGS to search through multiple
+# projects and redirect the results back to the right project.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+EXTERNAL_SEARCH_ID     =
+
+# The EXTRA_SEARCH_MAPPINGS tag can be used to enable searching through Doxygen
+# projects other than the one defined by this configuration file, but that are
+# all added to the same external search index. Each project needs to have a
+# unique id set via EXTERNAL_SEARCH_ID. The search mapping then maps the id of
+# to a relative location where the documentation can be found. The format is:
+# EXTRA_SEARCH_MAPPINGS = tagname1=loc1 tagname2=loc2 ...
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+EXTRA_SEARCH_MAPPINGS  =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the LaTeX output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_LATEX tag is set to YES, Doxygen will generate LaTeX output.
+# The default value is: YES.
+
+GENERATE_LATEX         = NO
+
+# The LATEX_OUTPUT tag is used to specify where the LaTeX docs will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it.
+# The default directory is: latex.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_OUTPUT           = latex
+
+# The LATEX_CMD_NAME tag can be used to specify the LaTeX command name to be
+# invoked.
+#
+# Note that when not enabling USE_PDFLATEX the default is latex when enabling
+# USE_PDFLATEX the default is pdflatex and when in the later case latex is
+# chosen this is overwritten by pdflatex. For specific output languages the
+# default can have been set differently, this depends on the implementation of
+# the output language.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_CMD_NAME         =
+
+# The MAKEINDEX_CMD_NAME tag can be used to specify the command name to generate
+# index for LaTeX.
+# Note: This tag is used in the Makefile / make.bat.
+# See also: LATEX_MAKEINDEX_CMD for the part in the generated output file
+# (.tex).
+# The default file is: makeindex.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+MAKEINDEX_CMD_NAME     = makeindex
+
+# The LATEX_MAKEINDEX_CMD tag can be used to specify the command name to
+# generate index for LaTeX. In case there is no backslash (\) as first character
+# it will be automatically added in the LaTeX code.
+# Note: This tag is used in the generated output file (.tex).
+# See also: MAKEINDEX_CMD_NAME for the part in the Makefile / make.bat.
+# The default value is: makeindex.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_MAKEINDEX_CMD    = makeindex
+
+# If the COMPACT_LATEX tag is set to YES, Doxygen generates more compact LaTeX
+# documents. This may be useful for small projects and may help to save some
+# trees in general.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+COMPACT_LATEX          = NO
+
+# The PAPER_TYPE tag can be used to set the paper type that is used by the
+# printer.
+# Possible values are: a4 (210 x 297 mm), letter (8.5 x 11 inches), legal (8.5 x
+# 14 inches) and executive (7.25 x 10.5 inches).
+# The default value is: a4.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+PAPER_TYPE             = a4
+
+# The EXTRA_PACKAGES tag can be used to specify one or more LaTeX package names
+# that should be included in the LaTeX output. The package can be specified just
+# by its name or with the correct syntax as to be used with the LaTeX
+# \usepackage command. To get the times font for instance you can specify :
+# EXTRA_PACKAGES=times or EXTRA_PACKAGES={times}
+# To use the option intlimits with the amsmath package you can specify:
+# EXTRA_PACKAGES=[intlimits]{amsmath}
+# If left blank no extra packages will be included.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+EXTRA_PACKAGES         =
+
+# The LATEX_HEADER tag can be used to specify a user-defined LaTeX header for
+# the generated LaTeX document. The header should contain everything until the
+# first chapter. If it is left blank Doxygen will generate a standard header. It
+# is highly recommended to start with a default header using
+# doxygen -w latex new_header.tex new_footer.tex new_stylesheet.sty
+# and then modify the file new_header.tex. See also section "Doxygen usage" for
+# information on how to generate the default header that Doxygen normally uses.
+#
+# Note: Only use a user-defined header if you know what you are doing!
+# Note: The header is subject to change so you typically have to regenerate the
+# default header when upgrading to a newer version of Doxygen. The following
+# commands have a special meaning inside the header (and footer): For a
+# description of the possible markers and block names see the documentation.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_HEADER           =
+
+# The LATEX_FOOTER tag can be used to specify a user-defined LaTeX footer for
+# the generated LaTeX document. The footer should contain everything after the
+# last chapter. If it is left blank Doxygen will generate a standard footer. See
+# LATEX_HEADER for more information on how to generate a default footer and what
+# special commands can be used inside the footer. See also section "Doxygen
+# usage" for information on how to generate the default footer that Doxygen
+# normally uses. Note: Only use a user-defined footer if you know what you are
+# doing!
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_FOOTER           =
+
+# The LATEX_EXTRA_STYLESHEET tag can be used to specify additional user-defined
+# LaTeX style sheets that are included after the standard style sheets created
+# by Doxygen. Using this option one can overrule certain style aspects. Doxygen
+# will copy the style sheet files to the output directory.
+# Note: The order of the extra style sheet files is of importance (e.g. the last
+# style sheet in the list overrules the setting of the previous ones in the
+# list).
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_EXTRA_STYLESHEET =
+
+# The LATEX_EXTRA_FILES tag can be used to specify one or more extra images or
+# other source files which should be copied to the LATEX_OUTPUT output
+# directory. Note that the files will be copied as-is; there are no commands or
+# markers available.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_EXTRA_FILES      =
+
+# If the PDF_HYPERLINKS tag is set to YES, the LaTeX that is generated is
+# prepared for conversion to PDF (using ps2pdf or pdflatex). The PDF file will
+# contain links (just like the HTML output) instead of page references. This
+# makes the output suitable for online browsing using a PDF viewer.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+PDF_HYPERLINKS         = YES
+
+# If the USE_PDFLATEX tag is set to YES, Doxygen will use the engine as
+# specified with LATEX_CMD_NAME to generate the PDF file directly from the LaTeX
+# files. Set this option to YES, to get a higher quality PDF documentation.
+#
+# See also section LATEX_CMD_NAME for selecting the engine.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+USE_PDFLATEX           = YES
+
+# The LATEX_BATCHMODE tag signals the behavior of LaTeX in case of an error.
+# Possible values are: NO same as ERROR_STOP, YES same as BATCH, BATCH In batch
+# mode nothing is printed on the terminal, errors are scrolled as if <return> is
+# hit at every error; missing files that TeX tries to input or request from
+# keyboard input (\read on a not open input stream) cause the job to abort,
+# NON_STOP In nonstop mode the diagnostic message will appear on the terminal,
+# but there is no possibility of user interaction just like in batch mode,
+# SCROLL In scroll mode, TeX will stop only for missing files to input or if
+# keyboard input is necessary and ERROR_STOP In errorstop mode, TeX will stop at
+# each error, asking for user intervention.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_BATCHMODE        = NO
+
+# If the LATEX_HIDE_INDICES tag is set to YES then Doxygen will not include the
+# index chapters (such as File Index, Compound Index, etc.) in the output.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_HIDE_INDICES     = NO
+
+# The LATEX_BIB_STYLE tag can be used to specify the style to use for the
+# bibliography, e.g. plainnat, or ieeetr. See
+# https://en.wikipedia.org/wiki/BibTeX and \cite for more info.
+# The default value is: plain.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_BIB_STYLE        = plain
+
+# The LATEX_EMOJI_DIRECTORY tag is used to specify the (relative or absolute)
+# path from which the emoji images will be read. If a relative path is entered,
+# it will be relative to the LATEX_OUTPUT directory. If left blank the
+# LATEX_OUTPUT directory will be used.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_EMOJI_DIRECTORY  =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the RTF output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_RTF tag is set to YES, Doxygen will generate RTF output. The
+# RTF output is optimized for Word 97 and may not look too pretty with other RTF
+# readers/editors.
+# The default value is: NO.
+
+GENERATE_RTF           = NO
+
+# The RTF_OUTPUT tag is used to specify where the RTF docs will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it.
+# The default directory is: rtf.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_OUTPUT             = rtf
+
+# If the COMPACT_RTF tag is set to YES, Doxygen generates more compact RTF
+# documents. This may be useful for small projects and may help to save some
+# trees in general.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+COMPACT_RTF            = NO
+
+# If the RTF_HYPERLINKS tag is set to YES, the RTF that is generated will
+# contain hyperlink fields. The RTF file will contain links (just like the HTML
+# output) instead of page references. This makes the output suitable for online
+# browsing using Word or some other Word compatible readers that support those
+# fields.
+#
+# Note: WordPad (write) and others do not support links.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_HYPERLINKS         = NO
+
+# Load stylesheet definitions from file. Syntax is similar to Doxygen's
+# configuration file, i.e. a series of assignments. You only have to provide
+# replacements, missing definitions are set to their default value.
+#
+# See also section "Doxygen usage" for information on how to generate the
+# default style sheet that Doxygen normally uses.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_STYLESHEET_FILE    =
+
+# Set optional variables used in the generation of an RTF document. Syntax is
+# similar to Doxygen's configuration file. A template extensions file can be
+# generated using doxygen -e rtf extensionFile.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_EXTENSIONS_FILE    =
+
+# The RTF_EXTRA_FILES tag can be used to specify one or more extra images or
+# other source files which should be copied to the RTF_OUTPUT output directory.
+# Note that the files will be copied as-is; there are no commands or markers
+# available.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_EXTRA_FILES        =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the man page output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_MAN tag is set to YES, Doxygen will generate man pages for
+# classes and files.
+# The default value is: NO.
+
+GENERATE_MAN           = NO
+
+# The MAN_OUTPUT tag is used to specify where the man pages will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it. A directory man3 will be created inside the directory specified by
+# MAN_OUTPUT.
+# The default directory is: man.
+# This tag requires that the tag GENERATE_MAN is set to YES.
+
+MAN_OUTPUT             = man
+
+# The MAN_EXTENSION tag determines the extension that is added to the generated
+# man pages. In case the manual section does not start with a number, the number
+# 3 is prepended. The dot (.) at the beginning of the MAN_EXTENSION tag is
+# optional.
+# The default value is: .3.
+# This tag requires that the tag GENERATE_MAN is set to YES.
+
+MAN_EXTENSION          = .3
+
+# The MAN_SUBDIR tag determines the name of the directory created within
+# MAN_OUTPUT in which the man pages are placed. If defaults to man followed by
+# MAN_EXTENSION with the initial . removed.
+# This tag requires that the tag GENERATE_MAN is set to YES.
+
+MAN_SUBDIR             =
+
+# If the MAN_LINKS tag is set to YES and Doxygen generates man output, then it
+# will generate one additional man file for each entity documented in the real
+# man page(s). These additional files only source the real man page, but without
+# them the man command would be unable to find the correct page.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_MAN is set to YES.
+
+MAN_LINKS              = NO
+
+#---------------------------------------------------------------------------
+# Configuration options related to the XML output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_XML tag is set to YES, Doxygen will generate an XML file that
+# captures the structure of the code including all documentation.
+# The default value is: NO.
+
+GENERATE_XML           = YES
+
+# The XML_OUTPUT tag is used to specify where the XML pages will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it.
+# The default directory is: xml.
+# This tag requires that the tag GENERATE_XML is set to YES.
+
+XML_OUTPUT             = xml
+
+# If the XML_PROGRAMLISTING tag is set to YES, Doxygen will dump the program
+# listings (including syntax highlighting and cross-referencing information) to
+# the XML output. Note that enabling this will significantly increase the size
+# of the XML output.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_XML is set to YES.
+
+XML_PROGRAMLISTING     = YES
+
+# If the XML_NS_MEMB_FILE_SCOPE tag is set to YES, Doxygen will include
+# namespace members in file scope as well, matching the HTML output.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_XML is set to YES.
+
+XML_NS_MEMB_FILE_SCOPE = NO
+
+#---------------------------------------------------------------------------
+# Configuration options related to the DOCBOOK output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_DOCBOOK tag is set to YES, Doxygen will generate Docbook files
+# that can be used to generate PDF.
+# The default value is: NO.
+
+GENERATE_DOCBOOK       = NO
+
+# The DOCBOOK_OUTPUT tag is used to specify where the Docbook pages will be put.
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be put in
+# front of it.
+# The default directory is: docbook.
+# This tag requires that the tag GENERATE_DOCBOOK is set to YES.
+
+DOCBOOK_OUTPUT         = docbook
+
+#---------------------------------------------------------------------------
+# Configuration options for the AutoGen Definitions output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_AUTOGEN_DEF tag is set to YES, Doxygen will generate an
+# AutoGen Definitions (see https://autogen.sourceforge.net/) file that captures
+# the structure of the code including all documentation. Note that this feature
+# is still experimental and incomplete at the moment.
+# The default value is: NO.
+
+GENERATE_AUTOGEN_DEF   = NO
+
+#---------------------------------------------------------------------------
+# Configuration options related to Sqlite3 output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_SQLITE3 tag is set to YES Doxygen will generate a Sqlite3
+# database with symbols found by Doxygen stored in tables.
+# The default value is: NO.
+
+GENERATE_SQLITE3       = NO
+
+# The SQLITE3_OUTPUT tag is used to specify where the Sqlite3 database will be
+# put. If a relative path is entered the value of OUTPUT_DIRECTORY will be put
+# in front of it.
+# The default directory is: sqlite3.
+# This tag requires that the tag GENERATE_SQLITE3 is set to YES.
+
+SQLITE3_OUTPUT         = sqlite3
+
+# The SQLITE3_RECREATE_DB tag is set to YES, the existing doxygen_sqlite3.db
+# database file will be recreated with each Doxygen run. If set to NO, Doxygen
+# will warn if a database file is already found and not modify it.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_SQLITE3 is set to YES.
+
+SQLITE3_RECREATE_DB    = YES
+
+#---------------------------------------------------------------------------
+# Configuration options related to the Perl module output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_PERLMOD tag is set to YES, Doxygen will generate a Perl module
+# file that captures the structure of the code including all documentation.
+#
+# Note that this feature is still experimental and incomplete at the moment.
+# The default value is: NO.
+
+GENERATE_PERLMOD       = NO
+
+# If the PERLMOD_LATEX tag is set to YES, Doxygen will generate the necessary
+# Makefile rules, Perl scripts and LaTeX code to be able to generate PDF and DVI
+# output from the Perl module output.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_PERLMOD is set to YES.
+
+PERLMOD_LATEX          = NO
+
+# If the PERLMOD_PRETTY tag is set to YES, the Perl module output will be nicely
+# formatted so it can be parsed by a human reader. This is useful if you want to
+# understand what is going on. On the other hand, if this tag is set to NO, the
+# size of the Perl module output will be much smaller and Perl will parse it
+# just the same.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_PERLMOD is set to YES.
+
+PERLMOD_PRETTY         = YES
+
+# The names of the make variables in the generated doxyrules.make file are
+# prefixed with the string contained in PERLMOD_MAKEVAR_PREFIX. This is useful
+# so different doxyrules.make files included by the same Makefile don't
+# overwrite each other's variables.
+# This tag requires that the tag GENERATE_PERLMOD is set to YES.
+
+PERLMOD_MAKEVAR_PREFIX =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the preprocessor
+#---------------------------------------------------------------------------
+
+# If the ENABLE_PREPROCESSING tag is set to YES, Doxygen will evaluate all
+# C-preprocessor directives found in the sources and include files.
+# The default value is: YES.
+
+ENABLE_PREPROCESSING   = YES
+
+# If the MACRO_EXPANSION tag is set to YES, Doxygen will expand all macro names
+# in the source code. If set to NO, only conditional compilation will be
+# performed. Macro expansion can be done in a controlled way by setting
+# EXPAND_ONLY_PREDEF to YES.
+# The default value is: NO.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+MACRO_EXPANSION        = NO
+
+# If the EXPAND_ONLY_PREDEF and MACRO_EXPANSION tags are both set to YES then
+# the macro expansion is limited to the macros specified with the PREDEFINED and
+# EXPAND_AS_DEFINED tags.
+# The default value is: NO.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+EXPAND_ONLY_PREDEF     = NO
+
+# If the SEARCH_INCLUDES tag is set to YES, the include files in the
+# INCLUDE_PATH will be searched if a #include is found.
+# The default value is: YES.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+SEARCH_INCLUDES        = YES
+
+# The INCLUDE_PATH tag can be used to specify one or more directories that
+# contain include files that are not input files but should be processed by the
+# preprocessor. Note that the INCLUDE_PATH is not recursive, so the setting of
+# RECURSIVE has no effect here.
+# This tag requires that the tag SEARCH_INCLUDES is set to YES.
+
+INCLUDE_PATH           =
+
+# You can use the INCLUDE_FILE_PATTERNS tag to specify one or more wildcard
+# patterns (like *.h and *.hpp) to filter out the header-files in the
+# directories. If left blank, the patterns specified with FILE_PATTERNS will be
+# used.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+INCLUDE_FILE_PATTERNS  =
+
+# The PREDEFINED tag can be used to specify one or more macro names that are
+# defined before the preprocessor is started (similar to the -D option of e.g.
+# gcc). The argument of the tag is a list of macros of the form: name or
+# name=definition (no spaces). If the definition and the "=" are omitted, "=1"
+# is assumed. To prevent a macro definition from being undefined via #undef or
+# recursively expanded use the := operator instead of the = operator.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+PREDEFINED             =
+
+# If the MACRO_EXPANSION and EXPAND_ONLY_PREDEF tags are set to YES then this
+# tag can be used to specify a list of macro names that should be expanded. The
+# macro definition that is found in the sources will be used. Use the PREDEFINED
+# tag if you want to use a different macro definition that overrules the
+# definition found in the source code.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+EXPAND_AS_DEFINED      =
+
+# If the SKIP_FUNCTION_MACROS tag is set to YES then Doxygen's preprocessor will
+# remove all references to function-like macros that are alone on a line, have
+# an all uppercase name, and do not end with a semicolon. Such function macros
+# are typically used for boiler-plate code, and will confuse the parser if not
+# removed.
+# The default value is: YES.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+SKIP_FUNCTION_MACROS   = YES
+
+#---------------------------------------------------------------------------
+# Configuration options related to external references
+#---------------------------------------------------------------------------
+
+# The TAGFILES tag can be used to specify one or more tag files. For each tag
+# file the location of the external documentation should be added. The format of
+# a tag file without this location is as follows:
+# TAGFILES = file1 file2 ...
+# Adding location for the tag files is done as follows:
+# TAGFILES = file1=loc1 "file2 = loc2" ...
+# where loc1 and loc2 can be relative or absolute paths or URLs. See the
+# section "Linking to external documentation" for more information about the use
+# of tag files.
+# Note: Each tag file must have a unique name (where the name does NOT include
+# the path). If a tag file is not located in the directory in which Doxygen is
+# run, you must also specify the path to the tagfile here.
+
+TAGFILES               =
+
+# When a file name is specified after GENERATE_TAGFILE, Doxygen will create a
+# tag file that is based on the input files it reads. See section "Linking to
+# external documentation" for more information about the usage of tag files.
+
+GENERATE_TAGFILE       =
+
+# If the ALLEXTERNALS tag is set to YES, all external classes and namespaces
+# will be listed in the class and namespace index. If set to NO, only the
+# inherited external classes will be listed.
+# The default value is: NO.
+
+ALLEXTERNALS           = NO
+
+# If the EXTERNAL_GROUPS tag is set to YES, all external groups will be listed
+# in the topic index. If set to NO, only the current project's groups will be
+# listed.
+# The default value is: YES.
+
+EXTERNAL_GROUPS        = YES
+
+# If the EXTERNAL_PAGES tag is set to YES, all external pages will be listed in
+# the related pages index. If set to NO, only the current project's pages will
+# be listed.
+# The default value is: YES.
+
+EXTERNAL_PAGES         = YES
+
+#---------------------------------------------------------------------------
+# Configuration options related to diagram generator tools
+#---------------------------------------------------------------------------
+
+# If set to YES the inheritance and collaboration graphs will hide inheritance
+# and usage relations if the target is undocumented or is not a class.
+# The default value is: YES.
+
+HIDE_UNDOC_RELATIONS   = YES
+
+# If you set the HAVE_DOT tag to YES then Doxygen will assume the dot tool is
+# available from the path. This tool is part of Graphviz (see:
+# https://www.graphviz.org/), a graph visualization toolkit from AT&T and Lucent
+# Bell Labs. The other options in this section have no effect if this option is
+# set to NO
+# The default value is: NO.
+
+HAVE_DOT               = NO
+
+# The DOT_NUM_THREADS specifies the number of dot invocations Doxygen is allowed
+# to run in parallel. When set to 0 Doxygen will base this on the number of
+# processors available in the system. You can set it explicitly to a value
+# larger than 0 to get control over the balance between CPU load and processing
+# speed.
+# Minimum value: 0, maximum value: 32, default value: 0.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_NUM_THREADS        = 0
+
+# DOT_COMMON_ATTR is common attributes for nodes, edges and labels of
+# subgraphs. When you want a differently looking font in the dot files that
+# Doxygen generates you can specify fontname, fontcolor and fontsize attributes.
+# For details please see <a href=https://graphviz.org/doc/info/attrs.html>Node,
+# Edge and Graph Attributes specification</a> You need to make sure dot is able
+# to find the font, which can be done by putting it in a standard location or by
+# setting the DOTFONTPATH environment variable or by setting DOT_FONTPATH to the
+# directory containing the font. Default graphviz fontsize is 14.
+# The default value is: fontname=Helvetica,fontsize=10.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_COMMON_ATTR        = "fontname=Helvetica,fontsize=10"
+
+# DOT_EDGE_ATTR is concatenated with DOT_COMMON_ATTR. For elegant style you can
+# add 'arrowhead=open, arrowtail=open, arrowsize=0.5'. <a
+# href=https://graphviz.org/doc/info/arrows.html>Complete documentation about
+# arrows shapes.</a>
+# The default value is: labelfontname=Helvetica,labelfontsize=10.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_EDGE_ATTR          = "labelfontname=Helvetica,labelfontsize=10"
+
+# DOT_NODE_ATTR is concatenated with DOT_COMMON_ATTR. For view without boxes
+# around nodes set 'shape=plain' or 'shape=plaintext' <a
+# href=https://www.graphviz.org/doc/info/shapes.html>Shapes specification</a>
+# The default value is: shape=box,height=0.2,width=0.4.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_NODE_ATTR          = "shape=box,height=0.2,width=0.4"
+
+# You can set the path where dot can find font specified with fontname in
+# DOT_COMMON_ATTR and others dot attributes.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_FONTPATH           =
+
+# If the CLASS_GRAPH tag is set to YES or GRAPH or BUILTIN then Doxygen will
+# generate a graph for each documented class showing the direct and indirect
+# inheritance relations. In case the CLASS_GRAPH tag is set to YES or GRAPH and
+# HAVE_DOT is enabled as well, then dot will be used to draw the graph. In case
+# the CLASS_GRAPH tag is set to YES and HAVE_DOT is disabled or if the
+# CLASS_GRAPH tag is set to BUILTIN, then the built-in generator will be used.
+# If the CLASS_GRAPH tag is set to TEXT the direct and indirect inheritance
+# relations will be shown as texts / links. Explicit enabling an inheritance
+# graph or choosing a different representation for an inheritance graph of a
+# specific class, can be accomplished by means of the command \inheritancegraph.
+# Disabling an inheritance graph can be accomplished by means of the command
+# \hideinheritancegraph.
+# Possible values are: NO, YES, TEXT, GRAPH and BUILTIN.
+# The default value is: YES.
+
+CLASS_GRAPH            = YES
+
+# If the COLLABORATION_GRAPH tag is set to YES then Doxygen will generate a
+# graph for each documented class showing the direct and indirect implementation
+# dependencies (inheritance, containment, and class references variables) of the
+# class with other documented classes. Explicit enabling a collaboration graph,
+# when COLLABORATION_GRAPH is set to NO, can be accomplished by means of the
+# command \collaborationgraph. Disabling a collaboration graph can be
+# accomplished by means of the command \hidecollaborationgraph.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+COLLABORATION_GRAPH    = YES
+
+# If the GROUP_GRAPHS tag is set to YES then Doxygen will generate a graph for
+# groups, showing the direct groups dependencies. Explicit enabling a group
+# dependency graph, when GROUP_GRAPHS is set to NO, can be accomplished by means
+# of the command \groupgraph. Disabling a directory graph can be accomplished by
+# means of the command \hidegroupgraph. See also the chapter Grouping in the
+# manual.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+GROUP_GRAPHS           = YES
+
+# If the UML_LOOK tag is set to YES, Doxygen will generate inheritance and
+# collaboration diagrams in a style similar to the OMG's Unified Modeling
+# Language.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+UML_LOOK               = NO
+
+# If the UML_LOOK tag is enabled, the fields and methods are shown inside the
+# class node. If there are many fields or methods and many nodes the graph may
+# become too big to be useful. The UML_LIMIT_NUM_FIELDS threshold limits the
+# number of items for each type to make the size more manageable. Set this to 0
+# for no limit. Note that the threshold may be exceeded by 50% before the limit
+# is enforced. So when you set the threshold to 10, up to 15 fields may appear,
+# but if the number exceeds 15, the total amount of fields shown is limited to
+# 10.
+# Minimum value: 0, maximum value: 100, default value: 10.
+# This tag requires that the tag UML_LOOK is set to YES.
+
+UML_LIMIT_NUM_FIELDS   = 10
+
+# If the DOT_UML_DETAILS tag is set to NO, Doxygen will show attributes and
+# methods without types and arguments in the UML graphs. If the DOT_UML_DETAILS
+# tag is set to YES, Doxygen will add type and arguments for attributes and
+# methods in the UML graphs. If the DOT_UML_DETAILS tag is set to NONE, Doxygen
+# will not generate fields with class member information in the UML graphs. The
+# class diagrams will look similar to the default class diagrams but using UML
+# notation for the relationships.
+# Possible values are: NO, YES and NONE.
+# The default value is: NO.
+# This tag requires that the tag UML_LOOK is set to YES.
+
+DOT_UML_DETAILS        = NO
+
+# The DOT_WRAP_THRESHOLD tag can be used to set the maximum number of characters
+# to display on a single line. If the actual line length exceeds this threshold
+# significantly it will be wrapped across multiple lines. Some heuristics are
+# applied to avoid ugly line breaks.
+# Minimum value: 0, maximum value: 1000, default value: 17.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_WRAP_THRESHOLD     = 17
+
+# If the TEMPLATE_RELATIONS tag is set to YES then the inheritance and
+# collaboration graphs will show the relations between templates and their
+# instances.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+TEMPLATE_RELATIONS     = NO
+
+# If the INCLUDE_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are set to
+# YES then Doxygen will generate a graph for each documented file showing the
+# direct and indirect include dependencies of the file with other documented
+# files. Explicit enabling an include graph, when INCLUDE_GRAPH is is set to NO,
+# can be accomplished by means of the command \includegraph. Disabling an
+# include graph can be accomplished by means of the command \hideincludegraph.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+INCLUDE_GRAPH          = YES
+
+# If the INCLUDED_BY_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are
+# set to YES then Doxygen will generate a graph for each documented file showing
+# the direct and indirect include dependencies of the file with other documented
+# files. Explicit enabling an included by graph, when INCLUDED_BY_GRAPH is set
+# to NO, can be accomplished by means of the command \includedbygraph. Disabling
+# an included by graph can be accomplished by means of the command
+# \hideincludedbygraph.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+INCLUDED_BY_GRAPH      = YES
+
+# If the CALL_GRAPH tag is set to YES then Doxygen will generate a call
+# dependency graph for every global function or class method.
+#
+# Note that enabling this option will significantly increase the time of a run.
+# So in most cases it will be better to enable call graphs for selected
+# functions only using the \callgraph command. Disabling a call graph can be
+# accomplished by means of the command \hidecallgraph.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+CALL_GRAPH             = NO
+
+# If the CALLER_GRAPH tag is set to YES then Doxygen will generate a caller
+# dependency graph for every global function or class method.
+#
+# Note that enabling this option will significantly increase the time of a run.
+# So in most cases it will be better to enable caller graphs for selected
+# functions only using the \callergraph command. Disabling a caller graph can be
+# accomplished by means of the command \hidecallergraph.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+CALLER_GRAPH           = NO
+
+# If the GRAPHICAL_HIERARCHY tag is set to YES then Doxygen will graphical
+# hierarchy of all classes instead of a textual one.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+GRAPHICAL_HIERARCHY    = YES
+
+# If the DIRECTORY_GRAPH tag is set to YES then Doxygen will show the
+# dependencies a directory has on other directories in a graphical way. The
+# dependency relations are determined by the #include relations between the
+# files in the directories. Explicit enabling a directory graph, when
+# DIRECTORY_GRAPH is set to NO, can be accomplished by means of the command
+# \directorygraph. Disabling a directory graph can be accomplished by means of
+# the command \hidedirectorygraph.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DIRECTORY_GRAPH        = YES
+
+# The DIR_GRAPH_MAX_DEPTH tag can be used to limit the maximum number of levels
+# of child directories generated in directory dependency graphs by dot.
+# Minimum value: 1, maximum value: 25, default value: 1.
+# This tag requires that the tag DIRECTORY_GRAPH is set to YES.
+
+DIR_GRAPH_MAX_DEPTH    = 1
+
+# The DOT_IMAGE_FORMAT tag can be used to set the image format of the images
+# generated by dot. For an explanation of the image formats see the section
+# output formats in the documentation of the dot tool (Graphviz (see:
+# https://www.graphviz.org/)).
+# Note: If you choose svg you need to set HTML_FILE_EXTENSION to xhtml in order
+# to make the SVG files visible in IE 9+ (other browsers do not have this
+# requirement).
+# Possible values are: png, jpg, gif, svg, png:gd, png:gd:gd, png:cairo,
+# png:cairo:gd, png:cairo:cairo, png:cairo:gdiplus, png:gdiplus and
+# png:gdiplus:gdiplus.
+# The default value is: png.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_IMAGE_FORMAT       = png
+
+# If DOT_IMAGE_FORMAT is set to svg, then this option can be set to YES to
+# enable generation of interactive SVG images that allow zooming and panning.
+#
+# Note that this requires a modern browser other than Internet Explorer. Tested
+# and working are Firefox, Chrome, Safari, and Opera.
+# Note: For IE 9+ you need to set HTML_FILE_EXTENSION to xhtml in order to make
+# the SVG files visible. Older versions of IE do not have SVG support.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+INTERACTIVE_SVG        = NO
+
+# The DOT_PATH tag can be used to specify the path where the dot tool can be
+# found. If left blank, it is assumed the dot tool can be found in the path.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_PATH               =
+
+# The DOTFILE_DIRS tag can be used to specify one or more directories that
+# contain dot files that are included in the documentation (see the \dotfile
+# command).
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOTFILE_DIRS           =
+
+# You can include diagrams made with dia in Doxygen documentation. Doxygen will
+# then run dia to produce the diagram and insert it in the documentation. The
+# DIA_PATH tag allows you to specify the directory where the dia binary resides.
+# If left empty dia is assumed to be found in the default search path.
+
+DIA_PATH               =
+
+# The DIAFILE_DIRS tag can be used to specify one or more directories that
+# contain dia files that are included in the documentation (see the \diafile
+# command).
+
+DIAFILE_DIRS           =
+
+# When using PlantUML, the PLANTUML_JAR_PATH tag should be used to specify the
+# path where java can find the plantuml.jar file or to the filename of jar file
+# to be used. If left blank, it is assumed PlantUML is not used or called during
+# a preprocessing step. Doxygen will generate a warning when it encounters a
+# \startuml command in this case and will not generate output for the diagram.
+
+PLANTUML_JAR_PATH      =
+
+# When using PlantUML, the PLANTUML_CFG_FILE tag can be used to specify a
+# configuration file for PlantUML.
+
+PLANTUML_CFG_FILE      =
+
+# When using PlantUML, the specified paths are searched for files specified by
+# the !include statement in a PlantUML block.
+
+PLANTUML_INCLUDE_PATH  =
+
+# The DOT_GRAPH_MAX_NODES tag can be used to set the maximum number of nodes
+# that will be shown in the graph. If the number of nodes in a graph becomes
+# larger than this value, Doxygen will truncate the graph, which is visualized
+# by representing a node as a red box. Note that if the number of direct
+# children of the root node in a graph is already larger than
+# DOT_GRAPH_MAX_NODES then the graph will not be shown at all. Also note that
+# the size of a graph can be further restricted by MAX_DOT_GRAPH_DEPTH.
+# Minimum value: 0, maximum value: 10000, default value: 50.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_GRAPH_MAX_NODES    = 50
+
+# The MAX_DOT_GRAPH_DEPTH tag can be used to set the maximum depth of the graphs
+# generated by dot. A depth value of 3 means that only nodes reachable from the
+# root by following a path via at most 3 edges will be shown. Nodes that lay
+# further from the root node will be omitted. Note that setting this option to 1
+# or 2 may greatly reduce the computation time needed for large code bases. Also
+# note that the size of a graph can be further restricted by
+# DOT_GRAPH_MAX_NODES. Using a depth of 0 means no depth restriction.
+# Minimum value: 0, maximum value: 1000, default value: 0.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+MAX_DOT_GRAPH_DEPTH    = 0
+
+# Set the DOT_MULTI_TARGETS tag to YES to allow dot to generate multiple output
+# files in one run (i.e. multiple -o and -T options on the command line). This
+# makes dot run faster, but since only newer versions of dot (>1.8.10) support
+# this, this feature is disabled by default.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_MULTI_TARGETS      = NO
+
+# If the GENERATE_LEGEND tag is set to YES Doxygen will generate a legend page
+# explaining the meaning of the various boxes and arrows in the dot generated
+# graphs.
+# Note: This tag requires that UML_LOOK isn't set, i.e. the Doxygen internal
+# graphical representation for inheritance and collaboration diagrams is used.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+GENERATE_LEGEND        = YES
+
+# If the DOT_CLEANUP tag is set to YES, Doxygen will remove the intermediate
+# files that are used to generate the various graphs.
+#
+# Note: This setting is not only used for dot files but also for msc temporary
+# files.
+# The default value is: YES.
+
+DOT_CLEANUP            = YES
+
+# You can define message sequence charts within Doxygen comments using the \msc
+# command. If the MSCGEN_TOOL tag is left empty (the default), then Doxygen will
+# use a built-in version of mscgen tool to produce the charts. Alternatively,
+# the MSCGEN_TOOL tag can also specify the name an external tool. For instance,
+# specifying prog as the value, Doxygen will call the tool as prog -T
+# <outfile_format> -o <outputfile> <inputfile>. The external tool should support
+# output file formats "png", "eps", "svg", and "ismap".
+
+MSCGEN_TOOL            =
+
+# The MSCFILE_DIRS tag can be used to specify one or more directories that
+# contain msc files that are included in the documentation (see the \mscfile
+# command).
+
+MSCFILE_DIRS           =
diff --git a/cpp_docs/Makefile b/cpp_docs/Makefile
new file mode 100644
index 00000000..d0c3cbf1
--- /dev/null
+++ b/cpp_docs/Makefile
@@ -0,0 +1,20 @@
+# Minimal makefile for Sphinx documentation
+#
+
+# You can set these variables from the command line, and also
+# from the environment for the first two.
+SPHINXOPTS    ?=
+SPHINXBUILD   ?= sphinx-build
+SOURCEDIR     = source
+BUILDDIR      = build
+
+# Put it first so that "make" without argument is like "make help".
+help:
+	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
+
+.PHONY: help Makefile
+
+# Catch-all target: route all unknown targets to Sphinx using the new
+# "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
+%: Makefile
+	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
diff --git a/cpp_docs/README.md b/cpp_docs/README.md
new file mode 100644
index 00000000..22ff9f68
--- /dev/null
+++ b/cpp_docs/README.md
@@ -0,0 +1,21 @@
+# C++ API Documentation
+
+## Building Documentation Locally
+
+We are still working out the best way to deploy the C++ documentation online alongside the R and Python documentation. 
+In the meantime, to build the C++ documentation locally, first ensure that you have [doxygen](https://www.doxygen.nl/index.html) installed. 
+On MacOS, this can be [done via homebrew](https://formulae.brew.sh/formula/doxygen) (i.e. `brew install doxygen`). 
+Next, you will need both the [Sphinx](https://www.sphinx-doc.org/en/master/) and [breathe](https://breathe.readthedocs.io/en/latest/dot_graphs.html) python packages
+
+Now, navigate to the python package's main directory (i.e. `cd [path/to/stochtree]`), build the C++ documentation via `doxygen` and then run `sphinx-build` as below
+
+```
+pip install --upgrade pip
+pip install -r cpp_docs/requirements.txt
+doxygen
+sphinx-build -M html cpp_docs/ cpp_docs/build/
+```
+
+## Documentation Style
+
+Module (class, function, etc...) documentation follows the format prescribed by [doxygen](https://www.doxygen.nl/manual/docblocks.html) for C++ code.
diff --git a/cpp_docs/conf.py b/cpp_docs/conf.py
new file mode 100644
index 00000000..369f5010
--- /dev/null
+++ b/cpp_docs/conf.py
@@ -0,0 +1,40 @@
+# Configuration file for the Sphinx documentation builder.
+#
+# For the full list of built-in configuration values, see the documentation:
+# https://www.sphinx-doc.org/en/master/usage/configuration.html
+
+# import os
+# import sys
+# sys.path.insert(0, os.path.abspath('../..'))
+from pathlib import Path
+CPP_DOC_PATH = Path(__file__).absolute().parent
+
+# -- Project information -----------------------------------------------------
+# https://www.sphinx-doc.org/en/master/usage/configuration.html#project-information
+
+project = 'stochtree'
+copyright = '2024, Drew Herren'
+author = 'Drew Herren'
+release = '0.0.1'
+
+# -- General configuration ---------------------------------------------------
+# https://www.sphinx-doc.org/en/master/usage/configuration.html#general-configuration
+
+extensions = [
+   'sphinx.ext.autodoc',
+   'sphinx.ext.autosummary',
+   'breathe'
+]
+
+templates_path = ['_templates']
+exclude_patterns = []
+
+# Breathe Configuration
+breathe_projects = {"StochTree": str(CPP_DOC_PATH / "doxyoutput" / "xml")}
+breathe_default_project = "StochTree"
+
+# -- Options for HTML output -------------------------------------------------
+# https://www.sphinx-doc.org/en/master/usage/configuration.html#options-for-html-output
+
+html_theme = 'furo'
+html_static_path = ['_static']
diff --git a/cpp_docs/index.rst b/cpp_docs/index.rst
new file mode 100644
index 00000000..069cd3e5
--- /dev/null
+++ b/cpp_docs/index.rst
@@ -0,0 +1,8 @@
+StochTree
+=========
+
+``stochtree`` runs stochastic machine learning algorithms for supervised learning and causal inference.
+
+.. doxygenclass:: StochTree::Tree
+   :project: StochTree
+   :members:
\ No newline at end of file
diff --git a/cpp_docs/make.bat b/cpp_docs/make.bat
new file mode 100644
index 00000000..dc1312ab
--- /dev/null
+++ b/cpp_docs/make.bat
@@ -0,0 +1,35 @@
+@ECHO OFF
+
+pushd %~dp0
+
+REM Command file for Sphinx documentation
+
+if "%SPHINXBUILD%" == "" (
+	set SPHINXBUILD=sphinx-build
+)
+set SOURCEDIR=source
+set BUILDDIR=build
+
+%SPHINXBUILD% >NUL 2>NUL
+if errorlevel 9009 (
+	echo.
+	echo.The 'sphinx-build' command was not found. Make sure you have Sphinx
+	echo.installed, then set the SPHINXBUILD environment variable to point
+	echo.to the full path of the 'sphinx-build' executable. Alternatively you
+	echo.may add the Sphinx directory to PATH.
+	echo.
+	echo.If you don't have Sphinx installed, grab it from
+	echo.https://www.sphinx-doc.org/
+	exit /b 1
+)
+
+if "%1" == "" goto help
+
+%SPHINXBUILD% -M %1 %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
+goto end
+
+:help
+%SPHINXBUILD% -M help %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
+
+:end
+popd
diff --git a/cpp_docs/requirements.txt b/cpp_docs/requirements.txt
new file mode 100644
index 00000000..44bfd94d
--- /dev/null
+++ b/cpp_docs/requirements.txt
@@ -0,0 +1,39 @@
+alabaster==0.7.13
+Babel==2.15.0
+beautifulsoup4==4.12.3
+breathe==4.35.0
+certifi==2024.2.2
+charset-normalizer==3.3.2
+docutils==0.20.1
+furo==2024.5.6
+idna==3.7
+imagesize==1.4.1
+importlib_metadata==7.1.0
+Jinja2==3.1.4
+joblib==1.4.2
+MarkupSafe==2.1.5
+numpy==1.24.4
+packaging==24.0
+pandas==2.0.3
+pybind11==2.12.0
+Pygments==2.18.0
+python-dateutil==2.9.0.post0
+pytz==2024.1
+requests==2.32.2
+scikit-learn==1.3.2
+scipy==1.10.1
+six==1.16.0
+snowballstemmer==2.2.0
+soupsieve==2.5
+Sphinx==7.1.2
+sphinx-basic-ng==1.0.0b2
+sphinxcontrib-applehelp==1.0.4
+sphinxcontrib-devhelp==1.0.2
+sphinxcontrib-htmlhelp==2.0.1
+sphinxcontrib-jsmath==1.0.1
+sphinxcontrib-qthelp==1.0.3
+sphinxcontrib-serializinghtml==1.1.5
+threadpoolctl==3.5.0
+tzdata==2024.1
+urllib3==2.2.1
+zipp==3.18.2
diff --git a/python_docs/README.md b/python_docs/README.md
index aa9244ce..d72fb5a4 100644
--- a/python_docs/README.md
+++ b/python_docs/README.md
@@ -8,7 +8,7 @@ install the package, and run `sphinx-build` as below
 
 ```
 pip install --upgrade pip
-pip install -r docs/requirements.txt
+pip install -r python_docs/requirements.txt
 pip install .
 sphinx-build -M html python_docs/source/ python_docs/build/
 ```

From c444a62cc3c9b6327316dded1845377031f91877 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sun, 1 Sep 2024 00:36:41 -0500
Subject: [PATCH 17/41] Updated C++ documentation

---
 cpp_docs/dataset.rst     | 18 ++++++++++
 cpp_docs/index.rst       | 10 +++---
 cpp_docs/tree.rst        | 20 +++++++++++
 include/stochtree/data.h | 72 ++++++++++++++++++++++++++++++++++++++++
 include/stochtree/tree.h | 49 +++++++++++++++++++--------
 5 files changed, 150 insertions(+), 19 deletions(-)
 create mode 100644 cpp_docs/dataset.rst
 create mode 100644 cpp_docs/tree.rst

diff --git a/cpp_docs/dataset.rst b/cpp_docs/dataset.rst
new file mode 100644
index 00000000..9cc660a8
--- /dev/null
+++ b/cpp_docs/dataset.rst
@@ -0,0 +1,18 @@
+Dataset API
+===========
+
+ForestDataset
+-------------
+
+The ``ForestDataset`` class is a wrapper around data needed to sample one or more tree ensembles. 
+Its core elements are
+
+* **Covariates**: Features / variables used to partition the forests. Stored internally as a (column-major) ``Eigen::MatrixXd``.
+* **Basis**: *[Optional]* basis vector used to define a "leaf regression" --- a partitioned linear model where covariates define the partitions and basis defines the regression variables. 
+  Also stored internally as a (column-major) ``Eigen::MatrixXd``
+* **Sample Weights**: *[Optional]* case weights for every observation in a training dataset. These may be heteroskedastic variance parameters or simply survey / case weights. 
+  Stored internally as an ``Eigen::VectorXd``
+
+.. doxygenclass:: StochTree::ForestDataset
+   :project: StochTree
+   :members:
diff --git a/cpp_docs/index.rst b/cpp_docs/index.rst
index 069cd3e5..84efb2dd 100644
--- a/cpp_docs/index.rst
+++ b/cpp_docs/index.rst
@@ -1,8 +1,8 @@
-StochTree
-=========
+StochTree C++ API and Implementations
+=====================================
 
 ``stochtree`` runs stochastic machine learning algorithms for supervised learning and causal inference.
 
-.. doxygenclass:: StochTree::Tree
-   :project: StochTree
-   :members:
\ No newline at end of file
+.. toctree::
+   dataset
+   tree
diff --git a/cpp_docs/tree.rst b/cpp_docs/tree.rst
new file mode 100644
index 00000000..841d3166
--- /dev/null
+++ b/cpp_docs/tree.rst
@@ -0,0 +1,20 @@
+Decision Tree API
+=================
+
+Tree
+----
+
+The fundamental building block of the C++ tree data structures is the ``Tree`` class. 
+
+.. doxygenclass:: StochTree::Tree
+   :project: StochTree
+   :members:
+
+Tree Split
+----------
+
+Numeric and categorical splits are represented by a `TreeSplit` class.
+
+.. doxygenclass:: StochTree::TreeSplit
+   :project: StochTree
+   :members:
diff --git a/include/stochtree/data.h b/include/stochtree/data.h
index 1d16e4fd..31e972f0 100644
--- a/include/stochtree/data.h
+++ b/include/stochtree/data.h
@@ -41,37 +41,109 @@ class ColumnVector {
   Eigen::VectorXd data_;
 };
 
+/*! \brief API for loading and accessing data */
 class ForestDataset {
  public:
+  /*!
+   * \brief Default constructor. No data is loaded at construction time.
+   */
   ForestDataset() {}
   ~ForestDataset() {}
+  /*!
+   * \brief Copy / load covariates from raw memory buffer (often pointer to data in a R matrix or numpy array)
+   * 
+   * \param data_ptr Pointer to first element of a contiguous array of data storing a covariate matrix
+   * \param num_row Number of rows in the covariate matrix
+   * \param num_col Number of columns / covariates in the covariate matrix
+   * \param is_row_major Whether or not the data in `data_ptr` are organized in a row-major or column-major fashion
+   */
   void AddCovariates(double* data_ptr, data_size_t num_row, int num_col, bool is_row_major) {
     covariates_ = ColumnMatrix(data_ptr, num_row, num_col, is_row_major);
     num_observations_ = num_row;
     num_covariates_ = num_col;
     has_covariates_ = true;
   }
+  /*!
+   * \brief Copy / load basis matrix from raw memory buffer (often pointer to data in a R matrix or numpy array)
+   * 
+   * \param data_ptr Pointer to first element of a contiguous array of data storing a basis matrix
+   * \param num_row Number of rows in the basis matrix
+   * \param num_col Number of columns in the basis matrix
+   * \param is_row_major Whether or not the data in `data_ptr` are organized in a row-major or column-major fashion
+   */
   void AddBasis(double* data_ptr, data_size_t num_row, int num_col, bool is_row_major) {
     basis_ = ColumnMatrix(data_ptr, num_row, num_col, is_row_major);
     num_basis_ = num_col;
     has_basis_ = true;
   }
+  /*!
+   * \brief Copy / load variance weights from raw memory buffer (often pointer to data in a R vector or numpy array)
+   * 
+   * \param data_ptr Pointer to first element of a contiguous array of data storing weights
+   * \param num_row Number of rows in the weight vector
+   */
   void AddVarianceWeights(double* data_ptr, data_size_t num_row) {
     var_weights_ = ColumnVector(data_ptr, num_row);
     has_var_weights_ = true;
   }
+  /*! \brief Whether or not a `ForestDataset` has (yet) loaded covariate data */
   inline bool HasCovariates() {return has_covariates_;}
+  /*! \brief Whether or not a `ForestDataset` has (yet) loaded basis data */
   inline bool HasBasis() {return has_basis_;}
+  /*! \brief Whether or not a `ForestDataset` has (yet) loaded variance weights */
   inline bool HasVarWeights() {return has_var_weights_;}
+  /*! \brief Number of observations (rows) in the dataset */
   inline data_size_t NumObservations() {return num_observations_;}
+  /*! \brief Number of covariate columns in the dataset */
   inline int NumCovariates() {return num_covariates_;}
+  /*! \brief Number of bases in the dataset. This is 0 if the dataset has not been provided a basis matrix. */
   inline int NumBasis() {return num_basis_;}
+  /*!
+   * \brief Returns a dataset's covariate value stored at (`row`, `col`)
+   * 
+   * \param row Row number to query in the covariate matrix
+   * \param col Column number to query in the covariate matrix
+   */
   inline double CovariateValue(data_size_t row, int col) {return covariates_.GetElement(row, col);}
+  /*!
+   * \brief Returns a dataset's basis value stored at (`row`, `col`)
+   * 
+   * \param row Row number to query in the basis matrix
+   * \param col Column number to query in the basis matrix
+   */
   inline double BasisValue(data_size_t row, int col) {return basis_.GetElement(row, col);}
+  /*!
+   * \brief Returns a dataset's variance weight stored at element `row`
+   * 
+   * \param row Index to query in the weight vector
+   */
   inline double VarWeightValue(data_size_t row) {return var_weights_.GetElement(row);}
+  /*!
+   * \brief Return a reference to the raw `Eigen::MatrixXd` storing the covariate data
+   * 
+   * \return Eigen::MatrixXd& by reference
+   */
   inline Eigen::MatrixXd& GetCovariates() {return covariates_.GetData();}
+  /*!
+   * \brief Return a reference to the raw `Eigen::MatrixXd` storing the basis data
+   * 
+   * \return Eigen::MatrixXd& by reference
+   */
   inline Eigen::MatrixXd& GetBasis() {return basis_.GetData();}
+  /*!
+   * \brief Return a reference to the raw `Eigen::VectorXd` storing the variance weights
+   * 
+   * \return Eigen::VectorXd& by reference
+   */
   inline Eigen::VectorXd& GetVarWeights() {return var_weights_.GetData();}
+  /*!
+   * \brief Update the data in the internal basis matrix to new values stored in a raw double array
+   * 
+   * \param data_ptr Pointer to first element of a contiguous array of data storing a basis matrix
+   * \param num_row Number of rows in the basis matrix
+   * \param num_col Number of columns in the basis matrix
+   * \param is_row_major Whether or not the data in `data_ptr` are organized in a row-major or column-major fashion
+   */
   void UpdateBasis(double* data_ptr, data_size_t num_row, int num_col, bool is_row_major) {
     CHECK(has_basis_);
     CHECK_EQ(num_col, num_basis_);
diff --git a/include/stochtree/tree.h b/include/stochtree/tree.h
index f847caa9..144ca4ff 100644
--- a/include/stochtree/tree.h
+++ b/include/stochtree/tree.h
@@ -55,7 +55,7 @@ enum FeatureSplitType {
 /*! \brief Forward declaration of TreeSplit class */
 class TreeSplit;
 
-/*! \brief in-memory representation of a decision tree */
+/*! \brief API for constructing decision trees (splitting, pruning, setting parameter values) */
 class Tree {
  public:
   static constexpr std::int32_t kInvalidNodeId{-1};
@@ -433,11 +433,9 @@ class Tree {
   }
 
   /*!
-   * \brief Get list of all categories belonging to the left/right child node.
-   * See the category_list_right_child_ field of each test node to determine whether this list
-   * represents the right child node or the left child node. Categories are integers ranging from 0
-   * to (n-1), where n is the number of categories in that particular feature. This list is assumed
-   * to be in ascending order.
+   * \brief Get list of all categories belonging to the left child node.
+   * Categories are integers ranging from 0 to (n-1), where n is the number of categories in that particular feature. 
+   * This list is assumed to be in ascending order.
    *
    * \param nid ID of node being queried
    */
@@ -792,10 +790,12 @@ inline int NextNodeCategorical(double fvalue, std::vector<std::uint32_t> const&
   return SplitTrueCategorical(fvalue, category_list) ? left_child : right_child;
 }
 
-/*! \brief Determine the node at which a tree places a given observation
- *  \param tree Tree object used for prediction
- *  \param data Dataset used for prediction
- *  \param row Row indexing the prediction observation
+/*! 
+ * Determine the node at which a tree places a given observation
+ * 
+ * \param tree Tree object used for prediction
+ * \param data Dataset used for prediction
+ * \param row Row indexing the prediction observation
  */
 inline int EvaluateTree(Tree const& tree, Eigen::MatrixXd& data, int row) {
   int node_id = 0;
@@ -816,10 +816,12 @@ inline int EvaluateTree(Tree const& tree, Eigen::MatrixXd& data, int row) {
   return node_id;
 }
 
-/*! \brief Determine the node at which a tree places a given observation
- *  \param tree Tree object used for prediction
- *  \param data Dataset used for prediction
- *  \param row Row indexing the prediction observation
+/*! 
+ * Determine the node at which a tree places a given observation
+ * 
+ * \param tree Tree object used for prediction
+ * \param data Dataset used for prediction
+ * \param row Row indexing the prediction observation
  */
 inline int EvaluateTree(Tree const& tree, Eigen::Map<Eigen::Matrix<double, Eigen::Dynamic, Eigen::Dynamic, Eigen::ColMajor>>& data, int row) {
   int node_id = 0;
@@ -862,14 +864,25 @@ inline bool RowSplitLeft(Eigen::MatrixXd& covariates, int row, int split_index,
   return SplitTrueCategorical(fvalue, category_list);
 }
 
+/*! \brief Representation of arbitrary tree split rules, including numeric split rules (`X[,i] <= c`) and categorical split rules (`X[,i] in {2,4,6,7}`) */
 class TreeSplit {
  public:
   TreeSplit() {}
+  /*!
+   * \brief Construct a numeric TreeSplit
+   * 
+   * \param split_value Numeric cutoff defining a new split rule
+   */
   TreeSplit(double split_value) {
     numeric_ = true;
     split_value_ = split_value;
     split_set_ = true;
   }
+  /*!
+   * \brief Construct a categorical TreeSplit
+   * 
+   * \param split_categories Vector of category indices defining a new (unordered) categorical split rule
+   */
   TreeSplit(std::vector<std::uint32_t>& split_categories) {
     numeric_ = false;
     split_categories_ = split_categories;
@@ -877,12 +890,20 @@ class TreeSplit {
   }
   ~TreeSplit() {}
   bool SplitSet() {return split_set_;}
+  /*! \brief Whether or not a `TreeSplit` rule is numeric */
   bool NumericSplit() {return numeric_;}
+  /*!
+   * \brief Whether a given covariate value is `True` or `False` on the rule defined by a `TreeSplit` object
+   * 
+   * \param fvalue Value of the covariate
+   */
   bool SplitTrue(double fvalue) {
     if (numeric_) return SplitTrueNumeric(fvalue, split_value_);
     else return SplitTrueCategorical(fvalue, split_categories_);
   }
+  /*! \brief Numeric cutoff value defining a `TreeSplit` object */
   double SplitValue() {return split_value_;}
+  /*! \brief Categories defining a `TreeSplit` object */
   std::vector<std::uint32_t> SplitCategories() {return split_categories_;}
  private:
   bool split_set_{false};

From 0a7849948fb1f463d89b7511876ab6a4068b52dd Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Mon, 2 Sep 2024 00:30:01 -0500
Subject: [PATCH 18/41] Updated C++ documentation and doc build config

---
 cpp_docs/Doxyfile        |  23 ++++----
 cpp_docs/dataset.rst     |  21 ++++++-
 cpp_docs/index.rst       |   3 +-
 cpp_docs/tree.rst        |   4 +-
 include/stochtree/data.h |  71 ++++++++++++++++++++---
 include/stochtree/tree.h | 120 ++++++++++++++++++++-------------------
 6 files changed, 161 insertions(+), 81 deletions(-)

diff --git a/cpp_docs/Doxyfile b/cpp_docs/Doxyfile
index 2b178775..9c0d1708 100644
--- a/cpp_docs/Doxyfile
+++ b/cpp_docs/Doxyfile
@@ -74,7 +74,7 @@ PROJECT_ICON           =
 # entered, it will be relative to the location where Doxygen was started. If
 # left blank the current directory will be used.
 
-OUTPUT_DIRECTORY       = doxyoutput
+OUTPUT_DIRECTORY       = cpp_docs/doxyoutput
 
 # If the CREATE_SUBDIRS tag is set to YES then Doxygen will create up to 4096
 # sub-directories (in 2 levels) under the output directory of each output format
@@ -965,7 +965,7 @@ WARN_LOGFILE           =
 # spaces. See also FILE_PATTERNS and EXTENSION_MAPPING
 # Note: If this tag is empty the current directory is searched.
 
-INPUT                  = ../
+INPUT                  = 
 
 # This tag can be used to specify the character encoding of the source files
 # that Doxygen parses. Internally Doxygen uses the UTF-8 encoding. Doxygen uses
@@ -1033,13 +1033,13 @@ RECURSIVE              = YES
 # Note that relative paths are relative to the directory from which Doxygen is
 # run.
 
-EXCLUDE                = ../src/cpp11.cpp \
-                         ../src/py_stochtree.cpp \
-                         ../src/R_data.cpp \
-                         ../src/R_random_effects.cpp \
-                         ../src/sampler.cpp \
-                         ../src/serialization.cpp \
-                         ../src/stochtree_types.h
+EXCLUDE                = src/cpp11.cpp \
+                         src/py_stochtree.cpp \
+                         src/R_data.cpp \
+                         src/R_random_effects.cpp \
+                         src/sampler.cpp \
+                         src/serialization.cpp \
+                         src/stochtree_types.h
 
 # The EXCLUDE_SYMLINKS tag can be used to select whether or not files or
 # directories that are symbolic links (a Unix file system feature) are excluded
@@ -1064,7 +1064,10 @@ EXCLUDE_PATTERNS       = */test/* \
                          */demo/* \
                          */deps/* \
                          */venv/* \
-                         */xcode/*
+                         */xcode/* \
+                         */build/* \
+                         */docs/* \
+                         */stochtree.egg-info/*
 
 # The EXCLUDE_SYMBOLS tag can be used to specify one or more symbol names
 # (namespaces, classes, functions, etc.) that should be excluded from the
diff --git a/cpp_docs/dataset.rst b/cpp_docs/dataset.rst
index 9cc660a8..742e04f9 100644
--- a/cpp_docs/dataset.rst
+++ b/cpp_docs/dataset.rst
@@ -9,10 +9,27 @@ Its core elements are
 
 * **Covariates**: Features / variables used to partition the forests. Stored internally as a (column-major) ``Eigen::MatrixXd``.
 * **Basis**: *[Optional]* basis vector used to define a "leaf regression" --- a partitioned linear model where covariates define the partitions and basis defines the regression variables. 
-  Also stored internally as a (column-major) ``Eigen::MatrixXd``
+  Also stored internally as a (column-major) ``Eigen::MatrixXd``.
 * **Sample Weights**: *[Optional]* case weights for every observation in a training dataset. These may be heteroskedastic variance parameters or simply survey / case weights. 
-  Stored internally as an ``Eigen::VectorXd``
+  Stored internally as an ``Eigen::VectorXd``.
 
 .. doxygenclass:: StochTree::ForestDataset
    :project: StochTree
    :members:
+
+RandomEffectsDataset
+--------------------
+
+The ``RandomEffectsDataset`` class is a wrapper around data needed to sample one or more tree ensembles. 
+Its core elements are
+
+* **Basis**: Vector of variables that have group-specific random coefficients. In the simplest additive group random effects model, this is a constant intercept of all ones. 
+  Stored internally as a (column-major) ``Eigen::MatrixXd``.
+* **Group Indices**: Integer-valued indices of group membership. In a model with three groups, these indices would typically be 0, 1, and 2 (remapped from perhaps more descriptive labels in R or Python). 
+  Stored internally as an ``std::vector`` of integers.
+* **Sample Weights**: *[Optional]* case weights for every observation in a training dataset. These may be heteroskedastic variance parameters or simply survey / case weights. 
+  Stored internally as an ``Eigen::VectorXd``.
+
+.. doxygenclass:: StochTree::RandomEffectsDataset
+   :project: StochTree
+   :members:
diff --git a/cpp_docs/index.rst b/cpp_docs/index.rst
index 84efb2dd..bad3eaee 100644
--- a/cpp_docs/index.rst
+++ b/cpp_docs/index.rst
@@ -1,7 +1,8 @@
 StochTree C++ API and Implementations
 =====================================
 
-``stochtree`` runs stochastic machine learning algorithms for supervised learning and causal inference.
+This page documents the data structures and interfaces that constitute the ``stochtree`` C++ core. 
+It may be useful to researchers building novel tree algorithms or users seeking a deeper understanding of the algorithms implemented in ``stochtree``.
 
 .. toctree::
    dataset
diff --git a/cpp_docs/tree.rst b/cpp_docs/tree.rst
index 841d3166..3fe13dba 100644
--- a/cpp_docs/tree.rst
+++ b/cpp_docs/tree.rst
@@ -4,7 +4,7 @@ Decision Tree API
 Tree
 ----
 
-The fundamental building block of the C++ tree data structures is the ``Tree`` class. 
+The fundamental building block of the C++ tree interface is the ``Tree`` class. 
 
 .. doxygenclass:: StochTree::Tree
    :project: StochTree
@@ -13,7 +13,7 @@ The fundamental building block of the C++ tree data structures is the ``Tree`` c
 Tree Split
 ----------
 
-Numeric and categorical splits are represented by a `TreeSplit` class.
+Numeric and categorical splits are represented by a ``TreeSplit`` class.
 
 .. doxygenclass:: StochTree::TreeSplit
    :project: StochTree
diff --git a/include/stochtree/data.h b/include/stochtree/data.h
index 31e972f0..04708da7 100644
--- a/include/stochtree/data.h
+++ b/include/stochtree/data.h
@@ -41,12 +41,10 @@ class ColumnVector {
   Eigen::VectorXd data_;
 };
 
-/*! \brief API for loading and accessing data */
+/*! \brief API for loading and accessing data used to sample tree ensembles */
 class ForestDataset {
  public:
-  /*!
-   * \brief Default constructor. No data is loaded at construction time.
-   */
+  /*! \brief Default constructor. No data is loaded at construction time. */
   ForestDataset() {}
   ~ForestDataset() {}
   /*!
@@ -121,19 +119,19 @@ class ForestDataset {
   /*!
    * \brief Return a reference to the raw `Eigen::MatrixXd` storing the covariate data
    * 
-   * \return Eigen::MatrixXd& by reference
+   * \return Reference to internal Eigen::MatrixXd
    */
   inline Eigen::MatrixXd& GetCovariates() {return covariates_.GetData();}
   /*!
    * \brief Return a reference to the raw `Eigen::MatrixXd` storing the basis data
    * 
-   * \return Eigen::MatrixXd& by reference
+   * \return Reference to internal Eigen::MatrixXd
    */
   inline Eigen::MatrixXd& GetBasis() {return basis_.GetData();}
   /*!
    * \brief Return a reference to the raw `Eigen::VectorXd` storing the variance weights
    * 
-   * \return Eigen::VectorXd& by reference
+   * \return Reference to internal Eigen::VectorXd
    */
   inline Eigen::VectorXd& GetVarWeights() {return var_weights_.GetData();}
   /*!
@@ -174,31 +172,88 @@ class ForestDataset {
   bool has_var_weights_{false};
 };
 
+/*! \brief API for loading and accessing data used to sample (additive) random effects */
 class RandomEffectsDataset {
  public:
+  /*! \brief Default constructor. No data is loaded at construction time. */
   RandomEffectsDataset() {}
   ~RandomEffectsDataset() {}
-  void AddBasis(double* data_ptr, data_size_t num_row, int num_col, bool is_row_major) {
+  /*!
+   * \brief Copy / load basis matrix from raw memory buffer (often pointer to data in a R matrix or numpy array)
+   * 
+   * \param data_ptr Pointer to first element of a contiguous array of data storing a basis matrix
+   * \param num_row Number of rows in the basis matrix
+   * \param num_col Number of columns in the basis matrix
+   * \param is_row_major Whether or not the data in `data_ptr` are organized in a row-major or column-major fashion
+   */
+   void AddBasis(double* data_ptr, data_size_t num_row, int num_col, bool is_row_major) {
     basis_ = ColumnMatrix(data_ptr, num_row, num_col, is_row_major);
     has_basis_ = true;
   }
+  /*!
+   * \brief Copy / load variance weights from raw memory buffer (often pointer to data in a R vector or numpy array)
+   * 
+   * \param data_ptr Pointer to first element of a contiguous array of data storing weights
+   * \param num_row Number of rows in the weight vector
+   */  
   void AddVarianceWeights(double* data_ptr, data_size_t num_row) {
     var_weights_ = ColumnVector(data_ptr, num_row);
     has_var_weights_ = true;
   }
+  /*!
+   * \brief Copy / load group indices for random effects
+   * 
+   * \param group_labels Vector of integers with as many elements as `num_row` in the basis matrix, 
+   * where each element corresponds to the group label for a given observation.
+   */
   void AddGroupLabels(std::vector<int32_t>& group_labels) {
     group_labels_ = group_labels;
     has_group_labels_ = true;
   }
+  /*! \brief Number of observations (rows) in the dataset */
   inline data_size_t NumObservations() {return basis_.NumRows();}
+  /*! \brief Whether or not a `RandomEffectsDataset` has (yet) loaded basis data */
   inline bool HasBasis() {return has_basis_;}
+  /*! \brief Whether or not a `RandomEffectsDataset` has (yet) loaded variance weights */
   inline bool HasVarWeights() {return has_var_weights_;}
+  /*! \brief Whether or not a `RandomEffectsDataset` has (yet) loaded group labels */
   inline bool HasGroupLabels() {return has_group_labels_;}
+  /*!
+   * \brief Returns a dataset's basis value stored at (`row`, `col`)
+   * 
+   * \param row Row number to query in the basis matrix
+   * \param col Column number to query in the basis matrix
+   */
   inline double BasisValue(data_size_t row, int col) {return basis_.GetElement(row, col);}
+  /*!
+   * \brief Returns a dataset's variance weight stored at element `row`
+   * 
+   * \param row Index to query in the weight vector
+   */
   inline double VarWeightValue(data_size_t row) {return var_weights_.GetElement(row);}
+  /*!
+   * \brief Returns a dataset's group label stored at element `row`
+   * 
+   * \param row Index to query in the group label vector
+   */
   inline int32_t GroupId(data_size_t row) {return group_labels_[row];}
+  /*!
+   * \brief Return a reference to the raw `Eigen::MatrixXd` storing the basis data
+   * 
+   * \return Reference to internal Eigen::MatrixXd
+   */
   inline Eigen::MatrixXd& GetBasis() {return basis_.GetData();}
+  /*!
+   * \brief Return a reference to the raw `Eigen::VectorXd` storing the variance weights
+   * 
+   * \return Reference to internal Eigen::VectorXd
+   */
   inline Eigen::VectorXd& GetVarWeights() {return var_weights_.GetData();}
+  /*!
+   * \brief Return a reference to the raw `std::vector` storing the group labels
+   * 
+   * \return Reference to internal std::vector
+   */
   inline std::vector<int32_t>& GetGroupLabels() {return group_labels_;}
  private:
   ColumnMatrix basis_;
diff --git a/include/stochtree/tree.h b/include/stochtree/tree.h
index 144ca4ff..d73bfba9 100644
--- a/include/stochtree/tree.h
+++ b/include/stochtree/tree.h
@@ -68,12 +68,15 @@ class Tree {
   Tree& operator=(Tree const&) = delete;
   Tree(Tree&&) noexcept = default;
   Tree& operator=(Tree&&) noexcept = default;
-
+  /*!
+   * \brief Copy the structure and parameters of another tree. If the `Tree` object calling this method already 
+   * has a non-root tree structure / parameters, this will be erased and replaced with a copy of `tree`.
+   * 
+   * \param tree Tree to be cloned
+   */
   void CloneFromTree(Tree* tree);
 
-  /*! \brief Number of nodes */
   std::int32_t num_nodes{0};
-  /*! \brief Number of deleted nodes */
   std::int32_t num_deleted_nodes{0};
 
   /*! \brief Reset tree to empty vectors and default values of boolean / integer variables */
@@ -100,16 +103,15 @@ class Tree {
   /*! \brief Whether or not a tree is a "stump" consisting of a single root node */
   inline bool IsRoot() {return leaves_.size() == 1;}
   
-  /*! \brief Save to JSON */
+  /*! \brief Convert tree to JSON and return JSON in-memory */
   json to_json();
-  /*! \brief Load from JSON */
+  /*! 
+   * \brief Load from JSON 
+   * 
+   * \param tree_json In-memory json object (of type `nlohmann::json`)
+   */
   void from_json(const json& tree_json);
 
-  /*!
-   * \brief change a non leaf node to a leaf node, delete its children
-   * \param nid node id of the node
-   * \param value new leaf value
-   */
   void ChangeToLeaf(std::int32_t nid, double value) {
     CHECK(this->IsLeaf(this->LeftChild(nid)));
     CHECK(this->IsLeaf(this->RightChild(nid)));
@@ -133,9 +135,9 @@ class Tree {
   }
 
   /*!
-   * \brief collapse a non leaf node to a leaf node, delete its children
-   * \param nid node id of the node
-   * \param value new leaf value
+   * \brief Collapse an internal node to a leaf node, deleting its children from the tree
+   * \param nid Node id of the new leaf node
+   * \param value_vector New leaf value
    */
   void CollapseToLeaf(std::int32_t nid, double value) {
     CHECK_EQ(output_dimension_, 1);
@@ -149,11 +151,6 @@ class Tree {
     this->ChangeToLeaf(nid, value);
   }
 
-  /*!
-   * \brief change a non leaf node to a leaf node, delete its children
-   * \param nid node id of the node
-   * \param value_vector new leaf vector value
-   */
   void ChangeToLeaf(std::int32_t nid, std::vector<double> value_vector) {
     CHECK(this->IsLeaf(this->LeftChild(nid)));
     CHECK(this->IsLeaf(this->RightChild(nid)));
@@ -177,9 +174,9 @@ class Tree {
   }
   
   /*!
-   * \brief collapse a non leaf node to a leaf node, delete its children
-   * \param nid node id of the node
-   * \param value_vector new leaf vector value
+   * \brief Collapse an internal node to a leaf node, deleting its children from the tree
+   * \param nid Node id of the new leaf node
+   * \param value_vector New leaf vector value
    */
   void CollapseToLeaf(std::int32_t nid, std::vector<double> value_vector) {
     CHECK_GT(output_dimension_, 1);
@@ -196,8 +193,9 @@ class Tree {
 
   /*!
    * \brief Iterate through all nodes in this tree.
-   * \param Function that accepts a node index, and returns false when iteration should
-   *        stop, otherwise returns true.
+   * 
+   * \tparam Func Function object type, must map `std::int32_t` to `bool`.
+   * \param func Function that accepts a node index and returns `False` when iteration through a given branch of the tree should stop and `True` otherwise.
    */
   template <typename Func> void WalkTree(Func func) const {
     std::stack<std::int32_t> nodes;
@@ -220,9 +218,6 @@ class Tree {
     }
   }
 
-  /*! \brief Predict a tree based on node membership indices
-   * TODO: generalize to vector leaves
-   */
   void InplacePredictFromNodes(std::vector<double> result, std::vector<std::int32_t> node_indices);
   std::vector<double> PredictFromNodes(std::vector<std::int32_t> node_indices);
   std::vector<double> PredictFromNodes(std::vector<std::int32_t> node_indices, Eigen::MatrixXd& basis);
@@ -269,7 +264,7 @@ class Tree {
   }
   
   /*!
-   * \brief Index of the node's "default" child, used when feature is missing
+   * \brief Index of the node's "default" child (potentially used in the case of a missing feature at prediction time)
    * \param nid ID of node being queried
    */
   std::int32_t DefaultChild(std::int32_t nid) const {
@@ -277,7 +272,7 @@ class Tree {
   }
   
   /*!
-   * \brief Feature index of the node's split condition
+   * \brief Feature index defining the node's split rule
    * \param nid ID of node being queried
    */
   std::int32_t SplitIndex(std::int32_t nid) const {
@@ -285,7 +280,7 @@ class Tree {
   }
   
   /*!
-   * \brief Whether the node is leaf node
+   * \brief Whether the node is a leaf node
    * \param nid ID of node being queried
    */
   bool IsLeaf(std::int32_t nid) const {
@@ -309,7 +304,7 @@ class Tree {
   }
 
   /*!
-   * \brief Get leaf value of the leaf node
+   * \brief Get parameter value of a node (typically though not necessarily a leaf node)
    * \param nid ID of node being queried
    */
   double LeafValue(std::int32_t nid) const {
@@ -317,7 +312,7 @@ class Tree {
   }
   
   /*!
-   * \brief Get value of the leaf node at a given output dimension
+   * \brief Get parameter value of a node (typically though not necessarily a leaf node) at a given output dimension
    * \param nid ID of node being queried
    * \param dim_id Output dimension being queried
    */
@@ -369,7 +364,7 @@ class Tree {
   }
 
   /*!
-   * \brief get leaf vector of the leaf node; useful for multi-output trees
+   * \brief Get vector-valued parameters of a node (typically leaf)
    * \param nid ID of node being queried
    */
   std::vector<double> LeafVector(std::int32_t nid) const {
@@ -385,7 +380,7 @@ class Tree {
   }
 
   /*!
-   * \brief sum of squared values for a given node
+   * \brief Sum of squared parameter values for a given node (typically though not necessarily a leaf node)
    * \param nid ID of node being queried
    */
   double SumSquaredNodeValues(std::int32_t nid) const {
@@ -406,7 +401,7 @@ class Tree {
   }
 
   /*!
-   * \brief sum of squared values for all leaves in a tree
+   * \brief Sum of squared values for all leaves in a tree
    */
   double SumSquaredLeafValues() const {
     double result = 0.;
@@ -425,7 +420,7 @@ class Tree {
   }
 
   /*!
-   * \brief Get threshold of the node
+   * \brief Get split threshold of the node
    * \param nid ID of node being queried
    */
   double Threshold(std::int32_t nid) const {
@@ -453,7 +448,7 @@ class Tree {
   }
 
   /*!
-   * \brief Get the type of a node
+   * \brief Get the type of a node (i.e. numeric split, categorical split, leaf)
    * \param nid ID of node being queried
    */
   TreeNodeType NodeType(std::int32_t nid) const {
@@ -513,7 +508,7 @@ class Tree {
   }
 
   /*!
-   * \brief get current depth
+   * \brief Get the depth of a node
    * \param nid node id
    */
   [[nodiscard]] std::int32_t GetDepth(std::int32_t nid) const {
@@ -628,58 +623,67 @@ class Tree {
 
   /*!
    * \brief Obtain a 0-based leaf index for each observation in a ForestDataset.
-   *        Internally, trees are stored as essentially vectors of node information, 
-   *        and the leaves_ vector gives us node IDs for every leaf in the tree.
+   *        Internally, trees are stored as vectors of node information, 
+   *        and the `leaves_` vector gives us node IDs for every leaf in the tree.
    *        Here, we would like to know, for every observation in a dataset, 
    *        which leaf number it is mapped to. Since the leaf numbers themselves 
-   *        do not carry any information, we renumber them from 0 to `leaves_.size()-1`. 
+   *        do not carry any information, we renumber them from `0` to `leaves_.size()-1`. 
    *
    *        Note: this is a tree-level helper function for an ensemble-level function. 
    *        It assumes the creation of: 
-   *           (a) a vector of column indices of size `dataset.NumObservations()` x `ensemble.NumTrees()`, and
-   *           (b) a running counter of the number of tree-observations already indexed in the ensemble  
-   *               (used as offsets for the leaf number computed and returned here)
+   *        -# a vector of column indices of size `dataset.NumObservations()` x `ensemble.NumTrees()`, stored in "tree-major" order
+   *        -# a running counter of the number of tree-observations already indexed in the ensemble  
+   *           (used as offsets for the leaf number computed and returned here)
    *        Users running this function for a single tree may simply pre-allocate an output vector as 
-   *        std::vector<int32_t> output(dataset->NumObservations()) and set the offset to 0.
+   *        `std::vector<int32_t> output(dataset->NumObservations())` and set the offset to 0.
    * \param dataset Dataset with which to predict leaf indices from the tree
+   * \param output Pre-allocated output vector storing a matrix of column indices, with "rows" corresponding to observations in `dataset` and "columns" corresponding to trees in an ensemble
+   * \param offset Bookkeeping index that determines where in `output` vector that column indices should be unpacked
+   * \param max_leaf Largest leaf value mapped so far. (Leaf indices serve as sparse column indices, so it is important that leaf values be unique to each tree.)
    */
   void PredictLeafIndexInplace(ForestDataset* dataset, std::vector<int32_t>& output, int32_t offset, int32_t max_leaf);
 
   /*!
    * \brief Obtain a 0-based leaf index for each observation in a ForestDataset.
-   *        Internally, trees are stored as essentially vectors of node information, 
-   *        and the leaves_ vector gives us node IDs for every leaf in the tree.
+   *        Internally, trees are stored as vectors of node information, 
+   *        and the `leaves_` vector gives us node IDs for every leaf in the tree.
    *        Here, we would like to know, for every observation in a dataset, 
    *        which leaf number it is mapped to. Since the leaf numbers themselves 
-   *        do not carry any information, we renumber them from 0 to `leaves_.size()-1`. 
+   *        do not carry any information, we renumber them from `0` to `leaves_.size()-1`. 
    *
    *        Note: this is a tree-level helper function for an ensemble-level function. 
    *        It assumes the creation of: 
-   *           (a) a vector of column indices of size `dataset.NumObservations()` x `ensemble.NumTrees()`, and
-   *           (b) a running counter of the number of tree-observations already indexed in the ensemble  
-   *               (used as offsets for the leaf number computed and returned here)
+   *        -# a vector of column indices of size `dataset.NumObservations()` x `ensemble.NumTrees()`, stored in "tree-major" order
+   *        -# a running counter of the number of tree-observations already indexed in the ensemble  
+   *           (used as offsets for the leaf number computed and returned here)
    *        Users running this function for a single tree may simply pre-allocate an output vector as 
-   *        std::vector<int32_t> output(dataset->NumObservations()) and set the offset to 0.
+   *        `std::vector<int32_t> output(dataset->NumObservations())` and set the offset to 0.
    * \param covariates Eigen matrix with which to predict leaf indices
+   * \param output Pre-allocated output vector storing a matrix of column indices, with "rows" corresponding to observations in `covariates` and "columns" corresponding to trees in an ensemble
+   * \param offset Bookkeeping index that determines where in `output` vector that column indices should be unpacked
+   * \param max_leaf Largest leaf value mapped so far. (Leaf indices serve as sparse column indices, so it is important that leaf values be unique to each tree.)
    */
   void PredictLeafIndexInplace(Eigen::MatrixXd& covariates, std::vector<int32_t>& output, int32_t offset, int32_t max_leaf);
 
   /*!
    * \brief Obtain a 0-based leaf index for each observation in a ForestDataset.
-   *        Internally, trees are stored as essentially vectors of node information, 
-   *        and the leaves_ vector gives us node IDs for every leaf in the tree.
+   *        Internally, trees are stored as vectors of node information, 
+   *        and the `leaves_` vector gives us node IDs for every leaf in the tree.
    *        Here, we would like to know, for every observation in a dataset, 
    *        which leaf number it is mapped to. Since the leaf numbers themselves 
-   *        do not carry any information, we renumber them from 0 to `leaves_.size()-1`. 
+   *        do not carry any information, we renumber them from `0` to `leaves_.size()-1`. 
    *
    *        Note: this is a tree-level helper function for an ensemble-level function. 
    *        It assumes the creation of: 
-   *           (a) a vector of column indices of size `dataset.NumObservations()` x `ensemble.NumTrees()`, and
-   *           (b) a running counter of the number of tree-observations already indexed in the ensemble  
-   *               (used as offsets for the leaf number computed and returned here)
+   *        -# a vector of column indices of size `dataset.NumObservations()` x `ensemble.NumTrees()`, stored in "tree-major" order
+   *        -# a running counter of the number of tree-observations already indexed in the ensemble  
+   *           (used as offsets for the leaf number computed and returned here)
    *        Users running this function for a single tree may simply pre-allocate an output vector as 
-   *        std::vector<int32_t> output(dataset->NumObservations()) and set the offset to 0.
+   *        `std::vector<int32_t> output(dataset->NumObservations())` and set the offset to 0.
    * \param covariates Eigen matrix with which to predict leaf indices
+   * \param output Pre-allocated output vector storing a matrix of column indices, with "rows" corresponding to observations in `covariates` and "columns" corresponding to trees in an ensemble
+   * \param offset Bookkeeping index that determines where in `output` vector that column indices should be unpacked
+   * \param max_leaf Largest leaf value mapped so far. (Leaf indices serve as sparse column indices, so it is important that leaf values be unique to each tree.)
    */
   void PredictLeafIndexInplace(Eigen::Map<Eigen::Matrix<double, Eigen::Dynamic, Eigen::Dynamic, Eigen::ColMajor>>& covariates, std::vector<int32_t>& output, int32_t offset, int32_t max_leaf);
 

From 5d135b27d1643e61c7486aff0a8944ffcfb5a5c1 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 3 Sep 2024 02:00:14 -0500
Subject: [PATCH 19/41] Updated C++ documentation

---
 cpp_docs/dataset.rst                  | 15 ++++++++---
 cpp_docs/index.rst                    |  1 +
 cpp_docs/tracking.rst                 | 36 +++++++++++++++++++++++++++
 include/stochtree/meta.h              |  7 +++---
 include/stochtree/partition_tracker.h | 10 +++++++-
 5 files changed, 61 insertions(+), 8 deletions(-)
 create mode 100644 cpp_docs/tracking.rst

diff --git a/cpp_docs/dataset.rst b/cpp_docs/dataset.rst
index 742e04f9..30179954 100644
--- a/cpp_docs/dataset.rst
+++ b/cpp_docs/dataset.rst
@@ -1,8 +1,8 @@
 Dataset API
 ===========
 
-ForestDataset
--------------
+Forest Dataset
+--------------
 
 The ``ForestDataset`` class is a wrapper around data needed to sample one or more tree ensembles. 
 Its core elements are
@@ -17,8 +17,8 @@ Its core elements are
    :project: StochTree
    :members:
 
-RandomEffectsDataset
---------------------
+Random Effects Dataset
+----------------------
 
 The ``RandomEffectsDataset`` class is a wrapper around data needed to sample one or more tree ensembles. 
 Its core elements are
@@ -33,3 +33,10 @@ Its core elements are
 .. doxygenclass:: StochTree::RandomEffectsDataset
    :project: StochTree
    :members:
+
+Other Classes and Types
+-----------------------
+
+.. doxygenenum:: StochTree::FeatureType
+   :project: StochTree
+   
\ No newline at end of file
diff --git a/cpp_docs/index.rst b/cpp_docs/index.rst
index bad3eaee..10396d88 100644
--- a/cpp_docs/index.rst
+++ b/cpp_docs/index.rst
@@ -6,4 +6,5 @@ It may be useful to researchers building novel tree algorithms or users seeking
 
 .. toctree::
    dataset
+   tracking
    tree
diff --git a/cpp_docs/tracking.rst b/cpp_docs/tracking.rst
new file mode 100644
index 00000000..57f22f99
--- /dev/null
+++ b/cpp_docs/tracking.rst
@@ -0,0 +1,36 @@
+Forest Sampling Tracker API
+===========================
+
+A truly minimalist tree ensemble library only needs 
+
+* A representation of a decision tree
+* A container for grouping / storing ensembles of trees
+* In-memory access to / representation of training data
+* Routines / functions to construct the trees
+
+Most algorithms for optimizing or sampling tree ensembles frequently perform the following operations
+
+* Determine which leaf a training observation falls into for a decision tree (to compute its prediction and update the residual / outcome)
+* Evaluate potential split candidates for a leaf of a decision
+
+With only the "minimalist" tools above, these two tasks proceed largely as follows
+
+* For every observation in the dataset, traverse the tree (runtime depends on the tree topology but in a fully balanced tree with :math:`k` nodes, this has time complexity :math:`O(\log (k))`).
+* For every observation in the dataset, determine whether an observation falls into a given node and whether or not a proposed decision rule would be true
+
+These operations both perform unnecessary computation which can be avoided with some additional real-time tracking. Essentially, we want 
+
+1. A mapping from dataset row index to leaf node id for every tree in an ensemble (so that we can skip the tree traversal during prediction)
+2. A mapping from leaf node id to dataset row indices every tree in an ensemble (so that we can skip the full pass through the training data at split evaluation)
+
+.. 1. For every observation in a dataset, which leaf node of each tree does the sample fall into?
+.. 2. For every leaf in a tree, which training set observations fall into that node?
+
+Forest Tracker
+--------------
+
+The ``ForestTracker`` class is a wrapper around several implementations of the mappings discussed above. 
+
+.. doxygenclass:: StochTree::ForestTracker
+   :project: StochTree
+   :members:
diff --git a/include/stochtree/meta.h b/include/stochtree/meta.h
index b77179ec..7318631c 100644
--- a/include/stochtree/meta.h
+++ b/include/stochtree/meta.h
@@ -30,10 +30,11 @@
 
 namespace StochTree {
 
+/*! \brief Integer encoding of feature types */
 enum FeatureType {
-  kNumeric,
-  kOrderedCategorical,
-  kUnorderedCategorical
+  kNumeric, /*!< Numeric feature */
+  kOrderedCategorical, /*!< Ordered categorical feature */
+  kUnorderedCategorical /*!< Unordered categorical feature */
 };
 
 enum ForestLeafVarianceType {
diff --git a/include/stochtree/partition_tracker.h b/include/stochtree/partition_tracker.h
index 6025496c..f0b9f188 100644
--- a/include/stochtree/partition_tracker.h
+++ b/include/stochtree/partition_tracker.h
@@ -46,9 +46,17 @@ class UnsortedNodeSampleTracker;
 class SortedNodeSampleTracker;
 class FeaturePresortRootContainer;
 
-/*! \brief Wrapper around various data structures for forest sampling algorithms */
+/*! \brief "Superclass" wrapper around tracking data structures for forest sampling algorithms */
 class ForestTracker {
  public:
+  /*!
+   * \brief Construct a new `ForestTracker` object
+   * 
+   * \param covariates Matrix of covariate data
+   * \param feature_types Type of each feature (column) in `covariates`. This is represented by the enum `StochTree::FeatureType`
+   * \param num_trees Number of trees in an ensemble to be sampled
+   * \param num_observations Number of rows in `covariates`
+   */
   ForestTracker(Eigen::MatrixXd& covariates, std::vector<FeatureType>& feature_types, int num_trees, int num_observations);
   ~ForestTracker() {}
   void AssignAllSamplesToRoot();

From 6409d4841564ef4bee628c942a127e58b594d952 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Thu, 5 Sep 2024 16:27:44 -0500
Subject: [PATCH 20/41] Updated C++ doc build instructions

---
 cpp_docs/README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cpp_docs/README.md b/cpp_docs/README.md
index 22ff9f68..5017af8c 100644
--- a/cpp_docs/README.md
+++ b/cpp_docs/README.md
@@ -12,7 +12,7 @@ Now, navigate to the python package's main directory (i.e. `cd [path/to/stochtre
 ```
 pip install --upgrade pip
 pip install -r cpp_docs/requirements.txt
-doxygen
+doxygen cpp_docs/Doxyfile
 sphinx-build -M html cpp_docs/ cpp_docs/build/
 ```
 

From 923ae54e861ef15f996c5c3ad48c14ab6689a68f Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Thu, 12 Sep 2024 03:12:43 -0500
Subject: [PATCH 21/41] Not-yet-fully-functional heteroskedasticity forest
 implementation

---
 debug/README.md                       |   3 +
 debug/api_debug.cpp                   | 149 ++++++++++++++++++--------
 include/stochtree/container.h         |   5 +-
 include/stochtree/ensemble.h          |  21 +++-
 include/stochtree/leaf_model.h        | 127 ++++++++++++++++++----
 include/stochtree/meta.h              |   4 +
 include/stochtree/partition_tracker.h |   5 +
 include/stochtree/tree.h              |  12 ++-
 include/stochtree/tree_sampler.h      |  44 ++++++--
 src/container.cpp                     |  16 +--
 src/leaf_model.cpp                    |  80 ++++++++++++++
 src/partition_tracker.cpp             |  17 +++
 src/tree.cpp                          |  19 ++--
 13 files changed, 406 insertions(+), 96 deletions(-)

diff --git a/debug/README.md b/debug/README.md
index e740b4ef..6e018fe6 100644
--- a/debug/README.md
+++ b/debug/README.md
@@ -14,9 +14,12 @@ The DGPs are numbered as follows:
 
 0. Simple leaf regression model with a univariate basis for the leaf model
 1. Constant leaf model with a large number of deep interactions between features
+2. Simple leaf regression model with a multivariate basis for the leaf model
+3. Simple "variance-only" model with a mean of zero but covariate-moderated variance function
 
 The models are numbered as follows:
 
 0. Constant leaf tree model (the "classic" BART / XBART model)
 1. "Univariate basis" leaf regression model
 2. "Multivariate basis" leaf regression model
+3. Log linear heteroskedastic variance model
diff --git a/debug/api_debug.cpp b/debug/api_debug.cpp
index afa8cc8a..0cb6fab8 100644
--- a/debug/api_debug.cpp
+++ b/debug/api_debug.cpp
@@ -225,7 +225,7 @@ void GenerateDGP2(std::vector<double>& covariates, std::vector<double>& basis, s
 
     for (int j = 0; j < y_cols; j++) {
       error = 0.1 * normal_dist(gen);
-      outcome[i * y_cols + j] = f_x +  error;
+      outcome[i * y_cols + j] = f_x + error;
       if (rfx_included) {
         if (rfx_groups[i] == 1) {
           rfx = 5.;
@@ -319,6 +319,86 @@ void GenerateDGP3(std::vector<double>& covariates, std::vector<double>& basis, s
   }
 }
 
+void GenerateDGP4(std::vector<double>& covariates, std::vector<double>& basis, std::vector<double>& outcome, std::vector<double>& rfx_basis, std::vector<int32_t>& rfx_groups, std::vector<FeatureType>& feature_types, std::mt19937& gen, int& n, int& x_cols, int& omega_cols, int& y_cols, int& rfx_basis_cols, int& num_rfx_groups, bool rfx_included, int random_seed = -1) {
+  // Data dimensions
+  n = 1000;
+  x_cols = 2;
+  omega_cols = 0;
+  y_cols = 1;
+  if (rfx_included) {
+    num_rfx_groups = 2;
+    rfx_basis_cols = 1;
+  } else {
+    num_rfx_groups = 0;
+    rfx_basis_cols = 0;
+  }
+
+  // Resize data
+  covariates.resize(n * x_cols);
+  basis.resize(n * omega_cols);
+  rfx_basis.resize(n * rfx_basis_cols);
+  outcome.resize(n * y_cols);
+  rfx_groups.resize(n);
+  feature_types.resize(x_cols, FeatureType::kNumeric);
+  
+  // Random number generation
+  std::uniform_real_distribution<double> uniform_dist{0.0,1.0};
+  std::normal_distribution<double> normal_dist(0.,1.);
+  
+  // DGP parameters
+  std::vector<double> betas{1, 2, 5, 10};
+  int num_partitions = betas.size();
+  double s_x;
+  double rfx;
+  double error;
+
+  for (int i = 0; i < n; i++) {
+    for (int j = 0; j < x_cols; j++) {
+      covariates[i*x_cols + j] = uniform_dist(gen);
+    }
+    
+    for (int j = 0; j < omega_cols; j++) {
+      basis[i*omega_cols + j] = uniform_dist(gen);
+    }
+    
+    if (rfx_included) {
+      for (int j = 0; j < rfx_basis_cols; j++) {
+        rfx_basis[i * rfx_basis_cols + j] = 1;
+      }
+
+      if (i % 2 == 0) {
+        rfx_groups[i] = 1;
+      }
+      else {
+        rfx_groups[i] = 2;
+      }
+    }
+    
+    for (int j = 0; j < y_cols; j++) {
+      if ((covariates[i * x_cols + 0] >= 0.0) && covariates[i * x_cols + 0] < 0.25) {
+        s_x = betas[0];
+      } else if ((covariates[i * x_cols + 0] >= 0.25) && covariates[i * x_cols + 0] < 0.5) {
+        s_x = betas[1];
+      } else if ((covariates[i * x_cols + 0] >= 0.5) && covariates[i * x_cols + 0] < 0.75) {
+        s_x = betas[2];
+      } else {
+        s_x = betas[3];
+      }
+      error = s_x * normal_dist(gen);
+      outcome[i * y_cols + j] = error;
+      if (rfx_included) {
+        if (rfx_groups[i] == 1) {
+          rfx = 5.;
+        }
+        else {
+          rfx = -5.;
+        }
+        outcome[i * y_cols + j] += rfx;
+      }
+    }
+  }
+}
+
 void OutcomeOffsetScale(ColumnVector& residual, double& outcome_offset, double& outcome_scale) {
   data_size_t n = residual.NumRows();
   double outcome_val = 0.0;
@@ -340,36 +420,6 @@ void OutcomeOffsetScale(ColumnVector& residual, double& outcome_offset, double&
   }
 }
 
-// void sampleGFR(ForestTracker& tracker, TreePrior& tree_prior, ForestContainer& forest_samples, ForestDataset& dataset, 
-//                ColumnVector& residual, std::mt19937& rng, std::vector<FeatureType>& feature_types, std::vector<double>& var_weights_vector, 
-//                ForestLeafModel leaf_model_type, Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size) {
-//   if (leaf_model_type == ForestLeafModel::kConstant) {
-//     GaussianConstantLeafModel leaf_model = GaussianConstantLeafModel(leaf_scale);
-//     GFRSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
-//   } else if (leaf_model_type == ForestLeafModel::kUnivariateRegression) {
-//     GaussianUnivariateRegressionLeafModel leaf_model = GaussianUnivariateRegressionLeafModel(leaf_scale);
-//     GFRSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
-//   } else if (leaf_model_type == ForestLeafModel::kMultivariateRegression) {
-//     GaussianMultivariateRegressionLeafModel leaf_model = GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-//     GFRSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance, feature_types, cutpoint_grid_size);
-//   }
-// }
-
-// void sampleMCMC(ForestTracker& tracker, TreePrior& tree_prior, ForestContainer& forest_samples, ForestDataset& dataset, 
-//                 ColumnVector& residual, std::mt19937& rng, std::vector<FeatureType>& feature_types, std::vector<double>& var_weights_vector, 
-//                 ForestLeafModel leaf_model_type, Eigen::MatrixXd& leaf_scale_matrix, double global_variance, double leaf_scale, int cutpoint_grid_size) {
-//   if (leaf_model_type == ForestLeafModel::kConstant) {
-//     GaussianConstantLeafModel leaf_model = GaussianConstantLeafModel(leaf_scale);
-//     MCMCSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
-//   } else if (leaf_model_type == ForestLeafModel::kUnivariateRegression) {
-//     GaussianUnivariateRegressionLeafModel leaf_model = GaussianUnivariateRegressionLeafModel(leaf_scale);
-//     MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
-//   } else if (leaf_model_type == ForestLeafModel::kMultivariateRegression) {
-//     GaussianMultivariateRegressionLeafModel leaf_model = GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-//     MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat>(tracker, forest_samples, leaf_model, dataset, residual, tree_prior, rng, var_weights_vector, global_variance);
-//   }
-// }
-
 void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, bool rfx_included = false, int num_gfr = 10, int num_mcmc = 100, int random_seed = -1) {
   // Flag the data as row-major
   bool row_major = true;
@@ -426,6 +476,11 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
     dataset.AddBasis(basis_raw.data(), n, omega_cols, row_major);
     output_dimension = omega_cols;
     is_leaf_constant = false;
+  } else if (dgp_num == 3) {
+    GenerateDGP4(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
+    dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
+    output_dimension = 1;
+    is_leaf_constant = true;
   } else {
     Log::Fatal("Invalid dgp_num");
   }
@@ -501,8 +556,10 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
   double leaf_scale_init = 1.;
   Eigen::MatrixXd leaf_scale_matrix(omega_cols, omega_cols);
   Eigen::MatrixXd leaf_scale_matrix_init(omega_cols, omega_cols);
-  leaf_scale_matrix_init << 1.0, 0.0, 0.0, 1.0;
-  leaf_scale_matrix = leaf_scale_matrix_init;
+  if (omega_cols > 0) {
+    leaf_scale_matrix_init << 1.0, 0.0, 0.0, 1.0;
+    leaf_scale_matrix = leaf_scale_matrix_init;
+  }
 
   // Set global variance
   double global_variance;
@@ -525,7 +582,7 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
   std::vector<double> leaf_variance_samples{};
 
   // Prepare the samplers
-  LeafModelVariant leaf_model = leafModelFactory(model_type, leaf_scale, leaf_scale_matrix);
+  LeafModelVariant leaf_model = leafModelFactory(model_type, leaf_scale, leaf_scale_matrix, a_global, b_global);
 
   // Run the GFR sampler
   if (num_gfr > 0) {
@@ -541,11 +598,13 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
 
       // Sample tree ensemble
       if (model_type == ModelType::kConstantLeafGaussian) {
-        GFRSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false);
+        GFRSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, true);
       } else if (model_type == ModelType::kUnivariateRegressionLeafGaussian) {
-        GFRSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false);
+        GFRSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, true);
       } else if (model_type == ModelType::kMultivariateRegressionLeafGaussian) {
-        GFRSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, omega_cols);
+        GFRSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, true, omega_cols);
+      } else if (model_type == ModelType::kLogLinearVariance) {
+        GFRSampleOneIter<LogLinearVarianceLeafModel, LogLinearVarianceSuffStat>(tracker, forest_samples, std::get<LogLinearVarianceLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, false);
       }
 
       if (rfx_included) {
@@ -576,11 +635,13 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
 
       // Sample tree ensemble
       if (model_type == ModelType::kConstantLeafGaussian) {
-        MCMCSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false);
+        MCMCSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, true);
       } else if (model_type == ModelType::kUnivariateRegressionLeafGaussian) {
-        MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false);
+        MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, true);
       } else if (model_type == ModelType::kMultivariateRegressionLeafGaussian) {
-        MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, omega_cols);
+        MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, true, omega_cols);
+      } else if (model_type == ModelType::kLogLinearVariance) {
+        MCMCSampleOneIter<LogLinearVarianceLeafModel, LogLinearVarianceSuffStat>(tracker, forest_samples, std::get<LogLinearVarianceLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, true);
       }
 
       if (rfx_included) {
@@ -624,12 +685,12 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
 int main(int argc, char* argv[]) {
   // Unpack command line arguments
   int dgp_num = std::stoi(argv[1]);
-  if ((dgp_num != 0) && (dgp_num != 1) && (dgp_num != 2)) {
-    StochTree::Log::Fatal("The first command line argument must be 0, 1, or 2");
+  if ((dgp_num != 0) && (dgp_num != 1) && (dgp_num != 2) && (dgp_num != 3)) {
+    StochTree::Log::Fatal("The first command line argument must be 0, 1, 2, or 3");
   }
   int model_type_int = static_cast<StochTree::ModelType>(std::stoi(argv[2]));
-  if ((model_type_int != 0) && (model_type_int != 1) && (model_type_int != 2)) {
-    StochTree::Log::Fatal("The second command line argument must be 0, 1, or 2");
+  if ((model_type_int != 0) && (model_type_int != 1) && (model_type_int != 2) && (model_type_int != 3)) {
+    StochTree::Log::Fatal("The second command line argument must be 0, 1, 2, or 3");
   }
   StochTree::ModelType model_type = static_cast<StochTree::ModelType>(model_type_int);
   int rfx_int = std::stoi(argv[3]);
diff --git a/include/stochtree/container.h b/include/stochtree/container.h
index 78139bb3..0eca3132 100644
--- a/include/stochtree/container.h
+++ b/include/stochtree/container.h
@@ -22,8 +22,8 @@ namespace StochTree {
 
 class ForestContainer {
  public:
-  ForestContainer(int num_trees, int output_dimension = 1, bool is_leaf_constant = true);
-  ForestContainer(int num_samples, int num_trees, int output_dimension = 1, bool is_leaf_constant = true);
+  ForestContainer(int num_trees, int output_dimension = 1, bool is_leaf_constant = true, bool is_exponentiated = false);
+  ForestContainer(int num_samples, int num_trees, int output_dimension = 1, bool is_leaf_constant = true, bool is_exponentiated = false);
   ~ForestContainer() {}
 
   void InitializeRoot(double leaf_value);
@@ -96,6 +96,7 @@ class ForestContainer {
   int num_samples_;
   int num_trees_;
   int output_dimension_;
+  bool is_exponentiated_{false};
   bool is_leaf_constant_;
   bool initialized_{false};
 };
diff --git a/include/stochtree/ensemble.h b/include/stochtree/ensemble.h
index 72a47b7c..9bb285e3 100644
--- a/include/stochtree/ensemble.h
+++ b/include/stochtree/ensemble.h
@@ -26,23 +26,25 @@ namespace StochTree {
 
 class TreeEnsemble {
  public:
-  TreeEnsemble(int num_trees, int output_dimension = 1, bool is_leaf_constant = true) {
+  TreeEnsemble(int num_trees, int output_dimension = 1, bool is_leaf_constant = true, bool is_exponentiated = false) {
     // Initialize trees in the ensemble
     trees_ = std::vector<std::unique_ptr<Tree>>(num_trees);
     for (int i = 0; i < num_trees; i++) {
       trees_[i].reset(new Tree());
-      trees_[i]->Init(output_dimension);
+      trees_[i]->Init(output_dimension, is_exponentiated);
     }
     // Store ensemble configurations
     num_trees_ = num_trees;
     output_dimension_ = output_dimension;
     is_leaf_constant_ = is_leaf_constant;
+    is_exponentiated_ = is_exponentiated;
   }
   TreeEnsemble(TreeEnsemble& ensemble) {
     // Unpack ensemble configurations
     num_trees_ = ensemble.num_trees_;
     output_dimension_ = ensemble.output_dimension_;
     is_leaf_constant_ = ensemble.is_leaf_constant_;
+    is_exponentiated_ = ensemble.is_exponentiated_;
     // Initialize trees in the ensemble
     trees_ = std::vector<std::unique_ptr<Tree>>(num_trees_);
     for (int i = 0; i < num_trees_; i++) {
@@ -68,7 +70,7 @@ class TreeEnsemble {
 
   inline void ResetInitTree(int i) {
     trees_[i].reset(new Tree());
-    trees_[i]->Init(output_dimension_);
+    trees_[i]->Init(output_dimension_, is_exponentiated_);
   }
 
   inline void CloneFromExistingTree(int i, Tree* tree) {
@@ -110,7 +112,8 @@ class TreeEnsemble {
         auto &tree = *trees_[j];
         std::int32_t nidx = EvaluateTree(tree, covariates, i);
         for (int32_t k = 0; k < output_dimension_; k++) {
-          pred += tree.LeafValue(nidx, k) * basis(i, k);
+          if (is_exponentiated_) pred += std::exp(tree.LeafValue(nidx, k)) * basis(i, k);
+          else pred += tree.LeafValue(nidx, k) * basis(i, k);
         }
       }
       output[i + offset] = pred;
@@ -133,7 +136,8 @@ class TreeEnsemble {
       for (size_t j = tree_begin; j < tree_end; j++) {
         auto &tree = *trees_[j];
         std::int32_t nidx = EvaluateTree(tree, covariates, i);
-        pred += tree.LeafValue(nidx, 0);
+        if (is_exponentiated_) pred += std::exp(tree.LeafValue(nidx, 0));
+        else pred += tree.LeafValue(nidx, 0);
       }
       output[i + offset] = pred;
     }
@@ -194,6 +198,10 @@ class TreeEnsemble {
     return is_leaf_constant_;
   }
 
+  inline bool IsExponentiated() {
+    return is_exponentiated_;
+  }
+
   inline int32_t TreeMaxDepth(int tree_num) {
     return trees_[tree_num]->MaxLeafDepth();
   }
@@ -332,6 +340,7 @@ class TreeEnsemble {
     result_obj.emplace("num_trees", this->num_trees_);
     result_obj.emplace("output_dimension", this->output_dimension_);
     result_obj.emplace("is_leaf_constant", this->is_leaf_constant_);
+    result_obj.emplace("is_exponentiated", this->is_exponentiated_);
 
     std::string tree_label;
     for (int i = 0; i < trees_.size(); i++) {
@@ -347,6 +356,7 @@ class TreeEnsemble {
     this->num_trees_ = ensemble_json.at("num_trees");
     this->output_dimension_ = ensemble_json.at("output_dimension");
     this->is_leaf_constant_ = ensemble_json.at("is_leaf_constant");
+    this->is_exponentiated_ = ensemble_json.at("is_exponentiated");
 
     std::string tree_label;
     trees_.clear();
@@ -363,6 +373,7 @@ class TreeEnsemble {
   int num_trees_;
   int output_dimension_;
   bool is_leaf_constant_;
+  bool is_exponentiated_;
 };
 
 } // namespace StochTree
diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index 57ac1b69..270c5046 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -8,6 +8,7 @@
 #include <Eigen/Dense>
 #include <stochtree/cutpoint_candidates.h>
 #include <stochtree/data.h>
+#include <stochtree/ig_sampler.h>
 #include <stochtree/log.h>
 #include <stochtree/meta.h>
 #include <stochtree/normal_sampler.h>
@@ -24,7 +25,8 @@ namespace StochTree {
 enum ModelType {
   kConstantLeafGaussian, 
   kUnivariateRegressionLeafGaussian, 
-  kMultivariateRegressionLeafGaussian
+  kMultivariateRegressionLeafGaussian, 
+  kLogLinearVariance
 };
 
 /*! \brief Sufficient statistic and associated operations for gaussian homoskedastic constant leaf outcome model */
@@ -38,7 +40,7 @@ class GaussianConstantSuffStat {
     sum_w = 0.0;
     sum_yw = 0.0;
   }
-  void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, data_size_t row_idx) {
+  void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
       sum_w += 1./dataset.VarWeightValue(row_idx);
@@ -53,6 +55,11 @@ class GaussianConstantSuffStat {
     sum_w = 0.0;
     sum_yw = 0.0;
   }
+  void AddSuffStat(GaussianConstantSuffStat& lhs, GaussianConstantSuffStat& rhs) {
+    n = lhs.n + rhs.n;
+    sum_w = lhs.sum_w + rhs.sum_w;
+    sum_yw = lhs.sum_yw + rhs.sum_yw;
+  }
   void SubtractSuffStat(GaussianConstantSuffStat& lhs, GaussianConstantSuffStat& rhs) {
     n = lhs.n - rhs.n;
     sum_w = lhs.sum_w - rhs.sum_w;
@@ -98,7 +105,7 @@ class GaussianUnivariateRegressionSuffStat {
     sum_xxw = 0.0;
     sum_yxw = 0.0;
   }
-  void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, data_size_t row_idx) {
+  void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
       sum_xxw += dataset.BasisValue(row_idx, 0)*dataset.BasisValue(row_idx, 0)/dataset.VarWeightValue(row_idx);
@@ -113,6 +120,11 @@ class GaussianUnivariateRegressionSuffStat {
     sum_xxw = 0.0;
     sum_yxw = 0.0;
   }
+  void AddSuffStat(GaussianUnivariateRegressionSuffStat& lhs, GaussianUnivariateRegressionSuffStat& rhs) {
+    n = lhs.n + rhs.n;
+    sum_xxw = lhs.sum_xxw + rhs.sum_xxw;
+    sum_yxw = lhs.sum_yxw + rhs.sum_yxw;
+  }
   void SubtractSuffStat(GaussianUnivariateRegressionSuffStat& lhs, GaussianUnivariateRegressionSuffStat& rhs) {
     n = lhs.n - rhs.n;
     sum_xxw = lhs.sum_xxw - rhs.sum_xxw;
@@ -160,7 +172,7 @@ class GaussianMultivariateRegressionSuffStat {
     ytWX = Eigen::MatrixXd::Zero(1, basis_dim);
     p = basis_dim;
   }
-  void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, data_size_t row_idx) {
+  void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
       XtWX += dataset.GetBasis()(row_idx, Eigen::all).transpose()*dataset.GetBasis()(row_idx, Eigen::all)/dataset.VarWeightValue(row_idx);
@@ -175,6 +187,11 @@ class GaussianMultivariateRegressionSuffStat {
     XtWX = Eigen::MatrixXd::Zero(p, p);
     ytWX = Eigen::MatrixXd::Zero(1, p);
   }
+  void AddSuffStat(GaussianMultivariateRegressionSuffStat& lhs, GaussianMultivariateRegressionSuffStat& rhs) {
+    n = lhs.n + rhs.n;
+    XtWX = lhs.XtWX + rhs.XtWX;
+    ytWX = lhs.ytWX + rhs.ytWX;
+  }
   void SubtractSuffStat(GaussianMultivariateRegressionSuffStat& lhs, GaussianMultivariateRegressionSuffStat& rhs) {
     n = lhs.n - rhs.n;
     XtWX = lhs.XtWX - rhs.XtWX;
@@ -209,13 +226,83 @@ class GaussianMultivariateRegressionLeafModel {
   MultivariateNormalSampler multivariate_normal_sampler_;
 };
 
+/*! \brief Sufficient statistic and associated operations for heteroskedastic log-linear variance model */
+class LogLinearVarianceSuffStat {
+ public:
+  data_size_t n;
+  double sum_ei;
+  double weighted_sum_ei;
+  double sum_log_partial_var;
+  LogLinearVarianceSuffStat() {
+    n = 0;
+    sum_ei = 0.0;
+    weighted_sum_ei = 0.0;
+    sum_log_partial_var = 0.0;
+  }
+  void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
+    n += 1;
+    sum_ei += outcome(row_idx)*outcome(row_idx);
+    weighted_sum_ei += outcome(row_idx)*outcome(row_idx)/dataset.VarWeightValue(row_idx);
+    sum_log_partial_var += tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx);
+  }
+  void ResetSuffStat() {
+    n = 0;
+    sum_ei = 0.0;
+    weighted_sum_ei = 0.0;
+    sum_log_partial_var = 0.0;
+  }
+  void AddSuffStat(LogLinearVarianceSuffStat& lhs, LogLinearVarianceSuffStat& rhs) {
+    n = lhs.n + rhs.n;
+    sum_ei = lhs.sum_ei + rhs.sum_ei;
+    weighted_sum_ei = lhs.weighted_sum_ei + rhs.weighted_sum_ei;
+    sum_log_partial_var = lhs.sum_log_partial_var + rhs.sum_log_partial_var;
+  }
+  void SubtractSuffStat(LogLinearVarianceSuffStat& lhs, LogLinearVarianceSuffStat& rhs) {
+    n = lhs.n - rhs.n;
+    sum_ei = lhs.sum_ei - rhs.sum_ei;
+    weighted_sum_ei = lhs.weighted_sum_ei - rhs.weighted_sum_ei;
+    sum_log_partial_var = lhs.sum_log_partial_var - rhs.sum_log_partial_var;
+  }
+  bool SampleGreaterThan(data_size_t threshold) {
+    return n > threshold;
+  }
+  bool SampleGreaterThanEqual(data_size_t threshold) {
+    return n >= threshold;
+  }
+  data_size_t SampleSize() {
+    return n;
+  }
+};
+
+/*! \brief Marginal likelihood and posterior computation for heteroskedastic log-linear variance model */
+class LogLinearVarianceLeafModel {
+ public:
+  LogLinearVarianceLeafModel(double nu, double lambda) {nu_ = nu; lambda_ = lambda; ig_sampler_ = InverseGammaSampler();}
+  ~LogLinearVarianceLeafModel() {}
+  double SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance);
+  double NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance);
+  double PosteriorParameterShape(LogLinearVarianceSuffStat& suff_stat, double global_variance);
+  double PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance);
+  void SampleLeafParameters(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, Tree* tree, int tree_num, double global_variance, std::mt19937& gen);
+  void SetEnsembleRootPredictedValue(ForestDataset& dataset, TreeEnsemble* ensemble, double root_pred_value);
+  void SetPriorShape(double nu) {nu_ = nu;}
+  void SetPriorScale(double lambda) {lambda_ = lambda;}
+  inline bool RequiresBasis() {return true;}
+ private:
+  double nu_;
+  double lambda_;
+  InverseGammaSampler ig_sampler_;
+};
+
 using SuffStatVariant = std::variant<GaussianConstantSuffStat, 
                                      GaussianUnivariateRegressionSuffStat, 
-                                     GaussianMultivariateRegressionSuffStat>;
+                                     GaussianMultivariateRegressionSuffStat, 
+                                     LogLinearVarianceSuffStat>;
 
 using LeafModelVariant = std::variant<GaussianConstantLeafModel, 
                                       GaussianUnivariateRegressionLeafModel, 
-                                      GaussianMultivariateRegressionLeafModel>;
+                                      GaussianMultivariateRegressionLeafModel, 
+                                      LogLinearVarianceLeafModel>;
 
 template<typename SuffStatType, typename... SuffStatConstructorArgs>
 static inline SuffStatVariant createSuffStat(SuffStatConstructorArgs... leaf_suff_stat_args) {
@@ -232,18 +319,22 @@ static inline SuffStatVariant suffStatFactory(ModelType model_type, int basis_di
     return createSuffStat<GaussianConstantSuffStat>();
   } else if (model_type == kUnivariateRegressionLeafGaussian) {
     return createSuffStat<GaussianUnivariateRegressionSuffStat>();
-  } else {
+  } else if (model_type == kMultivariateRegressionLeafGaussian) {
     return createSuffStat<GaussianMultivariateRegressionSuffStat, int>(basis_dim);
+  } else {
+    return createSuffStat<LogLinearVarianceSuffStat>();
   }
 }
 
-static inline LeafModelVariant leafModelFactory(ModelType model_type, double tau, Eigen::MatrixXd& Sigma0) {
+static inline LeafModelVariant leafModelFactory(ModelType model_type, double tau, Eigen::MatrixXd& Sigma0, double nu, double lambda) {
   if (model_type == kConstantLeafGaussian) {
     return createLeafModel<GaussianConstantLeafModel, double>(tau);
   } else if (model_type == kUnivariateRegressionLeafGaussian) {
     return createLeafModel<GaussianUnivariateRegressionLeafModel, double>(tau);
-  } else {
+  } else if (model_type == kMultivariateRegressionLeafGaussian) {
     return createLeafModel<GaussianMultivariateRegressionLeafModel, Eigen::MatrixXd>(Sigma0);
+  } else {
+    return createLeafModel<LogLinearVarianceLeafModel, double, double>(nu, lambda);
   }
 }
 
@@ -258,11 +349,11 @@ static inline void AccumulateSuffStatProposed(SuffStatType& node_suff_stat, Suff
   for (auto i = node_begin_iter; i != node_end_iter; i++) {
     auto idx = *i;
     double feature_value = dataset.CovariateValue(idx, split_feature);
-    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
     if (split.SplitTrue(feature_value)) {
-      left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+      left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
     } else {
-      right_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+      right_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
     }
   }
 }
@@ -279,15 +370,15 @@ static inline void AccumulateSuffStatExisting(SuffStatType& node_suff_stat, Suff
   // Accumulate sufficient statistics for the left and split nodes
   for (auto i = left_node_begin_iter; i != left_node_end_iter; i++) {
     auto idx = *i;
-    left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
+    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
   }
 
   // Accumulate sufficient statistics for the right and split nodes
   for (auto i = right_node_begin_iter; i != right_node_end_iter; i++) {
     auto idx = *i;
-    right_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
-    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    right_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
+    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
   }
 }
 
@@ -308,7 +399,7 @@ static inline void AccumulateSingleNodeSuffStat(SuffStatType& node_suff_stat, Fo
   // Accumulate sufficient statistics
   for (auto i = node_begin_iter; i != node_end_iter; i++) {
     auto idx = *i;
-    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    node_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
   }
 }
 
@@ -336,7 +427,7 @@ static inline void AccumulateCutpointBinSuffStat(SuffStatType& left_suff_stat, F
   // Accumulate sufficient statistics
   for (auto i = cutpoint_begin_iter; i != cutpoint_end_iter; i++) {
     auto idx = *i;
-    left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), idx);
+    left_suff_stat.IncrementSuffStat(dataset, residual.GetData(), tracker, idx, tree_num);
   }
 }
 
diff --git a/include/stochtree/meta.h b/include/stochtree/meta.h
index 0a26d963..991c254f 100644
--- a/include/stochtree/meta.h
+++ b/include/stochtree/meta.h
@@ -18,6 +18,7 @@
 #include <unordered_map>
 #include <utility>
 #include <vector>
+#include <boost/math/constants/constants.hpp>
 
 #if (defined(_MSC_VER) && (defined(_M_IX86) || defined(_M_AMD64))) || defined(__INTEL_COMPILER) || MM_PREFETCH
   #include <xmmintrin.h>
@@ -64,6 +65,9 @@ enum RandomEffectsType {
   kRegressionRandomEffect
 };
 
+/*! \brief Double precision pi constant */
+static constexpr double pi_constant = boost::math::constants::pi<double>();
+
 /*! \brief Type of data size */
 typedef int32_t data_size_t;
 
diff --git a/include/stochtree/partition_tracker.h b/include/stochtree/partition_tracker.h
index f0b9f188..8c5e5a27 100644
--- a/include/stochtree/partition_tracker.h
+++ b/include/stochtree/partition_tracker.h
@@ -66,8 +66,11 @@ class ForestTracker {
   void ResetRoot(Eigen::MatrixXd& covariates, std::vector<FeatureType>& feature_types, int32_t tree_num);
   void AddSplit(Eigen::MatrixXd& covariates, TreeSplit& split, int32_t split_feature, int32_t tree_id, int32_t split_node_id, int32_t left_node_id, int32_t right_node_id, bool keep_sorted = false);
   void RemoveSplit(Eigen::MatrixXd& covariates, Tree* tree, int32_t tree_id, int32_t split_node_id, int32_t left_node_id, int32_t right_node_id, bool keep_sorted = false);
+  double GetSamplePrediction(data_size_t sample_id);
   double GetTreeSamplePrediction(data_size_t sample_id, int tree_id);
+  void SetSamplePrediction(data_size_t sample_id, double value);
   void SetTreeSamplePrediction(data_size_t sample_id, int tree_id, double value);
+  void SyncPredictions();
   data_size_t GetNodeId(int observation_num, int tree_num);
   data_size_t UnsortedNodeBegin(int tree_id, int node_id);
   data_size_t UnsortedNodeEnd(int tree_id, int node_id);
@@ -85,6 +88,8 @@ class ForestTracker {
   SortedNodeSampleTracker* GetSortedNodeSampleTracker() {return sorted_node_sample_tracker_.get();}
 
  private:
+  /*! \brief Mapper from observations to predicted values summed over every tree in a forest */
+  std::vector<double> sum_predictions_;
   /*! \brief Mapper from observations to predicted values for every tree in a forest */
   std::unique_ptr<SamplePredMapper> sample_pred_mapper_;
   /*! \brief Mapper from observations to leaf node indices for every tree in a forest */
diff --git a/include/stochtree/tree.h b/include/stochtree/tree.h
index d73bfba9..2e2f7345 100644
--- a/include/stochtree/tree.h
+++ b/include/stochtree/tree.h
@@ -82,7 +82,7 @@ class Tree {
   /*! \brief Reset tree to empty vectors and default values of boolean / integer variables */
   void Reset();
   /*! \brief Initialize the tree with a single root node */
-  void Init(int output_dimension = 1);
+  void Init(int output_dimension = 1, bool is_log_scale = false);
   /*! \brief Allocate a new node and return the node's ID */
   int AllocNode();
   /*! \brief Deletes node indexed by node ID */
@@ -218,7 +218,6 @@ class Tree {
     }
   }
 
-  void InplacePredictFromNodes(std::vector<double> result, std::vector<std::int32_t> node_indices);
   std::vector<double> PredictFromNodes(std::vector<std::int32_t> node_indices);
   std::vector<double> PredictFromNodes(std::vector<std::int32_t> node_indices, Eigen::MatrixXd& basis);
   double PredictFromNode(std::int32_t node_id);
@@ -238,6 +237,13 @@ class Tree {
   std::int32_t OutputDimension() const {
     return output_dimension_;
   }
+
+  /*!
+   * \brief Whether or not tree parameters should be exponentiated at prediction time
+   */
+  bool IsLogScale() const {
+    return is_log_scale_;
+  }
   
   /*!
    * \brief Index of the node's parent
@@ -713,6 +719,7 @@ class Tree {
 
   bool has_categorical_split_{false};
   int output_dimension_{1};
+  bool is_log_scale_{false};
 };
 
 /*! \brief Comparison operator for trees */
@@ -720,6 +727,7 @@ inline bool operator==(const Tree& lhs, const Tree& rhs) {
   return (
     (lhs.has_categorical_split_ == rhs.has_categorical_split_) && 
     (lhs.output_dimension_ == rhs.output_dimension_) && 
+    (lhs.is_log_scale_ == rhs.is_log_scale_) && 
     (lhs.node_type_ == rhs.node_type_) && 
     (lhs.parent_ == rhs.parent_) && 
     (lhs.cleft_ == rhs.cleft_) && 
diff --git a/include/stochtree/tree_sampler.h b/include/stochtree/tree_sampler.h
index 4aadb373..44531736 100644
--- a/include/stochtree/tree_sampler.h
+++ b/include/stochtree/tree_sampler.h
@@ -178,6 +178,7 @@ static inline void UpdateResidualEntireForest(ForestTracker& tracker, ForestData
     new_resid = op(residual.GetElement(i), pred_value);
     residual.SetElement(i, new_resid);
   }
+  tracker.SyncPredictions();
 }
 
 static inline void UpdateResidualTree(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, Tree* tree, int tree_num, 
@@ -186,6 +187,7 @@ static inline void UpdateResidualTree(ForestTracker& tracker, ForestDataset& dat
   double pred_value;
   int32_t leaf_pred;
   double new_resid;
+  double pred_delta;
   for (data_size_t i = 0; i < n; i++) {
     if (tree_new) {
       // If the tree has been newly sampled or adjusted, we must rerun the prediction 
@@ -196,7 +198,9 @@ static inline void UpdateResidualTree(ForestTracker& tracker, ForestDataset& dat
       } else {
         pred_value = tree->PredictFromNode(leaf_pred);
       }
+      pred_delta = pred_value - tracker.GetTreeSamplePrediction(i, tree_num);
       tracker.SetTreeSamplePrediction(i, tree_num, pred_value);
+      tracker.SetSamplePrediction(i, tracker.GetSamplePrediction(i) + pred_delta);
     } else {
       // If the tree has not yet been modified via a sampling step, 
       // we can query its prediction directly from the SamplePredMapper stored in tracker
@@ -237,6 +241,31 @@ static inline void UpdateResidualNewBasis(ForestTracker& tracker, ForestDataset&
       residual.SetElement(i, new_resid);
     }
   }
+  tracker.SyncPredictions();
+}
+
+static inline void UpdatePredictionsTree(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, Tree* tree, 
+                                         int tree_num, bool requires_basis, bool tree_new) {
+  data_size_t n = dataset.GetCovariates().rows();
+  double pred_value;
+  int32_t leaf_pred;
+  double new_resid;
+  double pred_delta;
+  for (data_size_t i = 0; i < n; i++) {
+    if (tree_new) {
+      // If the tree has been newly sampled or adjusted, we must rerun the prediction 
+      // method and update the SamplePredMapper stored in tracker
+      leaf_pred = tracker.GetNodeId(i, tree_num);
+      if (requires_basis) {
+        pred_value = tree->PredictFromNode(leaf_pred, dataset.GetBasis(), i);
+      } else {
+        pred_value = tree->PredictFromNode(leaf_pred);
+      }
+      pred_delta = pred_value - tracker.GetTreeSamplePrediction(i, tree_num);
+      tracker.SetTreeSamplePrediction(i, tree_num, pred_value);
+      tracker.SetSamplePrediction(i, tracker.GetSamplePrediction(i) + pred_delta);
+    }
+  }
 }
 
 template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
@@ -556,7 +585,7 @@ template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatCon
 static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
                                     ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
                                     double global_variance, std::vector<FeatureType>& feature_types, int cutpoint_grid_size, 
-                                    bool pre_initialized, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
+                                    bool pre_initialized, bool backfitting, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Previous number of samples
   int prev_num_samples = forests.NumSamples();
   
@@ -587,7 +616,7 @@ static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& for
   for (int i = 0; i < num_trees; i++) {
     // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
     Tree* tree = ensemble->GetTree(i);
-    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
+    if (backfitting) UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
     
     // Reset the tree and sample trackers
     ensemble->ResetInitTree(i);
@@ -606,7 +635,8 @@ static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& for
     leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
     
     // Subtract tree i's predictions back out of the residual
-    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
+    if (backfitting) UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
+    else UpdatePredictionsTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), true);
   }
 }
 
@@ -845,7 +875,7 @@ static inline void MCMCSampleTreeOneIter(Tree* tree, ForestTracker& tracker, For
 template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, ForestDataset& dataset, 
                                      ColumnVector& residual, TreePrior& tree_prior, std::mt19937& gen, std::vector<double>& variable_weights, 
-                                     double global_variance, bool pre_initialized, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
+                                     double global_variance, bool pre_initialized, bool backfitting, LeafSuffStatConstructorArgs&... leaf_suff_stat_args) {
   // Previous number of samples
   int prev_num_samples = forests.NumSamples();
   
@@ -874,7 +904,7 @@ static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& fo
   for (int i = 0; i < num_trees; i++) {
     // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
     tree = ensemble->GetTree(i);
-    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
+    if (backfitting) UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
     
     // Sample tree i
     tree = ensemble->GetTree(i);
@@ -888,8 +918,8 @@ static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& fo
     leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
     
     // Subtract tree i's predictions back out of the residual
-    tree = ensemble->GetTree(i);
-    UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
+    if (backfitting) UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
+    else UpdatePredictionsTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), true);
   }
 }
 
diff --git a/src/container.cpp b/src/container.cpp
index 79e940d6..52c3741c 100644
--- a/src/container.cpp
+++ b/src/container.cpp
@@ -5,24 +5,26 @@
 
 namespace StochTree {
 
-ForestContainer::ForestContainer(int num_trees, int output_dimension, bool is_leaf_constant) {
+ForestContainer::ForestContainer(int num_trees, int output_dimension, bool is_leaf_constant, bool is_exponentiated) {
   forests_ = std::vector<std::unique_ptr<TreeEnsemble>>(0);
   num_samples_ = 0;
   num_trees_ = num_trees;
   output_dimension_ = output_dimension;
   is_leaf_constant_ = is_leaf_constant;
+  is_exponentiated_ = is_exponentiated;
   initialized_ = true;
 }
 
-ForestContainer::ForestContainer(int num_samples, int num_trees, int output_dimension, bool is_leaf_constant) {
+ForestContainer::ForestContainer(int num_samples, int num_trees, int output_dimension, bool is_leaf_constant, bool is_exponentiated) {
   forests_ = std::vector<std::unique_ptr<TreeEnsemble>>(num_samples);
   for (auto& forest : forests_) {
-    forest.reset(new TreeEnsemble(num_trees, output_dimension, is_leaf_constant));
+    forest.reset(new TreeEnsemble(num_trees, output_dimension, is_leaf_constant, is_exponentiated));
   }
   num_samples_ = num_samples;
   num_trees_ = num_trees;
   output_dimension_ = output_dimension;
   is_leaf_constant_ = is_leaf_constant;
+  is_exponentiated_ = is_exponentiated;
   initialized_ = true;
 }
 
@@ -47,7 +49,7 @@ void ForestContainer::InitializeRoot(std::vector<double>& leaf_vector) {
   CHECK_EQ(num_samples_, 0);
   CHECK_EQ(forests_.size(), 0);
   forests_.resize(1);
-  forests_[0].reset(new TreeEnsemble(num_trees_, output_dimension_, is_leaf_constant_));
+  forests_[0].reset(new TreeEnsemble(num_trees_, output_dimension_, is_leaf_constant_, is_exponentiated_));
   // NOTE: not setting num_samples = 1, since we are just initializing constant root 
   // nodes and the forest still needs to be sampled by either MCMC or GFR
   num_samples_ = 0;
@@ -59,7 +61,7 @@ void ForestContainer::AddSamples(int num_samples) {
   int total_new_samples = num_samples + num_samples_;
   forests_.resize(total_new_samples);
   for (int i = num_samples_; i < total_new_samples; i++) {
-    forests_[i].reset(new TreeEnsemble(num_trees_, output_dimension_, is_leaf_constant_));
+    forests_[i].reset(new TreeEnsemble(num_trees_, output_dimension_, is_leaf_constant_, is_exponentiated_));
   }
   num_samples_ = total_new_samples;
 }
@@ -127,6 +129,7 @@ json ForestContainer::to_json() {
   result_obj.emplace("num_samples", this->num_samples_);
   result_obj.emplace("num_trees", this->num_trees_);
   result_obj.emplace("output_dimension", this->output_dimension_);
+  result_obj.emplace("is_exponentiated_", this->is_exponentiated_);
   result_obj.emplace("is_leaf_constant", this->is_leaf_constant_);
   result_obj.emplace("initialized", this->initialized_);
 
@@ -145,6 +148,7 @@ void ForestContainer::from_json(const json& forest_container_json) {
   this->num_trees_ = forest_container_json.at("num_trees");
   this->output_dimension_ = forest_container_json.at("output_dimension");
   this->is_leaf_constant_ = forest_container_json.at("is_leaf_constant");
+  this->is_exponentiated_ = forest_container_json.at("is_exponentiated");
   this->initialized_ = forest_container_json.at("initialized");
 
   std::string forest_label;
@@ -152,7 +156,7 @@ void ForestContainer::from_json(const json& forest_container_json) {
   forests_.resize(this->num_samples_);
   for (int i = 0; i < this->num_samples_; i++) {
     forest_label = "forest_" + std::to_string(i);
-    forests_[i] = std::make_unique<TreeEnsemble>(this->num_trees_, this->output_dimension_, this->is_leaf_constant_);
+    forests_[i] = std::make_unique<TreeEnsemble>(this->num_trees_, this->output_dimension_, this->is_leaf_constant_, this->is_exponentiated_);
     forests_[i]->from_json(forest_container_json.at(forest_label));
   }
 }
diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index a3ae9b38..11b0910b 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -1,4 +1,5 @@
 #include <stochtree/leaf_model.h>
+#include <boost/math/special_functions/gamma.hpp>
 
 namespace StochTree {
 
@@ -206,4 +207,83 @@ void GaussianMultivariateRegressionLeafModel::SetEnsembleRootPredictedValue(Fore
   }
 }
 
+double LogLinearVarianceLeafModel::SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance) {
+  double left_log_ml = (
+    std::log(boost::math::tgamma(0.5 * (nu_ + left_stat.n))) + 
+    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) - 
+    (0.5 * left_stat.n) * std::log(2 * pi_constant) - 
+    left_stat.sum_log_partial_var - 
+    std::log(boost::math::tgamma(0.5 * (nu_))) - 
+    (0.5 * (nu_ + left_stat.n)) * std::log(nu_ * lambda_ * lambda_ + left_stat.sum_ei)
+  );
+
+  double right_log_ml = (
+    std::log(boost::math::tgamma(0.5 * (nu_ + right_stat.n))) + 
+    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) - 
+    (0.5 * right_stat.n) * std::log(2 * pi_constant) - 
+    right_stat.sum_log_partial_var - 
+    std::log(boost::math::tgamma(0.5 * (nu_))) - 
+    (0.5 * (nu_ + right_stat.n)) * std::log(nu_ * lambda_ * lambda_ + right_stat.sum_ei)
+  );
+
+  return left_log_ml + right_log_ml;
+}
+
+double LogLinearVarianceLeafModel::NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
+  double log_ml = (
+    std::log(boost::math::tgamma(0.5 * (nu_ + suff_stat.n))) + 
+    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) - 
+    (0.5 * suff_stat.n) * std::log(2 * pi_constant) - 
+    suff_stat.sum_log_partial_var - 
+    std::log(boost::math::tgamma(0.5 * (nu_))) - 
+    (0.5 * (nu_ + suff_stat.n)) * std::log(nu_ * lambda_ * lambda_ + suff_stat.sum_ei)
+  );
+
+  return log_ml;
+}
+
+double LogLinearVarianceLeafModel::PosteriorParameterShape(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
+  return (nu_ + suff_stat.n) / 2;
+}
+
+double LogLinearVarianceLeafModel::PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
+  return ((nu_ * lambda_ * lambda_ + suff_stat.weighted_sum_ei) / (2 * (nu_ + suff_stat.n)));
+}
+
+void LogLinearVarianceLeafModel::SampleLeafParameters(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, Tree* tree, int tree_num, double global_variance, std::mt19937& gen) {
+  // Vector of leaf indices for tree
+  std::vector<int32_t> tree_leaves = tree->GetLeaves();
+  
+  // Initialize sufficient statistics
+  LogLinearVarianceSuffStat node_suff_stat = LogLinearVarianceSuffStat();
+
+  // Sample each leaf node parameter
+  double node_shape;
+  double node_scale;
+  double node_mu;
+  int32_t leaf_id;
+  for (int i = 0; i < tree_leaves.size(); i++) {
+    // Compute leaf node sufficient statistics
+    leaf_id = tree_leaves[i];
+    node_suff_stat.ResetSuffStat();
+    AccumulateSingleNodeSuffStat<LogLinearVarianceSuffStat, false>(node_suff_stat, dataset, tracker, residual, tree_num, leaf_id);
+    
+    // Compute posterior mean and variance
+    node_shape = PosteriorParameterShape(node_suff_stat, global_variance);
+    node_scale = PosteriorParameterScale(node_suff_stat, global_variance);
+    
+    // Draw from IG(shape, scale) and set the leaf parameter with each draw
+    node_mu = std::log(ig_sampler_.Sample(node_shape, node_scale, gen));
+    tree->SetLeaf(leaf_id, node_mu);
+  }
+}
+
+void LogLinearVarianceLeafModel::SetEnsembleRootPredictedValue(ForestDataset& dataset, TreeEnsemble* ensemble, double root_pred_value) {
+  int num_trees = ensemble->NumTrees();
+  for (int i = 0; i < num_trees; i++) {
+    Tree* tree = ensemble->GetTree(i);
+    tree->SetLeaf(0, root_pred_value);
+  }
+}
+
 } // namespace StochTree
diff --git a/src/partition_tracker.cpp b/src/partition_tracker.cpp
index 1b0caf28..c752be9e 100644
--- a/src/partition_tracker.cpp
+++ b/src/partition_tracker.cpp
@@ -94,14 +94,31 @@ void ForestTracker::RemoveSplit(Eigen::MatrixXd& covariates, Tree* tree, int32_t
   // TODO: WARN if this is called from the GFR Tree Sampler
 }
 
+double ForestTracker::GetSamplePrediction(data_size_t sample_id) {
+  return sum_predictions_[sample_id];
+}
+
 double ForestTracker::GetTreeSamplePrediction(data_size_t sample_id, int tree_id) {
   return sample_pred_mapper_->GetPred(sample_id, tree_id);
 }
 
+void ForestTracker::SetSamplePrediction(data_size_t sample_id, double value) {
+  sum_predictions_[sample_id] = value;
+}
+
 void ForestTracker::SetTreeSamplePrediction(data_size_t sample_id, int tree_id, double value) {
   sample_pred_mapper_->SetPred(sample_id, tree_id, value);
 }
 
+void ForestTracker::SyncPredictions() {
+  for (data_size_t i = 0; i < num_observations_; i++) {
+    sum_predictions_[i] = 0.;
+    for (int j = 0; j < num_trees_; j++) {
+      sum_predictions_[i] += sample_pred_mapper_->GetPred(i, j);
+    }
+  }
+}
+
 FeatureUnsortedPartition::FeatureUnsortedPartition(data_size_t n) {
   indices_.resize(n);
   std::iota(indices_.begin(), indices_.end(), 0);
diff --git a/src/tree.cpp b/src/tree.cpp
index f5fa79a3..896083f4 100644
--- a/src/tree.cpp
+++ b/src/tree.cpp
@@ -38,16 +38,6 @@ std::int32_t Tree::NumSplitNodes() const {
   return splits;
 }
 
-void Tree::InplacePredictFromNodes(std::vector<double> result, std::vector<std::int32_t> node_indices) {
-  if (result.size() != node_indices.size()) {
-    Log::Fatal("Indices and result vector are different sizes");
-  }
-  data_size_t n = node_indices.size();
-  for (data_size_t i = 0; i < n; i++) {
-    result[i] = this->LeafValue(node_indices[i]);
-  }
-}
-
 double Tree::PredictFromNode(std::int32_t node_id) {
   if (!this->IsLeaf(node_id)) {
     Log::Fatal("Node %d is not a leaf node", node_id);
@@ -111,6 +101,7 @@ void Tree::CloneFromTree(Tree* tree) {
 
   has_categorical_split_ = tree->has_categorical_split_;
   output_dimension_ = tree->output_dimension_;
+  is_log_scale_ = tree->is_log_scale_;
 }
 
 std::int32_t Tree::AllocNode() {
@@ -321,9 +312,10 @@ void Tree::Reset() {
   num_deleted_nodes = 0;
   has_categorical_split_ = false;
   output_dimension_ = 1;
+  is_log_scale_ = false;
 }
 
-void Tree::Init(std::int32_t output_dimension) {
+void Tree::Init(std::int32_t output_dimension, bool is_log_scale) {
   CHECK_GE(output_dimension, 1);
 
   // Clear all of the vectors that define the tree structure
@@ -350,8 +342,9 @@ void Tree::Init(std::int32_t output_dimension) {
   leaf_parents_.clear();
   internal_nodes_.clear();
 
-  // Set output dimension
+  // Set tree level info
   output_dimension_ = output_dimension;
+  is_log_scale_ = is_log_scale;
 
   // Allocate root node
   int rid = AllocNode();
@@ -564,6 +557,7 @@ json Tree::to_json() {
   result_obj.emplace("num_deleted_nodes", this->NumDeletedNodes());
   result_obj.emplace("has_categorical_split", this->has_categorical_split_);
   result_obj.emplace("output_dimension", this->output_dimension_);
+  result_obj.emplace("is_log_scale", this->is_log_scale_);
 
   // Unpack the array based fields
   TreeNodeVectorsToJson(result_obj, this);
@@ -655,6 +649,7 @@ void Tree::from_json(const json& tree_json) {
   tree_json.at("num_deleted_nodes").get_to(this->num_deleted_nodes);
   tree_json.at("has_categorical_split").get_to(this->has_categorical_split_);
   tree_json.at("output_dimension").get_to(this->output_dimension_);
+  tree_json.at("is_log_scale").get_to(this->is_log_scale_);
   this->num_deleted_nodes = 0;
   
   // Unpack the array based fields

From e04c33a762ef47822771d2dc8073a1b88afb014d Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 17 Sep 2024 00:51:21 -0400
Subject: [PATCH 22/41] Functional, but numerically incorrect
 heteroskedasticity BART implementation

---
 debug/api_debug.cpp                   |  60 +++++--
 include/stochtree/data.h              |  29 ++++
 include/stochtree/ensemble.h          |  12 +-
 include/stochtree/leaf_model.h        |  16 +-
 include/stochtree/partition_tracker.h |   1 +
 include/stochtree/tree_sampler.h      | 219 +++++++++++++++++++-------
 src/container.cpp                     |   6 +-
 src/leaf_model.cpp                    |  26 +--
 src/partition_tracker.cpp             |   8 +
 9 files changed, 282 insertions(+), 95 deletions(-)

diff --git a/debug/api_debug.cpp b/debug/api_debug.cpp
index 0cb6fab8..9d19d87f 100644
--- a/debug/api_debug.cpp
+++ b/debug/api_debug.cpp
@@ -420,7 +420,7 @@ void OutcomeOffsetScale(ColumnVector& residual, double& outcome_offset, double&
   }
 }
 
-void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, bool rfx_included = false, int num_gfr = 10, int num_mcmc = 100, int random_seed = -1) {
+void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussian, bool rfx_included = false, int num_gfr = 10, int num_mcmc = 100, int random_seed = -1) {
   // Flag the data as row-major
   bool row_major = true;
 
@@ -484,6 +484,11 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
   } else {
     Log::Fatal("Invalid dgp_num");
   }
+  
+  // Runtime check --- cannot have case / variance weights and be modeling heteroskedastic variance
+  if ((dgp_num == 3) && (dataset.HasVarWeights())) {
+    StochTree::Log::Fatal("Cannot provide variance / case weights when modeling heteroskedasticity with a forest");
+  }
 
   // Construct residual
   ColumnVector residual = ColumnVector(outcome_raw.data(), n);
@@ -532,7 +537,13 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
 
   // Initialize an ensemble
   int num_trees = 50;
-  ForestContainer forest_samples = ForestContainer(num_trees, output_dimension, is_leaf_constant);
+  bool forest_exponentiated;
+  if (model_type == kLogLinearVariance) {
+    forest_exponentiated = true;
+  } else {
+    forest_exponentiated = false;
+  }
+  ForestContainer forest_samples = ForestContainer(num_trees, output_dimension, is_leaf_constant, forest_exponentiated);
 
   // Initialize a leaf model
   double leaf_prior_mean = 0.;
@@ -581,6 +592,35 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
   std::vector<double> global_variance_samples{};
   std::vector<double> leaf_variance_samples{};
 
+  // Initialize leaf model
+  double init_val;
+  double init_val_glob;
+  std::vector<double> init_vec;
+  if (model_type == kConstantLeafGaussian) {
+    init_val_glob = StochTree::ComputeMeanOutcome(residual);
+    init_val = init_val_glob / static_cast<double>(num_trees);
+    forest_samples.InitializeRoot(init_val);
+    tracker.AssignAllSamplesToConstantPrediction(init_val);
+  } else if (model_type == kUnivariateRegressionLeafGaussian) {
+    init_val_glob = StochTree::ComputeMeanOutcome(residual);
+    init_val = init_val_glob / static_cast<double>(num_trees);
+    forest_samples.InitializeRoot(init_val);
+    tracker.AssignAllSamplesToConstantPrediction(init_val);
+  } else if (model_type == kMultivariateRegressionLeafGaussian) {
+    init_val_glob = StochTree::ComputeMeanOutcome(residual);
+    init_val = init_val_glob / static_cast<double>(num_trees);
+    init_vec = std::vector<double>(omega_cols, init_val);
+    forest_samples.InitializeRoot(init_vec);
+    tracker.AssignAllSamplesToConstantPrediction(init_val);
+  } else if (model_type == kLogLinearVariance) {
+    init_val_glob = StochTree::ComputeVarianceOutcome(residual) * 0.4;
+    init_val = std::log(init_val_glob) / static_cast<double>(num_trees);
+    forest_samples.InitializeRoot(init_val);
+    tracker.AssignAllSamplesToConstantPrediction(init_val);
+    std::vector<double> initial_preds(n, init_val_glob);
+    dataset.AddVarianceWeights(initial_preds.data(), n);
+  }
+
   // Prepare the samplers
   LeafModelVariant leaf_model = leafModelFactory(model_type, leaf_scale, leaf_scale_matrix, a_global, b_global);
 
@@ -598,13 +638,13 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
 
       // Sample tree ensemble
       if (model_type == ModelType::kConstantLeafGaussian) {
-        GFRSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, true);
+        GFRSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, true, true);
       } else if (model_type == ModelType::kUnivariateRegressionLeafGaussian) {
-        GFRSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, true);
+        GFRSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, true, true);
       } else if (model_type == ModelType::kMultivariateRegressionLeafGaussian) {
-        GFRSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, true, omega_cols);
+        GFRSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, true, true, omega_cols);
       } else if (model_type == ModelType::kLogLinearVariance) {
-        GFRSampleOneIter<LogLinearVarianceLeafModel, LogLinearVarianceSuffStat>(tracker, forest_samples, std::get<LogLinearVarianceLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, false, false);
+        GFRSampleOneIter<LogLinearVarianceLeafModel, LogLinearVarianceSuffStat>(tracker, forest_samples, std::get<LogLinearVarianceLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, feature_types, cutpoint_grid_size, true, false);
       }
 
       if (rfx_included) {
@@ -635,13 +675,13 @@ void RunDebug(int dgp_num = 0, ModelType model_type = kConstantLeafGaussian, boo
 
       // Sample tree ensemble
       if (model_type == ModelType::kConstantLeafGaussian) {
-        MCMCSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, true);
+        MCMCSampleOneIter<GaussianConstantLeafModel, GaussianConstantSuffStat>(tracker, forest_samples, std::get<GaussianConstantLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, true, true);
       } else if (model_type == ModelType::kUnivariateRegressionLeafGaussian) {
-        MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, true);
+        MCMCSampleOneIter<GaussianUnivariateRegressionLeafModel, GaussianUnivariateRegressionSuffStat>(tracker, forest_samples, std::get<GaussianUnivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, true, true);
       } else if (model_type == ModelType::kMultivariateRegressionLeafGaussian) {
-        MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, true, omega_cols);
+        MCMCSampleOneIter<GaussianMultivariateRegressionLeafModel, GaussianMultivariateRegressionSuffStat, int>(tracker, forest_samples, std::get<GaussianMultivariateRegressionLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, true, true, omega_cols);
       } else if (model_type == ModelType::kLogLinearVariance) {
-        MCMCSampleOneIter<LogLinearVarianceLeafModel, LogLinearVarianceSuffStat>(tracker, forest_samples, std::get<LogLinearVarianceLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, false, true);
+        MCMCSampleOneIter<LogLinearVarianceLeafModel, LogLinearVarianceSuffStat>(tracker, forest_samples, std::get<LogLinearVarianceLeafModel>(leaf_model), dataset, residual, tree_prior, gen, variable_weights, global_variance, true, false);
       }
 
       if (rfx_included) {
diff --git a/include/stochtree/data.h b/include/stochtree/data.h
index 04708da7..1558760a 100644
--- a/include/stochtree/data.h
+++ b/include/stochtree/data.h
@@ -160,6 +160,35 @@ class ForestDataset {
       }
     }
   }
+  /*!
+   * \brief Update the data in the internal variance weight vector to new values stored in a raw double array
+   *
+   * \param data_ptr Pointer to first element of a contiguous array of data storing a weight vector
+   * \param num_row Number of rows in the weight vector
+   * \param exponentiate Whether or not inputs should be exponentiated before being saved to var weight vector
+   */
+  void UpdateVarWeights(double* data_ptr, data_size_t num_row, bool exponentiate = true) {
+    CHECK(has_var_weights_);
+    // Copy data from R / Python process memory to Eigen vector
+    double temp_value;
+    for (data_size_t i = 0; i < num_row; ++i) {
+      if (exponentiate) temp_value = std::exp(static_cast<double>(*(data_ptr + i)));
+      else temp_value = static_cast<double>(*(data_ptr + i));
+      var_weights_.SetElement(i, temp_value);
+    }
+  }
+  /*!
+   * \brief Update an observation in the internal variance weight vector to a new value
+   *
+   * \param row_id Row ID in the variance weight vector to be overwritten
+   * \param new_value New variance weight value
+   * \param exponentiate Whether or not input should be exponentiated before being saved to var weight vector
+   */
+  void SetVarWeightValue(data_size_t row_id, double new_value, bool exponentiate = true) {
+    CHECK(has_var_weights_);
+    if (exponentiate) var_weights_.SetElement(row_id, std::exp(new_value));
+    else var_weights_.SetElement(row_id, new_value);
+  }
  private:
   ColumnMatrix covariates_;
   ColumnMatrix basis_;
diff --git a/include/stochtree/ensemble.h b/include/stochtree/ensemble.h
index 9bb285e3..7af0f3e3 100644
--- a/include/stochtree/ensemble.h
+++ b/include/stochtree/ensemble.h
@@ -112,11 +112,11 @@ class TreeEnsemble {
         auto &tree = *trees_[j];
         std::int32_t nidx = EvaluateTree(tree, covariates, i);
         for (int32_t k = 0; k < output_dimension_; k++) {
-          if (is_exponentiated_) pred += std::exp(tree.LeafValue(nidx, k)) * basis(i, k);
-          else pred += tree.LeafValue(nidx, k) * basis(i, k);
+          pred += tree.LeafValue(nidx, k) * basis(i, k);
         }
       }
-      output[i + offset] = pred;
+      if (is_exponentiated_) output[i + offset] = std::exp(pred);
+      else output[i + offset] = std::exp(pred);
     }
   }
 
@@ -136,10 +136,10 @@ class TreeEnsemble {
       for (size_t j = tree_begin; j < tree_end; j++) {
         auto &tree = *trees_[j];
         std::int32_t nidx = EvaluateTree(tree, covariates, i);
-        if (is_exponentiated_) pred += std::exp(tree.LeafValue(nidx, 0));
-        else pred += tree.LeafValue(nidx, 0);
+        pred += tree.LeafValue(nidx, 0);
       }
-      output[i + offset] = pred;
+      if (is_exponentiated_) output[i + offset] = std::exp(pred);
+      else output[i + offset] = pred;
     }
   }
 
diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index 270c5046..def21e21 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -232,35 +232,41 @@ class LogLinearVarianceSuffStat {
   data_size_t n;
   double sum_ei;
   double weighted_sum_ei;
+  double sq_weighted_sum_ei;
   double sum_log_partial_var;
   LogLinearVarianceSuffStat() {
     n = 0;
     sum_ei = 0.0;
     weighted_sum_ei = 0.0;
+    sq_weighted_sum_ei = 0.0;
     sum_log_partial_var = 0.0;
   }
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     sum_ei += outcome(row_idx)*outcome(row_idx);
     weighted_sum_ei += outcome(row_idx)*outcome(row_idx)/dataset.VarWeightValue(row_idx);
-    sum_log_partial_var += tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx);
+    sq_weighted_sum_ei += (outcome(row_idx)*outcome(row_idx))/(dataset.VarWeightValue(row_idx)*dataset.VarWeightValue(row_idx));
+    sum_log_partial_var += std::exp(tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx));
   }
   void ResetSuffStat() {
     n = 0;
     sum_ei = 0.0;
     weighted_sum_ei = 0.0;
+    sq_weighted_sum_ei = 0.0;
     sum_log_partial_var = 0.0;
   }
   void AddSuffStat(LogLinearVarianceSuffStat& lhs, LogLinearVarianceSuffStat& rhs) {
     n = lhs.n + rhs.n;
     sum_ei = lhs.sum_ei + rhs.sum_ei;
     weighted_sum_ei = lhs.weighted_sum_ei + rhs.weighted_sum_ei;
+    sq_weighted_sum_ei = lhs.sq_weighted_sum_ei + rhs.sq_weighted_sum_ei;
     sum_log_partial_var = lhs.sum_log_partial_var + rhs.sum_log_partial_var;
   }
   void SubtractSuffStat(LogLinearVarianceSuffStat& lhs, LogLinearVarianceSuffStat& rhs) {
     n = lhs.n - rhs.n;
     sum_ei = lhs.sum_ei - rhs.sum_ei;
     weighted_sum_ei = lhs.weighted_sum_ei - rhs.weighted_sum_ei;
+    sq_weighted_sum_ei = lhs.sq_weighted_sum_ei - rhs.sq_weighted_sum_ei;
     sum_log_partial_var = lhs.sum_log_partial_var - rhs.sum_log_partial_var;
   }
   bool SampleGreaterThan(data_size_t threshold) {
@@ -287,7 +293,7 @@ class LogLinearVarianceLeafModel {
   void SetEnsembleRootPredictedValue(ForestDataset& dataset, TreeEnsemble* ensemble, double root_pred_value);
   void SetPriorShape(double nu) {nu_ = nu;}
   void SetPriorScale(double lambda) {lambda_ = lambda;}
-  inline bool RequiresBasis() {return true;}
+  inline bool RequiresBasis() {return false;}
  private:
   double nu_;
   double lambda_;
@@ -326,15 +332,17 @@ static inline SuffStatVariant suffStatFactory(ModelType model_type, int basis_di
   }
 }
 
-static inline LeafModelVariant leafModelFactory(ModelType model_type, double tau, Eigen::MatrixXd& Sigma0, double nu, double lambda) {
+static inline LeafModelVariant leafModelFactory(ModelType model_type, double tau, Eigen::MatrixXd& Sigma0, double a, double b) {
   if (model_type == kConstantLeafGaussian) {
     return createLeafModel<GaussianConstantLeafModel, double>(tau);
   } else if (model_type == kUnivariateRegressionLeafGaussian) {
     return createLeafModel<GaussianUnivariateRegressionLeafModel, double>(tau);
   } else if (model_type == kMultivariateRegressionLeafGaussian) {
     return createLeafModel<GaussianMultivariateRegressionLeafModel, Eigen::MatrixXd>(Sigma0);
+  } else if (model_type == kLogLinearVariance) {
+    return createLeafModel<LogLinearVarianceLeafModel, double, double>(a, b);
   } else {
-    return createLeafModel<LogLinearVarianceLeafModel, double, double>(nu, lambda);
+    Log::Fatal("Incompatible model type provided to leaf model factory");
   }
 }
 
diff --git a/include/stochtree/partition_tracker.h b/include/stochtree/partition_tracker.h
index 8c5e5a27..961538f0 100644
--- a/include/stochtree/partition_tracker.h
+++ b/include/stochtree/partition_tracker.h
@@ -68,6 +68,7 @@ class ForestTracker {
   void RemoveSplit(Eigen::MatrixXd& covariates, Tree* tree, int32_t tree_id, int32_t split_node_id, int32_t left_node_id, int32_t right_node_id, bool keep_sorted = false);
   double GetSamplePrediction(data_size_t sample_id);
   double GetTreeSamplePrediction(data_size_t sample_id, int tree_id);
+  void UpdateVarWeightsFromInternalPredictions(ForestDataset& dataset);
   void SetSamplePrediction(data_size_t sample_id, double value);
   void SetTreeSamplePrediction(data_size_t sample_id, int tree_id, double value);
   void SyncPredictions();
diff --git a/include/stochtree/tree_sampler.h b/include/stochtree/tree_sampler.h
index 44531736..2cf8da4b 100644
--- a/include/stochtree/tree_sampler.h
+++ b/include/stochtree/tree_sampler.h
@@ -146,14 +146,58 @@ static inline void RemoveSplitFromModel(ForestTracker& tracker, ForestDataset& d
 }
 
 static inline double ComputeMeanOutcome(ColumnVector& residual) {
-  data_size_t n = residual.NumRows();
-  double total_outcome = 0.;
+  int n = residual.NumRows();
+  double sum_y = 0.;
+  double y;
   for (data_size_t i = 0; i < n; i++) {
-    total_outcome += residual.GetElement(i);
+    y = residual.GetElement(i);
+    sum_y += y;
   }
-  return total_outcome / static_cast<double>(n);
+  return sum_y / static_cast<double>(n);
 }
 
+static inline double ComputeVarianceOutcome(ColumnVector& residual) {
+  int n = residual.NumRows();
+  double sum_y = 0.;
+  double sum_y_sq = 0.;
+  double y;
+  for (data_size_t i = 0; i < n; i++) {
+    y = residual.GetElement(i);
+    sum_y += y;
+    sum_y_sq += y * y;
+  }
+  return sum_y_sq / static_cast<double>(n) - (sum_y * sum_y) / (static_cast<double>(n) * static_cast<double>(n));
+}
+
+static inline void UpdateModelVarianceForest(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, 
+                                             TreeEnsemble* forest, bool requires_basis, std::function<double(double, double)> op) {
+  data_size_t n = dataset.GetCovariates().rows();
+  double tree_pred = 0.;
+  double pred_value = 0.;
+  double new_resid = 0.;
+  int32_t leaf_pred;
+  for (data_size_t i = 0; i < n; i++) {
+    for (int j = 0; j < forest->NumTrees(); j++) {
+      Tree* tree = forest->GetTree(j);
+      leaf_pred = tracker.GetNodeId(i, j);
+      if (requires_basis) {
+        tree_pred += tree->PredictFromNode(leaf_pred, dataset.GetBasis(), i);
+      } else {
+        tree_pred += tree->PredictFromNode(leaf_pred);
+      }
+      tracker.SetTreeSamplePrediction(i, j, tree_pred);
+      pred_value += tree_pred;
+    }
+    
+    // Run op (either plus or minus) on the residual and the new prediction
+    new_resid = op(residual.GetElement(i), pred_value);
+    residual.SetElement(i, new_resid);
+  }
+  tracker.SyncPredictions();
+}
+
+
+
 static inline void UpdateResidualEntireForest(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, TreeEnsemble* forest, 
                                               bool requires_basis, std::function<double(double, double)> op) {
   data_size_t n = dataset.GetCovariates().rows();
@@ -181,7 +225,7 @@ static inline void UpdateResidualEntireForest(ForestTracker& tracker, ForestData
   tracker.SyncPredictions();
 }
 
-static inline void UpdateResidualTree(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, Tree* tree, int tree_num, 
+static inline void UpdateMeanModelTree(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, Tree* tree, int tree_num, 
                                       bool requires_basis, std::function<double(double, double)> op, bool tree_new) {
   data_size_t n = dataset.GetCovariates().rows();
   double pred_value;
@@ -244,13 +288,15 @@ static inline void UpdateResidualNewBasis(ForestTracker& tracker, ForestDataset&
   tracker.SyncPredictions();
 }
 
-static inline void UpdatePredictionsTree(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, Tree* tree, 
-                                         int tree_num, bool requires_basis, bool tree_new) {
+static inline void UpdateVarModelTree(ForestTracker& tracker, ForestDataset& dataset, ColumnVector& residual, Tree* tree, 
+                                      int tree_num, bool requires_basis, std::function<double(double, double)> op, bool tree_new) {
   data_size_t n = dataset.GetCovariates().rows();
   double pred_value;
   int32_t leaf_pred;
-  double new_resid;
+  double new_weight;
   double pred_delta;
+  double prev_tree_pred;
+  double prev_pred;
   for (data_size_t i = 0; i < n; i++) {
     if (tree_new) {
       // If the tree has been newly sampled or adjusted, we must rerun the prediction 
@@ -261,10 +307,19 @@ static inline void UpdatePredictionsTree(ForestTracker& tracker, ForestDataset&
       } else {
         pred_value = tree->PredictFromNode(leaf_pred);
       }
-      pred_delta = pred_value - tracker.GetTreeSamplePrediction(i, tree_num);
+      prev_tree_pred = tracker.GetTreeSamplePrediction(i, tree_num);
+      prev_pred = tracker.GetSamplePrediction(i);
+      pred_delta = pred_value - prev_tree_pred;
       tracker.SetTreeSamplePrediction(i, tree_num, pred_value);
-      tracker.SetSamplePrediction(i, tracker.GetSamplePrediction(i) + pred_delta);
+      tracker.SetSamplePrediction(i, prev_pred + pred_delta);
+    } else {
+      // If the tree has not yet been modified via a sampling step, 
+      // we can query its prediction directly from the SamplePredMapper stored in tracker
+      pred_value = tracker.GetTreeSamplePrediction(i, tree_num);
     }
+    // Run op (either plus or minus) on the dataset's variance weights and the new prediction
+    new_weight = op(std::log(dataset.VarWeightValue(i)), pred_value);
+    dataset.SetVarWeightValue(i, std::exp(new_weight), false);
   }
 }
 
@@ -316,6 +371,63 @@ static inline std::tuple<double, double, data_size_t, data_size_t> EvaluateExist
   return std::tuple<double, double, data_size_t, data_size_t>(split_log_ml, no_split_log_ml, left_n, right_n);
 }
 
+template <typename LeafModel>
+static inline void ModelInitialization(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model,
+                                       ForestDataset& dataset, ColumnVector& residual, TreePrior& tree_prior,
+                                       std::mt19937& gen, std::vector<double>& variable_weights, double global_variance,
+                                       bool pre_initialized, bool backfitting, int prev_num_samples, bool var_trees = false) {
+  if ((prev_num_samples == 0) && (!pre_initialized)) {
+    // Add new forest to the container
+    forests.AddSamples(1);
+    
+    // Set initial value for each leaf in the forest
+    double leaf_value;
+    if (var_trees) {
+      leaf_value = std::log(ComputeVarianceOutcome(residual)) / static_cast<double>(forests.NumTrees());
+    } else {
+      leaf_value = ComputeMeanOutcome(residual) / static_cast<double>(forests.NumTrees());
+    }
+    TreeEnsemble* ensemble = forests.GetEnsemble(0);
+    leaf_model.SetEnsembleRootPredictedValue(dataset, ensemble, leaf_value);
+    tracker.AssignAllSamplesToConstantPrediction(leaf_value);
+  } else if (prev_num_samples > 0) {
+    // Add new forest to the container
+    forests.AddSamples(1);
+
+    // NOTE: only doing this for the simplicity of the partial residual step
+    // We could alternatively "reach back" to the tree predictions from a previous
+    // sample (whenever there is more than one sample). This is cleaner / quicker
+    // to implement during this refactor.
+    forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
+  } else {
+    forests.IncrementSampleCount();
+  }
+}
+
+template <typename LeafModel>
+static inline void AdjustStateBeforeTreeSampling(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, 
+                                                 ForestDataset& dataset, ColumnVector& residual, TreePrior& tree_prior, 
+                                                 bool backfitting, Tree* tree, int tree_num) {
+  if (backfitting) {
+    UpdateMeanModelTree(tracker, dataset, residual, tree, tree_num, leaf_model.RequiresBasis(), std::plus<double>(), false);
+  } else {
+    // TODO: think about a generic way to store "state" corresponding to the other models?
+    UpdateVarModelTree(tracker, dataset, residual, tree, tree_num, leaf_model.RequiresBasis(), std::minus<double>(), false);
+  }
+}
+
+template <typename LeafModel>
+static inline void AdjustStateAfterTreeSampling(ForestTracker& tracker, ForestContainer& forests, LeafModel& leaf_model, 
+                                                ForestDataset& dataset, ColumnVector& residual, TreePrior& tree_prior, 
+                                                bool backfitting, Tree* tree, int tree_num) {
+  if (backfitting) {
+    UpdateMeanModelTree(tracker, dataset, residual, tree, tree_num, leaf_model.RequiresBasis(), std::minus<double>(), true);
+  } else {
+    // TODO: think about a generic way to store "state" corresponding to the other models?
+    UpdateVarModelTree(tracker, dataset, residual, tree, tree_num, leaf_model.RequiresBasis(), std::plus<double>(), true);
+  }
+}
+
 template <typename LeafModel, typename LeafSuffStat, typename... LeafSuffStatConstructorArgs>
 static inline void EvaluateAllPossibleSplits(
   ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, TreePrior& tree_prior, LeafModel& leaf_model, double global_variance, int tree_num, int split_node_id, 
@@ -589,34 +701,25 @@ static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& for
   // Previous number of samples
   int prev_num_samples = forests.NumSamples();
   
-  if ((prev_num_samples == 0) && (!pre_initialized)) {
-    // Add new forest to the container
-    forests.AddSamples(1);
-    
-    // Set initial value for each leaf in the forest
-    double root_pred = ComputeMeanOutcome(residual) / static_cast<double>(forests.NumTrees());
-    TreeEnsemble* ensemble = forests.GetEnsemble(0);
-    leaf_model.SetEnsembleRootPredictedValue(dataset, ensemble, root_pred);
-  } else if (prev_num_samples > 0) {
-    // Add new forest to the container
-    forests.AddSamples(1);
-
-    // NOTE: only doing this for the simplicity of the partial residual step
-    // We could alternatively "reach back" to the tree predictions from a previous
-    // sample (whenever there is more than one sample). This is cleaner / quicker
-    // to implement during this refactor.
-    forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
-  } else {
-    forests.IncrementSampleCount();
-  }
+  // Handle any "initialization" of a model (trees, ForestTracker, etc...) if this is the first sample and 
+  // the model was not pre-initialized
+  bool var_trees;
+  if (std::is_same_v<LeafModel, LogLinearVarianceLeafModel>) var_trees = true;
+  else var_trees = false;
+  ModelInitialization<LeafModel>(tracker, forests, leaf_model, dataset, residual, tree_prior, gen,
+                                 variable_weights, global_variance, pre_initialized, backfitting,
+                                 prev_num_samples, var_trees);
   
   // Run the GFR algorithm for each tree
   TreeEnsemble* ensemble = forests.GetEnsemble(prev_num_samples);
   int num_trees = forests.NumTrees();
   for (int i = 0; i < num_trees; i++) {
-    // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
+    // Adjust any model state needed to run a tree sampler
+    // For models that involve Bayesian backfitting, this amounts to adding tree i's 
+    // predictions back to the residual (thus, training a model on the "partial residual")
+    // For more general "blocked MCMC" models, this might require changes to a ForestTracker or Dataset object
     Tree* tree = ensemble->GetTree(i);
-    if (backfitting) UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
+    AdjustStateBeforeTreeSampling<LeafModel>(tracker, forests, leaf_model, dataset, residual, tree_prior, backfitting, tree, i);
     
     // Reset the tree and sample trackers
     ensemble->ResetInitTree(i);
@@ -634,9 +737,11 @@ static inline void GFRSampleOneIter(ForestTracker& tracker, ForestContainer& for
     tree = ensemble->GetTree(i);
     leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
     
-    // Subtract tree i's predictions back out of the residual
-    if (backfitting) UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
-    else UpdatePredictionsTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), true);
+    // Adjust any model state needed to run a tree sampler
+    // For models that involve Bayesian backfitting, this amounts to subtracting tree i's 
+    // predictions back out of the residual (thus, using an updated "partial residual" in the following interation).
+    // For more general "blocked MCMC" models, this might require changes to a ForestTracker or Dataset object
+    AdjustStateAfterTreeSampling<LeafModel>(tracker, forests, leaf_model, dataset, residual, tree_prior, backfitting, tree, i);
   }
 }
 
@@ -879,32 +984,26 @@ static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& fo
   // Previous number of samples
   int prev_num_samples = forests.NumSamples();
   
-  if ((prev_num_samples == 0) && (!pre_initialized)) {
-    // Add new forest to the container
-    forests.AddSamples(1);
-    
-    // Set initial value for each leaf in the forest
-    double root_pred = ComputeMeanOutcome(residual) / static_cast<double>(forests.NumTrees());
-    TreeEnsemble* ensemble = forests.GetEnsemble(0);
-    leaf_model.SetEnsembleRootPredictedValue(dataset, ensemble, root_pred);
-  } else if (prev_num_samples > 0) {
-    // Add new forest to the container
-    forests.AddSamples(1);
-    
-    // Copy previous forest
-    forests.CopyFromPreviousSample(prev_num_samples, prev_num_samples - 1);
-  } else {
-    forests.IncrementSampleCount();
-  }
+  // Handle any "initialization" of a model (trees, ForestTracker, etc...) if this is the first sample and 
+  // the model was not pre-initialized
+  bool var_trees;
+  if (std::is_same_v<LeafModel, LogLinearVarianceLeafModel>) var_trees = true;
+  else var_trees = false;
+  ModelInitialization<LeafModel>(tracker, forests, leaf_model, dataset, residual, tree_prior, gen,
+                                 variable_weights, global_variance, pre_initialized, backfitting,
+                                 prev_num_samples, var_trees);
   
   // Run the MCMC algorithm for each tree
   TreeEnsemble* ensemble = forests.GetEnsemble(prev_num_samples);
   Tree* tree;
   int num_trees = forests.NumTrees();
   for (int i = 0; i < num_trees; i++) {
-    // Add tree i's predictions back to the residual (thus, training a model on the "partial residual")
-    tree = ensemble->GetTree(i);
-    if (backfitting) UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::plus<double>(), false);
+    // Adjust any model state needed to run a tree sampler
+    // For models that involve Bayesian backfitting, this amounts to adding tree i's 
+    // predictions back to the residual (thus, training a model on the "partial residual")
+    // For more general "blocked MCMC" models, this might require changes to a ForestTracker or Dataset object
+    Tree* tree = ensemble->GetTree(i);
+    AdjustStateBeforeTreeSampling<LeafModel>(tracker, forests, leaf_model, dataset, residual, tree_prior, backfitting, tree, i);
     
     // Sample tree i
     tree = ensemble->GetTree(i);
@@ -917,12 +1016,14 @@ static inline void MCMCSampleOneIter(ForestTracker& tracker, ForestContainer& fo
     tree = ensemble->GetTree(i);
     leaf_model.SampleLeafParameters(dataset, tracker, residual, tree, i, global_variance, gen);
     
-    // Subtract tree i's predictions back out of the residual
-    if (backfitting) UpdateResidualTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), std::minus<double>(), true);
-    else UpdatePredictionsTree(tracker, dataset, residual, tree, i, leaf_model.RequiresBasis(), true);
+    // Adjust any model state needed to run a tree sampler
+    // For models that involve Bayesian backfitting, this amounts to subtracting tree i's 
+    // predictions back out of the residual (thus, using an updated "partial residual" in the following interation).
+    // For more general "blocked MCMC" models, this might require changes to a ForestTracker or Dataset object
+    AdjustStateAfterTreeSampling<LeafModel>(tracker, forests, leaf_model, dataset, residual, tree_prior, backfitting, tree, i);
   }
 }
 
 } // namespace StochTree
 
-#endif // STOCHTREE_TREE_SAMPLER_H_
\ No newline at end of file
+#endif // STOCHTREE_TREE_SAMPLER_H_
diff --git a/src/container.cpp b/src/container.cpp
index 52c3741c..ce3091ed 100644
--- a/src/container.cpp
+++ b/src/container.cpp
@@ -37,7 +37,7 @@ void ForestContainer::InitializeRoot(double leaf_value) {
   CHECK_EQ(num_samples_, 0);
   CHECK_EQ(forests_.size(), 0);
   forests_.resize(1);
-  forests_[0].reset(new TreeEnsemble(num_trees_, output_dimension_, is_leaf_constant_));
+  forests_[0].reset(new TreeEnsemble(num_trees_, output_dimension_, is_leaf_constant_, is_exponentiated_));
   // NOTE: not setting num_samples = 1, since we are just initializing constant root 
   // nodes and the forest still needs to be sampled by either MCMC or GFR
   num_samples_ = 0;
@@ -129,7 +129,7 @@ json ForestContainer::to_json() {
   result_obj.emplace("num_samples", this->num_samples_);
   result_obj.emplace("num_trees", this->num_trees_);
   result_obj.emplace("output_dimension", this->output_dimension_);
-  result_obj.emplace("is_exponentiated_", this->is_exponentiated_);
+  result_obj.emplace("is_exponentiated", this->is_exponentiated_);
   result_obj.emplace("is_leaf_constant", this->is_leaf_constant_);
   result_obj.emplace("initialized", this->initialized_);
 
@@ -161,4 +161,4 @@ void ForestContainer::from_json(const json& forest_container_json) {
   }
 }
 
-} // namespace StochTree
\ No newline at end of file
+} // namespace StochTree
diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index 11b0910b..fa71997a 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -209,21 +209,21 @@ void GaussianMultivariateRegressionLeafModel::SetEnsembleRootPredictedValue(Fore
 
 double LogLinearVarianceLeafModel::SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance) {
   double left_log_ml = (
-    std::log(boost::math::tgamma(0.5 * (nu_ + left_stat.n))) + 
-    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) - 
+    boost::math::lgamma(0.5 * (nu_ + left_stat.n)) +
+    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) -
     (0.5 * left_stat.n) * std::log(2 * pi_constant) - 
     left_stat.sum_log_partial_var - 
-    std::log(boost::math::tgamma(0.5 * (nu_))) - 
-    (0.5 * (nu_ + left_stat.n)) * std::log(nu_ * lambda_ * lambda_ + left_stat.sum_ei)
+    boost::math::lgamma(0.5 * (nu_)) -
+    (0.5 * (nu_ + left_stat.n)) * std::log(nu_ * lambda_ * lambda_ + left_stat.weighted_sum_ei)
   );
 
   double right_log_ml = (
-    std::log(boost::math::tgamma(0.5 * (nu_ + right_stat.n))) + 
-    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) - 
+    boost::math::lgamma(0.5 * (nu_ + right_stat.n)) +
+    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) -
     (0.5 * right_stat.n) * std::log(2 * pi_constant) - 
     right_stat.sum_log_partial_var - 
-    std::log(boost::math::tgamma(0.5 * (nu_))) - 
-    (0.5 * (nu_ + right_stat.n)) * std::log(nu_ * lambda_ * lambda_ + right_stat.sum_ei)
+    boost::math::lgamma(0.5 * (nu_)) -
+    (0.5 * (nu_ + right_stat.n)) * std::log(nu_ * lambda_ * lambda_ + right_stat.weighted_sum_ei)
   );
 
   return left_log_ml + right_log_ml;
@@ -231,12 +231,12 @@ double LogLinearVarianceLeafModel::SplitLogMarginalLikelihood(LogLinearVarianceS
 
 double LogLinearVarianceLeafModel::NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
   double log_ml = (
-    std::log(boost::math::tgamma(0.5 * (nu_ + suff_stat.n))) + 
-    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) - 
+    boost::math::lgamma(0.5 * (nu_ + suff_stat.n)) +
+    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) -
     (0.5 * suff_stat.n) * std::log(2 * pi_constant) - 
     suff_stat.sum_log_partial_var - 
-    std::log(boost::math::tgamma(0.5 * (nu_))) - 
-    (0.5 * (nu_ + suff_stat.n)) * std::log(nu_ * lambda_ * lambda_ + suff_stat.sum_ei)
+    boost::math::lgamma(0.5 * (nu_)) -
+    (0.5 * (nu_ + suff_stat.n)) * std::log(nu_ * lambda_ * lambda_ + suff_stat.weighted_sum_ei)
   );
 
   return log_ml;
@@ -247,7 +247,7 @@ double LogLinearVarianceLeafModel::PosteriorParameterShape(LogLinearVarianceSuff
 }
 
 double LogLinearVarianceLeafModel::PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
-  return ((nu_ * lambda_ * lambda_ + suff_stat.weighted_sum_ei) / (2 * (nu_ + suff_stat.n)));
+  return ((nu_ * lambda_ * lambda_ + suff_stat.sq_weighted_sum_ei) / (2 * (nu_ + suff_stat.n)));
 }
 
 void LogLinearVarianceLeafModel::SampleLeafParameters(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, Tree* tree, int tree_num, double global_variance, std::mt19937& gen) {
diff --git a/src/partition_tracker.cpp b/src/partition_tracker.cpp
index c752be9e..e7893f23 100644
--- a/src/partition_tracker.cpp
+++ b/src/partition_tracker.cpp
@@ -20,6 +20,7 @@ ForestTracker::ForestTracker(Eigen::MatrixXd& covariates, std::vector<FeatureTyp
   unsorted_node_sample_tracker_ = std::make_unique<UnsortedNodeSampleTracker>(num_observations, num_trees);
   presort_container_ = std::make_unique<FeaturePresortRootContainer>(covariates, feature_types);
   sorted_node_sample_tracker_ = std::make_unique<SortedNodeSampleTracker>(presort_container_.get(), covariates, feature_types);
+  sum_predictions_ = std::vector<double>(num_observations, 0.);
 
   num_trees_ = num_trees;
   num_observations_ = num_observations;
@@ -71,6 +72,9 @@ void ForestTracker::AssignAllSamplesToRoot(int32_t tree_num) {
 }
 
 void ForestTracker::AssignAllSamplesToConstantPrediction(double value) {
+  for (data_size_t i = 0; i < num_observations_; i++) {
+    sum_predictions_[i] = value*num_trees_;
+  }
   for (int i = 0; i < num_trees_; i++) {
     sample_pred_mapper_->AssignAllSamplesToConstantPrediction(i, value);
   }
@@ -102,6 +106,10 @@ double ForestTracker::GetTreeSamplePrediction(data_size_t sample_id, int tree_id
   return sample_pred_mapper_->GetPred(sample_id, tree_id);
 }
 
+void ForestTracker::UpdateVarWeightsFromInternalPredictions(ForestDataset& dataset) {
+  dataset.UpdateVarWeights(sum_predictions_.data(), num_observations_, true);
+}
+
 void ForestTracker::SetSamplePrediction(data_size_t sample_id, double value) {
   sum_predictions_[sample_id] = value;
 }

From 7d7b4326d966db91c7a96b7ae8c43d4f0252113c Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 17 Sep 2024 17:52:50 -0400
Subject: [PATCH 23/41] Updated heteroscedasticity model

---
 debug/api_debug.cpp            | 15 +++++++++------
 include/stochtree/leaf_model.h | 22 +++++-----------------
 src/leaf_model.cpp             | 34 ++++++++++++++--------------------
 3 files changed, 28 insertions(+), 43 deletions(-)

diff --git a/debug/api_debug.cpp b/debug/api_debug.cpp
index 9d19d87f..fec5da04 100644
--- a/debug/api_debug.cpp
+++ b/debug/api_debug.cpp
@@ -346,7 +346,7 @@ void GenerateDGP4(std::vector<double>& covariates, std::vector<double>& basis, s
   std::normal_distribution<double> normal_dist(0.,1.);
   
   // DGP parameters
-  std::vector<double> betas{1, 2, 5, 10};
+  std::vector<double> betas{0.5, 1, 2, 4};
   int num_partitions = betas.size();
   double s_x;
   double rfx;
@@ -497,7 +497,7 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
   double outcome_offset;
   double outcome_scale;
   OutcomeOffsetScale(residual, outcome_offset, outcome_scale);
-
+  
   RandomEffectsDataset rfx_dataset;
   std::vector<int> rfx_init(n, 0);
   RandomEffectsTracker rfx_tracker = RandomEffectsTracker(rfx_init);
@@ -547,7 +547,7 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
 
   // Initialize a leaf model
   double leaf_prior_mean = 0.;
-  double leaf_prior_scale = 1.;
+  double leaf_prior_scale = 1./num_trees;
   
   // Initialize forest sampling machinery
   double alpha = 1;
@@ -559,8 +559,11 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
   double b_rfx = 1.;
   double a_leaf = 2.;
   double b_leaf = 0.5;
-  double a_global = 4.;
-  double b_global = 2.;
+  double a_global = 4;
+  double b_global = 2;
+  double a_0 = 1.5;
+  double a_forest = num_trees / (a_0 * a_0) + 0.5;
+  double b_forest = num_trees / (a_0 * a_0);
 
   // Set leaf model parameters
   double leaf_scale;
@@ -622,7 +625,7 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
   }
 
   // Prepare the samplers
-  LeafModelVariant leaf_model = leafModelFactory(model_type, leaf_scale, leaf_scale_matrix, a_global, b_global);
+  LeafModelVariant leaf_model = leafModelFactory(model_type, leaf_scale, leaf_scale_matrix, a_forest, b_forest);
 
   // Run the GFR sampler
   if (num_gfr > 0) {
diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index def21e21..750e7d21 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -230,43 +230,31 @@ class GaussianMultivariateRegressionLeafModel {
 class LogLinearVarianceSuffStat {
  public:
   data_size_t n;
-  double sum_ei;
   double weighted_sum_ei;
-  double sq_weighted_sum_ei;
   double sum_log_partial_var;
   LogLinearVarianceSuffStat() {
     n = 0;
-    sum_ei = 0.0;
     weighted_sum_ei = 0.0;
-    sq_weighted_sum_ei = 0.0;
     sum_log_partial_var = 0.0;
   }
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
-    sum_ei += outcome(row_idx)*outcome(row_idx);
     weighted_sum_ei += outcome(row_idx)*outcome(row_idx)/dataset.VarWeightValue(row_idx);
-    sq_weighted_sum_ei += (outcome(row_idx)*outcome(row_idx))/(dataset.VarWeightValue(row_idx)*dataset.VarWeightValue(row_idx));
     sum_log_partial_var += std::exp(tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx));
   }
   void ResetSuffStat() {
     n = 0;
-    sum_ei = 0.0;
     weighted_sum_ei = 0.0;
-    sq_weighted_sum_ei = 0.0;
     sum_log_partial_var = 0.0;
   }
   void AddSuffStat(LogLinearVarianceSuffStat& lhs, LogLinearVarianceSuffStat& rhs) {
     n = lhs.n + rhs.n;
-    sum_ei = lhs.sum_ei + rhs.sum_ei;
     weighted_sum_ei = lhs.weighted_sum_ei + rhs.weighted_sum_ei;
-    sq_weighted_sum_ei = lhs.sq_weighted_sum_ei + rhs.sq_weighted_sum_ei;
     sum_log_partial_var = lhs.sum_log_partial_var + rhs.sum_log_partial_var;
   }
   void SubtractSuffStat(LogLinearVarianceSuffStat& lhs, LogLinearVarianceSuffStat& rhs) {
     n = lhs.n - rhs.n;
-    sum_ei = lhs.sum_ei - rhs.sum_ei;
     weighted_sum_ei = lhs.weighted_sum_ei - rhs.weighted_sum_ei;
-    sq_weighted_sum_ei = lhs.sq_weighted_sum_ei - rhs.sq_weighted_sum_ei;
     sum_log_partial_var = lhs.sum_log_partial_var - rhs.sum_log_partial_var;
   }
   bool SampleGreaterThan(data_size_t threshold) {
@@ -283,7 +271,7 @@ class LogLinearVarianceSuffStat {
 /*! \brief Marginal likelihood and posterior computation for heteroskedastic log-linear variance model */
 class LogLinearVarianceLeafModel {
  public:
-  LogLinearVarianceLeafModel(double nu, double lambda) {nu_ = nu; lambda_ = lambda; ig_sampler_ = InverseGammaSampler();}
+  LogLinearVarianceLeafModel(double a, double b) {a_ = a; b_ = b; ig_sampler_ = InverseGammaSampler();}
   ~LogLinearVarianceLeafModel() {}
   double SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance);
   double NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance);
@@ -291,12 +279,12 @@ class LogLinearVarianceLeafModel {
   double PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   void SampleLeafParameters(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, Tree* tree, int tree_num, double global_variance, std::mt19937& gen);
   void SetEnsembleRootPredictedValue(ForestDataset& dataset, TreeEnsemble* ensemble, double root_pred_value);
-  void SetPriorShape(double nu) {nu_ = nu;}
-  void SetPriorScale(double lambda) {lambda_ = lambda;}
+  void SetPriorShape(double a) {a_ = a;}
+  void SetPriorScale(double b) {b_ = b;}
   inline bool RequiresBasis() {return false;}
  private:
-  double nu_;
-  double lambda_;
+  double a_;
+  double b_;
   InverseGammaSampler ig_sampler_;
 };
 
diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index fa71997a..990f4a60 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -209,21 +209,17 @@ void GaussianMultivariateRegressionLeafModel::SetEnsembleRootPredictedValue(Fore
 
 double LogLinearVarianceLeafModel::SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance) {
   double left_log_ml = (
-    boost::math::lgamma(0.5 * (nu_ + left_stat.n)) +
-    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) -
-    (0.5 * left_stat.n) * std::log(2 * pi_constant) - 
-    left_stat.sum_log_partial_var - 
-    boost::math::lgamma(0.5 * (nu_)) -
-    (0.5 * (nu_ + left_stat.n)) * std::log(nu_ * lambda_ * lambda_ + left_stat.weighted_sum_ei)
+    boost::math::lgamma(a_ + 0.5 * left_stat.n) -
+    (0.5 * left_stat.n) * std::log(2 * pi_constant * global_variance) - 
+    0.5 * left_stat.sum_log_partial_var - 
+    (a_ + 0.5 * left_stat.n) * std::log(b_ + (0.5 * left_stat.weighted_sum_ei) / global_variance)
   );
 
   double right_log_ml = (
-    boost::math::lgamma(0.5 * (nu_ + right_stat.n)) +
-    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) -
-    (0.5 * right_stat.n) * std::log(2 * pi_constant) - 
-    right_stat.sum_log_partial_var - 
-    boost::math::lgamma(0.5 * (nu_)) -
-    (0.5 * (nu_ + right_stat.n)) * std::log(nu_ * lambda_ * lambda_ + right_stat.weighted_sum_ei)
+    boost::math::lgamma(a_ + 0.5 * right_stat.n) -
+    (0.5 * right_stat.n) * std::log(2 * pi_constant * global_variance) - 
+    0.5 * right_stat.sum_log_partial_var - 
+    (a_ + 0.5 * right_stat.n) * std::log(b_ + (0.5 * right_stat.weighted_sum_ei) / global_variance)
   );
 
   return left_log_ml + right_log_ml;
@@ -231,23 +227,21 @@ double LogLinearVarianceLeafModel::SplitLogMarginalLikelihood(LogLinearVarianceS
 
 double LogLinearVarianceLeafModel::NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
   double log_ml = (
-    boost::math::lgamma(0.5 * (nu_ + suff_stat.n)) +
-    (0.5 * nu_) * std::log(0.5 * (nu_ * lambda_ * lambda_)) -
-    (0.5 * suff_stat.n) * std::log(2 * pi_constant) - 
-    suff_stat.sum_log_partial_var - 
-    boost::math::lgamma(0.5 * (nu_)) -
-    (0.5 * (nu_ + suff_stat.n)) * std::log(nu_ * lambda_ * lambda_ + suff_stat.weighted_sum_ei)
+    boost::math::lgamma(a_ + 0.5 * suff_stat.n) -
+    (0.5 * suff_stat.n) * std::log(2 * pi_constant * global_variance) - 
+    0.5 * suff_stat.sum_log_partial_var - 
+    (a_ + 0.5 * suff_stat.n) * std::log(b_ + (0.5 * suff_stat.weighted_sum_ei) / global_variance)
   );
 
   return log_ml;
 }
 
 double LogLinearVarianceLeafModel::PosteriorParameterShape(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
-  return (nu_ + suff_stat.n) / 2;
+  return a_ + 0.5 * suff_stat.n;
 }
 
 double LogLinearVarianceLeafModel::PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
-  return ((nu_ * lambda_ * lambda_ + suff_stat.sq_weighted_sum_ei) / (2 * (nu_ + suff_stat.n)));
+  return (b_ + (0.5 * suff_stat.weighted_sum_ei) / global_variance);
 }
 
 void LogLinearVarianceLeafModel::SampleLeafParameters(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, Tree* tree, int tree_num, double global_variance, std::mt19937& gen) {

From a0e242263d559a9478a40a6d3fa078de3ee732ab Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 17 Sep 2024 22:47:03 -0400
Subject: [PATCH 24/41] Fixed prediction bug

---
 include/stochtree/ensemble.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/include/stochtree/ensemble.h b/include/stochtree/ensemble.h
index 7af0f3e3..6ed52c63 100644
--- a/include/stochtree/ensemble.h
+++ b/include/stochtree/ensemble.h
@@ -116,7 +116,7 @@ class TreeEnsemble {
         }
       }
       if (is_exponentiated_) output[i + offset] = std::exp(pred);
-      else output[i + offset] = std::exp(pred);
+      else output[i + offset] = pred;
     }
   }
 

From d7217b5ea1cddea4c22f5d1fc2e321f999f3a6c7 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Wed, 25 Sep 2024 09:41:26 -0400
Subject: [PATCH 25/41] Added debugging scripts and data (and a non-working
 update of variance forest)

---
 R/bart.R                                      | 268 ++++++---
 R/bcf.R                                       |   8 +-
 R/cpp11.R                                     |  20 +-
 R/forest.R                                    |  30 +-
 R/model.R                                     |  10 +-
 R/variance.R                                  |   5 +-
 cran-bootstrap.R                              |  76 ++-
 debug/api_debug.cpp                           | 128 +++--
 debug/data/heterosked_test.csv                | 101 ++++
 debug/data/heterosked_train.csv               | 401 ++++++++++++++
 include/stochtree/data.h                      | 122 +++++
 include/stochtree/gamma_sampler.h             |  30 +
 include/stochtree/ig_sampler.h                |   6 +-
 include/stochtree/leaf_model.h                |   7 +-
 include/stochtree/partition_tracker.h         |   4 +
 include/stochtree/variance_model.h            |  24 +-
 man/ForestModel.Rd                            |   6 +
 man/ForestSamples.Rd                          |  42 +-
 man/bart.Rd                                   |  68 ++-
 man/bcf.Rd                                    |   2 +-
 man/createForestContainer.Rd                  |   9 +-
 man/sample_sigma2_one_iteration.Rd            |   4 +-
 src/Makevars                                  |   2 +-
 src/cpp11.cpp                                 |  41 +-
 src/data.cpp                                  |  79 ++-
 src/forest.cpp                                |  56 +-
 src/leaf_model.cpp                            |  20 +-
 src/partition_tracker.cpp                     |  44 ++
 src/sampler.cpp                               |  45 +-
 tools/debug/heteroskedastic_bart.R            |  41 ++
 tools/debug/rfx_debug.R                       |   4 +-
 .../debug/supervised_learning_task_analysis.R |   6 +-
 vignettes/CustomSamplingRoutine.Rmd           |  20 +-
 vignettes/Heteroskedasticity.Rmd              | 517 ++++++++++++++++++
 34 files changed, 1984 insertions(+), 262 deletions(-)
 create mode 100644 debug/data/heterosked_test.csv
 create mode 100644 debug/data/heterosked_train.csv
 create mode 100644 include/stochtree/gamma_sampler.h
 create mode 100644 tools/debug/heteroskedastic_bart.R
 create mode 100644 vignettes/Heteroskedasticity.Rmd

diff --git a/R/bart.R b/R/bart.R
index 1b498115..031ed1cf 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -25,21 +25,31 @@
 #' that were not in the training set.
 #' @param rfx_basis_test (Optional) Test set basis for "random-slope" regression in additive random effects model.
 #' @param cutpoint_grid_size Maximum size of the "grid" of potential cutpoints to consider. Default: 100.
-#' @param tau_init Starting value of leaf node scale parameter. Calibrated internally as `1/num_trees` if not set here.
-#' @param alpha Prior probability of splitting for a tree of depth 0. Tree split prior combines `alpha` and `beta` via `alpha*(1+node_depth)^-beta`.
-#' @param beta Exponent that decreases split probabilities for nodes of depth > 0. Tree split prior combines `alpha` and `beta` via `alpha*(1+node_depth)^-beta`.
+#' @param tau_init Starting value of leaf node scale parameter. Calibrated internally as `1/num_trees_mean` if not set here.
 #' @param leaf_model Model to use in the leaves, coded as integer with (0 = constant leaf, 1 = univariate leaf regression, 2 = multivariate leaf regression). Default: 0.
-#' @param min_samples_leaf Minimum allowable size of a leaf, in terms of training samples. Default: 5.
-#' @param max_depth Maximum depth of any tree in the ensemble. Default: 10. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
+#' @param alpha_mean Prior probability of splitting for a tree of depth 0 in the mean model. Tree split prior combines `alpha_mean` and `beta_mean` via `alpha_mean*(1+node_depth)^-beta_mean`.
+#' @param beta_mean Exponent that decreases split probabilities for nodes of depth > 0 in the mean model. Tree split prior combines `alpha_mean` and `beta_mean` via `alpha_mean*(1+node_depth)^-beta_mean`.
+#' @param min_samples_leaf_mean Minimum allowable size of a leaf, in terms of training samples, in the mean model. Default: 5.
+#' @param max_depth_mean Maximum depth of any tree in the ensemble in the mean model. Default: 10. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
+#' @param alpha_variance Prior probability of splitting for a tree of depth 0 in the variance model. Tree split prior combines `alpha_variance` and `beta_variance` via `alpha_variance*(1+node_depth)^-beta_variance`.
+#' @param beta_variance Exponent that decreases split probabilities for nodes of depth > 0 in the variance model. Tree split prior combines `alpha_variance` and `beta_variance` via `alpha_variance*(1+node_depth)^-beta_variance`.
+#' @param min_samples_leaf_variance Minimum allowable size of a leaf, in terms of training samples, in the variance model. Default: 5.
+#' @param max_depth_variance Maximum depth of any tree in the ensemble in the variance model. Default: 10. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
 #' @param a_global Shape parameter in the `IG(a_global, b_global)` global error variance model. Default: 0.
 #' @param b_global Scale parameter in the `IG(a_global, b_global)` global error variance model. Default: 0.
 #' @param a_leaf Shape parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model. Default: 3.
-#' @param b_leaf Scale parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model. Calibrated internally as `0.5/num_trees` if not set here.
+#' @param b_leaf Scale parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model. Calibrated internally as `0.5/num_trees_mean` if not set here.
+#' @param a_forest Shape parameter in the `IG(a_forest, b_forest)` conditional error variance model (which is only sampled if `include_variance_forest = T`). Calibrated internally as `num_trees_variance / 1.5^2 + 0.5` if not set.
+#' @param b_forest Scale parameter in the `IG(a_forest, b_forest)` conditional error variance model (which is only sampled if `include_variance_forest = T`). Calibrated internally as `num_trees_variance / 1.5^2` if not set.
 #' @param q Quantile used to calibrated `lambda` as in Sparapani et al (2021). Default: 0.9.
 #' @param sigma2_init Starting value of global error variance parameter. Calibrated internally as `pct_var_sigma2_init*var((y-mean(y))/sd(y))` if not set.
+#' @param variance_forest_init Starting value of root forest prediction in conditional (heteroskedastic) error variance model. Calibrated internally as `log(pct_var_variance_forest_init*var((y-mean(y))/sd(y)))/num_trees_variance` if not set.
 #' @param pct_var_sigma2_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by `sigma2_init`.
-#' @param variable_weights Numeric weights reflecting the relative probability of splitting on each variable. Does not need to sum to 1 but cannot be negative. Defaults to `rep(1/ncol(X_train), ncol(X_train))` if not set here.
-#' @param num_trees Number of trees in the ensemble. Default: 200.
+#' @param pct_var_variance_forest_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by `variance_forest_init`.
+#' @param variable_weights_mean Numeric weights reflecting the relative probability of splitting on each variable in the mean forest. Does not need to sum to 1 but cannot be negative. Defaults to `rep(1/ncol(X_train), ncol(X_train))` if not set here.
+#' @param variable_weights_variance Numeric weights reflecting the relative probability of splitting on each variable in the variance forest. Does not need to sum to 1 but cannot be negative. Defaults to `rep(1/ncol(X_train), ncol(X_train))` if not set here.
+#' @param num_trees_mean Number of trees in the ensemble for the conditional mean model. Default: 200. If `num_trees_mean = 0`, the conditional mean will not be modeled using a forest and the function will only proceed if `num_trees_variance > 0`.
+#' @param num_trees_variance Number of trees in the ensemble for the conditional variance model. Default: 0. Variance is only modeled using a tree / forest if `num_trees_variance > 0`.
 #' @param num_gfr Number of "warm-start" iterations run using the grow-from-root algorithm (He and Hahn, 2021). Default: 5.
 #' @param num_burnin Number of "burn-in" iterations of the MCMC sampler. Default: 0.
 #' @param num_mcmc Number of "retained" iterations of the MCMC sampler. Default: 100.
@@ -80,20 +90,43 @@
 bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL, 
                  rfx_basis_train = NULL, X_test = NULL, W_test = NULL, 
                  group_ids_test = NULL, rfx_basis_test = NULL, 
-                 cutpoint_grid_size = 100, tau_init = NULL, alpha = 0.95, 
-                 beta = 2.0, min_samples_leaf = 5, max_depth = 10, leaf_model = 0, 
+                 cutpoint_grid_size = 100, tau_init = NULL, 
+                 alpha_mean = 0.95, beta_mean = 2.0, min_samples_leaf_mean = 5, 
+                 max_depth_mean = 10, alpha_variance = 0.95, beta_variance = 2.0, 
+                 min_samples_leaf_variance = 5, max_depth_variance = 10, 
                  a_global = 0, b_global = 0, a_leaf = 3, b_leaf = NULL, 
-                 q = 0.9, sigma2_init = NULL, pct_var_sigma2_init = 0.25,
-                 variable_weights = NULL, num_trees = 200, num_gfr = 5, 
-                 num_burnin = 0, num_mcmc = 100, sample_sigma = T, 
+                 a_forest = NULL, b_forest = NULL, q = 0.9, sigma2_init = NULL, 
+                 variance_forest_init = NULL, pct_var_sigma2_init = 1, 
+                 pct_var_variance_forest_init = 1, variable_weights_mean = NULL, 
+                 variable_weights_variance = NULL, num_trees_mean = 200, num_trees_variance = 20, 
+                 num_gfr = 5, num_burnin = 0, num_mcmc = 100, sample_sigma = T, 
                  sample_tau = T, random_seed = -1, keep_burnin = F, 
                  keep_gfr = F, verbose = F) {
+    # Determine whether conditional mean, variance, or both will be modeled
+    if (num_trees_variance > 0) include_variance_forest = T
+    else include_variance_forest = F
+    if (num_trees_mean > 0) include_mean_forest = T
+    else include_mean_forest = F
+    
+    # Override tau sampling if there is no mean forest
+    if (!include_mean_forest) sample_tau <- F
+    
     # Variable weight preprocessing (and initialization if necessary)
-    if (is.null(variable_weights)) {
-        variable_weights = rep(1/ncol(X_train), ncol(X_train))
+    if (include_mean_forest) {
+        if (is.null(variable_weights_mean)) {
+            variable_weights_mean = rep(1/ncol(X_train), ncol(X_train))
+        }
+        if (any(variable_weights_mean < 0)) {
+            stop("variable_weights_mean cannot have any negative weights")
+        }
     }
-    if (any(variable_weights < 0)) {
-        stop("variable_weights cannot have any negative weights")
+    if (include_variance_forest) {
+        if (is.null(variable_weights_variance)) {
+            variable_weights_variance = rep(1/ncol(X_train), ncol(X_train))
+        }
+        if (any(variable_weights_variance < 0)) {
+            stop("variable_weights_variance cannot have any negative weights")
+        }
     }
     
     # Preprocess covariates
@@ -105,8 +138,11 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
             stop("X_test must be a matrix or dataframe")
         }
     }
-    if (ncol(X_train) != length(variable_weights)) {
-        stop("length(variable_weights) must equal ncol(X_train)")
+    if ((ncol(X_train) != length(variable_weights_mean)) && (include_mean_forest)) {
+        stop("length(variable_weights_mean) must equal ncol(X_train)")
+    }
+    if ((ncol(X_train) != length(variable_weights_variance)) && (include_variance_forest)) {
+        stop("length(variable_weights_variance) must equal ncol(X_train)")
     }
     train_cov_preprocess_list <- preprocessTrainData(X_train)
     X_train_metadata <- train_cov_preprocess_list$metadata
@@ -117,7 +153,12 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     
     # Update variable weights
     variable_weights_adj <- 1/sapply(original_var_indices, function(x) sum(original_var_indices == x))
-    variable_weights <- variable_weights[original_var_indices]*variable_weights_adj
+    if (include_mean_forest) {
+        variable_weights_mean <- variable_weights_mean[original_var_indices]*variable_weights_adj
+    }
+    if (include_variance_forest) {
+        variable_weights_variance <- variable_weights_variance[original_var_indices]*variable_weights_adj
+    }
     
     # Convert all input data to matrices if not already converted
     if ((is.null(dim(W_train))) && (!is.null(W_train))) {
@@ -215,32 +256,42 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     y_bar_train <- mean(y_train)
     y_std_train <- sd(y_train)
     resid_train <- (y_train-y_bar_train)/y_std_train
+    
+    # Compute initial value of root nodes in mean forest
+    init_val_mean <- mean(resid_train)
 
     # Calibrate priors for sigma^2 and tau
     if (is.null(sigma2_init)) sigma2_init <- pct_var_sigma2_init*var(resid_train)
-    if (is.null(b_leaf)) b_leaf <- var(resid_train)/(2*num_trees)
-    if (is.null(tau_init)) tau_init <- var(resid_train)/(num_trees)
+    if (is.null(variance_forest_init)) variance_forest_init <- pct_var_variance_forest_init*var(resid_train)
+    if (is.null(b_leaf)) b_leaf <- var(resid_train)/(2*num_trees_mean)
+    if (is.null(tau_init)) tau_init <- var(resid_train)/(num_trees_mean)
     current_leaf_scale <- as.matrix(tau_init)
     current_sigma2 <- sigma2_init
+    a_0 <- 1.5
+    a_forest <- num_trees_variance/(a_0^2) + 0.5
+    b_forest <- num_trees_variance/(a_0^2)
     
     # Determine leaf model type
-    if (!has_basis) leaf_model <- 0
-    else if (ncol(W_train) == 1) leaf_model <- 1
-    else if (ncol(W_train) > 1) leaf_model <- 2
+    if (!has_basis) leaf_model_mean_forest <- 0
+    else if (ncol(W_train) == 1) leaf_model_mean_forest <- 1
+    else if (ncol(W_train) > 1) leaf_model_mean_forest <- 2
     else stop("W_train passed must be a matrix with at least 1 column")
+
+    # Set variance leaf model type (currently only one option)
+    leaf_model_variance_forest <- 3
     
     # Unpack model type info
-    if (leaf_model == 0) {
+    if (leaf_model_mean_forest == 0) {
         output_dimension = 1
         is_leaf_constant = T
         leaf_regression = F
-    } else if (leaf_model == 1) {
+    } else if (leaf_model_mean_forest == 1) {
         stopifnot(has_basis)
         stopifnot(ncol(W_train) == 1)
         output_dimension = 1
         is_leaf_constant = F
         leaf_regression = T
-    } else if (leaf_model == 2) {
+    } else if (leaf_model_mean_forest == 2) {
         stopifnot(has_basis)
         stopifnot(ncol(W_train) > 1)
         output_dimension = ncol(W_train)
@@ -269,10 +320,20 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     
     # Sampling data structures
     feature_types <- as.integer(feature_types)
-    forest_model <- createForestModel(forest_dataset_train, feature_types, num_trees, nrow(X_train), alpha, beta, min_samples_leaf, max_depth)
+    if (include_mean_forest) {
+        forest_model_mean <- createForestModel(forest_dataset_train, feature_types, num_trees_mean, nrow(X_train), alpha_mean, beta_mean, min_samples_leaf_mean, max_depth_mean)
+    }
+    if (include_variance_forest) {
+        forest_model_variance <- createForestModel(forest_dataset_train, feature_types, num_trees_variance, nrow(X_train), alpha_variance, beta_variance, min_samples_leaf_variance, max_depth_variance)
+    }
     
     # Container of forest samples
-    forest_samples <- createForestContainer(num_trees, output_dimension, is_leaf_constant)
+    if (include_mean_forest) {
+        forest_samples_mean <- createForestContainer(num_trees_mean, output_dimension, is_leaf_constant, FALSE)
+    }
+    if (include_variance_forest) {
+        forest_samples_variance <- createForestContainer(num_trees_variance, 1, TRUE, TRUE)
+    }
     
     # Random effects prior parameters
     if (has_rfx) {
@@ -309,6 +370,18 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     if (sample_sigma) global_var_samples <- rep(0, num_samples)
     if (sample_tau) leaf_scale_samples <- rep(0, num_samples)
     
+    # Initialize the leaves of each tree in the mean forest
+    if (include_mean_forest) {
+        if (requires_basis) init_values_mean_forest <- rep(0., ncol(W_train))
+        else init_values_mean_forest <- 0.
+        forest_samples_mean$prepare_for_sampler(forest_dataset_train, outcome_train, forest_model_mean, leaf_model_mean_forest, init_values_mean_forest)
+    }
+
+    # Initialize the leaves of each tree in the variance forest
+    if (include_variance_forest) {
+        forest_samples_variance$prepare_for_sampler(forest_dataset_train, outcome_train, forest_model_variance, leaf_model_variance_forest, variance_forest_init)
+    }
+    
     # Run GFR (warm start) if specified
     if (num_gfr > 0){
         gfr_indices = 1:num_gfr
@@ -320,17 +393,27 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
                 }
             }
             
-            forest_model$sample_one_iteration(
-                forest_dataset_train, outcome_train, forest_samples, rng, feature_types, 
-                leaf_model, current_leaf_scale, variable_weights, 
-                current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = F
-            )
+            
+            if (include_mean_forest) {
+                forest_model_mean$sample_one_iteration(
+                    forest_dataset_train, outcome_train, forest_samples_mean, rng, feature_types, 
+                    leaf_model_mean_forest, current_leaf_scale, variable_weights_mean, 
+                    a_forest, b_forest, current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = T
+                )
+            }
+            if (include_variance_forest) {
+                forest_model_variance$sample_one_iteration(
+                    forest_dataset_train, outcome_train, forest_samples_variance, rng, feature_types, 
+                    leaf_model_variance_forest, current_leaf_scale, variable_weights_variance, 
+                    a_forest, b_forest, current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = T
+                )
+            }
             if (sample_sigma) {
-                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, rng, a_global, b_global)
+                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
             }
             if (sample_tau) {
-                leaf_scale_samples[i] <- sample_tau_one_iteration(forest_samples, rng, a_leaf, b_leaf, i-1)
+                leaf_scale_samples[i] <- sample_tau_one_iteration(forest_samples_mean, rng, a_leaf, b_leaf, i-1)
                 current_leaf_scale <- as.matrix(leaf_scale_samples[i])
             }
             if (has_rfx) {
@@ -362,17 +445,26 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
                 }
             }
             
-            forest_model$sample_one_iteration(
-                forest_dataset_train, outcome_train, forest_samples, rng, feature_types, 
-                leaf_model, current_leaf_scale, variable_weights, 
-                current_sigma2, cutpoint_grid_size, gfr = F, pre_initialized = F
-            )
+            if (include_mean_forest) {
+                forest_model_mean$sample_one_iteration(
+                    forest_dataset_train, outcome_train, forest_samples_mean, rng, feature_types, 
+                    leaf_model_mean_forest, current_leaf_scale, variable_weights_mean, 
+                    a_forest, b_forest, current_sigma2, cutpoint_grid_size, gfr = F, pre_initialized = T
+                )
+            }
+            if (include_variance_forest) {
+                forest_model_variance$sample_one_iteration(
+                    forest_dataset_train, outcome_train, forest_samples_variance, rng, feature_types, 
+                    leaf_model_variance_forest, current_leaf_scale, variable_weights_variance, 
+                    a_forest, b_forest, current_sigma2, cutpoint_grid_size, gfr = F, pre_initialized = T
+                )
+            }
             if (sample_sigma) {
-                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, rng, a_global, b_global)
+                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
             }
             if (sample_tau) {
-                leaf_scale_samples[i] <- sample_tau_one_iteration(forest_samples, rng, a_leaf, b_leaf, i-1)
+                leaf_scale_samples[i] <- sample_tau_one_iteration(forest_samples_mean, rng, a_leaf, b_leaf, i-1)
                 current_leaf_scale <- as.matrix(leaf_scale_samples[i])
             }
             if (has_rfx) {
@@ -381,9 +473,17 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         }
     }
     
-    # Forest predictions
-    y_hat_train <- forest_samples$predict(forest_dataset_train)*y_std_train + y_bar_train
-    if (has_test) y_hat_test <- forest_samples$predict(forest_dataset_test)*y_std_train + y_bar_train
+    # Mean forest predictions
+    if (include_mean_forest) {
+        y_hat_train <- forest_samples_mean$predict(forest_dataset_train)*y_std_train + y_bar_train
+        if (has_test) y_hat_test <- forest_samples_mean$predict(forest_dataset_test)*y_std_train + y_bar_train
+    }
+    
+    # Variance forest predictions
+    if (include_variance_forest) {
+        sigma_x_hat_train <- forest_samples_variance$predict(forest_dataset_train)
+        if (has_test) sigma_x_hat_test <- forest_samples_variance$predict(forest_dataset_test)
+    }
     
     # Random effects predictions
     if (has_rfx) {
@@ -417,23 +517,36 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     }
     
     # Subset forest and RFX predictions
-    y_hat_train <- y_hat_train[,keep_indices]
+    if (include_mean_forest) {
+        y_hat_train <- y_hat_train[,keep_indices]
+        if (has_test) y_hat_test <- y_hat_test[,keep_indices]
+    }
+    if (include_variance_forest) {
+        sigma_x_hat_train <- sigma_x_hat_train[,keep_indices]
+        if (has_test) sigma_x_hat_test <- sigma_x_hat_test[,keep_indices]
+    }
     if (has_rfx) {
         rfx_preds_train <- rfx_preds_train[,keep_indices]
+        if (has_test) rfx_preds_test <- rfx_preds_test[,keep_indices]
     }
-    if (has_test) {
-        y_hat_test <- y_hat_test[,keep_indices]
-        if (has_rfx_test) {
-            rfx_preds_test <- rfx_preds_test[,keep_indices]
-        }
-    }
-    
+
     # Global error variance
     if (sample_sigma) sigma2_samples <- global_var_samples[keep_indices]*(y_std_train^2)
     
     # Leaf parameter variance
     if (sample_tau) tau_samples <- leaf_scale_samples[keep_indices]
     
+    # Rescale variance forest prediction by sigma2_samples
+    if (include_variance_forest) {
+        if (sample_sigma) {
+            sigma_x_hat_train <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_train[,i]*sigma2_samples[i]))
+            if (has_test) sigma_x_hat_test <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_test[,i]*sigma2_samples[i]))
+        } else {
+            sigma_x_hat_train <- sqrt(sigma_x_hat_train*sigma2_init)
+            if (has_test) sigma_x_hat_test <- sqrt(sigma_x_hat_test*sigma2_init)
+        }
+    }
+    
     # Return results as a list
     model_params <- list(
         "sigma2_init" = sigma2_init, 
@@ -442,6 +555,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         "tau_init" = tau_init,
         "a_leaf" = a_leaf, 
         "b_leaf" = b_leaf,
+        "a_forest" = a_forest, 
+        "b_forest" = b_forest,
         "outcome_mean" = y_bar_train,
         "outcome_scale" = y_std_train, 
         "output_dimension" = output_dimension,
@@ -459,16 +574,25 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         "has_rfx_basis" = has_basis_rfx, 
         "num_rfx_basis" = num_basis_rfx, 
         "sample_sigma" = sample_sigma,
-        "sample_tau" = sample_tau
+        "sample_tau" = sample_tau,
+        "include_mean_forest" = include_mean_forest,
+        "include_variance_forest" = include_variance_forest
     )
     result <- list(
-        "forests" = forest_samples, 
         "model_params" = model_params, 
-        "y_hat_train" = y_hat_train, 
         "train_set_metadata" = X_train_metadata,
         "keep_indices" = keep_indices
     )
-    if (has_test) result[["y_hat_test"]] = y_hat_test
+    if (include_mean_forest) {
+        result[["mean_forests"]] = forest_samples_mean
+        result[["y_hat_train"]] = y_hat_train
+        if (has_test) result[["y_hat_test"]] = y_hat_test
+    }
+    if (include_variance_forest) {
+        result[["var_forests"]] = forest_samples_variance
+        result[["sigma_x_hat_train"]] = sigma_x_hat_train
+        if (has_test) result[["sigma_x_hat_test"]] = sigma_x_hat_test
+    }
     if (sample_sigma) result[["sigma2_samples"]] = sigma2_samples
     if (sample_tau) result[["tau_samples"]] = tau_samples
     if (has_rfx) {
@@ -480,7 +604,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     class(result) <- "bartmodel"
     
     # Clean up classes with external pointers to C++ data structures
-    rm(forest_model)
+    if (include_mean_forest) rm(forest_model_mean)
+    if (include_variance_forest) rm(forest_model_variance)
     rm(forest_dataset_train)
     if (has_test) rm(forest_dataset_test)
     if (has_rfx) rm(rfx_dataset_train, rfx_tracker_train, rfx_model)
@@ -588,10 +713,15 @@ predict.bartmodel <- function(bart, X_test, W_test = NULL, group_ids_test = NULL
     if (!is.null(W_test)) prediction_dataset <- createForestDataset(X_test, W_test)
     else prediction_dataset <- createForestDataset(X_test)
     
-    # Compute forest predictions
+    # Compute mean forest predictions
     y_std <- bart$model_params$outcome_scale
     y_bar <- bart$model_params$outcome_mean
-    forest_predictions <- bart$forests$predict(prediction_dataset)*y_std + y_bar
+    mean_forest_predictions <- bart$mean_forests$predict(prediction_dataset)*y_std + y_bar
+    
+    # Compute variance forest predictions
+    if (bart$model_params$include_variance_forest) {
+        var_forest_predictions <- bart$variance_forests$predict(prediction_dataset)*(y_std^2)
+    }
     
     # Compute rfx predictions (if needed)
     if (bart$model_params$has_rfx) {
@@ -601,20 +731,28 @@ predict.bartmodel <- function(bart, X_test, W_test = NULL, group_ids_test = NULL
     # Restrict predictions to the "retained" samples (if applicable)
     if (!predict_all) {
         keep_indices = bart$keep_indices
-        forest_predictions <- forest_predictions[,keep_indices]
+        mean_forest_predictions <- mean_forest_predictions[,keep_indices]
+        if (bart$model_params$include_variance_forest) {
+            variance_forest_predictions <- variance_forest_predictions[,keep_indices]
+        }
         if (bart$model_params$has_rfx) rfx_predictions <- rfx_predictions[,keep_indices]
     }
     
     if (bart$model_params$has_rfx) {
         y_hat <- forest_predictions + rfx_predictions
         result <- list(
-            "forest_predictions" = forest_predictions, 
+            "mean_forest_predictions" = mean_forest_predictions, 
+            "variance_forest_predictions" = variance_forest_predictions, 
             "rfx_predictions" = rfx_predictions, 
             "y_hat" = y_hat
         )
         return(result)
     } else {
-        return(list("y_hat" = forest_predictions))
+        result <- list(
+            "y_hat" = mean_forest_predictions, 
+            "variance_forest_predictions" = variance_forest_predictions
+        )
+        return(result)
     }
 }
 
diff --git a/R/bcf.R b/R/bcf.R
index f99c3df2..d0c2de4d 100644
--- a/R/bcf.R
+++ b/R/bcf.R
@@ -526,7 +526,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             
             # Sample variance parameters (if requested)
             if (sample_sigma_global) {
-                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, rng, a_global, b_global)
+                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
             }
             if (sample_sigma_leaf_mu) {
@@ -578,7 +578,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             
             # Sample variance parameters (if requested)
             if (sample_sigma_global) {
-                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, rng, a_global, b_global)
+                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
             }
             if (sample_sigma_leaf_tau) {
@@ -625,7 +625,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             
             # Sample variance parameters (if requested)
             if (sample_sigma_global) {
-                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, rng, a_global, b_global)
+                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
             }
             if (sample_sigma_leaf_mu) {
@@ -677,7 +677,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             
             # Sample variance parameters (if requested)
             if (sample_sigma_global) {
-                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, rng, a_global, b_global)
+                global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
             }
             if (sample_sigma_leaf_tau) {
diff --git a/R/cpp11.R b/R/cpp11.R
index c718ca1c..294c9c28 100644
--- a/R/cpp11.R
+++ b/R/cpp11.R
@@ -180,8 +180,8 @@ rfx_label_mapper_to_list_cpp <- function(label_mapper_ptr) {
   .Call(`_stochtree_rfx_label_mapper_to_list_cpp`, label_mapper_ptr)
 }
 
-forest_container_cpp <- function(num_trees, output_dimension, is_leaf_constant) {
-  .Call(`_stochtree_forest_container_cpp`, num_trees, output_dimension, is_leaf_constant)
+forest_container_cpp <- function(num_trees, output_dimension, is_leaf_constant, is_exponentiated) {
+  .Call(`_stochtree_forest_container_cpp`, num_trees, output_dimension, is_leaf_constant, is_exponentiated)
 }
 
 forest_container_from_json_cpp <- function(json_ptr, forest_label) {
@@ -276,6 +276,10 @@ set_leaf_vector_forest_container_cpp <- function(forest_samples, leaf_vector) {
   invisible(.Call(`_stochtree_set_leaf_vector_forest_container_cpp`, forest_samples, leaf_vector))
 }
 
+initialize_forest_model_cpp <- function(data, residual, forest_samples, tracker, init_values, leaf_model_int) {
+  invisible(.Call(`_stochtree_initialize_forest_model_cpp`, data, residual, forest_samples, tracker, init_values, leaf_model_int))
+}
+
 adjust_residual_forest_container_cpp <- function(data, residual, forest_samples, tracker, requires_basis, forest_num, add) {
   invisible(.Call(`_stochtree_adjust_residual_forest_container_cpp`, data, residual, forest_samples, tracker, requires_basis, forest_num, add))
 }
@@ -324,16 +328,16 @@ forest_kernel_compute_kernel_train_test_cpp <- function(forest_kernel, covariate
   .Call(`_stochtree_forest_kernel_compute_kernel_train_test_cpp`, forest_kernel, covariates_train, covariates_test, forest_container, forest_num)
 }
 
-sample_gfr_one_iteration_cpp <- function(data, residual, forest_samples, tracker, split_prior, rng, feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, global_variance, leaf_model_int, pre_initialized) {
-  invisible(.Call(`_stochtree_sample_gfr_one_iteration_cpp`, data, residual, forest_samples, tracker, split_prior, rng, feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, global_variance, leaf_model_int, pre_initialized))
+sample_gfr_one_iteration_cpp <- function(data, residual, forest_samples, tracker, split_prior, rng, feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, a_forest, b_forest, global_variance, leaf_model_int, pre_initialized) {
+  invisible(.Call(`_stochtree_sample_gfr_one_iteration_cpp`, data, residual, forest_samples, tracker, split_prior, rng, feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, a_forest, b_forest, global_variance, leaf_model_int, pre_initialized))
 }
 
-sample_mcmc_one_iteration_cpp <- function(data, residual, forest_samples, tracker, split_prior, rng, feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, global_variance, leaf_model_int, pre_initialized) {
-  invisible(.Call(`_stochtree_sample_mcmc_one_iteration_cpp`, data, residual, forest_samples, tracker, split_prior, rng, feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, global_variance, leaf_model_int, pre_initialized))
+sample_mcmc_one_iteration_cpp <- function(data, residual, forest_samples, tracker, split_prior, rng, feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, a_forest, b_forest, global_variance, leaf_model_int, pre_initialized) {
+  invisible(.Call(`_stochtree_sample_mcmc_one_iteration_cpp`, data, residual, forest_samples, tracker, split_prior, rng, feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, a_forest, b_forest, global_variance, leaf_model_int, pre_initialized))
 }
 
-sample_sigma2_one_iteration_cpp <- function(residual, rng, a, b) {
-  .Call(`_stochtree_sample_sigma2_one_iteration_cpp`, residual, rng, a, b)
+sample_sigma2_one_iteration_cpp <- function(residual, dataset, rng, a, b) {
+  .Call(`_stochtree_sample_sigma2_one_iteration_cpp`, residual, dataset, rng, a, b)
 }
 
 sample_tau_one_iteration_cpp <- function(forest_samples, rng, a, b, sample_num) {
diff --git a/R/forest.R b/R/forest.R
index 953aa585..8a61cf57 100644
--- a/R/forest.R
+++ b/R/forest.R
@@ -16,9 +16,10 @@ ForestSamples <- R6::R6Class(
         #' @param num_trees Number of trees
         #' @param output_dimension Dimensionality of the outcome model
         #' @param is_leaf_constant Whether leaf is constant
+        #' @param is_exponentiated Whether forest predictions should be exponentiated before being returned
         #' @return A new `ForestContainer` object.
-        initialize = function(num_trees, output_dimension=1, is_leaf_constant=F) {
-            self$forest_container_ptr <- forest_container_cpp(num_trees, output_dimension, is_leaf_constant)
+        initialize = function(num_trees, output_dimension=1, is_leaf_constant=F, is_exponentiated=F) {
+            self$forest_container_ptr <- forest_container_cpp(num_trees, output_dimension, is_leaf_constant, is_exponentiated)
         }, 
         
         #' @description
@@ -106,6 +107,26 @@ ForestSamples <- R6::R6Class(
             }
         }, 
         
+        #' @description
+        #' Set a constant predicted value for every tree in the ensemble. 
+        #' Stops program if any tree is more than a root node. 
+        #' @param dataset `ForestDataset` Dataset class (covariates, basis, etc...)
+        #' @param outcome `Outcome` Outcome class (residual / partial residual)
+        #' @param forest_model `ForestModel` object storing tracking structures used in training / sampling
+        #' @param leaf_model_int Integer value encoding the leaf model type (0 = constant gaussian, 1 = univariate gaussian, 2 = multivariate gaussian, 3 = log linear variance).
+        #' @param leaf_value Constant leaf value(s) to be fixed for each tree in the ensemble indexed by `forest_num`. Can be either a single number or a vector, depending on the forest's leaf dimension.
+        prepare_for_sampler = function(dataset, outcome, forest_model, leaf_model_int, leaf_value) {
+            stopifnot(!is.null(dataset$data_ptr))
+            stopifnot(!is.null(outcome$data_ptr))
+            stopifnot(!is.null(forest_model$tracker_ptr))
+            stopifnot(!is.null(self$forest_container_ptr))
+            stopifnot(num_samples_forest_container_cpp(self$forest_container_ptr) == 0)
+            
+            # Initialize the model
+            initialize_forest_model_cpp(dataset$data_ptr, outcome$data_ptr, self$forest_container_ptr, 
+                                        forest_model$tracker_ptr, leaf_value, leaf_model_int)
+        }, 
+        
         #' @description
         #' Adjusts residual based on the predictions of a forest 
         #' 
@@ -294,11 +315,12 @@ ForestSamples <- R6::R6Class(
 #' @param num_trees Number of trees
 #' @param output_dimension Dimensionality of the outcome model
 #' @param is_leaf_constant Whether leaf is constant
+#' @param is_exponentiated Whether forest predictions should be exponentiated before being returned
 #'
 #' @return `ForestSamples` object
 #' @export
-createForestContainer <- function(num_trees, output_dimension=1, is_leaf_constant=F) {
+createForestContainer <- function(num_trees, output_dimension=1, is_leaf_constant=F, is_exponentiated=F) {
     return(invisible((
-        ForestSamples$new(num_trees, output_dimension, is_leaf_constant)
+        ForestSamples$new(num_trees, output_dimension, is_leaf_constant, is_exponentiated)
     )))
 }
diff --git a/R/model.R b/R/model.R
index 4811ab56..67d61499 100644
--- a/R/model.R
+++ b/R/model.R
@@ -68,27 +68,29 @@ ForestModel <- R6::R6Class(
         #' @param leaf_model_int Integer specifying the leaf model type (0 = constant leaf, 1 = univariate leaf regression, 2 = multivariate leaf regression)
         #' @param leaf_model_scale Scale parameter used in the leaf node model (should be a q x q matrix where q is the dimensionality of the basis and is only >1 when `leaf_model_int = 2`)
         #' @param variable_weights Vector specifying sampling probability for all p covariates in `forest_dataset`
+        #' @param a_forest Shape parameter on variance forest model (if applicable)
+        #' @param b_forest Scale parameter on variance forest model (if applicable)
         #' @param global_scale Global variance parameter
         #' @param cutpoint_grid_size (Optional) Number of unique cutpoints to consider (default: 500, currently only used when `GFR = TRUE`)
         #' @param gfr (Optional) Whether or not the forest should be sampled using the "grow-from-root" (GFR) algorithm
         #' @param pre_initialized (Optional) Whether or not the leaves are pre-initialized outside of the sampling loop (before any samples are drawn). In multi-forest implementations like BCF, this is true, though in the single-forest supervised learning implementation, we can let C++ do the initialization. Default: F.
         sample_one_iteration = function(forest_dataset, residual, forest_samples, rng, feature_types, 
                                         leaf_model_int, leaf_model_scale, variable_weights, 
-                                        global_scale, cutpoint_grid_size = 500, gfr = T, 
-                                        pre_initialized = F) {
+                                        a_forest, b_forest, global_scale, cutpoint_grid_size = 500, 
+                                        gfr = T, pre_initialized = F) {
             if (gfr) {
                 sample_gfr_one_iteration_cpp(
                     forest_dataset$data_ptr, residual$data_ptr, 
                     forest_samples$forest_container_ptr, self$tracker_ptr, self$tree_prior_ptr, 
                     rng$rng_ptr, feature_types, cutpoint_grid_size, leaf_model_scale, 
-                    variable_weights, global_scale, leaf_model_int, pre_initialized
+                    variable_weights, a_forest, b_forest, global_scale, leaf_model_int, pre_initialized
                 )
             } else {
                 sample_mcmc_one_iteration_cpp(
                     forest_dataset$data_ptr, residual$data_ptr, 
                     forest_samples$forest_container_ptr, self$tracker_ptr, self$tree_prior_ptr,
                     rng$rng_ptr, feature_types, cutpoint_grid_size, leaf_model_scale, 
-                    variable_weights, global_scale, leaf_model_int, pre_initialized
+                    variable_weights, a_forest, b_forest, global_scale, leaf_model_int, pre_initialized
                 ) 
             }
         }
diff --git a/R/variance.R b/R/variance.R
index c8933b3d..d225226e 100644
--- a/R/variance.R
+++ b/R/variance.R
@@ -1,13 +1,14 @@
 #' Sample one iteration of the (inverse gamma) global variance model
 #'
 #' @param residual Outcome class
+#' @param dataset ForestDataset class
 #' @param rng C++ random number generator
 #' @param a Global variance shape parameter
 #' @param b Global variance scale parameter
 #'
 #' @export
-sample_sigma2_one_iteration <- function(residual, rng, a, b) {
-    return(sample_sigma2_one_iteration_cpp(residual$data_ptr, rng$rng_ptr, a, b))
+sample_sigma2_one_iteration <- function(residual, dataset, rng, a, b) {
+    return(sample_sigma2_one_iteration_cpp(residual$data_ptr, dataset$data_ptr, rng$rng_ptr, a, b))
 }
 
 #' Sample one iteration of the leaf parameter variance model (only for univariate basis and constant leaf!)
diff --git a/cran-bootstrap.R b/cran-bootstrap.R
index 2a0a0f83..6a3b1d29 100644
--- a/cran-bootstrap.R
+++ b/cran-bootstrap.R
@@ -10,12 +10,6 @@
 # which is MIT licensed with the following copyright:
 # Copyright (c) Microsoft Corporation
 
-# Use xfun for find and replace in files / directories
-# require(xfun)
-# if (!require(xfun)) {
-#     install.packages("xfun")
-# }
-
 # Create the stochtree_cran folder
 cran_dir <- "stochtree_cran"
 if (!dir.exists(cran_dir)) {
@@ -255,3 +249,73 @@ if (all(file.exists(eigen_files_to_vendor_src))) {
         stop("Failed to vendor all Eigen files")
     }
 }
+
+# Copy boost_math headers / implementations to an include/ subdirectory of src/
+boost_header_files_to_vendor_src <- c()
+boost_header_files_to_vendor_dst <- c()
+# Existing header files
+boost_header_subfolder_src <- "deps/boost_math/include/boost"
+boost_header_filenames_src <- list.files(boost_header_subfolder_src, pattern = "\\.(hpp)$", recursive = TRUE)
+boost_header_files_to_vendor_src <- file.path(boost_header_subfolder_src, boost_header_filenames_src)
+# Existing implementation files
+boost_impl_subfolder_src <- "deps/boost_math/src"
+boost_impl_filenames_src <- list.files(boost_impl_subfolder_src, pattern = "\\.(cpp)$", recursive = TRUE)
+boost_impl_files_to_vendor_src <- file.path(boost_impl_subfolder_src, boost_impl_filenames_src)
+# Destination files
+boost_header_subfolder_dst <- "src/include/boost"
+boost_header_files_to_vendor_dst <- file.path(cran_dir, boost_header_subfolder_dst, boost_header_filenames_src)
+boost_impl_files_to_vendor_dst <- file.path(cran_dir, boost_header_subfolder_dst, boost_impl_filenames_src)
+
+if (all(file.exists(boost_header_files_to_vendor_src))) {
+    n_removed <- suppressWarnings(sum(file.remove(boost_header_files_to_vendor_dst)))
+    if (n_removed > 0) {
+        cat(sprintf("Removed %d previously vendored files from src/include/boost\n", n_removed))
+    }
+    
+    cat(
+        sprintf(
+            "Vendoring files from deps/boost_math/include/boost/ to src/include/boost\n"
+        )
+    )
+    
+    # Recreate the directory structure
+    dst_dirs <- unique(dirname(boost_header_files_to_vendor_dst))
+    for (dst_dir in dst_dirs) {
+        if (!dir.exists(dst_dir)) {
+            dir.create(dst_dir, recursive = TRUE)
+        }
+    }
+    
+    if (all(file.copy(boost_header_files_to_vendor_src, boost_header_files_to_vendor_dst))) {
+        cat("All deps/boost_math/include/boost header files successfully copied to src/include/boost\n")
+    } else {
+        stop("Failed to vendor all deps/boost_math/include/boost header files")
+    }
+}
+
+if (all(file.exists(boost_impl_files_to_vendor_src))) {
+    n_removed <- suppressWarnings(sum(file.remove(boost_impl_files_to_vendor_dst)))
+    if (n_removed > 0) {
+        cat(sprintf("Removed %d previously vendored cpp files from src/include/boost\n", n_removed))
+    }
+    
+    cat(
+        sprintf(
+            "Vendoring files from deps/boost_math/src/ to src/include/boost\n"
+        )
+    )
+    
+    # Recreate the directory structure
+    dst_dirs <- unique(dirname(boost_impl_files_to_vendor_dst))
+    for (dst_dir in dst_dirs) {
+        if (!dir.exists(dst_dir)) {
+            dir.create(dst_dir, recursive = TRUE)
+        }
+    }
+    
+    if (all(file.copy(boost_impl_files_to_vendor_src, boost_impl_files_to_vendor_dst))) {
+        cat("All deps/boost_math/src header files successfully copied to src/include/boost\n")
+    } else {
+        stop("Failed to vendor all deps/boost_math/src header files")
+    }
+}
diff --git a/debug/api_debug.cpp b/debug/api_debug.cpp
index fec5da04..fffefd9b 100644
--- a/debug/api_debug.cpp
+++ b/debug/api_debug.cpp
@@ -321,8 +321,8 @@ void GenerateDGP3(std::vector<double>& covariates, std::vector<double>& basis, s
 
 void GenerateDGP4(std::vector<double>& covariates, std::vector<double>& basis, std::vector<double>& outcome, std::vector<double>& rfx_basis, std::vector<int32_t>& rfx_groups, std::vector<FeatureType>& feature_types, std::mt19937& gen, int& n, int& x_cols, int& omega_cols, int& y_cols, int& rfx_basis_cols, int& num_rfx_groups, bool rfx_included, int random_seed = -1) {
   // Data dimensions
-  n = 1000;
-  x_cols = 2;
+  n = 400;
+  x_cols = 10;
   omega_cols = 0;
   y_cols = 1;
   if (rfx_included) {
@@ -346,7 +346,7 @@ void GenerateDGP4(std::vector<double>& covariates, std::vector<double>& basis, s
   std::normal_distribution<double> normal_dist(0.,1.);
   
   // DGP parameters
-  std::vector<double> betas{0.5, 1, 2, 4};
+  std::vector<double> betas{0.5, 1, 2, 3};
   int num_partitions = betas.size();
   double s_x;
   double rfx;
@@ -420,10 +420,19 @@ void OutcomeOffsetScale(ColumnVector& residual, double& outcome_offset, double&
   }
 }
 
-void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussian, bool rfx_included = false, int num_gfr = 10, int num_mcmc = 100, int random_seed = -1) {
+void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussian, 
+              bool rfx_included = false, int num_gfr = 10, int num_mcmc = 100, int random_seed = -1, 
+              std::string dataset_filename = "", int outcome_col = -1, std::string covariate_cols = "",
+              std::string basis_cols = "") {
   // Flag the data as row-major
   bool row_major = true;
 
+  // Determine whether we will generate data or read from file
+  bool data_from_file = false;
+  if (!dataset_filename.empty()) {
+    data_from_file = true;
+  }
+
   // Random number generation
   std::mt19937 gen;
   if (random_seed == -1) {
@@ -437,6 +446,9 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
   // Initialize dataset
   ForestDataset dataset = ForestDataset();
 
+  // Initialize outcome
+  ColumnVector residual = ColumnVector();
+
   // Empty data containers and dimensions (filled in by calling a specific DGP simulation function below)
   int n;
   int x_cols;
@@ -459,30 +471,55 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
   // Generate the data
   int output_dimension;
   bool is_leaf_constant;
-  if (dgp_num == 0) {
-    GenerateDGP1(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
-    dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
-    dataset.AddBasis(basis_raw.data(), n, omega_cols, row_major);
-    output_dimension = 1;
-    is_leaf_constant = false;
-  } else if (dgp_num == 1) {
-    GenerateDGP2(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
-    dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
-    output_dimension = 1;
-    is_leaf_constant = true;
-  } else if (dgp_num == 2) {
-    GenerateDGP3(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
-    dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
-    dataset.AddBasis(basis_raw.data(), n, omega_cols, row_major);
-    output_dimension = omega_cols;
-    is_leaf_constant = false;
-  } else if (dgp_num == 3) {
-    GenerateDGP4(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
-    dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
-    output_dimension = 1;
-    is_leaf_constant = true;
+  if (!data_from_file) {
+    if (dgp_num == 0) {
+      GenerateDGP1(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
+      dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
+      dataset.AddBasis(basis_raw.data(), n, omega_cols, row_major);
+      output_dimension = 1;
+      is_leaf_constant = false;
+    } else if (dgp_num == 1) {
+      GenerateDGP2(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
+      dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
+      output_dimension = 1;
+      is_leaf_constant = true;
+    } else if (dgp_num == 2) {
+      GenerateDGP3(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
+      dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
+      dataset.AddBasis(basis_raw.data(), n, omega_cols, row_major);
+      output_dimension = omega_cols;
+      is_leaf_constant = false;
+    } else if (dgp_num == 3) {
+      GenerateDGP4(covariates_raw, basis_raw, outcome_raw, rfx_basis_raw, rfx_groups, feature_types, gen, n, x_cols, omega_cols, y_cols, rfx_basis_cols, num_rfx_groups, rfx_included, random_seed);
+      dataset.AddCovariates(covariates_raw.data(), n, x_cols, row_major);
+      output_dimension = 1;
+      is_leaf_constant = true;
+    } else {
+      Log::Fatal("Invalid dgp_num");
+    }
+    // Construct residual
+    residual = ColumnVector(outcome_raw.data(), n);
   } else {
-    Log::Fatal("Invalid dgp_num");
+    // Override RFX
+    rfx_included = false;
+    // Construct residual
+    residual = ColumnVector(dataset_filename, outcome_col);
+    y_cols = 0;
+    // Add covariates
+    dataset.AddCovariatesFromCSV(dataset_filename, covariate_cols);
+    n = dataset.NumObservations();
+    x_cols = dataset.NumCovariates();
+    feature_types.resize(x_cols, FeatureType::kNumeric);
+    if (!basis_cols.empty()) {
+      dataset.AddBasisFromCSV(dataset_filename, basis_cols);
+      output_dimension = dataset.NumBasis();
+      is_leaf_constant = false;
+      omega_cols = dataset.NumBasis();
+    } else {
+      output_dimension = 1;
+      is_leaf_constant = true;
+      omega_cols = 0;
+    }
   }
   
   // Runtime check --- cannot have case / variance weights and be modeling heteroskedastic variance
@@ -490,9 +527,6 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
     StochTree::Log::Fatal("Cannot provide variance / case weights when modeling heteroskedasticity with a forest");
   }
 
-  // Construct residual
-  ColumnVector residual = ColumnVector(outcome_raw.data(), n);
-
   // Center and scale the data
   double outcome_offset;
   double outcome_scale;
@@ -550,8 +584,8 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
   double leaf_prior_scale = 1./num_trees;
   
   // Initialize forest sampling machinery
-  double alpha = 1;
-  double beta = 0.1;
+  double alpha = 0.95;
+  double beta = 2.;
   int min_samples_leaf = 1;
   int max_depth = 10;
   int cutpoint_grid_size = 100;
@@ -559,8 +593,8 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
   double b_rfx = 1.;
   double a_leaf = 2.;
   double b_leaf = 0.5;
-  double a_global = 4;
-  double b_global = 2;
+  double a_global = 0;
+  double b_global = 0;
   double a_0 = 1.5;
   double a_forest = num_trees / (a_0 * a_0) + 0.5;
   double b_forest = num_trees / (a_0 * a_0);
@@ -600,26 +634,29 @@ void RunDebug(int dgp_num = 0, const ModelType model_type = kConstantLeafGaussia
   double init_val_glob;
   std::vector<double> init_vec;
   if (model_type == kConstantLeafGaussian) {
-    init_val_glob = StochTree::ComputeMeanOutcome(residual);
+    init_val_glob = ComputeMeanOutcome(residual);
     init_val = init_val_glob / static_cast<double>(num_trees);
     forest_samples.InitializeRoot(init_val);
-    tracker.AssignAllSamplesToConstantPrediction(init_val);
+    UpdateResidualEntireForest(tracker, dataset, residual, forest_samples.GetEnsemble(0), false, std::minus<double>());
+    tracker.UpdatePredictions(forest_samples.GetEnsemble(0), dataset);
   } else if (model_type == kUnivariateRegressionLeafGaussian) {
-    init_val_glob = StochTree::ComputeMeanOutcome(residual);
+    init_val_glob = ComputeMeanOutcome(residual);
     init_val = init_val_glob / static_cast<double>(num_trees);
     forest_samples.InitializeRoot(init_val);
-    tracker.AssignAllSamplesToConstantPrediction(init_val);
+    UpdateResidualEntireForest(tracker, dataset, residual, forest_samples.GetEnsemble(0), true, std::minus<double>());
+    tracker.UpdatePredictions(forest_samples.GetEnsemble(0), dataset);
   } else if (model_type == kMultivariateRegressionLeafGaussian) {
-    init_val_glob = StochTree::ComputeMeanOutcome(residual);
+    init_val_glob = ComputeMeanOutcome(residual);
     init_val = init_val_glob / static_cast<double>(num_trees);
     init_vec = std::vector<double>(omega_cols, init_val);
     forest_samples.InitializeRoot(init_vec);
-    tracker.AssignAllSamplesToConstantPrediction(init_val);
+    UpdateResidualEntireForest(tracker, dataset, residual, forest_samples.GetEnsemble(0), true, std::minus<double>());
+    tracker.UpdatePredictions(forest_samples.GetEnsemble(0), dataset);
   } else if (model_type == kLogLinearVariance) {
-    init_val_glob = StochTree::ComputeVarianceOutcome(residual) * 0.4;
+    init_val_glob = ComputeVarianceOutcome(residual) * 0.4;
     init_val = std::log(init_val_glob) / static_cast<double>(num_trees);
     forest_samples.InitializeRoot(init_val);
-    tracker.AssignAllSamplesToConstantPrediction(init_val);
+    tracker.UpdatePredictions(forest_samples.GetEnsemble(0), dataset);
     std::vector<double> initial_preds(n, init_val_glob);
     dataset.AddVarianceWeights(initial_preds.data(), n);
   }
@@ -753,7 +790,12 @@ int main(int argc, char* argv[]) {
   if (random_seed < -1) {
     StochTree::Log::Fatal("The sixth command line argument must be >= -0");
   }
+  std::string dataset_filename = argv[7];
+  int outcome_col = std::stoi(argv[8]);
+  std::string covariate_cols = argv[9];
+  std::string basis_cols = argv[10];
 
   // Run the debug program
-  StochTree::RunDebug(dgp_num, model_type, rfx_included, num_gfr, num_mcmc);
+  StochTree::RunDebug(dgp_num, model_type, rfx_included, num_gfr, num_mcmc, random_seed,
+                      dataset_filename, outcome_col, covariate_cols, basis_cols);
 }
diff --git a/debug/data/heterosked_test.csv b/debug/data/heterosked_test.csv
new file mode 100644
index 00000000..9c20150b
--- /dev/null
+++ b/debug/data/heterosked_test.csv
@@ -0,0 +1,101 @@
+"y","X1","X2","X3","X4","X5","X6","X7","X8","X9","X10","f_x","s_x"
+0.16602939170279,0.211290733190253,0.3512832315173,0.484317823080346,0.0410519035067409,0.544329481897876,0.208616065792739,0.715793566778302,0.519131515640765,0.804753824602813,0.242159801069647,NA,0.5
+-0.492151343206358,0.0310312763322145,0.467259066179395,0.217408320866525,0.585395927308127,0.310897014569491,0.555933631025255,0.999427518807352,0.609017762588337,0.833850894821808,0.831058437004685,NA,0.5
+1.20354672980893,0.324771000305191,0.243206361541525,0.00510925496928394,0.225724841468036,0.818582467501983,0.428320674458519,0.52159065939486,0.743639749241993,0.846550665097311,0.274055331945419,NA,1
+-0.298743475101736,0.059549157274887,0.788293640129268,0.664353932486847,0.174846360227093,0.396595876198262,0.0166858048178256,0.671366059686989,0.164389409590513,0.748013024684042,0.213287916500121,NA,0.5
+1.03648471667601,0.252165184123442,0.103475574404001,0.159992411732674,0.836252088425681,0.74254785827361,0.88382129278034,0.559503264725208,0.0441013514064252,0.333072878420353,0.317699365783483,NA,1
+0.372412663856177,0.277434553951025,0.696199390338734,0.228776063071564,0.719009180320427,0.411765250377357,0.557771438034251,0.434479911345989,0.98785528820008,0.964887821115553,0.372693746583536,NA,1
+0.678007080201085,0.901923469034955,0.656224591424689,0.984398937784135,0.372089076321572,0.862292707199231,0.308036184636876,0.0231759585440159,0.113736179191619,0.934551725862548,0.281830958090723,NA,3
+-0.552663625102306,0.384898619260639,0.653318807482719,0.57212492544204,0.617288585519418,0.212964130798355,0.596753151156008,0.907653672154993,0.364099610829726,0.8535895885434,0.874561849748716,NA,1
+-0.774647129926176,0.542285286355764,0.891476916149259,0.86847648001276,0.3822966220323,0.468129127752036,0.658936342457309,0.679395364364609,0.313021682668477,0.295605404768139,0.946900382405147,NA,2
+-1.44840009823072,0.786929592490196,0.990138707915321,0.00964757986366749,0.11595363356173,0.0707218167372048,0.0610561305657029,0.741362863453105,0.26028509857133,0.727263244334608,0.252514223800972,NA,3
+-0.000520860259289017,0.373750334838405,0.77888114657253,0.958520723273978,0.851794941583648,0.405048871645704,0.789868315216154,0.650866032578051,0.848741357214749,0.00563913723453879,0.714518729131669,NA,1
+4.91065105854111,0.578438652446494,0.44657018291764,0.96312881493941,0.472523927222937,0.0506300190463662,0.498262552311644,0.523629083996639,0.353911799145862,0.00572359748184681,0.927425773814321,NA,2
+0.246599975172457,0.323262227233499,0.280061168596148,0.221339529380202,0.189832986332476,0.364617298590019,0.677225903840736,0.126530721783638,0.237819334724918,0.558171211974695,0.957330684643239,NA,1
+0.216574141744894,0.128740054322407,0.535212400136515,0.49389783013612,0.27021420141682,0.782948551233858,0.722482954151928,0.256591950077564,0.287929816404358,0.411982560995966,0.477760225534439,NA,0.5
+3.02695240909448,0.830361526459455,0.771890457021073,0.678807897027582,0.249619299778715,0.304002076154575,0.733004137175158,0.739543926436454,0.798186061438173,0.900906472001225,0.851402544882149,NA,3
+-0.321787256332478,0.630839701509103,0.987936206627637,0.945720319403335,0.0623901186045259,0.258995248703286,0.429870260413736,0.10198374139145,0.536068871850148,0.0391868108417839,0.294132520444691,NA,2
+0.212045418087806,0.0110131918918341,0.85342196887359,0.588755084900185,0.461576499743387,0.770185991190374,0.871162265306339,0.0518779626581818,0.869023777078837,0.722436351701617,0.799294896423817,NA,0.5
+-1.21242344678739,0.425265174359083,0.357040172442794,0.340407437179238,0.488938638009131,0.354673355352134,0.615913023473695,0.24169555818662,0.993121116189286,0.728206684347242,0.014574522851035,NA,1
+1.28352116284694,0.657284670509398,0.787876920541748,0.395542721729726,0.422870381968096,0.305611111223698,0.258184634381905,0.99757966119796,0.214673584559932,0.472818041918799,0.445311633404344,NA,2
+-0.574621916007152,0.938520508352667,0.00738264597021043,0.339304566383362,0.935923039447516,0.826553477905691,0.751117973355576,0.412732847733423,0.446600724477321,0.908122762804851,0.410085891839117,NA,3
+-1.79033131705676,0.980508934007958,0.991732611320913,0.0741828014142811,0.45592138543725,0.0406530441250652,0.153601433616132,0.680239439709112,0.495365400798619,0.136085328413174,0.0960345070343465,NA,3
+1.2730466507008,0.452979361405596,0.353644639486447,0.955131257884204,0.253656769637018,0.531206650892273,0.689106163335964,0.535432658391073,0.512008368736133,0.523187090177089,0.483651001704857,NA,1
+0.509242586001192,0.0175574035383761,0.875898850383237,0.553155447356403,0.245557092595845,0.353349522221833,0.957418726291507,0.397177098784596,0.216923247324303,0.675873225554824,0.0169080917257816,NA,0.5
+-0.136460417178799,0.152752772672102,0.813950020587072,0.820145434001461,0.618891098769382,0.972209425177425,0.535218630451709,0.251730428542942,0.206172946607694,0.795590546447784,0.940857806708664,NA,0.5
+0.485453387886637,0.402201347984374,0.646702455822378,0.656405615853146,0.228795171016827,0.628267531748861,0.0990123685915023,0.514316890388727,0.170408786740154,0.966783886775374,0.67154831183143,NA,1
+0.358253559632074,0.103477319702506,0.780801502522081,0.291534556541592,0.102512540761381,0.0295835479628295,0.529529393883422,0.729500360088423,0.752762402174994,0.442406627582386,0.0135988409165293,NA,0.5
+-5.08545632040851,0.502724350197241,0.428052270086482,0.527379664825276,0.26013516378589,0.645728018833324,0.877794990781695,0.123491464182734,0.907502186950296,0.479111275169998,0.0677777659147978,NA,2
+0.707859361399802,0.197307132417336,0.620997583027929,0.118650285294279,0.991431219037622,0.912463267799467,0.897971634287387,0.922440506285056,0.905837482772768,0.0830823809374124,0.424855173798278,NA,0.5
+-0.288322601219351,0.0948237683624029,0.572173510212451,0.900335347745568,0.536399732576683,0.609837994910777,0.291524545988068,0.537141105625778,0.524107180535793,0.156775680137798,0.559588886797428,NA,0.5
+0.549673124655909,0.0728990600910038,0.447939761448652,0.282676422968507,0.89773990213871,0.0633204986806959,0.865510883042589,0.105334107298404,0.133278978988528,0.190158660756424,0.180829501943663,NA,0.5
+0.540571216994743,0.237544966395944,0.707299687666818,0.419169025262818,0.743102890206501,0.269150409614667,0.262001751922071,0.799080436583608,0.2612558118999,0.273263912182301,0.450734896818176,NA,0.5
+-0.0452946833490895,0.226565732620656,0.955050441902131,0.150834861211479,0.852100720163435,0.115236598765478,0.736819905461743,0.699184895725921,0.0959788486361504,0.278612334979698,0.56139239971526,NA,0.5
+0.803100296173604,0.530489934142679,0.194167217472568,0.529533125227317,0.713073023594916,0.926254247082397,0.580682525411248,0.297447438817471,0.769652892835438,0.668208419112489,0.192935517756268,NA,2
+4.75098156092376,0.510896486230195,0.674823730485514,0.756135024828836,0.539776347577572,0.319426174042746,0.557334935991094,0.713212842354551,0.714800932211801,0.606322152074426,0.17348047113046,NA,2
+1.14191042699979,0.704268886707723,0.301489194622263,0.67195270746015,0.743559376103804,0.791731091681868,0.890636668074876,0.923103271983564,0.125805326737463,0.261845856206492,0.053273844299838,NA,2
+-1.96289199262713,0.760442031314597,0.742438767105341,0.355483126826584,0.519423028221354,0.103875080589205,0.619771863799542,0.889494609320536,0.9085327538196,0.0071903329808265,0.535958426771685,NA,3
+-1.03924818368133,0.355457389494404,0.383036406245083,0.142556034494191,0.735553824109957,0.801241792505607,0.312697742134333,0.730286944191903,0.337912452174351,0.0597852817736566,0.109000069089234,NA,1
+2.56288078808684,0.640810209326446,0.781058971770108,0.45493664429523,0.475713788997382,0.998631661524996,0.845030306605622,0.513773418031633,0.416949922917411,0.517727062571794,0.653628408210352,NA,2
+0.512191613003144,0.841465181438252,0.340397675754502,0.183199171675369,0.348972214618698,0.399342444725335,0.673026149626821,0.462349094683304,0.73421816341579,0.642916572280228,0.501591531094164,NA,3
+-0.390539543957083,0.670964063378051,0.323868047911674,0.873477897839621,0.235217976849526,0.678807153599337,0.459241795353591,0.494968741200864,0.0186729081906378,0.205307064112276,0.93625286151655,NA,2
+-0.387138910565391,0.505246647400782,0.206667850259691,0.212133591994643,0.223405942320824,0.534676593495533,0.622734377160668,0.088978860527277,0.732178951846436,0.555771772982553,0.74612275743857,NA,2
+-0.589758275320359,0.917571729980409,0.606019907863811,0.361401373520494,0.349297178443521,0.815126905683428,0.432852742262185,0.217298388015479,0.659059998346493,0.282440681708977,0.74272277392447,NA,3
+-0.535819616401154,0.195396314607933,0.922371664317325,0.635648620780557,0.0705672230105847,0.389690730255097,0.417000237386674,0.0651042077224702,0.747380811953917,0.306937695480883,0.186355540528893,NA,0.5
+0.100718265891839,0.12325372453779,0.838415022008121,0.486661186208948,0.464539987500757,0.0181915941648185,0.543029651045799,0.084053430473432,0.314679026603699,0.367974560242146,0.29371877363883,NA,0.5
+4.4639440117062,0.943375065457076,0.92623546323739,0.376004029763862,0.170030419481918,0.136762315873057,0.569733060197905,0.480285328347236,0.851396167185158,0.530285589862615,0.0130437007173896,NA,3
+-1.7739095259091,0.750196340726689,0.386715405387804,0.119214843027294,0.157079570228234,0.972443665377796,0.0673526108730584,0.901384715922177,0.521999530028552,0.226870314916596,0.699825004441664,NA,3
+-3.30597720310619,0.631283310241997,0.137164937565103,0.283018422778696,0.0198266028892249,0.599854060914367,0.308085889788345,0.868349778000265,0.512785997241735,0.855990704614669,0.914151601027697,NA,2
+0.573932596174342,0.0070427656173706,0.641306987032294,0.176330357091501,0.567426423309371,0.860410574125126,0.408202450722456,0.201708807609975,0.791534950956702,0.511292593320832,0.750208221375942,NA,0.5
+-2.21001462414232,0.557995214127004,0.356393828522414,0.992580118589103,0.0819355831481516,0.553154400084168,0.32692315033637,0.239232912426814,0.190619267290458,0.00340557587333024,0.911083268001676,NA,2
+-2.29486992099795,0.626155448844656,0.925242279656231,0.2268055845052,0.104973732959479,0.319284403230995,0.0643279056530446,0.407658671727404,0.308903530938551,0.547128311824054,0.589992973487824,NA,2
+1.20099834449345,0.465869394131005,0.820835534017533,0.980574035085738,0.109229437308386,0.939030001172796,0.209905731026083,0.141733445925638,0.5528343396727,0.369989494327456,0.328800423070788,NA,1
+2.04880751638206,0.705077335238457,0.499480672879145,0.795235471567139,0.749453478259966,0.910042788600549,0.965336692053825,0.16686162375845,0.790705517167225,0.60525494068861,0.386548299575225,NA,2
+-0.510808721017406,0.0382022578269243,0.0574023951776326,0.298518662340939,0.847815460059792,0.419254497392103,0.545455661835149,0.804183976259083,0.566720734350383,0.938392051728442,0.968750852160156,NA,0.5
+0.678353506101917,0.00150989321991801,0.282608818961307,0.227338050492108,0.629864166723564,0.0941448376979679,0.269607466645539,0.0547637669369578,0.734315895475447,0.624765485292301,0.949363355059177,NA,0.5
+-3.84612254244577,0.817981925327331,0.499992654426023,0.763754336163402,0.459059632383287,0.466768078505993,0.0136354095302522,0.119035738054663,0.619225281523541,0.695366266882047,0.287478444399312,NA,3
+1.18831966729165,0.689650556538254,0.954330617329106,0.0839970302768052,0.226895423140377,0.289217309327796,0.483793317107484,0.826940205646679,0.489855382591486,0.196166640147567,0.896134687354788,NA,2
+-0.984385859730434,0.221693887142465,0.386208922602236,0.671697184676304,0.865381807554513,0.56949229654856,0.96111100865528,0.867747253272682,0.981907822191715,0.349981465376914,0.436939367791638,NA,0.5
+-0.395896870249781,0.995180341880769,0.518618949921802,0.838818890042603,0.500900116749108,0.120013452135026,0.757572711678222,0.317005023127422,0.970106801018119,0.118986214278266,0.764332336606458,NA,3
+1.38921159150761,0.674878076650202,0.494008522713557,0.11772581236437,0.903489429038018,0.538562575588003,0.725335141411051,0.373649602057412,0.479591501876712,0.292627403745428,0.750551311299205,NA,2
+2.42945595659824,0.953342667547986,0.083741452312097,0.756313804769889,0.162194768199697,0.247160838916898,0.287883190670982,0.55613048421219,0.396303126122802,0.824216928100213,0.150460966397077,NA,3
+-3.6886999739904,0.687809974187985,0.753712829900905,0.101322782225907,0.698061282979324,0.231127486098558,0.223462254740298,0.0152061164844781,0.74869236536324,0.895096591673791,0.904631495475769,NA,2
+0.536585118223136,0.688023552997038,0.401733021717519,0.964100113371387,0.407351006288081,0.605407851049677,0.754583293804899,0.348921799799427,0.613906478276476,0.991704752435908,0.878143492620438,NA,2
+-0.945724263155543,0.912634621141478,0.0984702135901898,0.383788489736617,0.127180437557399,0.202219387050718,0.871567155467346,0.128467405447736,0.565469443099573,0.198427167953923,0.211701851338148,NA,3
+1.88190395261656,0.982580098556355,0.440120175015181,0.976914363214746,0.384266132023185,0.651897041592747,0.424716322217137,0.656596934422851,0.675765822641551,0.502742925658822,0.0215359264984727,NA,3
+1.75984850787277,0.818847576156259,0.283998677041382,0.752549906261265,0.436714354204014,0.99236780917272,0.125404683407396,0.771643821382895,0.72715258016251,0.0586418081074953,0.712552866665646,NA,3
+0.840920362678104,0.147506986744702,0.812251603929326,0.144564733840525,0.968569115269929,0.245198084274307,0.901848326670006,0.778830538270995,0.769952379865572,0.63684784504585,0.340954556828365,NA,0.5
+-1.9371212817847,0.811514051631093,0.0480760163627565,0.165090465452522,0.285216748947278,0.520478271646425,0.14143471699208,0.530164128635079,0.171509642153978,0.663002614164725,0.605542375706136,NA,3
+2.66745669003816,0.618318668100983,0.538341464707628,0.279087009374052,0.891984875546768,0.127626759931445,0.712945127626881,0.0132724172435701,0.173096344573423,0.185944046359509,0.588332365499809,NA,2
+0.619195277945595,0.861147953663021,0.00769214262254536,0.243746276246384,0.0888408594764769,0.991699742851779,0.997524467529729,0.361437901854515,0.604364247061312,0.258257536683232,0.485892802011222,NA,3
+-1.20727540221404,0.716689873952419,0.612233497900888,0.836100687040016,0.588582671945915,0.491994495503604,0.792359412880614,0.0365804079920053,0.800699540879577,0.275558543158695,0.215889111161232,NA,2
+4.72985785755328,0.932213481282815,0.372599190333858,0.526720034424216,0.653838029364124,0.497327620862052,0.48135881498456,0.0302206429187208,0.234266108367592,0.33457084489055,0.598570736125112,NA,3
+0.288958968840092,0.0119730825535953,0.300384242553264,0.850864094216377,0.893871575593948,0.680723139783368,0.990262570325285,0.865412194048986,0.379822072573006,0.718840815359727,0.890456868568435,NA,0.5
+0.259681068955783,0.237852266291156,0.0348299730103463,0.718882874818519,0.653284071711823,0.112274453276768,0.0580400477629155,0.833725305041298,0.536504363641143,0.720546880736947,0.159137749811634,NA,0.5
+0.347321451075773,0.188694522483274,0.531638014828786,0.572584339883178,0.238210330018774,0.231171588879079,0.413350867340341,0.0659690995234996,0.564861474558711,0.89177248836495,0.0945249791257083,NA,0.5
+3.89576276409494,0.833090277388692,0.203691257163882,0.146478878101334,0.819324584677815,0.196580097544938,0.892589659895748,0.226715816417709,0.877559039741755,0.85475739534013,0.0848844614811242,NA,3
+0.355581450144155,0.431055790279061,0.416096288943663,0.0859726935159415,0.325928226578981,0.58786572702229,0.350675149122253,0.401109970640391,0.756839712616056,0.0408970382995903,0.338316329289228,NA,1
+1.60495074110366,0.621179772540927,0.686551147606224,0.273364662658423,0.874324111267924,0.725664374418557,0.859822448343039,0.737721871584654,0.271499434486032,0.237752126529813,0.236145419767126,NA,2
+-2.6328605154421,0.692925159586594,0.32423769752495,0.0426305204164237,0.968091825256124,0.1722840978764,0.862542052520439,0.704603992169723,0.0835464387200773,0.100951640866697,0.527263561496511,NA,2
+0.0799409275378214,0.496741143520921,0.358587516937405,0.925880230497569,0.544319620588794,0.682037363760173,0.974792276741937,0.415831092977896,0.969078256050125,0.604709276696667,0.89061022317037,NA,1
+2.72669228705894,0.478368178475648,0.310989870224148,0.928430530708283,0.247262259013951,0.795121156377718,0.861811829963699,0.400008339434862,0.144553888821974,0.947825188748538,0.19086144422181,NA,1
+0.0790671158723385,0.127485178643838,0.703777753748,0.503316113026813,0.764946941519156,0.433781018713489,0.384083716897294,0.968963841674849,0.380835567833856,0.876958164153621,0.818229214288294,NA,0.5
+-0.459476378753931,0.18172625801526,0.720858050510287,0.848017353564501,0.720434938790277,0.728625974617898,0.44146662694402,0.951146713923663,0.455086235888302,0.740384874632582,0.091537274653092,NA,0.5
+-0.00279715401469337,0.887286564800888,0.161548246862367,0.0689359360840172,0.555442054290324,0.846620650961995,0.00943395867943764,0.108124481979758,0.89916443801485,0.677391635021195,0.0622330722399056,NA,3
+0.249461137396448,0.0212012422271073,0.359011579537764,0.719863031757995,0.249324724078178,0.707923346664757,0.122814457165077,0.939011327456683,0.158998906379566,0.995269876671955,0.441887193359435,NA,0.5
+0.0133950863816936,0.0725361246149987,0.0616531122941524,0.287096783984452,0.382249645655975,0.883280041394755,0.615435254527256,0.487508539808914,0.597117075929418,0.629250884056091,0.159072700887918,NA,0.5
+0.418448230677183,0.0969394627027214,0.411688929889351,0.449063409119844,0.488310252549127,0.259443101240322,0.987585310125723,0.441142725525424,0.242221797816455,0.250788792734966,0.619807209586725,NA,0.5
+1.16506424422402,0.786211173050106,0.369333798764274,0.840181995881721,0.386459692381322,0.285024101380259,0.641522094374523,0.849066619062796,0.0109615188557655,0.2850232264027,0.217773179057986,NA,3
+0.989575894880979,0.539474389981478,0.796261472860351,0.47632975759916,0.676875605247915,0.890021840808913,0.499118740204722,0.972148579079658,0.982196035329252,0.0354776941239834,0.547611665446311,NA,2
+-5.41773583711259,0.991268366575241,0.841971538960934,0.831874355440959,0.383187236264348,0.318007141817361,0.644914947915822,0.261283464496955,0.146094920346513,0.701359197963029,0.458953364752233,NA,3
+1.14091061117272,0.381695970892906,0.186867855954915,0.592309525003657,0.0125671157147735,0.62503357976675,0.712586513254791,0.063052834244445,0.450469782575965,0.306621422059834,0.900312934769318,NA,1
+-0.0430420048530519,0.126209627138451,0.0910242712125182,0.877147340215743,0.65187450312078,0.148876765510067,0.271347487112507,0.483428512467071,0.995978597551584,0.910394222242758,0.631069793598726,NA,0.5
+2.53541834119888,0.527330596232787,0.949522181181237,0.366707332897931,0.0310849468223751,0.659584330860525,0.315074123907834,0.177570374915376,0.579150864621624,0.698416418628767,0.336142445914447,NA,2
+-0.836400788818656,0.152910969685763,0.588620311347768,0.183476264355704,0.471249244175851,0.456099348841235,0.358562543056905,0.0993230841122568,0.865682073868811,0.688885818701237,0.783728409092873,NA,0.5
+-0.36119486883805,0.255377688677981,0.472820749040693,0.497897547669709,0.599874146282673,0.595044590299949,0.915363078936934,0.366866510361433,0.132163925329223,0.286865012487397,0.395963127491996,NA,1
+3.04844600215742,0.784051381517202,0.334584510419518,0.889806121354923,0.633161137346178,0.861800517654046,0.5874773489777,0.395519501296803,0.458229560870677,0.794260403839871,0.584855122258887,NA,3
+-1.56680469940733,0.424370453692973,0.798977045807987,0.652883867966011,0.178207511780784,0.704748782562092,0.0875129597261548,0.638247390044853,0.396533044287935,0.528938032919541,0.909660720732063,NA,1
+-0.125657442776976,0.367308006854728,0.554850550601259,0.471428145188838,0.812708863057196,0.960221603047103,0.897328518796712,0.436890807002783,0.851095250342041,0.439047307474539,0.350051162531599,NA,1
+-0.081334269056118,0.763460468733683,0.334580871742219,0.455008901190013,0.758000182220712,0.850450441241264,0.255375979002565,0.451483712298796,0.409017519326881,0.0273381865117699,0.59320038347505,NA,3
+0.492823092528766,0.0655732385348529,0.881846528034657,0.0530098504386842,0.35191644448787,0.175170796457678,0.296730656642467,0.907911094138399,0.603398642269894,0.255270632915199,0.642264471622184,NA,0.5
+-0.000915148320753323,0.613401755923405,0.360998818883672,0.247979114530608,0.784389181062579,0.354104121448472,0.209656548919156,0.0889754833187908,0.849633313016966,0.397846080595627,0.135037919739261,NA,2
diff --git a/debug/data/heterosked_train.csv b/debug/data/heterosked_train.csv
new file mode 100644
index 00000000..92d47304
--- /dev/null
+++ b/debug/data/heterosked_train.csv
@@ -0,0 +1,401 @@
+"y","X1","X2","X3","X4","X5","X6","X7","X8","X9","X10","f_x","s_x"
+-0.282241503700301,0.0321366493590176,0.0392713348846883,0.491026453208178,0.829869156936184,0.419834628002718,0.674110037973151,0.440613425569609,0.00938279670663178,0.688462630612776,0.246391290798783,0,0.5
+0.560156335491632,0.633398831356317,0.713975282153115,0.0746546245645732,0.183240191545337,0.366673885611817,0.195146100129932,0.543941563926637,0.770088015124202,0.815632452024147,0.204938031733036,NA,2
+-2.55310551844943,0.699684502789751,0.518513803370297,0.278569060144946,0.518335236469284,0.557218188419938,0.487766429549083,0.912966759642586,0.306013585766777,0.737159843789414,0.415715463226661,NA,2
+1.2493544072818,0.376545963343233,0.365289261564612,0.878427121788263,0.236202105879784,0.150846817996353,0.263488188385963,0.295650234911591,0.752220941707492,0.503766167676076,0.0375082376413047,NA,1
+-0.350237222512917,0.685897701652721,0.439451805083081,0.346272532362491,0.639235025504604,0.0299059110693634,0.791390363825485,0.818463942268863,0.805753854336217,0.0685151207726449,0.653748897369951,NA,2
+0.875396882302278,0.30443329596892,0.593776761321351,0.252662484999746,0.143341688672081,0.202486322494224,0.209879243280739,0.0234908810816705,0.443319902056828,0.865865753497928,0.605711343931034,NA,1
+0.486947118214128,0.524243678199127,0.0881543764844537,0.894031626405194,0.117429533274844,0.153696053894237,0.0199424722231925,0.0166082351934165,0.0904451431706548,0.634674217319116,0.25031628459692,NA,2
+1.52973577099548,0.478108013281599,0.41259130765684,0.922683839220554,0.537282897857949,0.28786034998484,0.518826235085726,0.768439579289407,0.712297242833301,0.471964940661564,0.0293229683302343,NA,1
+0.314146031707177,0.352395879570395,0.994232393568382,0.36731672892347,0.371404710225761,0.226430130191147,0.988522542640567,0.171963014639914,0.590013455832377,0.61276261578314,0.0982697720173746,NA,1
+1.43575656817199,0.343638661550358,0.0898715713992715,0.671082190936431,0.0814627697691321,0.115701446775347,0.404091404750943,0.914198226062581,0.77044213260524,0.724840591661632,0.960911155678332,NA,1
+0.326893619264727,0.748311516828835,0.972395642194897,0.462105612503365,0.849746079416946,0.525140055455267,0.691481846617535,0.64259241358377,0.383345428388566,0.193897266406566,0.471145344432443,NA,2
+5.33184058038735,0.805053810123354,0.694419888081029,0.688123103696853,0.857482564169914,0.412985544884577,0.756523177726194,0.587173974374309,0.698520486243069,0.306543357903138,0.569155315635726,NA,3
+-0.080953281849018,0.292309782933444,0.886532769538462,0.590175394201651,0.763742916053161,0.843529825564474,0.444129067705944,0.506667435867712,0.263209822122008,0.25964065361768,0.51411981228739,NA,1
+-0.0642885588731738,0.0813713425304741,0.733218841487542,0.645473898854107,0.48057269025594,0.958589600399137,0.70577060454525,0.746377976378426,0.228743602987379,0.102548423456028,0.184051728574559,NA,0.5
+-2.52172005222636,0.465416571125388,0.113867231411859,0.423410250106826,0.912441357970238,0.253497969126329,0.957222544355318,0.298387421993539,0.55475458712317,0.320897468365729,0.92878125119023,NA,1
+0.26999574319132,0.0482504856772721,0.870362227084115,0.0656226673163474,0.352718068053946,0.950954237952828,0.0427663850132376,0.726099342806265,0.917875221231952,0.958915420575067,0.913584525929764,NA,0.5
+-3.83785409353774,0.645924511365592,0.445315549150109,0.396382685052231,0.90340900560841,0.380887056933716,0.26203626464121,0.901702417759225,0.417292382800952,0.660986073780805,0.41848081164062,NA,2
+1.07793425501999,0.529066368937492,0.877272051293403,0.683232536539435,0.744753323029727,0.3394386311993,0.526980829657987,0.636599146993831,0.445450452622026,0.164547258988023,0.882723631570116,NA,2
+0.62946218194112,0.621317676734179,0.144061228726059,0.754505411023274,0.52779389359057,0.0482079237699509,0.308562529738992,0.983435485279188,0.138843381311744,0.889652899932116,0.731016719480976,NA,2
+0.149334178305908,0.687091745669022,0.0368512177374214,0.239253385690972,0.0125792836770415,0.357229135232046,0.194120459957048,0.189207792049274,0.275957886129618,0.757066001417115,0.0808777082711458,NA,2
+1.08233265888858,0.377081562764943,0.927687839372084,0.388060942757875,0.262930948287249,0.415721071185544,0.595551578560844,0.889767974615097,0.680972298840061,0.78021034412086,0.810993585269898,NA,1
+-3.21122703337705,0.507098242873326,0.364786737831309,0.706525600515306,0.0720878560096025,0.39529197756201,0.0853938185609877,0.25313756079413,0.884323446080089,0.164221335435286,0.151563796214759,NA,2
+0.531353908252581,0.237350288545713,0.275147415464744,0.501605095108971,0.0984707665629685,0.615358766168356,0.561869938857853,0.290915884776041,0.80242047063075,0.554143948713318,0.496158995432779,NA,0.5
+0.600730293046287,0.157840367639437,0.632627204060555,0.929030198603868,0.630327652674168,0.730401052860543,0.328352578915656,0.717250395333394,0.666188669623807,0.0548528400249779,0.833407171769068,NA,0.5
+1.01314701175506,0.898484638426453,0.203661296050996,0.846307630417868,0.219352454645559,0.742492161225528,0.517635546857491,0.0817107316106558,0.968180059455335,0.336696855258197,0.662801184924319,NA,3
+0.656553622768969,0.753240135731176,0.343114467570558,0.128794493386522,0.560916883870959,0.668597492389381,0.196455833502114,0.172105104196817,0.634505996946245,0.0560522808227688,0.678417820017785,NA,3
+0.450441176587303,0.0125156014692038,0.882218054495752,0.629003981128335,0.674523104447871,0.600846989545971,0.633095325203612,0.400010914774612,0.962411692133173,0.547679667593911,0.177117998711765,NA,0.5
+-3.7895427703596,0.756340250140056,0.397959120338783,0.865862431004643,0.327016743365675,0.974390563322231,0.230026092845947,0.127599307801574,0.0277679341379553,0.932881123386323,0.593616648577154,NA,3
+0.946190693629125,0.235685531515628,0.246450350852683,0.248962875455618,0.362083269981667,0.932028053328395,0.458421003306285,0.347327328752726,0.816151189152151,0.349907604278997,0.481070955749601,NA,0.5
+9.4191799850465,0.849114913959056,0.821041927672923,0.602861605351791,0.340112386737019,0.396447837818414,0.765584346372634,0.106930397683755,0.223846387118101,0.744411860825494,0.93100854405202,NA,3
+1.43916127761723,0.766780707519501,0.445421120384708,0.451271537225693,0.72373710712418,0.184640744002536,0.951642854139209,0.495319120585918,0.00020794733427465,0.887012050719932,0.271078041987494,NA,3
+0.243285053031709,0.172001409810036,0.398085105465725,0.231227887328714,0.164392935112119,0.112842592177913,0.171439406462014,0.502675085794181,0.686919268220663,0.491456889547408,0.454194214195013,NA,0.5
+0.630674862417757,0.932543548289686,0.256847345735878,0.979184590745717,0.631192493718117,0.981027684174478,0.682858986081555,0.169451557798311,0.60733424173668,0.9371962856967,0.350068996660411,NA,3
+0.601104263344641,0.218169360188767,0.321275946451351,0.484401718014851,0.851453062379733,0.309203763958067,0.917364788241684,0.2084669705946,0.245045544346794,0.582212117500603,0.228992780670524,NA,0.5
+0.840336041358887,0.589697151444852,0.685158264124766,0.327503680251539,0.213558244984597,0.763619041070342,0.11949589359574,0.71811868599616,0.408380198059604,0.832140794256702,0.770084762945771,NA,2
+-0.154074442892582,0.367701322771609,0.884693963453174,0.0697798361070454,0.434232867090032,0.898273871280253,0.254723551450297,0.111902467207983,0.715196632780135,0.184001997346058,0.933242507977411,NA,1
+0.720696373819241,0.198938927613199,0.606495931511745,0.336577468551695,0.326773484470323,0.370286533143371,0.00082359416410327,0.0124902881216258,0.239021955290809,0.908346865791827,0.0976885615382344,NA,0.5
+2.21060504692689,0.682107795961201,0.287048922851682,0.372942043235525,0.396774863358587,0.819875442888588,0.710184759926051,0.190397032536566,0.480622512986884,0.8761212809477,0.223856529453769,NA,2
+-0.00610575291022993,0.067679442698136,0.8684254467953,0.996917813783512,0.089049612171948,0.700067178346217,0.794930153992027,0.930825348943472,0.826459914213046,0.864694126881659,0.0812219593208283,NA,0.5
+-0.932580761661321,0.572068417910486,0.0790525975171477,0.1397358069662,0.64970194036141,0.396581323817372,0.13856448000297,0.767174258362502,0.951541883638129,0.0230525995139033,0.823745897971094,NA,2
+-1.23014290795405,0.450845072045922,0.671238768612966,0.580475129419938,0.165164324454963,0.766623474657536,0.279710618546233,0.353242868324742,0.870829950086772,0.200475953286514,0.171313758939505,NA,1
+-3.16484165617904,0.573105162009597,0.258897884283215,0.213309426326305,0.100215684855357,0.882589143933728,0.585318948607892,0.152414533542469,0.104481044691056,0.666403246112168,0.75058483122848,NA,2
+4.62370372914815,0.73533759615384,0.740031143417582,0.788233703933656,0.918064421508461,0.720053877448663,0.39371900446713,0.0863925719168037,0.545766794355586,0.310717426007614,0.739832061110064,NA,2
+1.06384980222904,0.318392616463825,0.172780332621187,0.879689910449088,0.738148988690227,0.928580733481795,0.954701505368575,0.686478513525799,0.12954113073647,0.81541432836093,0.500270092394203,NA,1
+0.797694547807648,0.528178822714835,0.222754651214927,0.543697185115889,0.210871644085273,0.539274046663195,0.117441890062764,0.171201136894524,0.563767193350941,0.336862071650103,0.51251038024202,NA,2
+-1.43612727789891,0.995858771493658,0.930734105641022,0.990805656183511,0.171419916907325,0.054182613035664,0.928726562298834,0.748863881221041,0.940693028038368,0.65918653504923,0.31154797365889,NA,3
+-0.662510088784892,0.113952487008646,0.250964630628005,0.410930230980739,0.10554705071263,0.907607411500067,0.386065973900259,0.522172022610903,0.355578461894765,0.730407647090033,0.462258468614891,NA,0.5
+1.38840466048108,0.341306684771553,0.812958737369627,0.613608168903738,0.835363352671266,0.894293455639854,0.379676664015278,0.66161756683141,0.392706391168758,0.0179466558620334,0.213412882061675,NA,1
+-0.00107339168469423,0.467106574913487,0.461363392416388,0.494308657478541,0.868279299233109,0.097200368065387,0.598206092603505,0.0933514924254268,0.761134962551296,0.0639440342783928,0.236494644545019,NA,1
+-0.781708262436574,0.128517229110003,0.170633271569386,0.299606638494879,0.496000039856881,0.510280701331794,0.300075584789738,0.853872763924301,0.197547832271084,0.155960420612246,0.643106105038896,NA,0.5
+0.341957823006054,0.412145783891901,0.359467171831056,0.964134642854333,0.698599802330136,0.409747923957184,0.337395059876144,0.43656346690841,0.678571406751871,0.0371420315932482,0.82975935889408,NA,1
+0.056551295167318,0.222288713557646,0.49123525666073,0.395386436022818,0.539690778823569,0.574697827454656,0.397546735825017,0.730274567846209,0.652596935629845,0.617730791214854,0.38262702873908,NA,0.5
+0.106784845057808,0.148283806396648,0.0914904365781695,0.869412067811936,0.399036906659603,0.190275267930701,0.531700859311968,0.970284502254799,0.63110744045116,0.105896403081715,0.895602686330676,NA,0.5
+-0.416591273016816,0.0369925673585385,0.369142951210961,0.802026466466486,0.83644736954011,0.384842669591308,0.399965344229713,0.497230796376243,0.21596611966379,0.430716055911034,0.814202995272353,NA,0.5
+-3.80115746542674,0.896795936627313,0.765040824888274,0.844353931955993,0.740446796640754,0.11038355785422,0.944162652362138,0.749065604060888,0.802961661946028,0.594114093808457,0.982326869154349,NA,3
+-0.990579577345106,0.364397091092542,0.75387371936813,0.92530464194715,0.556107219774276,0.472777665359899,0.290147027932107,0.558879483724013,0.734846210572869,0.912317100213841,0.382154474034905,NA,1
+-2.24113101562438,0.958884046878666,0.916358025046065,0.622180263744667,0.313185492297634,0.629507611738518,0.766538005322218,0.00391310267150402,0.117573201656342,0.677621009293944,0.86312605952844,NA,3
+-1.37915963138867,0.992283673025668,0.1130617109593,0.39246118767187,0.386350285029039,0.618687929585576,0.00955063896253705,0.3101056877058,0.00335579412057996,0.428965806029737,0.334215411450714,NA,3
+-0.116138535683225,0.712791633559391,0.826705769635737,0.998709523584694,0.935079188318923,0.999019755981863,0.179841009201482,0.775375233031809,0.565244837198406,0.73825324466452,0.217810853617266,NA,2
+2.8651370208333,0.918227929389104,0.991976723074913,0.556448292685673,0.86033549089916,0.86803180235438,0.593546075979248,0.764600344700739,0.115971907973289,0.874116574181244,0.415115732233971,NA,3
+-2.62673850900046,0.958541032392532,0.734085222240537,0.277872398728505,0.903584003215656,0.99169037095271,0.442168229259551,0.931520459009334,0.135586928809062,0.59293475211598,0.717808285029605,NA,3
+0.132124476008359,0.608879194129258,0.450298280920833,0.517520986497402,0.466313583776355,0.215587850660086,0.0298155974596739,0.189444416435435,0.174548792652786,0.0233730303589255,0.0774613090325147,NA,2
+0.293719995172287,0.0288681895472109,0.813382123131305,0.00113681610673666,0.941644994076341,0.476048385258764,0.530871283495799,0.56963656633161,0.737177671631798,0.0965919359587133,0.604818821884692,NA,0.5
+-0.103954343912756,0.166011718567461,0.653191721998155,0.923596187727526,0.993117317091674,0.121775610838085,0.0122047434560955,0.826190118445083,0.30410159076564,0.38432927033864,0.433089199708775,NA,0.5
+0.716889016296623,0.424093425739557,0.161204627482221,0.926760187838227,0.688538460293785,0.412991603836417,0.0354802808724344,0.914258436998352,0.532327418681234,0.665652722353116,0.169264691183344,NA,1
+-3.89856674282553,0.847578614018857,0.657475670333952,0.999632467282936,0.367575454059988,0.757724079070613,0.600674423156306,0.687886233208701,0.487299331231043,0.809120106277987,0.675410686992109,NA,3
+0.167302299143473,0.0175340240821242,0.519420479191467,0.318057127762586,0.0525879818014801,0.545170752331614,0.493110234150663,0.703221583971754,0.326910747680813,0.955182061996311,0.553046975517645,NA,0.5
+3.41642433081155,0.881483160192147,0.548339178785682,0.000273799290880561,0.615487394854426,0.331853078911081,0.753756532678381,0.619998622685671,0.887993055395782,0.321768817491829,0.723241026746109,NA,3
+-0.927780454804531,0.694804448867217,0.636846353765577,0.545869589783251,0.543147100368515,0.651934214634821,0.496286484412849,0.906899358844385,0.585167640121654,0.544923613313586,0.9785473162774,NA,2
+-0.119458659437126,0.349967923015356,0.0674725724384189,0.461099995067343,0.208889465779066,0.727099789306521,0.322485944256186,0.0180952423252165,0.586417717626318,0.50533275748603,0.208145300159231,NA,1
+-0.388475062884792,0.442952080629766,0.550757031654939,0.0116928820498288,0.919974668882787,0.28176667355001,0.343595980666578,0.00730579695664346,0.0586100376676768,0.816800056258217,0.281768965069205,NA,1
+-4.99993600969702,0.63083560904488,0.304470317903906,0.130367321893573,0.00757993618026376,0.672845395281911,0.775554867926985,0.561601209221408,0.809073857031763,0.350174822146073,0.369892556220293,NA,2
+-4.0932011291792,0.857258127070963,0.849426775239408,0.048665531212464,0.663260747911409,0.201854383805767,0.374728660099208,0.680570747936144,0.791422239039093,0.155649269232526,0.159891559742391,NA,3
+-1.63574784505844,0.475719389040023,0.463194821262732,0.562303752405569,0.269420249154791,0.64509441726841,0.99847622634843,0.944659149041399,0.570544230751693,0.00567547790706158,0.528426631586626,NA,1
+-0.11708102669514,0.229862803127617,0.693337155273184,0.0249634576030076,0.472208397230133,0.628053227905184,0.81685835798271,0.652433575829491,0.879498174646869,0.0514549117069691,0.73972195899114,NA,0.5
+0.311440636819556,0.424796005710959,0.588375912979245,0.907698655501008,0.31491112918593,0.173823640448973,0.74140138248913,0.306885188445449,0.665830912999809,0.498456827364862,0.325599604984745,NA,1
+-0.523524190351201,0.546965456567705,0.69669742975384,0.907464131480083,0.905781339621171,0.374616772402078,0.97064465098083,0.54574229917489,0.0258567882701755,0.499222912825644,0.301927668973804,NA,2
+-0.218557554085927,0.545247800182551,0.532440177630633,0.0326926102861762,0.571362876798958,0.246572606964037,0.62373100570403,0.800766404950991,0.306481578154489,0.010504704201594,0.843400214333087,NA,2
+4.3394388956167,0.816038053482771,0.0158182233572006,0.43390632327646,0.118837420130149,0.119051147252321,0.583459883695468,0.119374568108469,0.339256392093375,0.430539290653542,0.673767470754683,NA,3
+-3.26204680706395,0.901603788835928,0.348586000269279,0.311316560022533,0.66575604211539,0.234927158802748,0.4827365425881,0.146938317688182,0.157435120781884,0.520954007748514,0.697913567069918,NA,3
+-1.34236542741488,0.620338303502649,0.691506293835118,0.481012200936675,0.556597996968776,0.0661866711452603,0.809830514946952,0.655171810416505,0.967796785058454,0.859031651634723,0.547678065020591,NA,2
+2.62955558280747,0.840353684034199,0.673164369771257,0.499901092844084,0.148192471591756,0.0805800317320973,0.836274195462465,0.529777634423226,0.809363054344431,0.569066174095497,0.855126766953617,NA,3
+-0.438281983773096,0.286419975571334,0.0967769827693701,0.10907745687291,0.96515504270792,0.346270593581721,0.213748984504491,0.87659911182709,0.000996117945760489,0.11449680221267,0.900713045150042,NA,1
+-0.819668273218654,0.42447182838805,0.305468514794484,0.628598166629672,0.897104371571913,0.292935826117173,0.57036331994459,0.812557882862166,0.743328155716881,0.372404619818553,0.995886287419125,NA,1
+-2.15502275916223,0.581904123770073,0.136866772547364,0.686216610949486,0.0187842161394656,0.65494451741688,0.842298676259816,0.63314122450538,0.811359524028376,0.159128638915718,0.789697944186628,NA,2
+-4.06652032407565,0.945780334994197,0.103755530901253,0.866593056125566,0.559091728879139,0.662870865082368,0.727699366630986,0.921519288793206,0.788001266308129,0.731000347295776,0.126275058137253,NA,3
+-0.928011560521798,0.0429409199859947,0.000712319742888212,0.487844629446045,0.285959116648883,0.604428091552109,0.919549201382324,0.459383252309635,0.727056132396683,0.891209361376241,0.935548935784027,NA,0.5
+-0.454744311371444,0.328576610656455,0.304207463981584,0.804804563056678,0.846173255937174,0.218100384576246,0.161341489758343,0.0678012303542346,0.141843453980982,0.453309568809345,0.174222140572965,NA,1
+2.45897650312528,0.572264407062903,0.749721936415881,0.234257691074163,0.789959133137017,0.606415096437559,0.554639648413286,0.0167610717471689,0.64993330463767,0.166575252544135,0.753427488962188,NA,2
+6.3265939587816,0.819421303458512,0.737637117039412,0.894383451668546,0.761343186022714,0.651555245975032,0.303879029816017,0.53969519212842,0.311747952597216,0.319801090052351,0.836284123826772,NA,3
+-1.00774699035296,0.27150860009715,0.301227852702141,0.904794576577842,0.526734083425254,0.869649238185957,0.472009405493736,0.629169559106231,0.432649733265862,0.571082683978602,0.996163306059316,NA,1
+0.746872815646722,0.140957412077114,0.958929154090583,0.87989121559076,0.650756301125512,0.234146694419906,0.255590234417468,0.420677730115131,0.597164487466216,0.723511897493154,0.155153512023389,NA,0.5
+-0.650446841065496,0.358473981032148,0.862018195679411,0.700934009160846,0.0534398728050292,0.899426093092188,0.338007411221042,0.93593748472631,0.137800792232156,0.827133719110861,0.955730211222544,NA,1
+2.48082038300247,0.961773466318846,0.0908011053688824,0.906130446586758,0.650059416424483,0.286194331245497,0.889659560285509,0.1561406950932,0.112980651902035,0.944480426842347,0.891218760749325,NA,3
+-0.0986038818318802,0.0816032441798598,0.00994992698542774,0.0916588774416596,0.106353395618498,0.383079081075266,0.394785706652328,0.774634938454255,0.597865202464163,0.382828871253878,0.0871360464952886,NA,0.5
+1.1520722946698,0.372490294510499,0.642933483468369,0.932021666085348,0.25168374995701,0.656297161011025,0.551260613603517,0.00573913590051234,0.171782038640231,0.776553657837212,0.087719907052815,NA,1
+4.3995392071382,0.889362843940035,0.875090325716883,0.929815792944282,0.647907796083018,0.219110984588042,0.0118211782537401,0.674186609685421,0.940533248940483,0.127728166524321,0.00270650535821915,NA,3
+0.0290089026468435,0.248338227858767,0.142401040298864,0.763918829383329,0.76891547255218,0.181683097267523,0.87568672769703,0.820826095528901,0.332615875406191,0.810349359177053,0.414319772040471,NA,0.5
+-0.0716587997708629,0.099602812435478,0.572981350123882,0.823288503335789,0.706261500250548,0.0959598675835878,0.149675080087036,0.507298650220037,0.423980995081365,0.74773308984004,0.686039772350341,NA,0.5
+-1.30011461908445,0.42879819823429,0.0999327092431486,0.0399061276111752,0.891762524843216,0.942133626202121,0.152556500863284,0.170978014590219,0.368863882729784,0.0347012423444539,0.505937222158536,NA,1
+-0.60014108521951,0.138419456779957,0.436613920144737,0.604420283576474,0.204740515211597,0.765600503887981,0.98930400935933,0.276836613891646,0.0905646500177681,0.362719136057422,0.529882991919294,NA,0.5
+-1.21145790381126,0.744622958125547,0.749749571783468,0.360840648878366,0.762236907379702,0.297599644400179,0.55331027880311,0.624136926373467,0.798092990880832,0.851898095104843,0.404137687990442,NA,2
+-1.14999787644678,0.708947046194226,0.849501037504524,0.762910400982946,0.842422707471997,0.723715083673596,0.381835736334324,0.65285807219334,0.514471322065219,0.310605535982177,0.957349325995892,NA,2
+0.819526373875359,0.515504683367908,0.370702817803249,0.823700248729438,0.387957931729034,0.642785836942494,0.348471603821963,0.0168538340367377,0.692721860483289,0.232188782887533,0.389768423512578,NA,2
+0.04335007115952,0.00294706947170198,0.814211948076263,0.31387432734482,0.261198920663446,0.432101055746898,0.918104903073981,0.415187336038798,0.976240418851376,0.291730556869879,0.519225212512538,NA,0.5
+-0.941306547537896,0.320613505784422,0.445245401933789,0.659601202700287,0.373574797762558,0.309444201411679,0.99856966570951,0.845955910626799,0.385660471161827,0.863749768352136,0.85754614090547,NA,1
+-1.18186963828744,0.701132035115734,0.859337297501042,0.348278685705736,0.160000698640943,0.238924831384793,0.72800212725997,0.57119212881662,0.620406114961952,0.0212759706191719,0.0539104880299419,NA,2
+0.357126829159397,0.447363865328953,0.8170770870056,0.286243395647034,0.16769379354082,0.238466019975021,0.662134238751605,0.810090478044003,0.577125230105594,0.075156477978453,0.137602924602106,NA,1
+-0.190270625930595,0.114963983185589,0.593716769479215,0.903442053124309,0.815722588449717,0.452215825207531,0.0901011251844466,0.436070464085788,0.167535469401628,0.971105119213462,0.308095294749364,NA,0.5
+2.62078960911659,0.566922665573657,0.568221352994442,0.653094903565943,0.0865914954338223,0.786628634436056,0.917334056925029,0.248513758182526,0.225959765724838,0.70123139442876,0.785259994678199,NA,2
+2.55987015026694,0.833427351433784,0.499585702549666,0.598924180492759,0.138457585126162,0.320701913908124,0.774522821651772,0.431595224887133,0.257062387652695,0.22843798622489,0.532552591059357,NA,3
+-6.92858680088879,0.782670683693141,0.0883395997807384,0.773956855759025,0.646301113301888,0.948011690285057,0.624721661442891,0.384072499116883,0.52077893470414,0.161269078962505,0.443590870127082,NA,3
+0.15815266439335,0.246600785059854,0.783747910521924,0.235627511749044,0.865159292006865,0.799394915346056,0.177220857003704,0.427418543258682,0.373554009012878,0.512462994782254,0.892843663692474,NA,0.5
+2.65450595933212,0.957361436681822,0.911815687082708,0.41771270474419,0.507127913879231,0.388280466897413,0.209281904157251,0.512741857906803,0.995567321544513,0.608058721991256,0.980684688081965,NA,3
+-0.551655302147764,0.105588861741126,0.765772460727021,0.254358040867373,0.496851657284424,0.270303341327235,0.840589354978874,0.230695051141083,0.313359949970618,0.0843451307155192,0.604350767796859,NA,0.5
+-1.8820051243768,0.865534041076899,0.282570220297202,0.518943741451949,0.582809855230153,0.733290414093062,0.464054192649201,0.0420361561700702,0.312909991247579,0.357775181764737,0.217115553095937,NA,3
+1.18644127377823,0.572014078265056,0.47516213497147,0.909601657185704,0.7345625765156,0.159067094791681,0.0758456904441118,0.596963451942429,0.248694570967928,0.609315068461001,0.460826584137976,NA,2
+2.90277751401675,0.714331415947527,0.171784817706794,0.755383554147556,0.103581401053816,0.949289575219154,0.311075175181031,0.892260275082663,0.782703787088394,0.609557135263458,0.0396083393134177,NA,2
+0.452672729165082,0.362838387256488,0.290337451035157,0.464105833088979,0.632470370503142,0.288197767920792,0.256659790175036,0.76495176483877,0.331189053365961,0.102935964474455,0.724172668065876,NA,1
+-0.133181544288443,0.697857573861256,0.296673942590132,0.952276430791244,0.360607230570167,0.295894445385784,0.471734570106491,0.0396309678908437,0.965557127026841,0.30653714039363,0.577830789843574,NA,2
+0.520898443292835,0.555650745285675,0.0409085555002093,0.172368012135848,0.690776515984908,0.844665887998417,0.950760766165331,0.402099822415039,0.815108865965158,0.204499331535771,0.857367512304336,NA,2
+-4.94863899675115,0.611774453427643,0.924236066872254,0.0708308285102248,0.330309199402109,0.127171179978177,0.491658851737157,0.536354664713144,0.913808302022517,0.952496240613982,0.481220846064389,NA,2
+0.736866988322533,0.438154348172247,0.806642528390512,0.0169571470469236,0.662110002711415,0.0638061012141407,0.217253629118204,0.100625155959278,0.0314080747775733,0.836882830131799,0.524368022568524,NA,1
+-2.10491296672012,0.603837736183777,0.607003055978566,0.14466291340068,0.00309824291616678,0.579994248226285,0.499280680436641,0.896025418769568,0.630717721302062,0.990853895898908,0.906316698761657,NA,2
+-0.385675311337004,0.0125510159414262,0.516535924980417,0.448626236524433,0.0885730378795415,0.931544049177319,0.0455953879281878,0.932046544039622,0.456221962114796,0.18970851926133,0.15640650712885,NA,0.5
+-0.933954992523,0.0433406794909388,0.950225162087008,0.479722076794133,0.840589659288526,0.512415238423273,0.36178726516664,0.267573584103957,0.603488262509927,0.0370614926796407,0.624879651935771,NA,0.5
+-0.520842484729798,0.0929510626010597,0.185449638403952,0.0954606782179326,0.354706885525957,0.336916906060651,0.202741828747094,0.128091655438766,0.105544385500252,0.0621682242490351,0.337343172635883,NA,0.5
+-1.1902755322199,0.341341719729826,0.27227359986864,0.726273648440838,0.375441956566647,0.0984445584472269,0.24713291740045,0.68887278297916,0.395826757419854,0.263939680531621,0.85243204399012,NA,1
+-0.0160453226366918,0.598223075270653,0.515979057410732,0.294184898026288,0.419611923396587,0.451983051374555,0.610102006234229,0.502045850269496,0.0474624985363334,0.312018062686548,0.97183643002063,NA,2
+0.662189390327135,0.269035245059058,0.890601610997692,0.579056739108637,0.532028702553362,0.036886066198349,0.655321523780003,0.785500477533787,0.994296758901328,0.625912741292268,0.597492320695892,NA,1
+-1.47635093715271,0.519639003556222,0.0640717146452516,0.487221607938409,0.496073189657182,0.116159395547584,0.006662578554824,0.0628067965153605,0.91214673826471,0.58853417634964,0.529160888632759,NA,2
+-0.54737069346927,0.0266456077806652,0.749969109194353,0.375706146936864,0.8472254879307,0.302311453036964,0.892074418487027,0.566268016584218,0.896159957861528,0.375780015485361,0.340594119857997,NA,0.5
+1.45065191789749,0.94707443495281,0.425205362495035,0.337836832040921,0.73194540082477,0.0198679927270859,0.384525762172416,0.486763422377408,0.31629200046882,0.698771668132395,0.0593036743812263,NA,3
+-0.36734327686679,0.449535029008985,0.739834612002596,0.998082731151953,0.405127953272313,0.798034045379609,0.383507769554853,0.453684104373679,0.366463227430359,0.449634636053815,0.556320760864764,NA,1
+-0.142193432562441,0.0993167369160801,0.780165972188115,0.76557879964821,0.643417255720124,0.0841845641843975,0.952992078615353,0.388045005733147,0.353067258605734,0.494073997018859,0.38412378448993,NA,0.5
+-0.0204411745838119,0.182601721491665,0.671439114259556,0.933410462690517,0.063336655497551,0.283508115913719,0.0870876528788358,0.795035666320473,0.261529661715031,0.253830597037449,0.271484842523932,NA,0.5
+-0.145046151664827,0.412740072468296,0.922483856091276,0.205560039961711,0.281724784523249,0.308287980500609,0.114223259268329,0.339805831899866,0.59704695106484,0.0895669923629612,0.20351308491081,NA,1
+-0.655416133968273,0.132374021690339,0.0385842223186046,0.960168987046927,0.553003982873634,0.0313359131105244,0.998100819531828,0.0783406211994588,0.927472871961072,0.659052587812766,0.785189574118704,NA,0.5
+0.0569453360323003,0.455947425216436,0.609724464127794,0.614067499991506,0.97299245535396,0.99231677222997,0.702998753637075,0.760542156873271,0.224094831617549,0.597768754232675,0.174418788170442,NA,1
+-0.407626682681292,0.138098580995575,0.752001489046961,0.289834522875026,0.654601774876937,0.41541023994796,0.00403436576016247,0.770590521162376,0.0943589757662266,0.306590826017782,0.670288912020624,NA,0.5
+-1.68139582769653,0.969414204824716,0.606616077246144,0.349470247514546,0.341198356356472,0.052086751209572,0.360128439497203,0.27755997586064,0.483060038648546,0.592371104983613,0.179017000831664,NA,3
+-1.41235887891515,0.484311842592433,0.627842574846,0.414641877403483,0.304095499916002,0.200165947666392,0.097875046543777,0.366788988700137,0.650650549912825,0.789857445284724,0.357476759934798,NA,1
+0.452289857944087,0.612423501210287,0.262217645766214,0.175194005016237,0.517215595347807,0.658887927187607,0.398805856704712,0.485592402284965,0.953524999320507,0.391746623674408,0.300889120902866,NA,2
+-2.08435011464261,0.759304512990639,0.582466018851846,0.261647397186607,0.554752136347815,0.801065125502646,0.137913859682158,0.877758507616818,0.749789121560752,0.467832755995914,0.0966854214202613,NA,3
+-0.250461882730123,0.282862489577383,0.311645941110328,0.60926196561195,0.124141810229048,0.274296503281221,0.622827796963975,0.743674198165536,0.265039020916447,0.945896445307881,0.395986490882933,NA,1
+1.38929004072203,0.581831085495651,0.604764067567885,0.0981524740345776,0.640039406251162,0.59033013205044,0.712040337501094,0.564666945487261,0.492797074839473,0.603931111749262,0.279830668587238,NA,2
+3.37308806241796,0.644188753794879,0.11642846907489,0.388798480387777,0.456940018106252,0.958898683078587,0.534385369159281,0.026345114922151,0.103369149379432,0.836727291345596,0.575546889333054,NA,2
+-1.80625513593003,0.665181114571169,0.865635313559324,0.236588786588982,0.625312402611598,0.197498777182773,0.469960128655657,0.853968983516097,0.0933152246288955,0.272778454935178,0.137419609585777,NA,2
+-0.598181630839518,0.20983607089147,0.388797290390357,0.747019624104723,0.93496206542477,0.0514743681997061,0.420886440202594,0.680075784912333,0.825326177757233,0.238552219001576,0.866760726552457,NA,0.5
+-0.678701228012741,0.367456012638286,0.76701890816912,0.299027033150196,0.638889130437747,0.973676205612719,0.202693411381915,0.047896116040647,0.693167041055858,0.72095926781185,0.85648188367486,NA,1
+-0.439448370591987,0.171001069946215,0.7493276654277,0.766403131186962,0.142307656118646,0.68866288033314,0.379330020165071,0.842053881846368,0.453404651256278,0.344623880228028,0.187736973864958,NA,0.5
+-0.429402457336857,0.232082100119442,0.912413143087178,0.417194787180051,0.263550848001614,0.0323172744829208,0.70294936420396,0.237633729353547,0.179497604025528,0.155822693370283,0.655707615427673,NA,0.5
+0.260273411620581,0.397116974228993,0.285043719923124,0.626160256098956,0.440539639210328,0.228579026414081,0.950656231259927,0.738680086331442,0.909562820801511,0.836534011876211,0.909986349521205,NA,1
+-0.601741747228831,0.00319111370481551,0.801924289902672,0.936224457342178,0.0328773867804557,0.680261990521103,0.817012073937804,0.107413252815604,0.0303064233157784,0.471293790731579,0.67827691603452,NA,0.5
+0.579175363038437,0.382363738259301,0.393253202782944,0.158311059698462,0.802881805924699,0.164180209161714,0.210846305359155,0.0777299583423883,0.271905378438532,0.415683274855837,0.646119900047779,NA,1
+0.233684619832068,0.104158732341602,0.044687672983855,0.755966236116365,0.898829346057028,0.747886597644538,0.785850781947374,0.187898478936404,0.26085401698947,0.919391671195626,0.723531056428328,NA,0.5
+-1.18176505505841,0.748055958654732,0.457851321436465,0.75289491051808,0.874799456913024,0.5951328065712,0.474716911558062,0.540802971692756,0.586096824146807,0.983661994105205,0.879120596917346,NA,2
+-0.899714329525814,0.598819239530712,0.214800329878926,0.255403825780377,0.657175703207031,0.83159053674899,0.0539117860607803,0.840320016723126,0.30811989097856,0.841044461587444,0.933701136615127,NA,2
+0.646093632296236,0.36379097471945,0.930275573628023,0.413587759248912,0.677580804331228,0.780740413581952,0.0646629584953189,0.859191400231794,0.603091831551865,0.680502528557554,0.776847406988963,NA,1
+1.02643265104361,0.787000266136602,0.130031454842538,0.812010727357119,0.11337968474254,0.226478895405307,0.9479467747733,0.289414885919541,0.826333333505318,0.482536654453725,0.204640087904409,NA,3
+-1.60873401630344,0.333655280526727,0.473265617853031,0.913793664192781,0.927346032112837,0.598311467794701,0.802216146606952,0.604303786531091,0.204727914649993,0.256905679125339,0.353850594256073,NA,1
+-0.193922357216301,0.309134368319064,0.69424194470048,0.045563388383016,0.0289882610086352,0.702026945538819,0.353906127158552,0.578083222731948,0.998108556028455,0.706539734266698,0.111041986150667,NA,1
+2.25822378003256,0.699067022651434,0.175160866929218,0.675344614312053,0.653209868585691,0.448388746008277,0.639876928878948,0.529742702143267,0.386671084910631,0.871713967528194,0.597260946873575,NA,2
+-0.294217127054907,0.0130114420317113,0.745208188192919,0.662316924892366,0.869964884594083,0.346366792684421,0.134350478416309,0.91824146383442,0.628984485287219,0.677548446692526,0.685797044774517,NA,0.5
+-5.09182856615671,0.535232451977208,0.519287661882117,0.85244823875837,0.555158670060337,0.251911287195981,0.740879685385153,0.578002710128203,0.67449068557471,0.13997372216545,0.171553277410567,NA,2
+-0.957106599062254,0.260365868685767,0.039272784255445,0.205235176021233,0.658755406038836,0.0693191748578101,0.265798757784069,0.553729085018858,0.56509280600585,0.896149475127459,0.0161577914841473,NA,1
+-0.74547676965435,0.216713041067123,0.312677611829713,0.271783971460536,0.31258171889931,0.547919424949214,0.143913608510047,0.106598092708737,0.155940489610657,0.147696991218254,0.264999630395323,NA,0.5
+-1.7556278223873,0.301559766521677,0.813955902820453,0.378281063167378,0.23688638349995,0.825144364265725,0.807417817413807,0.154609765624627,0.987439922289923,0.27786693489179,0.650420303922147,NA,1
+-0.0470943359654031,0.160312748048455,0.732178756734356,0.151784234680235,0.372392004355788,0.374390203272924,0.544937105616555,0.617528083734214,0.677572895074263,0.368166692554951,0.655130254570395,NA,0.5
+0.124658668723908,0.182294715894386,0.995739555219188,0.113104562275112,0.11240058299154,0.208648389670998,0.537716497201473,0.0649266852997243,0.650002721697092,0.0501199315767735,0.357121436158195,NA,0.5
+5.21455443964906,0.779459196841344,0.449038189370185,0.292015180690214,0.143725096713752,0.904136493103579,0.608930496964604,0.354715100722387,0.194870956009254,0.843750018393621,0.0934222042560577,NA,3
+1.75772733370199,0.821147922892123,0.425148322479799,0.171820772113279,0.235684452112764,0.761053857393563,0.315450295107439,0.220257700188085,0.835394476307556,0.984954028623179,0.115882620681077,NA,3
+-2.47988607885718,0.629339757142588,0.828968267887831,0.995918438304216,0.607340537942946,0.0347810362000018,0.946215031202883,0.967786622000858,0.126801078440621,0.765530567616224,0.121757410932332,NA,2
+-0.894667690433518,0.781423395499587,0.0622167293913662,0.272649483056739,0.198446429567412,0.659495470346883,0.81549444841221,0.649437340209261,0.403396281879395,0.0653008993249387,0.449648660607636,NA,3
+-2.59967794033893,0.833517065504566,0.922720778966323,0.283613242208958,0.117495934013277,0.44706165464595,0.493439532117918,0.653966138372198,0.117235817248002,0.946330566890538,0.346774617442861,NA,3
+0.562866817007894,0.066422026604414,0.0124633046798408,0.348506391048431,0.520839661592618,0.444712787633762,0.71667861030437,0.328789311693981,0.026976422406733,0.644805737538263,0.929708110401407,NA,0.5
+-0.98353176943091,0.345342023530975,0.675448514288291,0.863113478990272,0.767568795010448,0.745967566501349,0.583446231437847,0.355865387944505,0.183258432662115,0.327033995883539,0.742279504658654,NA,1
+1.39982507996358,0.301927540684119,0.425509258871898,0.963772800983861,0.432708555832505,0.552789221983403,0.862505354220048,0.194295163266361,0.607898182235658,0.666282393038273,0.855093700578436,NA,1
+2.19108366345933,0.784785338677466,0.910598614718765,0.0310040663462132,0.792512105545029,0.913687644060701,0.779540273128077,0.203273280523717,0.580115466378629,0.778640141477808,0.0813250311184675,NA,3
+0.102754799970055,0.0151381115429103,0.303750258870423,0.530344953527674,0.398493434069678,0.551140069263056,0.331004866398871,0.0359833822585642,0.954829844180495,0.751596683170646,0.923089451156557,NA,0.5
+-2.71593227987405,0.975154257612303,0.158668037503958,0.417390400543809,0.100585088133812,0.454939389135689,0.426590847782791,0.1122667635791,0.172702635638416,0.360355676151812,0.969007642241195,NA,3
+0.11316914619458,0.144407300045714,0.726451003458351,0.323942760471255,0.0605967913288623,0.890680358512327,0.902225363301113,0.955268873134628,0.0258821186143905,0.516488530673087,0.00521893566474319,NA,0.5
+0.214612463434781,0.382541353581473,0.541727594798431,0.679740986786783,0.000293354038149118,0.129221958573908,0.0420920078177005,0.329942629439756,0.341416005743667,0.02168780984357,0.247941843234003,NA,1
+-3.25744451413655,0.878030564635992,0.612484061392024,0.841921371873468,0.389507194282487,0.873570098308846,0.941481810528785,0.270786457462236,0.105030868668109,0.0905804259236902,0.677928207209334,NA,3
+-0.612778977564602,0.299138211412355,0.71343940589577,0.362453953828663,0.569098226493225,0.806055163498968,0.984774222364649,0.0434266540687531,0.158101887907833,0.446324746357277,0.10046491608955,NA,1
+0.768254629890036,0.090535826748237,0.598878909833729,0.383121004793793,0.942228753585368,0.728780089877546,0.816637960728258,0.63866300880909,0.776843504980206,0.295215973397717,0.961366922827438,NA,0.5
+-0.567603909448942,0.0424070812296122,0.419121650280431,0.861307024024427,0.638702552299947,0.642014807322994,0.769632588373497,0.153189419070259,0.810209463350475,0.170681128744036,0.77459627809003,NA,0.5
+-5.9771524195317,0.862377436831594,0.652252439875156,0.904387121321633,0.797982558840886,0.350751545047387,0.78046753979288,0.985694216098636,0.70478395326063,0.913390251807868,0.0379480242263526,NA,3
+3.06750410813849,0.80633880593814,0.679136122344062,0.952588496729732,0.829646679805592,0.881833428051323,0.884054609807208,0.0632740694563836,0.70828592334874,0.175746616674587,0.878892200067639,NA,3
+0.957806121739846,0.112819531699643,0.528766673523933,0.779676516773179,0.985083922278136,0.22144174692221,0.14839206263423,0.560842191567644,0.211447972571477,0.751184774329886,0.262189727742225,NA,0.5
+0.7394269431204,0.0613693608902395,0.0450991443358362,0.469146619085222,0.236004963051528,0.938807192258537,0.464330278337002,0.197913277195767,0.454433776205406,0.08160714013502,0.868174660252407,NA,0.5
+2.89437745658501,0.765211458783597,0.946839487645775,0.702625217847526,0.89387573953718,0.322030391078442,0.635835886467248,0.490745102521032,0.251796741737053,0.57421529921703,0.919654391240329,NA,3
+-0.837698154337176,0.911105049075559,0.887382954359055,0.218226345721632,0.503832868300378,0.00183678534813225,0.586421895073727,0.72927557816729,0.53785819420591,0.782691985368729,0.0610043394844979,NA,3
+1.61332292935373,0.767474424093962,0.657503654249012,0.23821485415101,0.3197404849343,0.848195793339983,0.523012418299913,0.220011793542653,0.923964306944981,0.419060569256544,0.20017861854285,NA,3
+-0.111281104502172,0.136224425164983,0.408692202530801,0.915172693319619,0.946666706586257,0.544694220647216,0.307216387009248,0.844691653503105,0.402090376475826,0.111828369786963,0.364809120539576,NA,0.5
+-0.743268442892708,0.631344011286274,0.416102928575128,0.94413023837842,0.405237703584135,0.0686362243723124,0.856442781630903,0.569145374232903,0.298357689753175,0.543654523789883,0.354759010253474,NA,2
+-0.905598862688402,0.429458065889776,0.599177881376818,0.525696570519358,0.556089870398864,0.374567771330476,0.73522638506256,0.165942407678813,0.241547536570579,0.640308366389945,0.910148287890479,NA,1
+-0.381371694003123,0.319485255284235,0.775019305292517,0.202426716685295,0.393176882760599,0.383716176263988,0.833298979094252,0.63092312333174,0.456514721736312,0.263742276001722,0.599667183123529,NA,1
+-0.423702137252754,0.11936202365905,0.114415199263021,0.187402412761003,0.825105560244992,0.401661385083571,0.598708146018907,0.626203504158184,0.0329728100914508,0.0982055109925568,0.259948245948181,NA,0.5
+-0.805397857933071,0.126862512435764,0.561627364018932,0.226535556837916,0.0691305936779827,0.0460475136060268,0.0944148511625826,0.584244670113549,0.75893074576743,0.932498198468238,0.695256362203509,NA,0.5
+0.319155083005407,0.472723427927122,0.787534170318395,0.645320721901953,0.715023176278919,0.209356067935005,0.81911487551406,0.801698182709515,0.70181589666754,0.698942579096183,0.469195405719802,NA,1
+-0.0907648903587075,0.463830034947023,0.883693974465132,0.996114502195269,0.933144294423983,0.130785294808447,0.672029396053404,0.39099053083919,0.82090491685085,0.889978097518906,0.481951746391132,NA,1
+0.685509547256731,0.733466965379193,0.0820799909997731,0.0614028854761273,0.193428620696068,0.842947125434875,0.147228190675378,0.63629440870136,0.00185011373832822,0.664431531913579,0.359879235271364,NA,2
+-6.88310219990682,0.766328622121364,0.514705869369209,0.0641286331228912,0.71263275318779,0.865839602192864,0.317526940023527,0.472104668151587,0.0943877408280969,0.525016574189067,0.392749238293618,NA,3
+-2.30749559493075,0.317944551585242,0.313390593510121,0.785861490992829,0.626033872598782,0.691302561433986,0.909780625021085,0.636675088433549,0.000775783322751522,0.607812081230804,0.350837268168107,NA,1
+0.190249220215772,0.0292525580152869,0.784951515262946,0.726968697272241,0.515227085910738,0.952373256674036,0.985080229351297,0.0235045454464853,0.00416592671535909,0.967333158710971,0.396277377847582,NA,0.5
+-1.55456092344735,0.298712126677856,0.329398845555261,0.824424406746402,0.504606149625033,0.462511173449457,0.987116791075096,0.984700593166053,0.738257547840476,0.506412111455575,0.215016127098352,NA,1
+-5.71298108096891,0.863856402924284,0.472625948023051,0.0874699417036027,0.909145939163864,0.37907059583813,0.480933768674731,0.478833106346428,0.669854396488518,0.0413195120636374,0.272561500314623,NA,3
+2.72257293704493,0.977674740599468,0.757155697094277,0.207756455754861,0.203775214497,0.78417210560292,0.582602435722947,0.666409130906686,0.686884060502052,0.110600611427799,0.558197030797601,NA,3
+10.2974933407333,0.817447017878294,0.907617374090478,0.650747747858986,0.467643693089485,0.37755541363731,8.57806298881769e-05,0.00122400932013988,0.270136442501098,0.128451892407611,0.193024599459022,NA,3
+-0.515443771934163,0.156245535472408,0.951601629611105,0.789141749264672,0.919310998637229,0.852464217459783,0.700894636334851,0.253609915263951,0.141912077786401,0.594247984467074,0.577542662387714,NA,0.5
+3.60755387259999,0.935209455899894,0.168847924564034,0.71698178560473,0.164761062944308,0.820564121939242,0.269563676323742,0.865492029348388,0.0663771124090999,0.757397901965305,0.30812180461362,NA,3
+1.53424165667702,0.495078047504649,0.00743950600735843,0.699956620577723,0.150095566408709,0.820907787652686,0.0250667075160891,0.219115395331755,0.0701660695485771,0.144342829938978,0.661241426831111,NA,1
+2.11945690269233,0.494878040393814,0.335358702111989,0.0859456097241491,0.334762825863436,0.436428788118064,0.871063163038343,0.862540878355503,0.149437770945951,0.172741169808432,0.301684214035049,NA,1
+-0.764114777927609,0.472692873096094,0.913892224663869,0.814544472144917,0.345459071453661,0.473493713885546,0.772064296295866,0.964068693341687,0.302707911469042,0.310749824624509,0.326807718491182,NA,1
+1.59341061109396,0.607975764898583,0.0794732617214322,0.974691078998148,0.617390216095373,0.461572230560705,0.722619395470247,0.609765309141949,0.594569276785478,0.192564327269793,0.0523809674195945,NA,2
+-1.05008884817102,0.458628129446879,0.276793640572578,0.394021584419534,0.216551521327347,0.656353653175756,0.901549807749689,0.893069363664836,0.394100816454738,0.276124453404918,0.0872335392050445,NA,1
+-0.454916415458206,0.100318351062015,0.378878374584019,0.0983213325962424,0.174892703304067,0.711960697313771,0.919599503278732,0.190358696039766,0.269345039268956,0.287819736870006,0.287268604617566,NA,0.5
+-0.485510412623777,0.241354882251471,0.949344601249322,0.158448557602242,0.133629100397229,0.866928705945611,0.937315163202584,0.184269865509123,0.327862715348601,0.563999371370301,0.785677004838362,NA,0.5
+0.776775239291567,0.291910991771147,0.0846551819704473,0.77373803849332,0.182577745057642,0.20777322165668,0.364862532587722,0.302542981225997,0.99205335858278,0.101478747557849,0.831732955761254,NA,1
+-0.503915118460329,0.0921388799324632,0.69793195463717,0.640171206556261,0.433864553691819,0.868978491751477,0.679959014523774,0.123384471517056,0.638639747863635,0.164615281391889,0.954158689128235,NA,0.5
+-2.45868231246521,0.486175883794203,0.204146457370371,0.274052948923782,0.427365210838616,0.0658067418262362,0.238397930283099,0.715437222272158,0.305063903564587,0.979477859567851,0.535615005297586,NA,1
+3.07267136331703,0.672265029046685,0.683067857287824,0.300874865613878,0.990141049260274,0.336872167419642,0.262356182327494,0.166166434762999,0.507457473315299,0.182093014242128,0.988365483703092,NA,2
+-1.35725074282868,0.373770251171663,0.989214881556109,0.348896064329892,0.00952328857965767,0.870421917643398,0.0278489568736404,0.971605542581528,0.0709339645691216,0.96520364494063,0.830430411733687,NA,1
+-2.09439816462769,0.6810261097271,0.785620857728645,0.798142119776458,0.381587166339159,0.372327584540471,0.625061142724007,0.36749339546077,0.582425137981772,0.641279636882246,0.120793332578614,NA,2
+-0.00796859068675282,0.0229878642130643,0.855209650471807,0.982022156473249,0.256182591430843,0.777578515000641,0.825847221305594,0.558763438137248,0.683600728865713,0.737240033224225,0.413099535508081,NA,0.5
+-1.4979445469424,0.714179781964049,0.706974609289318,0.173396941041574,0.230190037516877,0.856905392371118,0.897651092847809,0.326673374744132,0.499662009300664,0.31590295699425,0.814334665657952,NA,2
+-0.439028039829894,0.69282753020525,0.235939425881952,0.237423748476431,0.719278433360159,0.29460807191208,0.928081472637132,0.536010401323438,0.794380184262991,0.658699807012454,0.520766410976648,NA,2
+-0.242951793769155,0.243101859698072,0.307146482169628,0.843962025130168,0.0316330003552139,0.430362788261846,0.351072994992137,0.654738643905148,0.969542238861322,0.60179814370349,0.398643856402487,NA,0.5
+-0.630263115026057,0.200559745077044,0.907688920153305,0.334342788904905,0.150655995355919,0.972313160542399,0.542266771197319,0.50963302818127,0.218434902839363,0.748211001046002,0.228817308787256,NA,0.5
+0.696031295956962,0.328547941055149,0.876553914509714,0.164135021390393,0.395798878511414,0.477207755902782,0.283287385711446,0.191637014970183,0.346791804069653,0.0879971194081008,0.774699172470719,NA,1
+1.86218635994138,0.667642474640161,0.175826355349272,0.104500935412943,0.188644989626482,0.935310949804261,0.534588502487168,0.650544292991981,0.280430254060775,0.881018078653142,0.322163599310443,NA,2
+0.0618266822267202,0.966812142170966,0.964485211065039,0.745329377939925,0.468591102631763,0.238328024744987,0.248983833007514,0.304753655567765,0.806436447193846,0.374863224104047,0.268298006616533,NA,3
+-0.213469050164475,0.626246140571311,0.371381344739348,0.64032802847214,0.563473800662905,0.100175821688026,0.0235935947857797,0.410097931977361,0.984508452471346,0.908335901331156,0.106187571771443,NA,2
+2.71820413597084,0.342010788153857,0.705079389037564,0.551346761640161,0.598823779728264,0.448870678432286,0.737467909697443,0.322141070617363,0.551015156554058,0.226791883818805,0.913258621236309,NA,1
+-1.01015670294422,0.765705335186794,0.826494007604197,0.231260113185272,0.565515470458195,0.248132557841018,0.171093754237518,0.286525617586449,0.441912526264787,0.227831450290978,0.286231678677723,NA,3
+-3.14339298170896,0.951644803164527,0.232232666807249,0.908373491605744,0.913206648547202,0.407022410538048,0.953037474770099,0.274196953279898,0.27726714592427,0.842141730245203,0.17599373916164,NA,3
+0.816940374582757,0.00308033730834723,0.223011573543772,0.0552042822819203,0.646219877526164,0.89388394379057,0.35093015129678,0.0684547659475356,0.56139280856587,0.433695368934423,0.780848235357553,NA,0.5
+-1.06114260561244,0.488627271028236,0.343027671799064,0.495272737927735,0.920322231249884,0.0372702074237168,0.504528037970886,0.391261521494016,0.130302850389853,0.576689033070579,0.0055089273955673,NA,1
+3.14001425018611,0.936363400658593,0.68013828061521,0.900950629264116,0.699788666563109,0.58299405220896,0.566819867584854,0.539389610989019,0.598359101684764,0.961430250899866,0.322504172567278,NA,3
+3.75658460367109,0.72642320394516,0.340536155505106,0.644040668383241,0.0150993110146374,0.76843476947397,0.496726306155324,0.994598030112684,0.0396893250290304,0.878083458403125,0.48237074050121,NA,2
+1.12695583768729,0.983749621314928,0.788466003490612,0.593351603019983,0.94108819635585,0.306970248464495,0.201373670483008,0.209501806180924,0.305320084095001,0.451809530379251,0.385713089257479,NA,3
+1.52459560077634,0.672651072964072,0.46188158262521,0.209960805252194,0.545736834639683,0.21016333415173,0.909396487753838,0.140858779894188,0.656669340096414,0.829055720707402,0.514228889951482,NA,2
+0.963944520418568,0.0890714421402663,0.796551150269806,0.0773013802245259,0.993034319253638,0.18855186062865,0.839895894518122,0.13716762047261,0.883261514361948,0.305906966794282,0.866397253004834,NA,0.5
+0.129771290079079,0.189816636266187,0.434954048832878,0.614785549463704,0.0503757097758353,0.514615601161495,0.952145036077127,0.637101435568184,0.426087585045025,0.311506387079135,0.234520558966324,NA,0.5
+0.912884979700598,0.683184877503663,0.510933240642771,0.473237108206376,0.597530248807743,0.262252091662958,0.373021523468196,0.595309577649459,0.412889627274126,0.824333656812087,0.681659359484911,NA,2
+-2.09362850541451,0.426857191603631,0.896169882267714,0.314928279956803,0.495635512284935,0.482654591090977,0.713752283481881,0.620617669541389,0.778110204497352,0.956990454345942,0.608790414175019,NA,1
+-0.0644100579741575,0.721381928073242,0.246724736411124,0.742296724347398,0.949994837632403,0.286190049722791,0.0760854352265596,0.445758877322078,0.949769111117348,0.925280713476241,0.499942892463878,NA,2
+0.10139334086343,0.0579308001324534,0.994543595705181,0.293401257600635,0.00884762965142727,0.889348507625982,0.549911052221432,0.615719662979245,0.280096381437033,0.143207954941317,0.271301218308508,NA,0.5
+2.06653528604937,0.518336966400966,0.506918795639649,0.466876366641372,0.620179544668645,0.486438295803964,0.383961294777691,0.519759878516197,0.0823564794845879,0.572632172610611,0.927550779422745,NA,2
+0.083993183366566,0.792077120160684,0.0227267004083842,0.350600538309664,0.802795631811023,0.271761489799246,0.752974940929562,0.58151887729764,0.448455915320665,0.114585774950683,0.480480066733435,NA,3
+0.871280979378034,0.155268164584413,0.169720521196723,0.209214897826314,0.969444170594215,0.455098179168999,0.162548776483163,0.30731915589422,0.797547695925459,0.937418807530776,0.699685209430754,NA,0.5
+-0.993675609227815,0.31696749618277,0.255061091855168,0.329014195129275,0.311154339462519,0.901402737712488,0.881375814089552,0.592734534991905,0.0463438257575035,0.407562130596489,0.94760683667846,NA,1
+3.87620571131626,0.712310006609187,0.150037638610229,0.24496771581471,0.652770188869908,0.754434264730662,0.353124728426337,0.437375633278862,0.317781692370772,0.994260160252452,0.886606745189056,NA,2
+-0.184073402751879,0.302567538106814,0.236578963929787,0.529907553223893,0.0782564121764153,0.575638748938218,0.953494219575077,0.74427487119101,0.285246771760285,0.675243055913597,0.700421273009852,NA,1
+-0.82056052576034,0.607995933154598,0.269555284408852,0.859022193821147,0.785452287411317,0.556223073042929,0.531818702351302,0.694545754231513,0.475929024163634,0.182002258952707,0.0817325403913856,NA,2
+-0.128441943850425,0.689589613582939,0.838425317080691,0.0708509180694818,0.0456330950837582,0.244261574465781,0.352208221564069,0.257190010044724,0.259088592603803,0.793637574184686,0.251339136157185,NA,2
+-1.67953017850423,0.513718589907512,0.177739400183782,0.135568092111498,0.754302552901208,0.119685888523236,0.271099909441546,0.881469729356468,0.380955666769296,0.0594409927725792,0.285897349473089,NA,2
+4.01029674994469,0.637662801891565,0.681524514220655,0.0506364298053086,0.195933144073933,0.177333432948217,0.206886797677726,0.685570570174605,0.356021656654775,0.985714256530628,0.845266965450719,NA,2
+0.418247462976808,0.156605343334377,0.341756730806082,0.963353005703539,0.899666843237355,0.4310629342217,0.946215359028429,0.897696364205331,0.776364185847342,0.420296776574105,0.381828723009676,NA,0.5
+-1.51268669424462,0.62234056647867,0.577063782373443,0.603003362193704,0.446018574293703,0.340106446295977,0.65706201409921,0.152433987008408,0.260849780868739,0.550666619790718,0.255014094058424,NA,2
+4.89636360756605,0.807543221861124,0.476624209433794,0.202747098170221,0.38368299161084,0.331279368372634,0.282060217810795,0.374299304792657,0.750059184152633,0.606916478602216,0.0227296042721719,NA,3
+2.17393837350942,0.280177400680259,0.634965054458007,0.408001474570483,0.916558355325833,0.714338184334338,0.583447890123352,0.470874862978235,0.0685866239946336,0.717115951701999,0.843359079910442,NA,1
+0.114333681805783,0.438450475456193,0.602708112215623,0.349823107244447,0.414686303352937,0.198583260178566,0.261792612727731,0.163943613413721,0.180993436602876,0.669274596963078,0.0332412673160434,NA,1
+-0.0575913747610489,0.180707123363391,0.526421991642565,0.82064001262188,0.521263679722324,0.792229591170326,0.514831050531939,0.655353802023456,0.148887025890872,0.567784914281219,0.786496615968645,NA,0.5
+-1.01172391605431,0.463357580360025,0.267548341304064,0.839970801956952,0.421053394908085,0.835206566611305,0.946785928681493,0.722578325076029,0.913413252448663,0.466875985031947,0.519509368343279,NA,1
+-1.01622844711912,0.636612149421126,0.569439431419596,0.0444083481561393,0.166187049355358,0.890496745705605,0.972773446468636,0.512027263408527,0.453198195435107,0.185353330336511,0.822659314842895,NA,2
+0.879633812737811,0.937646907521412,0.357851214939728,0.754458939423785,0.757599327713251,0.252516763517633,0.253876760136336,0.213992986362427,0.89202951756306,0.274374803295359,0.646439817501232,NA,3
+3.17475900901958,0.715058491099626,0.757979915942997,0.363833147101104,0.339705190155655,0.342578890034929,0.504253518534824,0.836292343214154,0.440996023127809,0.0837488134857267,0.572989572072402,NA,2
+-0.0127358680059262,0.91581250471063,0.954323386540636,0.430059639271349,0.762585739139467,0.368888254277408,0.20797983976081,0.47765283472836,0.167148848297074,0.308806973975152,0.314454952254891,NA,3
+-0.8544312017705,0.502859967993572,0.151654090732336,0.396629377966747,0.021326761925593,0.205127923749387,0.539602338802069,0.0801719883456826,0.0248979306779802,0.718125011539087,0.321455252822489,NA,2
+-1.82887098666628,0.262003114912659,0.0757940574549139,0.85448711225763,0.564622745616361,0.0720540515612811,0.967587752500549,0.959227720042691,0.638316398952156,0.562585303094238,0.834035288542509,NA,1
+3.2622467572984,0.335096222581342,0.244150118669495,0.183940630406141,0.615293832495809,0.827252987539396,0.267028478439897,0.273504600860178,0.507153154583648,0.388217261061072,0.138010729802772,NA,1
+1.65601016742667,0.838172710733488,0.954755051294342,0.608526331372559,0.836548767983913,0.919543279102072,0.515458332141861,0.598611275665462,0.66656892397441,0.607837118208408,0.493392545264214,NA,3
+0.381933395917132,0.261543265311047,0.95214184653014,0.764482910744846,0.966228008968756,0.493756796000525,0.872538808966056,0.585356997791678,0.242046943400055,0.900154284201562,0.452932744985446,NA,1
+0.061813986449167,0.5902709166985,0.654293139465153,0.18226848798804,0.914126749383286,0.398949036840349,0.773602006956935,0.743641247740015,0.208624595077708,0.4145590539556,0.676244510803372,NA,2
+0.274146489910667,0.560014321003109,0.350247922120616,0.756335157435387,0.416073066880926,0.0586489790584892,0.301071509020403,0.422949285479262,0.210499112727121,0.482112698722631,0.112424957100302,NA,2
+-5.75883040392064,0.901148825651035,0.810049108229578,0.878282216377556,0.316235190955922,0.230603245552629,0.250381491146982,0.650639815721661,0.0529408203437924,0.958216429455206,0.889385785441846,NA,3
+0.911749288623184,0.539145407034084,0.596371402265504,0.897788940230384,0.439045100938529,0.16618771571666,0.142886094050482,0.667914129793644,0.535841233795509,0.753273370675743,0.0447190594859421,NA,2
+4.55360390370342,0.945572390919551,0.0924056400544941,0.939797199331224,0.642557488754392,0.0861750931944698,0.632535864366218,0.465771202929318,0.272886190097779,0.772984977345914,0.715489778900519,NA,3
+-0.907822599380484,0.423604313516989,0.944986613234505,0.159030285896733,0.922660069772974,0.964939738158137,0.532024955842644,0.634939571144059,0.39645018754527,0.635082328226417,0.593678319593892,NA,1
+-0.139344587678803,0.58962686243467,0.590537373209372,0.14912519371137,0.20451657124795,0.0897868368774652,0.738680734764785,0.374435908161104,0.989756791852415,0.584141218336299,0.653865883359686,NA,2
+0.806150843945478,0.678180137882009,0.973715249914676,0.106831170618534,0.300997588550672,0.750364477513358,0.491450151661411,0.0154496582690626,0.259265987202525,0.558927526231855,0.0112981905695051,NA,2
+1.44095642980371,0.917209735373035,0.341985862003639,0.268955789040774,0.109774171141908,0.239792765583843,0.454389738617465,0.522328067803755,0.60719471052289,0.118838940281421,0.388227568939328,NA,3
+-3.25161689162916,0.922700179507956,0.0325096684973687,0.352068450069055,0.232990069780499,0.469084792770445,0.981463437899947,0.11463882913813,0.72538296924904,0.246744823874906,0.321137896971777,NA,3
+-0.130522430553986,0.401394749758765,0.256456261267886,0.0354134733788669,0.978563639800996,0.239538576453924,0.814784180140123,0.735997994896024,0.749723166925833,0.62831072579138,0.890577062265947,NA,1
+0.669575467655283,0.00989005784504116,0.435264135012403,0.723876874428242,0.849379999563098,0.0575199017766863,0.957934653852135,0.837231518467888,0.46569788781926,0.891659042565152,0.783426602371037,NA,0.5
+2.54014096182668,0.305441607953981,0.0902002388611436,0.118577564833686,0.385022775735706,0.56807669182308,0.334235888672993,0.538188089616597,0.216295424615964,0.158172710798681,0.00234771450050175,NA,1
+-0.193944994135837,0.00190780940465629,0.78280071169138,0.764838046627119,0.291868838947266,0.869910318404436,0.341377722565085,0.648056457517669,0.579640600830317,0.215270293876529,0.61375098163262,NA,0.5
+0.0208742133525005,0.863172167912126,0.504580818815157,0.374554778914899,0.836817204486579,0.87124543520622,0.670387550722808,0.737122401129454,0.827918927185237,0.599544936791062,0.942843936849385,NA,3
+0.765792314938424,0.566925200633705,0.849535879679024,0.34304199879989,0.847504819976166,0.892173214582726,0.758812437998131,0.214903841959313,0.45636634901166,0.484204821521416,0.207701456500217,NA,2
+0.352804369431417,0.364061176544055,0.670583426486701,0.117415519431233,0.108332704752684,0.316217254614457,0.767299061873928,0.895374773070216,0.667814850108698,0.922258591279387,0.0134780446533114,NA,1
+-1.23698048076279,0.332583913113922,0.612572266953066,0.704983988078311,0.768699376378208,0.385655405465513,0.128826092928648,0.116410831455141,0.520903897006065,0.974680992309004,0.806146663846448,NA,1
+-2.56441778784605,0.665565764764324,0.605427384609357,0.17659778567031,0.02090925257653,0.704631736734882,0.73883875226602,0.774222782580182,0.268567186314613,0.696540282806382,0.354841801803559,NA,2
+0.232796925229605,0.569475795142353,0.454856015508994,0.939597767777741,0.744496839120984,0.698145196773112,0.467724752146751,0.0180247377138585,0.297438253415748,0.308250970672816,0.523631568299606,NA,2
+-0.916045983780381,0.398941761115566,0.661880399100482,0.385367383016273,0.0125482359435409,0.701195284491405,0.652126201428473,0.324592209421098,0.482771011535078,0.943977946648374,0.711980663239956,NA,1
+-3.02511296110412,0.601308670360595,0.492553135380149,0.233871235977858,0.712123312056065,0.867592514958233,0.929739307146519,0.856446724850684,0.754480483010411,0.377171362750232,0.526562972692773,NA,2
+0.08116233752899,0.208068270701915,0.806491583352908,0.138934786897153,0.550345825962722,0.273357491008937,0.738135070772842,0.122066766722128,0.67383626755327,0.776206725975499,0.432750965002924,NA,0.5
+-5.27518419045481,0.891456350916997,0.601628924021497,0.281817921902984,0.245754534145817,0.525102650281042,0.350016801385209,0.0317163458094001,0.342192857991904,0.69337944011204,0.535440781386569,NA,3
+-0.195996325881689,0.138576569035649,0.187388508580625,0.262100108899176,0.263345927000046,0.493119575316086,0.152671873103827,0.504191888263449,0.913665950298309,0.165937364799902,0.0847142075654119,NA,0.5
+0.315579484938764,0.858387031825259,0.695295455399901,0.467401414411142,0.626965253613889,0.490166572621092,0.617864213185385,0.0769863030873239,0.542200545780361,0.219044300960377,0.0295198371168226,NA,3
+0.0267096393523584,0.266054383246228,0.523457160918042,0.538887435337529,0.597743078833446,0.296432407340035,0.807767712045461,0.84599154163152,0.397196589736268,0.82058397657238,0.093033802928403,NA,1
+1.25261939865097,0.60674773179926,0.706874470924959,0.674645616207272,0.156269168946892,0.858524578856304,0.966854283586144,0.777528064092621,0.547137490706518,0.0508977069985121,0.170303455553949,NA,2
+0.541883133495883,0.299106652615592,0.868335065431893,0.293283038539812,0.337412812747061,0.563003861811012,0.057874902850017,0.206769967218861,0.249845808371902,0.57238865736872,0.431905421428382,NA,1
+-0.359359846361593,0.00028673093765974,0.444823984289542,0.267580098472536,0.619911819230765,0.348575697746128,0.445040695136413,0.298632511869073,0.349616114981472,0.0186277241446078,0.727784499060363,NA,0.5
+-0.725046148314536,0.738201215397567,0.305303359869868,0.98667918308638,0.875479456968606,0.816655561095104,0.550264997407794,0.78673102799803,0.749039791757241,0.148614945588633,0.50864305277355,NA,2
+2.42662093734972,0.78392618172802,0.779760129982606,0.417675146833062,0.697084854589775,0.642540717031807,0.936560302507132,0.12054528738372,0.307862642919645,0.839434523368254,4.8645306378603e-05,NA,3
+-0.841952793676179,0.248953337082639,0.903661191929132,0.214526182506233,0.640308956848457,0.630132407415658,0.557652691844851,0.294213210465387,0.575431503122672,0.117273130686954,0.394496359396726,NA,0.5
+-1.03023205439958,0.724063246278092,0.797944512451068,0.531282962532714,0.761441437294707,0.882055644644424,0.695016658399254,0.902350852033123,0.740311119239777,0.755922955228016,0.0983525444753468,NA,2
+-0.912771137967775,0.34925606357865,0.676785026676953,0.588860424933955,0.161323110340163,0.957519877469167,0.398865574738011,0.566670776112005,0.161247945856303,0.247955431696028,0.743449069792405,NA,1
+0.517313406285897,0.119058254174888,0.301976219983771,0.2837041572202,0.0562514583580196,0.732049201382324,0.543040792457759,0.178399549797177,0.637692917603999,0.176733382046223,0.913348912494257,NA,0.5
+0.871011941589735,0.308870760258287,0.508238948881626,0.217849156819284,0.755379884736612,0.308171590790153,0.877481517381966,0.958365337457508,0.897053161635995,0.609838765114546,0.357350649312139,NA,1
+0.723881692134752,0.1084195880685,0.285055675543845,0.494687871308997,0.959149545524269,0.867562021827325,0.437210090924054,0.0436040495987982,0.886218967847526,0.134117919020355,0.147130149416625,NA,0.5
+-4.1056823910876,0.836923674680293,0.790600413223729,0.218965121312067,0.631649191724136,0.131414104020223,0.986164937028661,0.1794618004933,0.893512472510338,0.397628468694165,0.977409608894959,NA,3
+0.952558604299245,0.281533166533336,0.653331918641925,0.782094214344397,0.486817280761898,0.712452893378213,0.735165594611317,0.22127672447823,0.17275553708896,0.781067404197529,0.301315511809662,NA,1
+0.434834298048182,0.345692228991538,0.579240264836699,0.952218348626047,0.0265811623539776,0.292065045097843,0.140570497373119,0.594512204639614,0.894585548667237,0.163636759854853,0.791753190103918,NA,1
+-0.617241139637955,0.24287026701495,0.347456730203703,0.352250093361363,0.567248777253553,0.5325484755449,0.362278310814872,0.104282488347962,0.6345406237524,0.298809389350936,0.061041493434459,NA,0.5
+-1.10157854604848,0.589005693560466,0.738731898134574,0.411837223684415,0.0231877483893186,0.510611890815198,0.317921287380159,0.142743433825672,0.362699191318825,0.295025371946394,0.297999273752794,NA,2
+0.0779708729765081,0.61409965949133,0.267073255265132,0.644359648926184,0.435340049676597,0.663986770203337,0.853410524781793,0.439644190017134,0.0916713422629982,0.885482318233699,0.328195882029831,NA,2
+-0.790086227163868,0.827004836406559,0.588833221467212,0.510606417665258,0.135837320005521,0.959990479284897,0.622058121720329,0.238031924469396,0.0791387532372028,0.875529285753146,0.385706771630794,NA,3
+0.0121011462499208,0.434019140200689,0.76129729533568,0.565473348135129,0.554319101618603,0.193900709273294,0.253057076362893,0.960415460402146,0.64092730381526,0.927356063388288,0.739957847632468,NA,1
+0.528668478450982,0.00797079806216061,0.620697325794026,0.059939440805465,0.933844800340012,0.282361896475777,0.798007321543992,0.109523738268763,0.205230085877702,0.786281060893089,0.626566218677908,NA,0.5
+-1.97146007839586,0.426603920059279,0.232865846948698,0.667433485155925,0.0196325895376503,0.752369344001636,0.0936158304102719,0.0917298034764826,0.746732441009954,0.296932371798903,0.478665569564328,NA,1
+0.917133356519574,0.318299685139209,0.434513642685488,0.549943955615163,0.726315794279799,0.817645830567926,0.811867464100942,0.061435961863026,0.746087650069967,0.447872480610386,0.84255820303224,NA,1
+-0.329040167848524,0.118530319537967,0.457290950231254,0.645931467181072,0.893649809062481,0.290868752868846,0.963444818975404,0.287232589442283,0.965041985502467,0.503362905001268,0.700591426342726,NA,0.5
+1.48193500973284,0.625231690006331,0.0553984474390745,0.649881738703698,0.299855779856443,0.496550764422864,0.941366601735353,0.854566443245858,0.833261088933796,0.97451618895866,0.931585984304547,NA,2
+-0.173022349447719,0.164724288508296,0.869774119695649,0.643917094916105,0.35930937086232,0.131004156777635,0.581698802066967,0.991578063229099,0.646482613869011,0.973439331632107,0.251832834677771,NA,0.5
+-0.798130578450863,0.413501289440319,0.191485705785453,0.66864021285437,0.944299905095249,0.781557427253574,0.426434542285278,0.155345749342814,0.47630034852773,0.368169168476015,0.250597581965849,NA,1
+-0.574218404015675,0.242424165830016,0.58770715072751,0.515803768066689,0.381307470612228,0.00103132519870996,0.822859295178205,0.0108886968810111,0.230126534821466,0.557247446617112,0.905343563761562,NA,0.5
+1.20576697217052,0.481467565754429,0.384135053725913,0.250637572957203,0.0487530084792525,0.0894714090973139,0.907941385637969,0.130016501294449,0.108319341670722,0.00571742816828191,0.322211351711303,NA,1
+1.09418799497703,0.428736956324428,0.169671062380075,0.828763456083834,0.351603407878429,0.227558815153316,0.226003634510562,0.346984679810703,0.792112624039873,0.331346849445254,0.432414019247517,NA,1
+1.33295018743162,0.657001668587327,0.637372163590044,0.824361448409036,0.929858485469595,0.478111879900098,0.372787630185485,0.409159137168899,0.687029706314206,0.462824999121949,0.282154636690393,NA,2
+0.767515180489683,0.164000877644867,0.787021941738203,0.480641457485035,0.256527086952701,0.139046657830477,0.260776846436784,0.843071689130738,0.928756222594529,0.0495820019859821,0.623474525287747,NA,0.5
+5.91575131696734,0.968515180051327,0.366838250076398,0.0660362653434277,0.856167251477018,0.179680837085471,0.161809651181102,0.591778725851327,0.48686463618651,0.738822849933058,0.183114260667935,NA,3
+-6.07690196330587,0.830175120383501,0.379230955149978,0.115117009729147,0.729175335494801,0.629532365594059,0.782002086285502,0.933919353410602,0.0596355667803437,0.724859771085903,0.652606250252575,NA,3
+-0.313191580590458,0.433103942545131,0.486646147910506,0.0679896532092243,0.0214490725193173,0.0353633773047477,0.744490799959749,0.845955922966823,0.958894333336502,0.156010123435408,0.303289767587557,NA,1
+-0.540923578326201,0.460490206023678,0.00578354438766837,0.550281241768971,0.788312985096127,0.210271368967369,0.815538283670321,0.28684966918081,0.275849351193756,0.469581529032439,0.647478682687506,NA,1
+-0.673999243552475,0.570351638598368,0.868796721566468,0.776297046570107,0.343447036575526,0.135450173402205,0.647280380362645,0.0270581084769219,0.964931801892817,0.511921106604859,0.636638013413176,NA,2
+0.521317196587708,0.0333191037643701,0.283822370693088,0.192718317965046,0.948545307852328,0.824977292912081,0.370365360984579,0.515110278967768,0.214455303736031,0.224180643446743,0.711288265651092,NA,0.5
+0.464127896273477,0.150690599810332,0.122571487911046,0.888559450628236,0.731974716298282,0.0771893607452512,0.541291358415037,0.552816195879132,0.315732726827264,0.151362558128312,0.962228747783229,NA,0.5
+0.0280326256524612,0.218963563675061,0.667505384190008,0.811947909416631,0.687651550397277,0.0374882640317082,0.161606113892049,0.341489754617214,0.114423418417573,0.711193904979154,0.999109187629074,NA,0.5
+1.72545787431865,0.791984313167632,0.713207671185955,0.329182849498466,0.632728930795565,0.319493535207585,0.219288081862032,0.48391812061891,0.699484226293862,0.955756370443851,0.813189222943038,NA,3
+1.15486734783788,0.566656570881605,0.657263582805172,0.788281690096483,0.778249064926058,0.590916589833796,0.385298176435754,0.389463485917076,0.137170025613159,0.138196402462199,0.308245474472642,NA,2
+-0.457464364994371,0.203198125585914,0.378648053156212,0.808898270130157,0.906652554869652,0.850757014239207,0.988703542388976,0.178554533980787,0.459032043116167,0.799958050018176,0.297242203727365,NA,0.5
+2.0642220969772,0.574996857671067,0.13869056943804,0.148214791202918,0.0713210175745189,0.281843064585701,0.699210103135556,0.611457530176267,0.412616135785356,0.312300917692482,0.753751856740564,NA,2
+1.79325254054518,0.779666494345292,0.699538435321301,0.961586186429486,0.347297596279532,0.0675467550754547,0.325070535531268,0.176488080061972,0.603379048407078,0.136019740719348,0.473342314828187,NA,3
+-0.814168249805148,0.179700289387256,0.290472864639014,0.604973735287786,0.684216808062047,0.566976414760575,0.147398902801797,0.29908396420069,0.0406292479019612,0.475435412954539,0.30359836248681,NA,0.5
+1.05601002941817,0.974190507782623,0.59218838927336,0.234243621351197,0.808535494375974,0.187695320462808,0.772726303897798,0.996423880336806,0.286155195906758,0.0625078319571912,0.898713116999716,NA,3
+-0.335678118214373,0.589294733013958,0.64874632912688,0.60927852592431,0.912218964891508,0.116446102270856,0.800978301558644,0.552153271622956,0.498927663313225,0.77924073045142,0.604476742446423,NA,2
+-0.297220306313378,0.00104556139558554,0.243074154946953,0.28915421012789,0.584380616666749,0.680923626758158,0.190056581050158,0.489183940691873,0.543326803250238,0.462141246302053,0.0547776529565454,NA,0.5
+3.36381201170981,0.842413400299847,0.836705626221374,0.803220853442326,0.52237598830834,0.0978306015022099,0.44979960215278,0.623058009892702,0.0899901306256652,0.659136149799451,0.511611237656325,NA,3
+-1.88385207395372,0.52834680210799,0.734877026872709,0.131855968618765,0.703349165152758,0.0538370700087398,0.573549640597776,0.794007008662447,0.812998212641105,0.404450054978952,0.43243193323724,NA,2
+-1.73270176331594,0.779436560813338,0.115024698665366,0.0290894189383835,0.368165988940746,0.811495361849666,0.0700736299622804,0.615472083212808,0.257920050993562,0.869047976098955,0.349914842285216,NA,3
+1.37079153120135,0.570917901350185,0.187404554570094,0.398802037583664,0.846335949376225,0.934954999480397,0.529415836092085,0.910126697039232,0.118137815967202,0.111092046368867,0.248694343725219,NA,2
+0.571363043562507,0.331030112225562,0.450528397923335,0.336339824367315,0.16454178863205,0.430747980251908,0.505673100007698,0.328476364724338,0.21718189259991,0.586265194229782,0.447927470318973,NA,1
+-1.79533836540329,0.976926734903827,0.0961627899669111,0.60899573401548,0.599624714581296,0.713024838129058,0.36587701109238,0.517652825685218,0.313225879799575,0.691182613139972,0.946866175159812,NA,3
+2.76102079506608,0.760612237034366,0.802744230488315,0.707125860266387,0.710110249230638,0.0485071069560945,0.337238987907767,0.603377134539187,0.396445233840495,0.336875891312957,0.0135681433603168,NA,3
+1.03587118074943,0.546186395455152,0.0895447288639843,0.102424295851961,0.124316787347198,0.398161188932136,0.0595820427406579,0.0317856874316931,0.711451485287398,0.184543622424826,0.570017953403294,NA,2
+2.64092013401424,0.813234215602279,0.346893396694213,0.999183400999755,0.163131871260703,0.109145125374198,0.742135232314467,0.926391132874414,0.354281723732129,0.518946023192257,0.143736189464107,NA,3
+-2.14161378373943,0.623024221044034,0.987261440372095,0.240460366243497,0.0876346873119473,0.137773034861311,0.00308776297606528,0.764373373007402,0.797460315050557,0.443219825392589,0.516431802418083,NA,2
+-0.193411209224147,0.0207313429564238,0.243699158774689,0.459949440322816,0.262547085061669,0.695130342617631,0.946504537714645,0.726618548389524,0.864191201748326,0.815897560212761,0.0842976626008749,NA,0.5
+1.04927342445141,0.472177557414398,0.0301995284389704,0.293144194176421,0.790906876791269,0.438358291517943,0.794757833238691,0.85613635671325,0.811791674233973,0.112252983730286,0.169568839715794,NA,1
+0.348988455997724,0.262080669403076,0.927174943732098,0.142983013764024,0.640390169108286,0.366609850898385,0.529223524965346,0.57928417250514,0.206402273848653,0.268847646424547,0.165483654243872,NA,1
+0.696440990671028,0.983129711588845,0.654424325563014,0.83093448006548,0.817050429061055,0.692395427962765,0.485632661730051,0.661732462001964,0.0443739434704185,0.631122295744717,0.821382548194379,NA,3
+-1.50946435977094,0.524429301731288,0.394003928638995,0.612721437122673,0.641075712163001,0.8340331655927,0.81034871423617,0.378355852561072,0.118066052906215,0.0152956454548985,0.0607850980013609,NA,2
+-3.60722631045085,0.973684054333717,0.862753849243745,0.470457507064566,0.516427976312116,0.571779370773584,0.00344765046611428,0.557507778517902,0.863539802376181,0.618254639208317,0.0438256817869842,NA,3
+0.640760110283842,0.3505244248081,0.388575355056673,0.525333723518997,0.90868836059235,0.656305950833485,0.87575338082388,0.145426131319255,0.142402743920684,0.722210387466475,0.646311188582331,NA,1
+1.0927036128643,0.0793833178468049,0.0104481617454439,0.93192859296687,0.779025187250227,0.358062380226329,0.498329946072772,0.557266015792266,0.794099885271862,0.103802968282253,0.489988661836833,NA,0.5
+-0.960320030022167,0.231456351932138,0.585931064095348,0.872712701093405,0.684092679759488,0.747057758970186,0.33389916899614,0.693479184061289,0.234955767868087,0.0913671234156936,0.484689482487738,NA,0.5
+5.55515128084404,0.961973294848576,0.598567689536139,0.797411441337317,0.749971851240844,0.626418237108737,0.475173852639273,0.763921497855335,0.795191584387794,0.464224591152743,0.356469079386443,NA,3
+0.222792689673181,0.216883212793618,0.504161356948316,0.685418124077842,0.138950776075944,0.609323340700939,0.0815524500794709,0.887275154469535,0.673021834110841,0.229804648784921,0.545686026103795,NA,0.5
+0.493718034822244,0.11028397642076,0.503047540783882,0.179511502385139,0.763330884743482,0.77220833580941,0.934788197511807,0.494932206347585,0.731283217668533,0.855659510940313,0.0117787455674261,NA,0.5
+0.461772257413767,0.29381926660426,0.762450747890398,0.234901242889464,0.5249476833269,0.629562719725072,0.200397627661005,0.684597495477647,0.356038145022467,0.802739176666364,0.600334402406588,NA,1
+-0.126129491991506,0.463731594849378,0.167885933071375,0.540383089799434,0.282209430588409,0.0468776472844183,0.37753825658001,0.563547776313499,0.0574275727849454,0.122192964889109,0.144121702294797,NA,1
+1.61069779366059,0.353434937307611,0.44708115211688,0.562454687664285,0.681164643960074,0.344466916518286,0.389643874252215,0.47427371609956,0.420238852966577,0.246512484736741,0.0113735438790172,NA,1
+0.455525567857585,0.656678552739322,0.520737201906741,0.440892208134755,0.383611467434093,0.853515934199095,0.312850524671376,0.188586953794584,0.611132161458954,0.416548165027052,0.966824663570151,NA,2
+0.752414003343478,0.368973962496966,0.144383963663131,0.298857402056456,0.603884643642232,0.948024961864576,0.0727454784791917,0.0918680941686034,0.0495259300805628,0.778334744274616,0.237199151189998,NA,1
+-1.8071186112866,0.330021998845041,0.0695072312373668,0.405746232718229,0.476144076324999,0.162464414490387,0.143160074716434,0.2627956320066,0.371168155921623,0.219870826462284,0.593052309006453,NA,1
+0.338110168780804,0.0405488722026348,0.971289380686358,0.55798068922013,0.217713665682822,0.626417078776285,0.498581673717126,0.377851612633094,0.218278390355408,0.651240651495755,0.95426289155148,NA,0.5
+-3.08507748542801,0.905532934004441,0.329712072620168,0.140193846542388,0.36389043321833,0.374093280639499,0.146446174709126,0.438101051608101,0.795116507913917,0.983287858776748,0.488525949651375,NA,3
+-1.72372688590346,0.696682563750073,0.349387434776872,0.505626027705148,0.826131088426337,0.336876499466598,0.579624563921243,0.374704758403823,0.0984764297027141,0.158775766147301,0.86363190994598,NA,2
+0.613683233774074,0.0651458308566362,0.581464517861605,0.907430648803711,0.798097816295922,0.125102420337498,0.432380372891203,0.18545747292228,0.108076399890706,0.328964518383145,0.317265540128574,NA,0.5
+-0.133225601541877,0.859262556303293,0.671681129839271,0.68166439072229,0.624605974880978,0.0363332864362746,0.559169779764488,0.0110217127948999,0.197365242987871,0.235231575090438,0.954349690815434,NA,3
+0.174705914799019,0.0484868276398629,0.72244808007963,0.412865192163736,0.177109800977632,0.49629073496908,0.43845453299582,0.883392751449719,0.354612664552405,0.244716308778152,0.773190965875983,NA,0.5
+-2.11705848424155,0.688459891825914,0.221930157393217,0.0272207804955542,0.0866714252624661,0.0403791540302336,0.440649472177029,0.0105264887679368,0.100412974366918,0.790013117250055,0.270158890169114,NA,2
+1.1060152777824,0.375678987475112,0.924136486602947,0.474893233040348,0.824483483564109,0.0317611857317388,0.0541152430232614,0.202915545087308,0.701533750165254,0.888495072023943,0.528801799751818,NA,1
+-1.40484738126697,0.914472201606259,0.389121263055131,0.115709668258205,0.70249339309521,0.88396455720067,0.0478117982856929,0.939067059895024,0.574597767787054,0.756754127331078,0.176177548244596,NA,3
+-1.22766612067787,0.357021145289764,0.348640100797638,0.841263998765498,0.261813498334959,0.820658108917996,0.24100551684387,0.458479619817808,0.121229101205245,0.780505152186379,0.284189038909972,NA,1
+-0.137006680090441,0.0419280277565122,0.456591938855127,0.769418158335611,0.3475969475694,0.325503826374188,0.268078948371112,0.801353276707232,0.0109000348020345,0.909261407796293,0.970131604699418,NA,0.5
+-0.0472805089628641,0.458404157776386,0.509212339995429,0.472755545051768,0.89819523692131,0.00172450905665755,0.195178902009502,0.491253996500745,0.602235041558743,0.000361819053068757,0.810925672529265,NA,1
+-6.69280752542676,0.794113770360127,0.283597531029955,0.415720561984926,0.386682669632137,0.543149482225999,0.528418547241017,0.59079469111748,0.82328638038598,0.7218906681519,0.762335718609393,NA,3
+-0.791993317715144,0.94858734565787,0.862443518359214,0.336455043870956,0.178935058414936,0.876441803527996,0.886401900788769,0.0696042117197067,0.201479215407744,0.579562027938664,0.916529270121828,NA,3
+-3.5798937723398,0.518584945704788,0.341426242142916,0.980938139371574,0.025910884141922,0.703400827012956,0.611595463240519,0.540800383547321,0.108336265431717,0.802920109592378,0.717154868878424,NA,2
+1.34179692842582,0.256257413187996,0.137025708565488,0.189194887410849,0.356893142918125,0.456141719361767,0.802874229149893,0.286960861412808,0.539246008498594,0.623640240402892,0.202499657869339,NA,1
+0.574692809911355,0.367721185088158,0.189689038787037,0.650288314092904,0.916537459241226,0.189138949615881,0.176210168516263,0.626079858280718,0.105365733848885,0.0375174721702933,0.556417517596856,NA,1
+0.291989692067655,0.374401310924441,0.173651255434379,0.666860758094117,0.863264636369422,0.927415754180402,0.457678058184683,0.499020219780505,0.751850564265624,0.987137568416074,0.329214916797355,NA,1
+-1.0948854251991,0.480366722913459,0.382694880710915,0.93061161483638,0.545312937349081,0.46468991599977,0.467403194168583,0.945679706521332,0.918626469327137,0.6478590965271,0.0622258309740573,NA,1
+0.549466325611295,0.832923032343388,0.586885153781623,0.856621402082965,0.0974842766299844,0.193075296701863,0.797113571548834,0.331570270936936,0.681197754340246,0.456899536773562,0.216078756842762,NA,3
+-1.18444309638044,0.987224767683074,0.0441201773937792,0.150253226514906,0.924849382368848,0.243760817451403,0.601127431960776,0.941083330428228,0.0376720677595586,0.590444662142545,0.594265560386702,NA,3
+-2.6287892127699,0.511187988799065,0.17760677007027,0.0900412548799068,0.707964851288125,0.772246306762099,0.0507865459658206,0.880909067578614,0.565439280355349,0.325563751393929,0.625947890337557,NA,2
diff --git a/include/stochtree/data.h b/include/stochtree/data.h
index 1558760a..e5cdff93 100644
--- a/include/stochtree/data.h
+++ b/include/stochtree/data.h
@@ -6,16 +6,104 @@
 #define STOCHTREE_DATA_H_
 
 #include <Eigen/Dense>
+#include <stochtree/io.h>
 #include <stochtree/log.h>
 #include <stochtree/meta.h>
 #include <memory>
 
 namespace StochTree {
 
+/*! \brief Extract local features from memory */
+static inline void ExtractMultipleFeaturesFromMemory(std::vector<std::string>* text_data, const Parser* parser,
+                                                     std::vector<int32_t>& column_indices, Eigen::MatrixXd& data,
+                                                     data_size_t num_rows) {
+  std::vector<std::pair<int, double>> oneline_features;
+  auto& ref_text_data = *text_data;
+  int feature_counter;
+  bool column_matched;
+  for (data_size_t i = 0; i < num_rows; ++i) {
+    // unpack the vector of textlines read from file into a vector of (int, double) tuples
+    oneline_features.clear();
+    parser->ParseOneLine(ref_text_data[i].c_str(), &oneline_features);
+    
+    // free processed line:
+    ref_text_data[i].clear();
+
+    // unload the data from oneline_features vector into the dataset variables containers
+    int feature_counter = 0;
+    for (auto& inner_data : oneline_features) {
+      int feature_idx = inner_data.first;
+      column_matched = (std::find(column_indices.begin(), column_indices.end(), feature_idx)
+                        != column_indices.end());
+      if (column_matched){
+        data(i, feature_counter) = inner_data.second;
+        feature_counter += 1;
+      }
+    }
+  }
+  // free text data after use
+  text_data->clear();
+}
+
+/*! \brief Extract local features from memory */
+static inline void ExtractSingleFeatureFromMemory(std::vector<std::string>* text_data, const Parser* parser,
+                                                  int32_t column_index, Eigen::VectorXd& data, data_size_t num_rows) {
+  std::vector<std::pair<int, double>> oneline_features;
+  auto& ref_text_data = *text_data;
+  bool column_matched;
+  for (data_size_t i = 0; i < num_rows; ++i) {
+    // unpack the vector of textlines read from file into a vector of (int, double) tuples
+    oneline_features.clear();
+    parser->ParseOneLine(ref_text_data[i].c_str(), &oneline_features);
+    
+    // free processed line:
+    ref_text_data[i].clear();
+
+    // unload the data from oneline_features vector into the dataset variables containers
+    for (auto& inner_data : oneline_features) {
+      int feature_idx = inner_data.first;
+      if (column_index == feature_idx){
+        data(i) = inner_data.second;
+      }
+    }
+  }
+  // free text data after use
+  text_data->clear();
+}
+
+static inline std::vector<std::string> LoadTextDataToMemory(const char* filename, int* num_global_data, bool header) {
+  size_t file_load_progress_interval_bytes = size_t(10) * 1024 * 1024 * 1024;
+  TextReader<data_size_t> text_reader(filename, header, file_load_progress_interval_bytes);
+  // read all lines
+  *num_global_data = text_reader.ReadAllLines();
+  return std::move(text_reader.Lines());
+}
+
+static inline void FeatureUnpack(std::vector<int32_t>& categorical_variables, const char* var_id) {
+  std::string var_clean = Common::RemoveQuotationSymbol(Common::Trim(var_id));
+  int out;
+  bool success = Common::AtoiAndCheck(var_clean.c_str(), &out);
+  if (success) {
+    categorical_variables.push_back(out);
+  } else {
+    Log::Warning("Parsed variable index %s cannot be cast to an integer", var_clean.c_str());
+  }
+}
+
+static inline std::vector<int> Str2FeatureVec(const char* parameters) {
+  std::vector<int> feature_vec;
+  auto args = Common::Split(parameters, ",");
+  for (auto arg : args) {
+    FeatureUnpack(feature_vec, Common::Trim(arg).c_str());
+  }
+  return feature_vec;
+}
+
 class ColumnMatrix {
  public:
   ColumnMatrix() {}
   ColumnMatrix(double* data_ptr, data_size_t num_row, int num_col, bool is_row_major);
+  ColumnMatrix(std::string filename, std::string column_index_string, bool header = true, bool precise_float_parser = false);
   ~ColumnMatrix() {}
   double GetElement(data_size_t row_num, int32_t col_num) {return data_(row_num, col_num);}
   void SetElement(data_size_t row_num, int32_t col_num, double value) {data_(row_num, col_num) = value;}
@@ -31,6 +119,7 @@ class ColumnVector {
  public:
   ColumnVector() {}
   ColumnVector(double* data_ptr, data_size_t num_row);
+  ColumnVector(std::string filename, int32_t column_index, bool header = true, bool precise_float_parser = false);
   ~ColumnVector() {}
   double GetElement(data_size_t row_num) {return data_(row_num);}
   void SetElement(data_size_t row_num, double value) {data_(row_num) = value;}
@@ -84,6 +173,39 @@ class ForestDataset {
     var_weights_ = ColumnVector(data_ptr, num_row);
     has_var_weights_ = true;
   }
+  /*!
+   * \brief Copy / load covariates from CSV file
+   * 
+   * \param filename Name of the file (including any necessary path prefixes)
+   * \param column_index_string Comma-delimited string listing columns to extract into covariates matrix
+   */
+  void AddCovariatesFromCSV(std::string filename, std::string column_index_string, bool header = true, bool precise_float_parser = false) {
+    covariates_ = ColumnMatrix(filename, column_index_string, header, precise_float_parser);
+    num_observations_ = covariates_.NumRows();
+    num_covariates_ = covariates_.NumCols();
+    has_covariates_ = true;
+  }
+  /*!
+   * \brief Copy / load basis matrix from CSV file
+   * 
+   * \param filename Name of the file (including any necessary path prefixes)
+   * \param column_index_string Comma-delimited string listing columns to extract into covariates matrix
+   */
+  void AddBasisFromCSV(std::string filename, std::string column_index_string, bool header = true, bool precise_float_parser = false) {
+    basis_ = ColumnMatrix(filename, column_index_string, header, precise_float_parser);
+    num_basis_ = basis_.NumCols();
+    has_basis_ = true;
+  }
+  /*!
+   * \brief Copy / load variance / case weights from CSV file
+   * 
+   * \param filename Name of the file (including any necessary path prefixes)
+   * \param column_index Integer index of column containing weights
+   */
+  void AddVarianceWeightsFromCSV(std::string filename, int32_t column_index, bool header = true, bool precise_float_parser = false) {
+    var_weights_ = ColumnVector(filename, column_index, header, precise_float_parser);
+    has_var_weights_ = true;
+  }
   /*! \brief Whether or not a `ForestDataset` has (yet) loaded covariate data */
   inline bool HasCovariates() {return has_covariates_;}
   /*! \brief Whether or not a `ForestDataset` has (yet) loaded basis data */
diff --git a/include/stochtree/gamma_sampler.h b/include/stochtree/gamma_sampler.h
new file mode 100644
index 00000000..6bd037ec
--- /dev/null
+++ b/include/stochtree/gamma_sampler.h
@@ -0,0 +1,30 @@
+/*! Copyright (c) 2024 stochtree authors. All rights reserved. */
+#ifndef STOCHTREE_GAMMA_SAMPLER_H_
+#define STOCHTREE_GAMMA_SAMPLER_H_
+
+#include <random>
+
+namespace StochTree {
+
+class GammaSampler {
+ public:
+  GammaSampler() {}
+  ~GammaSampler() {}
+  double Sample(double a, double b, std::mt19937& gen, bool rate_param = true) {
+    // C++ standard library provides a gamma distribution with scale
+    // parameter, but the correspondence between gamma and IG is that 
+    // 1 / gamma(a,b) ~ IG(a,b) when b is a __rate__ parameter.
+    // Before sampling, we convert ig_scale to a gamma scale parameter by 
+    // taking its multiplicative inverse.
+    double rate = rate_param ? b : 1./b;
+    gamma_dist_ = std::gamma_distribution<double>(a, rate);
+    return gamma_dist_(gen);
+  }
+ private:
+  /*! \brief Standard normal distribution */
+  std::gamma_distribution<double> gamma_dist_;
+};
+
+} // namespace StochTree
+
+#endif // STOCHTREE_IG_SAMPLER_H_
\ No newline at end of file
diff --git a/include/stochtree/ig_sampler.h b/include/stochtree/ig_sampler.h
index ebfaee32..645aec59 100644
--- a/include/stochtree/ig_sampler.h
+++ b/include/stochtree/ig_sampler.h
@@ -10,14 +10,14 @@ class InverseGammaSampler {
  public:
   InverseGammaSampler() {}
   ~InverseGammaSampler() {}
-  double Sample(double shape, double scale, std::mt19937& gen) {
+  double Sample(double a, double b, std::mt19937& gen, bool scale_param = true) {
     // C++ standard library provides a gamma distribution with scale
     // parameter, but the correspondence between gamma and IG is that 
     // 1 / gamma(a,b) ~ IG(a,b) when b is a __rate__ parameter.
     // Before sampling, we convert ig_scale to a gamma scale parameter by 
     // taking its multiplicative inverse.
-    double gamma_scale = 1./scale;
-    gamma_dist_ = std::gamma_distribution<double>(shape, gamma_scale);
+    double gamma_scale = scale_param ? 1./b : b;
+    gamma_dist_ = std::gamma_distribution<double>(a, gamma_scale);
     return (1/gamma_dist_(gen));
   }
  private:
diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index 750e7d21..57480f0b 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -8,6 +8,7 @@
 #include <Eigen/Dense>
 #include <stochtree/cutpoint_candidates.h>
 #include <stochtree/data.h>
+#include <stochtree/gamma_sampler.h>
 #include <stochtree/ig_sampler.h>
 #include <stochtree/log.h>
 #include <stochtree/meta.h>
@@ -240,7 +241,7 @@ class LogLinearVarianceSuffStat {
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     weighted_sum_ei += outcome(row_idx)*outcome(row_idx)/dataset.VarWeightValue(row_idx);
-    sum_log_partial_var += std::exp(tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx));
+    sum_log_partial_var += tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx);
   }
   void ResetSuffStat() {
     n = 0;
@@ -276,11 +277,11 @@ class LogLinearVarianceLeafModel {
   double SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance);
   double NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   double PosteriorParameterShape(LogLinearVarianceSuffStat& suff_stat, double global_variance);
-  double PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance);
+  double PosteriorParameterRate(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   void SampleLeafParameters(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, Tree* tree, int tree_num, double global_variance, std::mt19937& gen);
   void SetEnsembleRootPredictedValue(ForestDataset& dataset, TreeEnsemble* ensemble, double root_pred_value);
   void SetPriorShape(double a) {a_ = a;}
-  void SetPriorScale(double b) {b_ = b;}
+  void SetPriorRate(double b) {b_ = b;}
   inline bool RequiresBasis() {return false;}
  private:
   double a_;
diff --git a/include/stochtree/partition_tracker.h b/include/stochtree/partition_tracker.h
index 961538f0..4b9b97ef 100644
--- a/include/stochtree/partition_tracker.h
+++ b/include/stochtree/partition_tracker.h
@@ -63,6 +63,7 @@ class ForestTracker {
   void AssignAllSamplesToRoot(int32_t tree_num);
   void AssignAllSamplesToConstantPrediction(double value);
   void AssignAllSamplesToConstantPrediction(int32_t tree_num, double value);
+  void UpdatePredictions(TreeEnsemble* ensemble, ForestDataset& dataset);
   void ResetRoot(Eigen::MatrixXd& covariates, std::vector<FeatureType>& feature_types, int32_t tree_num);
   void AddSplit(Eigen::MatrixXd& covariates, TreeSplit& split, int32_t split_feature, int32_t tree_id, int32_t split_node_id, int32_t left_node_id, int32_t right_node_id, bool keep_sorted = false);
   void RemoveSplit(Eigen::MatrixXd& covariates, Tree* tree, int32_t tree_id, int32_t split_node_id, int32_t left_node_id, int32_t right_node_id, bool keep_sorted = false);
@@ -108,6 +109,9 @@ class ForestTracker {
   int num_trees_;
   int num_observations_;
   int num_features_;
+
+  void UpdatePredictionsInternal(TreeEnsemble* ensemble, Eigen::MatrixXd& covariates, Eigen::MatrixXd& basis);
+  void UpdatePredictionsInternal(TreeEnsemble* ensemble, Eigen::MatrixXd& covariates);
 };
 
 /*! \brief Class storing sample-prediction map for each tree in an ensemble */
diff --git a/include/stochtree/variance_model.h b/include/stochtree/variance_model.h
index e74b2964..9c61b357 100644
--- a/include/stochtree/variance_model.h
+++ b/include/stochtree/variance_model.h
@@ -8,6 +8,7 @@
 #include <Eigen/Dense>
 #include <stochtree/data.h>
 #include <stochtree/ensemble.h>
+#include <stochtree/gamma_sampler.h>
 #include <stochtree/ig_sampler.h>
 #include <stochtree/meta.h>
 
@@ -26,21 +27,38 @@ class GlobalHomoskedasticVarianceModel {
   ~GlobalHomoskedasticVarianceModel() {}
   double PosteriorShape(Eigen::VectorXd& residuals, double a, double b) {
     data_size_t n = residuals.rows();
-    return (a/2.0) + (n/2.0);
+    return a + (0.5 * n);
   }
   double PosteriorScale(Eigen::VectorXd& residuals, double a, double b) {
     data_size_t n = residuals.rows();
     double sum_sq_resid = 0.;
     for (data_size_t i = 0; i < n; i++) {
-      sum_sq_resid += std::pow(residuals(i, 0), 2);
+      sum_sq_resid += (residuals(i) * residuals(i));
     }
-    return (b/2.0) + (sum_sq_resid/2.0);
+    return b + (0.5 * sum_sq_resid);
+  }
+  double PosteriorShape(Eigen::VectorXd& residuals, Eigen::VectorXd& weights, double a, double b) {
+    data_size_t n = residuals.rows();
+    return a + (0.5 * n);
+  }
+  double PosteriorScale(Eigen::VectorXd& residuals, Eigen::VectorXd& weights, double a, double b) {
+    data_size_t n = residuals.rows();
+    double sum_sq_resid = 0.;
+    for (data_size_t i = 0; i < n; i++) {
+      sum_sq_resid += (residuals(i) * residuals(i)) / weights(i);
+    }
+    return b + (0.5 * sum_sq_resid);
   }
   double SampleVarianceParameter(Eigen::VectorXd& residuals, double a, double b, std::mt19937& gen) {
     double ig_shape = PosteriorShape(residuals, a, b);
     double ig_scale = PosteriorScale(residuals, a, b);
     return ig_sampler_.Sample(ig_shape, ig_scale, gen);
   }
+  double SampleVarianceParameter(Eigen::VectorXd& residuals, Eigen::VectorXd& weights, double a, double b, std::mt19937& gen) {
+    double ig_shape = PosteriorShape(residuals, weights, a, b);
+    double ig_scale = PosteriorScale(residuals, weights, a, b);
+    return ig_sampler_.Sample(ig_shape, ig_scale, gen);
+  }
  private:
   InverseGammaSampler ig_sampler_;
 };
diff --git a/man/ForestModel.Rd b/man/ForestModel.Rd
index 3f8421c8..e09d0c8f 100644
--- a/man/ForestModel.Rd
+++ b/man/ForestModel.Rd
@@ -82,6 +82,8 @@ Run a single iteration of the forest sampling algorithm (MCMC or GFR)
   leaf_model_int,
   leaf_model_scale,
   variable_weights,
+  a_forest,
+  b_forest,
   global_scale,
   cutpoint_grid_size = 500,
   gfr = T,
@@ -108,6 +110,10 @@ Run a single iteration of the forest sampling algorithm (MCMC or GFR)
 
 \item{\code{variable_weights}}{Vector specifying sampling probability for all p covariates in \code{forest_dataset}}
 
+\item{\code{a_forest}}{Shape parameter on variance forest model (if applicable)}
+
+\item{\code{b_forest}}{Scale parameter on variance forest model (if applicable)}
+
 \item{\code{global_scale}}{Global variance parameter}
 
 \item{\code{cutpoint_grid_size}}{(Optional) Number of unique cutpoints to consider (default: 500, currently only used when \code{GFR = TRUE})}
diff --git a/man/ForestSamples.Rd b/man/ForestSamples.Rd
index b629ca1a..17c9bd39 100644
--- a/man/ForestSamples.Rd
+++ b/man/ForestSamples.Rd
@@ -22,6 +22,7 @@ Wrapper around a C++ container of tree ensembles
 \item \href{#method-ForestSamples-predict_raw}{\code{ForestSamples$predict_raw()}}
 \item \href{#method-ForestSamples-predict_raw_single_forest}{\code{ForestSamples$predict_raw_single_forest()}}
 \item \href{#method-ForestSamples-set_root_leaves}{\code{ForestSamples$set_root_leaves()}}
+\item \href{#method-ForestSamples-prepare_for_sampler}{\code{ForestSamples$prepare_for_sampler()}}
 \item \href{#method-ForestSamples-adjust_residual}{\code{ForestSamples$adjust_residual()}}
 \item \href{#method-ForestSamples-update_residual}{\code{ForestSamples$update_residual()}}
 \item \href{#method-ForestSamples-save_json}{\code{ForestSamples$save_json()}}
@@ -47,7 +48,12 @@ Wrapper around a C++ container of tree ensembles
 \subsection{Method \code{new()}}{
 Create a new ForestContainer object.
 \subsection{Usage}{
-\if{html}{\out{<div class="r">}}\preformatted{ForestSamples$new(num_trees, output_dimension = 1, is_leaf_constant = F)}\if{html}{\out{</div>}}
+\if{html}{\out{<div class="r">}}\preformatted{ForestSamples$new(
+  num_trees,
+  output_dimension = 1,
+  is_leaf_constant = F,
+  is_exponentiated = F
+)}\if{html}{\out{</div>}}
 }
 
 \subsection{Arguments}{
@@ -58,6 +64,8 @@ Create a new ForestContainer object.
 \item{\code{output_dimension}}{Dimensionality of the outcome model}
 
 \item{\code{is_leaf_constant}}{Whether leaf is constant}
+
+\item{\code{is_exponentiated}}{Whether forest predictions should be exponentiated before being returned}
 }
 \if{html}{\out{</div>}}
 }
@@ -172,6 +180,38 @@ Stops program if any tree is more than a root node.
 \describe{
 \item{\code{forest_num}}{Index of the forest sample within the container.}
 
+\item{\code{leaf_value}}{Constant leaf value(s) to be fixed for each tree in the ensemble indexed by \code{forest_num}. Can be either a single number or a vector, depending on the forest's leaf dimension.}
+}
+\if{html}{\out{</div>}}
+}
+}
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-ForestSamples-prepare_for_sampler"></a>}}
+\if{latex}{\out{\hypertarget{method-ForestSamples-prepare_for_sampler}{}}}
+\subsection{Method \code{prepare_for_sampler()}}{
+Set a constant predicted value for every tree in the ensemble.
+Stops program if any tree is more than a root node.
+\subsection{Usage}{
+\if{html}{\out{<div class="r">}}\preformatted{ForestSamples$prepare_for_sampler(
+  dataset,
+  outcome,
+  forest_model,
+  leaf_model_int,
+  leaf_value
+)}\if{html}{\out{</div>}}
+}
+
+\subsection{Arguments}{
+\if{html}{\out{<div class="arguments">}}
+\describe{
+\item{\code{dataset}}{\code{ForestDataset} Dataset class (covariates, basis, etc...)}
+
+\item{\code{outcome}}{\code{Outcome} Outcome class (residual / partial residual)}
+
+\item{\code{forest_model}}{\code{ForestModel} object storing tracking structures used in training / sampling}
+
+\item{\code{leaf_model_int}}{Integer value encoding the leaf model type (0 = constant gaussian, 1 = univariate gaussian, 2 = multivariate gaussian, 3 = log linear variance).}
+
 \item{\code{leaf_value}}{Constant leaf value(s) to be fixed for each tree in the ensemble indexed by \code{forest_num}. Can be either a single number or a vector, depending on the forest's leaf dimension.}
 }
 \if{html}{\out{</div>}}
diff --git a/man/bart.Rd b/man/bart.Rd
index eb4dfe59..d65f10d9 100644
--- a/man/bart.Rd
+++ b/man/bart.Rd
@@ -16,20 +16,29 @@ bart(
   rfx_basis_test = NULL,
   cutpoint_grid_size = 100,
   tau_init = NULL,
-  alpha = 0.95,
-  beta = 2,
-  min_samples_leaf = 5,
-  max_depth = 10,
-  leaf_model = 0,
+  alpha_mean = 0.95,
+  beta_mean = 2,
+  min_samples_leaf_mean = 5,
+  max_depth_mean = 10,
+  alpha_variance = 0.95,
+  beta_variance = 2,
+  min_samples_leaf_variance = 5,
+  max_depth_variance = 10,
   a_global = 0,
   b_global = 0,
   a_leaf = 3,
   b_leaf = NULL,
+  a_forest = NULL,
+  b_forest = NULL,
   q = 0.9,
   sigma2_init = NULL,
-  pct_var_sigma2_init = 0.25,
-  variable_weights = NULL,
-  num_trees = 200,
+  variance_forest_init = NULL,
+  pct_var_sigma2_init = 1,
+  pct_var_variance_forest_init = 0.4,
+  variable_weights_mean = NULL,
+  variable_weights_variance = NULL,
+  num_trees_mean = 200,
+  num_trees_variance = 200,
   num_gfr = 5,
   num_burnin = 0,
   num_mcmc = 100,
@@ -38,7 +47,8 @@ bart(
   random_seed = -1,
   keep_burnin = F,
   keep_gfr = F,
-  verbose = F
+  verbose = F,
+  include_variance_forest = F
 )
 }
 \arguments{
@@ -77,17 +87,23 @@ that were not in the training set.}
 
 \item{cutpoint_grid_size}{Maximum size of the "grid" of potential cutpoints to consider. Default: 100.}
 
-\item{tau_init}{Starting value of leaf node scale parameter. Calibrated internally as \code{1/num_trees} if not set here.}
+\item{tau_init}{Starting value of leaf node scale parameter. Calibrated internally as \code{1/num_trees_mean} if not set here.}
 
-\item{alpha}{Prior probability of splitting for a tree of depth 0. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha*(1+node_depth)^-beta}.}
+\item{alpha_mean}{Prior probability of splitting for a tree of depth 0 in the mean model. Tree split prior combines \code{alpha_mean} and \code{beta_mean} via \code{alpha_mean*(1+node_depth)^-beta_mean}.}
 
-\item{beta}{Exponent that decreases split probabilities for nodes of depth > 0. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha*(1+node_depth)^-beta}.}
+\item{beta_mean}{Exponent that decreases split probabilities for nodes of depth > 0 in the mean model. Tree split prior combines \code{alpha_mean} and \code{beta_mean} via \code{alpha_mean*(1+node_depth)^-beta_mean}.}
 
-\item{min_samples_leaf}{Minimum allowable size of a leaf, in terms of training samples. Default: 5.}
+\item{min_samples_leaf_mean}{Minimum allowable size of a leaf, in terms of training samples, in the mean model. Default: 5.}
 
-\item{max_depth}{Maximum depth of any tree in the ensemble. Default: 10. Can be overriden with \code{-1} which does not enforce any depth limits on trees.}
+\item{max_depth_mean}{Maximum depth of any tree in the ensemble in the mean model. Default: 10. Can be overriden with \code{-1} which does not enforce any depth limits on trees.}
 
-\item{leaf_model}{Model to use in the leaves, coded as integer with (0 = constant leaf, 1 = univariate leaf regression, 2 = multivariate leaf regression). Default: 0.}
+\item{alpha_variance}{Prior probability of splitting for a tree of depth 0 in the variance model. Tree split prior combines \code{alpha_variance} and \code{beta_variance} via \code{alpha_variance*(1+node_depth)^-beta_variance}.}
+
+\item{beta_variance}{Exponent that decreases split probabilities for nodes of depth > 0 in the variance model. Tree split prior combines \code{alpha_variance} and \code{beta_variance} via \code{alpha_variance*(1+node_depth)^-beta_variance}.}
+
+\item{min_samples_leaf_variance}{Minimum allowable size of a leaf, in terms of training samples, in the variance model. Default: 5.}
+
+\item{max_depth_variance}{Maximum depth of any tree in the ensemble in the variance model. Default: 10. Can be overriden with \code{-1} which does not enforce any depth limits on trees.}
 
 \item{a_global}{Shape parameter in the \code{IG(a_global, b_global)} global error variance model. Default: 0.}
 
@@ -95,17 +111,29 @@ that were not in the training set.}
 
 \item{a_leaf}{Shape parameter in the \code{IG(a_leaf, b_leaf)} leaf node parameter variance model. Default: 3.}
 
-\item{b_leaf}{Scale parameter in the \code{IG(a_leaf, b_leaf)} leaf node parameter variance model. Calibrated internally as \code{0.5/num_trees} if not set here.}
+\item{b_leaf}{Scale parameter in the \code{IG(a_leaf, b_leaf)} leaf node parameter variance model. Calibrated internally as \code{0.5/num_trees_mean} if not set here.}
+
+\item{a_forest}{Shape parameter in the \code{IG(a_forest, b_forest)} conditional error variance model (which is only sampled if \code{include_variance_forest = T}). Calibrated internally as \code{num_trees_variance / 1.5^2 + 0.5} if not set.}
+
+\item{b_forest}{Scale parameter in the \code{IG(a_forest, b_forest)} conditional error variance model (which is only sampled if \code{include_variance_forest = T}). Calibrated internally as \code{num_trees_variance / 1.5^2} if not set.}
 
 \item{q}{Quantile used to calibrated \code{lambda} as in Sparapani et al (2021). Default: 0.9.}
 
 \item{sigma2_init}{Starting value of global error variance parameter. Calibrated internally as \code{pct_var_sigma2_init*var((y-mean(y))/sd(y))} if not set.}
 
+\item{variance_forest_init}{Starting value of root forest prediction in conditional (heteroskedastic) error variance model. Calibrated internally as \code{log(pct_var_variance_forest_init*var((y-mean(y))/sd(y)))/num_trees_variance} if not set.}
+
 \item{pct_var_sigma2_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by \code{sigma2_init}.}
 
-\item{variable_weights}{Numeric weights reflecting the relative probability of splitting on each variable. Does not need to sum to 1 but cannot be negative. Defaults to \code{rep(1/ncol(X_train), ncol(X_train))} if not set here.}
+\item{pct_var_variance_forest_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by \code{variance_forest_init}.}
+
+\item{variable_weights_mean}{Numeric weights reflecting the relative probability of splitting on each variable in the mean forest. Does not need to sum to 1 but cannot be negative. Defaults to \code{rep(1/ncol(X_train), ncol(X_train))} if not set here.}
+
+\item{variable_weights_variance}{Numeric weights reflecting the relative probability of splitting on each variable in the variance forest. Does not need to sum to 1 but cannot be negative. Defaults to \code{rep(1/ncol(X_train), ncol(X_train))} if not set here.}
 
-\item{num_trees}{Number of trees in the ensemble. Default: 200.}
+\item{num_trees_mean}{Number of trees in the ensemble for the conditional mean model. Default: 200. If \code{num_trees_mean = 0}, the conditional mean will not be modeled using a forest and the function will only proceed if \code{num_trees_variance > 0}.}
+
+\item{num_trees_variance}{Number of trees in the ensemble for the conditional variance model. Default: 0. Variance is only modeled using a tree / forest if \code{num_trees_variance > 0}.}
 
 \item{num_gfr}{Number of "warm-start" iterations run using the grow-from-root algorithm (He and Hahn, 2021). Default: 5.}
 
@@ -113,7 +141,7 @@ that were not in the training set.}
 
 \item{num_mcmc}{Number of "retained" iterations of the MCMC sampler. Default: 100.}
 
-\item{sample_sigma}{Whether or not to update the \code{sigma^2} global error variance parameter based on \code{IG(nu, nu*lambda)}. Default: T.}
+\item{sample_sigma}{Whether or not to update the \code{sigma^2} global error variance parameter based on \code{IG(a_globa, b_global)}. Default: T.}
 
 \item{sample_tau}{Whether or not to update the \code{tau} leaf scale variance parameter based on \code{IG(a_leaf, b_leaf)}. Cannot (currently) be set to true if \code{ncol(W_train)>1}. Default: T.}
 
@@ -124,6 +152,8 @@ that were not in the training set.}
 \item{keep_gfr}{Whether or not "grow-from-root" samples should be included in cached predictions. Default TRUE. Ignored if num_mcmc = 0.}
 
 \item{verbose}{Whether or not to print progress during the sampling loops. Default: FALSE.}
+
+\item{leaf_model}{Model to use in the leaves, coded as integer with (0 = constant leaf, 1 = univariate leaf regression, 2 = multivariate leaf regression). Default: 0.}
 }
 \value{
 List of sampling outputs and a wrapper around the sampled forests (which can be used for in-memory prediction on new data, or serialized to JSON on disk).
diff --git a/man/bcf.Rd b/man/bcf.Rd
index af2fbf33..0108b46b 100644
--- a/man/bcf.Rd
+++ b/man/bcf.Rd
@@ -153,7 +153,7 @@ that were not in the training set.}
 
 \item{num_mcmc}{Number of "retained" iterations of the MCMC sampler. Default: 100.}
 
-\item{sample_sigma_global}{Whether or not to update the \code{sigma^2} global error variance parameter based on \code{IG(nu, nu*lambda)}. Default: T.}
+\item{sample_sigma_global}{Whether or not to update the \code{sigma^2} global error variance parameter based on \code{IG(a_global, b_global)}. Default: T.}
 
 \item{sample_sigma_leaf_mu}{Whether or not to update the \code{sigma_leaf_mu} leaf scale variance parameter in the prognostic forest based on \code{IG(a_leaf_mu, b_leaf_mu)}. Default: T.}
 
diff --git a/man/createForestContainer.Rd b/man/createForestContainer.Rd
index 8453a7bc..67a33e8d 100644
--- a/man/createForestContainer.Rd
+++ b/man/createForestContainer.Rd
@@ -4,7 +4,12 @@
 \alias{createForestContainer}
 \title{Create a container of forest samples}
 \usage{
-createForestContainer(num_trees, output_dimension = 1, is_leaf_constant = F)
+createForestContainer(
+  num_trees,
+  output_dimension = 1,
+  is_leaf_constant = F,
+  is_exponentiated = F
+)
 }
 \arguments{
 \item{num_trees}{Number of trees}
@@ -12,6 +17,8 @@ createForestContainer(num_trees, output_dimension = 1, is_leaf_constant = F)
 \item{output_dimension}{Dimensionality of the outcome model}
 
 \item{is_leaf_constant}{Whether leaf is constant}
+
+\item{is_exponentiated}{Whether forest predictions should be exponentiated before being returned}
 }
 \value{
 \code{ForestSamples} object
diff --git a/man/sample_sigma2_one_iteration.Rd b/man/sample_sigma2_one_iteration.Rd
index 559ccc66..f3d687b9 100644
--- a/man/sample_sigma2_one_iteration.Rd
+++ b/man/sample_sigma2_one_iteration.Rd
@@ -4,11 +4,13 @@
 \alias{sample_sigma2_one_iteration}
 \title{Sample one iteration of the (inverse gamma) global variance model}
 \usage{
-sample_sigma2_one_iteration(residual, rng, a, b)
+sample_sigma2_one_iteration(residual, dataset, rng, a, b)
 }
 \arguments{
 \item{residual}{Outcome class}
 
+\item{dataset}{ForestDataset class}
+
 \item{rng}{C++ random number generator}
 
 \item{a}{Global variance shape parameter}
diff --git a/src/Makevars b/src/Makevars
index 53848f54..8f704cd9 100644
--- a/src/Makevars
+++ b/src/Makevars
@@ -3,7 +3,7 @@ PKGROOT=..
 
 STOCHTREE_CPPFLAGS = -DSTOCHTREE_R_BUILD
 
-PKG_CPPFLAGS= -I$(PKGROOT)/include -I$(PKGROOT)/deps/eigen -I$(PKGROOT)/deps/fmt/include -I$(PKGROOT)/deps/fast_double_parser/include $(STOCHTREE_CPPFLAGS)
+PKG_CPPFLAGS= -I$(PKGROOT)/include -I$(PKGROOT)/deps/eigen -I$(PKGROOT)/deps/fmt/include -I$(PKGROOT)/deps/fast_double_parser/include -I$(PKGROOT)/deps/boost_math/include $(STOCHTREE_CPPFLAGS)
 
 CXX_STD=CXX17
 
diff --git a/src/cpp11.cpp b/src/cpp11.cpp
index d20046bb..96e5c887 100644
--- a/src/cpp11.cpp
+++ b/src/cpp11.cpp
@@ -335,10 +335,10 @@ extern "C" SEXP _stochtree_rfx_label_mapper_to_list_cpp(SEXP label_mapper_ptr) {
   END_CPP11
 }
 // forest.cpp
-cpp11::external_pointer<StochTree::ForestContainer> forest_container_cpp(int num_trees, int output_dimension, bool is_leaf_constant);
-extern "C" SEXP _stochtree_forest_container_cpp(SEXP num_trees, SEXP output_dimension, SEXP is_leaf_constant) {
+cpp11::external_pointer<StochTree::ForestContainer> forest_container_cpp(int num_trees, int output_dimension, bool is_leaf_constant, bool is_exponentiated);
+extern "C" SEXP _stochtree_forest_container_cpp(SEXP num_trees, SEXP output_dimension, SEXP is_leaf_constant, SEXP is_exponentiated) {
   BEGIN_CPP11
-    return cpp11::as_sexp(forest_container_cpp(cpp11::as_cpp<cpp11::decay_t<int>>(num_trees), cpp11::as_cpp<cpp11::decay_t<int>>(output_dimension), cpp11::as_cpp<cpp11::decay_t<bool>>(is_leaf_constant)));
+    return cpp11::as_sexp(forest_container_cpp(cpp11::as_cpp<cpp11::decay_t<int>>(num_trees), cpp11::as_cpp<cpp11::decay_t<int>>(output_dimension), cpp11::as_cpp<cpp11::decay_t<bool>>(is_leaf_constant), cpp11::as_cpp<cpp11::decay_t<bool>>(is_exponentiated)));
   END_CPP11
 }
 // forest.cpp
@@ -512,6 +512,14 @@ extern "C" SEXP _stochtree_set_leaf_vector_forest_container_cpp(SEXP forest_samp
   END_CPP11
 }
 // forest.cpp
+void initialize_forest_model_cpp(cpp11::external_pointer<StochTree::ForestDataset> data, cpp11::external_pointer<StochTree::ColumnVector> residual, cpp11::external_pointer<StochTree::ForestContainer> forest_samples, cpp11::external_pointer<StochTree::ForestTracker> tracker, cpp11::doubles init_values, int leaf_model_int);
+extern "C" SEXP _stochtree_initialize_forest_model_cpp(SEXP data, SEXP residual, SEXP forest_samples, SEXP tracker, SEXP init_values, SEXP leaf_model_int) {
+  BEGIN_CPP11
+    initialize_forest_model_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestDataset>>>(data), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ColumnVector>>>(residual), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestContainer>>>(forest_samples), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestTracker>>>(tracker), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles>>(init_values), cpp11::as_cpp<cpp11::decay_t<int>>(leaf_model_int));
+    return R_NilValue;
+  END_CPP11
+}
+// forest.cpp
 void adjust_residual_forest_container_cpp(cpp11::external_pointer<StochTree::ForestDataset> data, cpp11::external_pointer<StochTree::ColumnVector> residual, cpp11::external_pointer<StochTree::ForestContainer> forest_samples, cpp11::external_pointer<StochTree::ForestTracker> tracker, bool requires_basis, int forest_num, bool add);
 extern "C" SEXP _stochtree_adjust_residual_forest_container_cpp(SEXP data, SEXP residual, SEXP forest_samples, SEXP tracker, SEXP requires_basis, SEXP forest_num, SEXP add) {
   BEGIN_CPP11
@@ -600,26 +608,26 @@ extern "C" SEXP _stochtree_forest_kernel_compute_kernel_train_test_cpp(SEXP fore
   END_CPP11
 }
 // sampler.cpp
-void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDataset> data, cpp11::external_pointer<StochTree::ColumnVector> residual, cpp11::external_pointer<StochTree::ForestContainer> forest_samples, cpp11::external_pointer<StochTree::ForestTracker> tracker, cpp11::external_pointer<StochTree::TreePrior> split_prior, cpp11::external_pointer<std::mt19937> rng, cpp11::integers feature_types, int cutpoint_grid_size, cpp11::doubles_matrix<> leaf_model_scale_input, cpp11::doubles variable_weights, double global_variance, int leaf_model_int, bool pre_initialized);
-extern "C" SEXP _stochtree_sample_gfr_one_iteration_cpp(SEXP data, SEXP residual, SEXP forest_samples, SEXP tracker, SEXP split_prior, SEXP rng, SEXP feature_types, SEXP cutpoint_grid_size, SEXP leaf_model_scale_input, SEXP variable_weights, SEXP global_variance, SEXP leaf_model_int, SEXP pre_initialized) {
+void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDataset> data, cpp11::external_pointer<StochTree::ColumnVector> residual, cpp11::external_pointer<StochTree::ForestContainer> forest_samples, cpp11::external_pointer<StochTree::ForestTracker> tracker, cpp11::external_pointer<StochTree::TreePrior> split_prior, cpp11::external_pointer<std::mt19937> rng, cpp11::integers feature_types, int cutpoint_grid_size, cpp11::doubles_matrix<> leaf_model_scale_input, cpp11::doubles variable_weights, double a_forest, double b_forest, double global_variance, int leaf_model_int, bool pre_initialized);
+extern "C" SEXP _stochtree_sample_gfr_one_iteration_cpp(SEXP data, SEXP residual, SEXP forest_samples, SEXP tracker, SEXP split_prior, SEXP rng, SEXP feature_types, SEXP cutpoint_grid_size, SEXP leaf_model_scale_input, SEXP variable_weights, SEXP a_forest, SEXP b_forest, SEXP global_variance, SEXP leaf_model_int, SEXP pre_initialized) {
   BEGIN_CPP11
-    sample_gfr_one_iteration_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestDataset>>>(data), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ColumnVector>>>(residual), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestContainer>>>(forest_samples), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestTracker>>>(tracker), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::TreePrior>>>(split_prior), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<std::mt19937>>>(rng), cpp11::as_cpp<cpp11::decay_t<cpp11::integers>>(feature_types), cpp11::as_cpp<cpp11::decay_t<int>>(cutpoint_grid_size), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles_matrix<>>>(leaf_model_scale_input), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles>>(variable_weights), cpp11::as_cpp<cpp11::decay_t<double>>(global_variance), cpp11::as_cpp<cpp11::decay_t<int>>(leaf_model_int), cpp11::as_cpp<cpp11::decay_t<bool>>(pre_initialized));
+    sample_gfr_one_iteration_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestDataset>>>(data), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ColumnVector>>>(residual), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestContainer>>>(forest_samples), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestTracker>>>(tracker), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::TreePrior>>>(split_prior), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<std::mt19937>>>(rng), cpp11::as_cpp<cpp11::decay_t<cpp11::integers>>(feature_types), cpp11::as_cpp<cpp11::decay_t<int>>(cutpoint_grid_size), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles_matrix<>>>(leaf_model_scale_input), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles>>(variable_weights), cpp11::as_cpp<cpp11::decay_t<double>>(a_forest), cpp11::as_cpp<cpp11::decay_t<double>>(b_forest), cpp11::as_cpp<cpp11::decay_t<double>>(global_variance), cpp11::as_cpp<cpp11::decay_t<int>>(leaf_model_int), cpp11::as_cpp<cpp11::decay_t<bool>>(pre_initialized));
     return R_NilValue;
   END_CPP11
 }
 // sampler.cpp
-void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDataset> data, cpp11::external_pointer<StochTree::ColumnVector> residual, cpp11::external_pointer<StochTree::ForestContainer> forest_samples, cpp11::external_pointer<StochTree::ForestTracker> tracker, cpp11::external_pointer<StochTree::TreePrior> split_prior, cpp11::external_pointer<std::mt19937> rng, cpp11::integers feature_types, int cutpoint_grid_size, cpp11::doubles_matrix<> leaf_model_scale_input, cpp11::doubles variable_weights, double global_variance, int leaf_model_int, bool pre_initialized);
-extern "C" SEXP _stochtree_sample_mcmc_one_iteration_cpp(SEXP data, SEXP residual, SEXP forest_samples, SEXP tracker, SEXP split_prior, SEXP rng, SEXP feature_types, SEXP cutpoint_grid_size, SEXP leaf_model_scale_input, SEXP variable_weights, SEXP global_variance, SEXP leaf_model_int, SEXP pre_initialized) {
+void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDataset> data, cpp11::external_pointer<StochTree::ColumnVector> residual, cpp11::external_pointer<StochTree::ForestContainer> forest_samples, cpp11::external_pointer<StochTree::ForestTracker> tracker, cpp11::external_pointer<StochTree::TreePrior> split_prior, cpp11::external_pointer<std::mt19937> rng, cpp11::integers feature_types, int cutpoint_grid_size, cpp11::doubles_matrix<> leaf_model_scale_input, cpp11::doubles variable_weights, double a_forest, double b_forest, double global_variance, int leaf_model_int, bool pre_initialized);
+extern "C" SEXP _stochtree_sample_mcmc_one_iteration_cpp(SEXP data, SEXP residual, SEXP forest_samples, SEXP tracker, SEXP split_prior, SEXP rng, SEXP feature_types, SEXP cutpoint_grid_size, SEXP leaf_model_scale_input, SEXP variable_weights, SEXP a_forest, SEXP b_forest, SEXP global_variance, SEXP leaf_model_int, SEXP pre_initialized) {
   BEGIN_CPP11
-    sample_mcmc_one_iteration_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestDataset>>>(data), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ColumnVector>>>(residual), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestContainer>>>(forest_samples), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestTracker>>>(tracker), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::TreePrior>>>(split_prior), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<std::mt19937>>>(rng), cpp11::as_cpp<cpp11::decay_t<cpp11::integers>>(feature_types), cpp11::as_cpp<cpp11::decay_t<int>>(cutpoint_grid_size), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles_matrix<>>>(leaf_model_scale_input), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles>>(variable_weights), cpp11::as_cpp<cpp11::decay_t<double>>(global_variance), cpp11::as_cpp<cpp11::decay_t<int>>(leaf_model_int), cpp11::as_cpp<cpp11::decay_t<bool>>(pre_initialized));
+    sample_mcmc_one_iteration_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestDataset>>>(data), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ColumnVector>>>(residual), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestContainer>>>(forest_samples), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestTracker>>>(tracker), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::TreePrior>>>(split_prior), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<std::mt19937>>>(rng), cpp11::as_cpp<cpp11::decay_t<cpp11::integers>>(feature_types), cpp11::as_cpp<cpp11::decay_t<int>>(cutpoint_grid_size), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles_matrix<>>>(leaf_model_scale_input), cpp11::as_cpp<cpp11::decay_t<cpp11::doubles>>(variable_weights), cpp11::as_cpp<cpp11::decay_t<double>>(a_forest), cpp11::as_cpp<cpp11::decay_t<double>>(b_forest), cpp11::as_cpp<cpp11::decay_t<double>>(global_variance), cpp11::as_cpp<cpp11::decay_t<int>>(leaf_model_int), cpp11::as_cpp<cpp11::decay_t<bool>>(pre_initialized));
     return R_NilValue;
   END_CPP11
 }
 // sampler.cpp
-double sample_sigma2_one_iteration_cpp(cpp11::external_pointer<StochTree::ColumnVector> residual, cpp11::external_pointer<std::mt19937> rng, double a, double b);
-extern "C" SEXP _stochtree_sample_sigma2_one_iteration_cpp(SEXP residual, SEXP rng, SEXP a, SEXP b) {
+double sample_sigma2_one_iteration_cpp(cpp11::external_pointer<StochTree::ColumnVector> residual, cpp11::external_pointer<StochTree::ForestDataset> dataset, cpp11::external_pointer<std::mt19937> rng, double a, double b);
+extern "C" SEXP _stochtree_sample_sigma2_one_iteration_cpp(SEXP residual, SEXP dataset, SEXP rng, SEXP a, SEXP b) {
   BEGIN_CPP11
-    return cpp11::as_sexp(sample_sigma2_one_iteration_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ColumnVector>>>(residual), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<std::mt19937>>>(rng), cpp11::as_cpp<cpp11::decay_t<double>>(a), cpp11::as_cpp<cpp11::decay_t<double>>(b)));
+    return cpp11::as_sexp(sample_sigma2_one_iteration_cpp(cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ColumnVector>>>(residual), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<StochTree::ForestDataset>>>(dataset), cpp11::as_cpp<cpp11::decay_t<cpp11::external_pointer<std::mt19937>>>(rng), cpp11::as_cpp<cpp11::decay_t<double>>(a), cpp11::as_cpp<cpp11::decay_t<double>>(b)));
   END_CPP11
 }
 // sampler.cpp
@@ -894,7 +902,7 @@ static const R_CallMethodDef CallEntries[] = {
     {"_stochtree_dataset_num_rows_cpp",                                (DL_FUNC) &_stochtree_dataset_num_rows_cpp,                                 1},
     {"_stochtree_ensemble_average_max_depth_forest_container_cpp",     (DL_FUNC) &_stochtree_ensemble_average_max_depth_forest_container_cpp,      2},
     {"_stochtree_ensemble_tree_max_depth_forest_container_cpp",        (DL_FUNC) &_stochtree_ensemble_tree_max_depth_forest_container_cpp,         3},
-    {"_stochtree_forest_container_cpp",                                (DL_FUNC) &_stochtree_forest_container_cpp,                                 3},
+    {"_stochtree_forest_container_cpp",                                (DL_FUNC) &_stochtree_forest_container_cpp,                                 4},
     {"_stochtree_forest_container_from_json_cpp",                      (DL_FUNC) &_stochtree_forest_container_from_json_cpp,                       2},
     {"_stochtree_forest_dataset_add_basis_cpp",                        (DL_FUNC) &_stochtree_forest_dataset_add_basis_cpp,                         2},
     {"_stochtree_forest_dataset_add_covariates_cpp",                   (DL_FUNC) &_stochtree_forest_dataset_add_covariates_cpp,                    2},
@@ -915,6 +923,7 @@ static const R_CallMethodDef CallEntries[] = {
     {"_stochtree_get_tree_leaves_forest_container_cpp",                (DL_FUNC) &_stochtree_get_tree_leaves_forest_container_cpp,                 3},
     {"_stochtree_get_tree_split_counts_forest_container_cpp",          (DL_FUNC) &_stochtree_get_tree_split_counts_forest_container_cpp,           4},
     {"_stochtree_init_json_cpp",                                       (DL_FUNC) &_stochtree_init_json_cpp,                                        0},
+    {"_stochtree_initialize_forest_model_cpp",                         (DL_FUNC) &_stochtree_initialize_forest_model_cpp,                          6},
     {"_stochtree_is_leaf_constant_forest_container_cpp",               (DL_FUNC) &_stochtree_is_leaf_constant_forest_container_cpp,                1},
     {"_stochtree_json_add_bool_cpp",                                   (DL_FUNC) &_stochtree_json_add_bool_cpp,                                    3},
     {"_stochtree_json_add_bool_subfolder_cpp",                         (DL_FUNC) &_stochtree_json_add_bool_subfolder_cpp,                          4},
@@ -986,9 +995,9 @@ static const R_CallMethodDef CallEntries[] = {
     {"_stochtree_rfx_tracker_cpp",                                     (DL_FUNC) &_stochtree_rfx_tracker_cpp,                                      1},
     {"_stochtree_rfx_tracker_get_unique_group_ids_cpp",                (DL_FUNC) &_stochtree_rfx_tracker_get_unique_group_ids_cpp,                 1},
     {"_stochtree_rng_cpp",                                             (DL_FUNC) &_stochtree_rng_cpp,                                              1},
-    {"_stochtree_sample_gfr_one_iteration_cpp",                        (DL_FUNC) &_stochtree_sample_gfr_one_iteration_cpp,                        13},
-    {"_stochtree_sample_mcmc_one_iteration_cpp",                       (DL_FUNC) &_stochtree_sample_mcmc_one_iteration_cpp,                       13},
-    {"_stochtree_sample_sigma2_one_iteration_cpp",                     (DL_FUNC) &_stochtree_sample_sigma2_one_iteration_cpp,                      4},
+    {"_stochtree_sample_gfr_one_iteration_cpp",                        (DL_FUNC) &_stochtree_sample_gfr_one_iteration_cpp,                        15},
+    {"_stochtree_sample_mcmc_one_iteration_cpp",                       (DL_FUNC) &_stochtree_sample_mcmc_one_iteration_cpp,                       15},
+    {"_stochtree_sample_sigma2_one_iteration_cpp",                     (DL_FUNC) &_stochtree_sample_sigma2_one_iteration_cpp,                      5},
     {"_stochtree_sample_tau_one_iteration_cpp",                        (DL_FUNC) &_stochtree_sample_tau_one_iteration_cpp,                         5},
     {"_stochtree_set_leaf_value_forest_container_cpp",                 (DL_FUNC) &_stochtree_set_leaf_value_forest_container_cpp,                  2},
     {"_stochtree_set_leaf_vector_forest_container_cpp",                (DL_FUNC) &_stochtree_set_leaf_vector_forest_container_cpp,                 2},
diff --git a/src/data.cpp b/src/data.cpp
index ea667bce..b964baea 100644
--- a/src/data.cpp
+++ b/src/data.cpp
@@ -9,6 +9,36 @@ ColumnMatrix::ColumnMatrix(double* data_ptr, data_size_t num_row, int num_col, b
   LoadData(data_ptr, num_row, num_col, is_row_major);
 }
 
+ColumnMatrix::ColumnMatrix(std::string filename, std::string column_index_string, bool header, bool precise_float_parser) {
+  // Convert string to vector of indices
+  std::vector<int32_t> column_indices = Str2FeatureVec(column_index_string.c_str());
+  
+  // Set up CSV parser
+  data_size_t num_global_data = 0;
+  auto parser = std::unique_ptr<Parser>(Parser::CreateParser(filename.c_str(), header, 0, precise_float_parser));
+  if (parser == nullptr) {
+    Log::Fatal("Could not recognize data format of %s", filename.c_str());
+  }
+  
+  // Determine number of columns in the data file
+  int num_columns = parser->NumFeatures();
+
+  // Check compatibility between column_indices and num_columns
+  int32_t max_col = *std::max_element(column_indices.begin(), column_indices.end());
+  if (max_col >= num_columns) Log::Fatal("Some column indices requested do not exist in the CSV file");
+
+  // Read data to memory
+  auto text_data = LoadTextDataToMemory(filename.c_str(), &num_global_data, header);
+  int num_observations = static_cast<data_size_t>(text_data.size());
+
+  // Allocate the data_ matrix
+  data_ = Eigen::MatrixXd(num_observations, column_indices.size());
+
+  // Load data
+  ExtractMultipleFeaturesFromMemory(&text_data, parser.get(), column_indices, data_, num_observations);
+  text_data.clear();
+}
+
 void ColumnMatrix::LoadData(double* data_ptr, data_size_t num_row, int num_col, bool is_row_major) {
   data_.resize(num_row, num_col);
 
@@ -32,44 +62,37 @@ ColumnVector::ColumnVector(double* data_ptr, data_size_t num_row) {
   LoadData(data_ptr, num_row);
 }
 
-void ColumnVector::LoadData(double* data_ptr, data_size_t num_row) {
-  data_.resize(num_row);
-
-  // Copy data from R / Python process memory to Eigen matrix
-  double temp_value;
-  for (data_size_t i = 0; i < num_row; ++i) {
-    temp_value = static_cast<double>(*(data_ptr + i));
-    data_(i) = temp_value;
+ColumnVector::ColumnVector(std::string filename, int32_t column_index, bool header, bool precise_float_parser) {
+  // Set up CSV parser
+  data_size_t num_global_data = 0;
+  auto parser = std::unique_ptr<Parser>(Parser::CreateParser(filename.c_str(), header, 0, precise_float_parser));
+  if (parser == nullptr) {
+    Log::Fatal("Could not recognize data format of %s", filename.c_str());
   }
-}
+  
+  // Determine number of columns in the data file
+  int num_columns = parser->NumFeatures();
 
-void LoadData(double* data_ptr, int num_row, int num_col, bool is_row_major, Eigen::MatrixXd& data_matrix) {
-  data_matrix.resize(num_row, num_col);
+  // Read data to memory
+  auto text_data = LoadTextDataToMemory(filename.c_str(), &num_global_data, header);
+  int num_observations = static_cast<data_size_t>(text_data.size());
 
-  // Copy data from R / Python process memory to Eigen matrix
-  double temp_value;
-  for (data_size_t i = 0; i < num_row; ++i) {
-    for (int j = 0; j < num_col; ++j) {
-      if (is_row_major){
-        // Numpy 2-d arrays are stored in "row major" order
-        temp_value = static_cast<double>(*(data_ptr + static_cast<data_size_t>(num_col) * i + j));
-      } else {
-        // R matrices are stored in "column major" order
-        temp_value = static_cast<double>(*(data_ptr + static_cast<data_size_t>(num_row) * j + i));
-      }
-      data_matrix(i, j) = temp_value;
-    }
-  }
+  // Allocate the data_ matrix
+  data_ = Eigen::VectorXd(num_observations);
+
+  // Load data
+  ExtractSingleFeatureFromMemory(&text_data, parser.get(), column_index, data_, num_observations);
+  text_data.clear();
 }
 
-void LoadData(double* data_ptr, int num_row, Eigen::VectorXd& data_vector) {
-  data_vector.resize(num_row);
+void ColumnVector::LoadData(double* data_ptr, data_size_t num_row) {
+  data_.resize(num_row);
 
   // Copy data from R / Python process memory to Eigen matrix
   double temp_value;
   for (data_size_t i = 0; i < num_row; ++i) {
     temp_value = static_cast<double>(*(data_ptr + i));
-    data_vector(i) = temp_value;
+    data_(i) = temp_value;
   }
 }
 
diff --git a/src/forest.cpp b/src/forest.cpp
index c1f22c4e..7959003d 100644
--- a/src/forest.cpp
+++ b/src/forest.cpp
@@ -12,9 +12,9 @@
 #include <vector>
 
 [[cpp11::register]]
-cpp11::external_pointer<StochTree::ForestContainer> forest_container_cpp(int num_trees, int output_dimension = 1, bool is_leaf_constant = true) {
+cpp11::external_pointer<StochTree::ForestContainer> forest_container_cpp(int num_trees, int output_dimension = 1, bool is_leaf_constant = true, bool is_exponentiated = false) {
     // Create smart pointer to newly allocated object
-    std::unique_ptr<StochTree::ForestContainer> forest_sample_ptr_ = std::make_unique<StochTree::ForestContainer>(num_trees, output_dimension, is_leaf_constant);
+    std::unique_ptr<StochTree::ForestContainer> forest_sample_ptr_ = std::make_unique<StochTree::ForestContainer>(num_trees, output_dimension, is_leaf_constant, is_exponentiated);
     
     // Release management of the pointer to R session
     return cpp11::external_pointer<StochTree::ForestContainer>(forest_sample_ptr_.release());
@@ -247,6 +247,58 @@ void set_leaf_vector_forest_container_cpp(cpp11::external_pointer<StochTree::For
     forest_samples->InitializeRoot(leaf_vector_converted);
 }
 
+[[cpp11::register]]
+void initialize_forest_model_cpp(cpp11::external_pointer<StochTree::ForestDataset> data, 
+                                 cpp11::external_pointer<StochTree::ColumnVector> residual, 
+                                 cpp11::external_pointer<StochTree::ForestContainer> forest_samples, 
+                                 cpp11::external_pointer<StochTree::ForestTracker> tracker, 
+                                 cpp11::doubles init_values, int leaf_model_int){
+    // Convert leaf model type to enum
+    StochTree::ModelType model_type;
+    if (leaf_model_int == 0) model_type = StochTree::ModelType::kConstantLeafGaussian;
+    else if (leaf_model_int == 1) model_type = StochTree::ModelType::kUnivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 2) model_type = StochTree::ModelType::kMultivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 3) model_type = StochTree::ModelType::kLogLinearVariance;
+    else StochTree::Log::Fatal("Invalid model type");
+    
+    // Unpack initial value
+    int num_trees = forest_samples->NumTrees();
+    double init_val;
+    std::vector<double> init_value_vector;
+    if ((model_type == StochTree::ModelType::kConstantLeafGaussian) || 
+        (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) || 
+        (model_type == StochTree::ModelType::kLogLinearVariance)) {
+        init_val = init_values.at(0);
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
+        int leaf_dim = init_values.size();
+        init_value_vector.resize(leaf_dim);
+        for (int i = 0; i < leaf_dim; i++) {
+            init_value_vector[i] = init_values[i] / static_cast<double>(num_trees);
+        }
+    }
+    
+    // Initialize the models accordingly
+    if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
+        forest_samples->InitializeRoot(init_val / static_cast<double>(num_trees));
+        UpdateResidualEntireForest(*tracker, *data, *residual, forest_samples->GetEnsemble(0), false, std::minus<double>());
+        tracker->UpdatePredictions(forest_samples->GetEnsemble(0), *data);
+    } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
+        forest_samples->InitializeRoot(init_val / static_cast<double>(num_trees));
+        UpdateResidualEntireForest(*tracker, *data, *residual, forest_samples->GetEnsemble(0), true, std::minus<double>());
+        tracker->UpdatePredictions(forest_samples->GetEnsemble(0), *data);
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
+        forest_samples->InitializeRoot(init_value_vector);
+        UpdateResidualEntireForest(*tracker, *data, *residual, forest_samples->GetEnsemble(0), true, std::minus<double>());
+        tracker->UpdatePredictions(forest_samples->GetEnsemble(0), *data);
+    } else if (model_type == StochTree::ModelType::kLogLinearVariance) {
+        forest_samples->InitializeRoot(std::log(init_val) / static_cast<double>(num_trees));
+        tracker->UpdatePredictions(forest_samples->GetEnsemble(0), *data);
+        int n = data->NumObservations();
+        std::vector<double> initial_preds(n, init_val);
+        data->AddVarianceWeights(initial_preds.data(), n);
+    }
+}
+
 [[cpp11::register]]
 void adjust_residual_forest_container_cpp(cpp11::external_pointer<StochTree::ForestDataset> data, 
                                           cpp11::external_pointer<StochTree::ColumnVector> residual, 
diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index 990f4a60..5edb3002 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -210,15 +210,15 @@ void GaussianMultivariateRegressionLeafModel::SetEnsembleRootPredictedValue(Fore
 double LogLinearVarianceLeafModel::SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance) {
   double left_log_ml = (
     boost::math::lgamma(a_ + 0.5 * left_stat.n) -
-    (0.5 * left_stat.n) * std::log(2 * pi_constant * global_variance) - 
-    0.5 * left_stat.sum_log_partial_var - 
+    // (0.5 * left_stat.n) * std::log(2 * pi_constant * global_variance) - 
+    // 0.5 * left_stat.sum_log_partial_var - 
     (a_ + 0.5 * left_stat.n) * std::log(b_ + (0.5 * left_stat.weighted_sum_ei) / global_variance)
   );
 
   double right_log_ml = (
     boost::math::lgamma(a_ + 0.5 * right_stat.n) -
-    (0.5 * right_stat.n) * std::log(2 * pi_constant * global_variance) - 
-    0.5 * right_stat.sum_log_partial_var - 
+    // (0.5 * right_stat.n) * std::log(2 * pi_constant * global_variance) - 
+    // 0.5 * right_stat.sum_log_partial_var - 
     (a_ + 0.5 * right_stat.n) * std::log(b_ + (0.5 * right_stat.weighted_sum_ei) / global_variance)
   );
 
@@ -228,8 +228,8 @@ double LogLinearVarianceLeafModel::SplitLogMarginalLikelihood(LogLinearVarianceS
 double LogLinearVarianceLeafModel::NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
   double log_ml = (
     boost::math::lgamma(a_ + 0.5 * suff_stat.n) -
-    (0.5 * suff_stat.n) * std::log(2 * pi_constant * global_variance) - 
-    0.5 * suff_stat.sum_log_partial_var - 
+    // (0.5 * suff_stat.n) * std::log(2 * pi_constant * global_variance) - 
+    // 0.5 * suff_stat.sum_log_partial_var - 
     (a_ + 0.5 * suff_stat.n) * std::log(b_ + (0.5 * suff_stat.weighted_sum_ei) / global_variance)
   );
 
@@ -240,7 +240,7 @@ double LogLinearVarianceLeafModel::PosteriorParameterShape(LogLinearVarianceSuff
   return a_ + 0.5 * suff_stat.n;
 }
 
-double LogLinearVarianceLeafModel::PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
+double LogLinearVarianceLeafModel::PosteriorParameterRate(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
   return (b_ + (0.5 * suff_stat.weighted_sum_ei) / global_variance);
 }
 
@@ -253,7 +253,7 @@ void LogLinearVarianceLeafModel::SampleLeafParameters(ForestDataset& dataset, Fo
 
   // Sample each leaf node parameter
   double node_shape;
-  double node_scale;
+  double node_rate;
   double node_mu;
   int32_t leaf_id;
   for (int i = 0; i < tree_leaves.size(); i++) {
@@ -264,10 +264,10 @@ void LogLinearVarianceLeafModel::SampleLeafParameters(ForestDataset& dataset, Fo
     
     // Compute posterior mean and variance
     node_shape = PosteriorParameterShape(node_suff_stat, global_variance);
-    node_scale = PosteriorParameterScale(node_suff_stat, global_variance);
+    node_rate = PosteriorParameterRate(node_suff_stat, global_variance);
     
     // Draw from IG(shape, scale) and set the leaf parameter with each draw
-    node_mu = std::log(ig_sampler_.Sample(node_shape, node_scale, gen));
+    node_mu = std::log(ig_sampler_.Sample(node_shape, node_rate, gen, false));
     tree->SetLeaf(leaf_id, node_mu);
   }
 }
diff --git a/src/partition_tracker.cpp b/src/partition_tracker.cpp
index e7893f23..e1237cec 100644
--- a/src/partition_tracker.cpp
+++ b/src/partition_tracker.cpp
@@ -84,6 +84,50 @@ void ForestTracker::AssignAllSamplesToConstantPrediction(int32_t tree_num, doubl
   sample_pred_mapper_->AssignAllSamplesToConstantPrediction(tree_num, value);
 }
 
+void ForestTracker::UpdatePredictionsInternal(TreeEnsemble* ensemble, Eigen::MatrixXd& covariates, Eigen::MatrixXd& basis) {
+  int output_dim = basis.cols();
+  double forest_pred, tree_pred;
+
+  for (data_size_t i = 0; i < num_observations_; i++) {
+    forest_pred = 0.0;
+    for (int j = 0; j < num_trees_; j++) {
+      tree_pred = 0.0;
+      Tree* tree = ensemble->GetTree(j);
+      std::int32_t nidx = EvaluateTree(*tree, covariates, i);
+      for (int32_t k = 0; k < output_dim; k++) {
+        tree_pred += tree->LeafValue(nidx, k) * basis(i, k);
+      }
+      sample_pred_mapper_->SetPred(i, j, tree_pred);
+      forest_pred += tree_pred;
+    }
+    sum_predictions_[i] = forest_pred;
+  }
+}
+
+void ForestTracker::UpdatePredictionsInternal(TreeEnsemble* ensemble, Eigen::MatrixXd& covariates) {
+  double forest_pred, tree_pred;
+
+  for (data_size_t i = 0; i < num_observations_; i++) {
+    forest_pred = 0.0;
+    for (int j = 0; j < num_trees_; j++) {
+      Tree* tree = ensemble->GetTree(j);
+      std::int32_t nidx = EvaluateTree(*tree, covariates, i);
+      tree_pred = tree->LeafValue(nidx, 0);
+      sample_pred_mapper_->SetPred(i, j, tree_pred);
+      forest_pred += tree_pred;
+    }
+    sum_predictions_[i] = forest_pred;
+  }
+}
+
+void ForestTracker::UpdatePredictions(TreeEnsemble* ensemble, ForestDataset& dataset) {
+  if (dataset.HasBasis()) {
+    UpdatePredictionsInternal(ensemble, dataset.GetCovariates(), dataset.GetBasis());
+  } else {
+    UpdatePredictionsInternal(ensemble, dataset.GetCovariates());
+  }
+}
+
 void ForestTracker::AddSplit(Eigen::MatrixXd& covariates, TreeSplit& split, int32_t split_feature, int32_t tree_id, int32_t split_node_id, int32_t left_node_id, int32_t right_node_id, bool keep_sorted) {
   sample_node_mapper_->AddSplit(covariates, split, split_feature, tree_id, split_node_id, left_node_id, right_node_id);
   unsorted_node_sample_tracker_->PartitionTreeNode(covariates, tree_id, split_node_id, left_node_id, right_node_id, split_feature, split);
diff --git a/src/sampler.cpp b/src/sampler.cpp
index 973bbf44..1792f1b2 100644
--- a/src/sampler.cpp
+++ b/src/sampler.cpp
@@ -21,6 +21,7 @@ void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDatas
                                   cpp11::integers feature_types, int cutpoint_grid_size, 
                                   cpp11::doubles_matrix<> leaf_model_scale_input, 
                                   cpp11::doubles variable_weights, 
+                                  double a_forest, double b_forest,
                                   double global_variance, int leaf_model_int, 
                                   bool pre_initialized = false
 ) {
@@ -35,6 +36,8 @@ void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDatas
     if (leaf_model_int == 0) model_type = StochTree::ModelType::kConstantLeafGaussian;
     else if (leaf_model_int == 1) model_type = StochTree::ModelType::kUnivariateRegressionLeafGaussian;
     else if (leaf_model_int == 2) model_type = StochTree::ModelType::kMultivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 3) model_type = StochTree::ModelType::kLogLinearVariance;
+    else StochTree::Log::Fatal("Invalid model type");
     
     // Unpack leaf model parameters
     double leaf_scale;
@@ -60,22 +63,18 @@ void sample_gfr_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestDatas
     }
     
     // Prepare the samplers
-    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix);
+    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix, a_forest, b_forest);
     int num_basis = data->NumBasis();
     
     // Run one iteration of the sampler
     if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
-        // StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        // StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
-        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, true);
     } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
-        // StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        // StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
-        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, true);
     } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
-        // StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        // StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
-        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*tracker, *forest_samples, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, num_basis);
+        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*tracker, *forest_samples, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, true, num_basis);
+    } else if (model_type == StochTree::ModelType::kLogLinearVariance) {
+        StochTree::GFRSampleOneIter<StochTree::LogLinearVarianceLeafModel, StochTree::LogLinearVarianceSuffStat>(*tracker, *forest_samples, std::get<StochTree::LogLinearVarianceLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, false);
     }
 }
 
@@ -89,6 +88,7 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
                                    cpp11::integers feature_types, int cutpoint_grid_size, 
                                    cpp11::doubles_matrix<> leaf_model_scale_input, 
                                    cpp11::doubles variable_weights, 
+                                   double a_forest, double b_forest,
                                    double global_variance, int leaf_model_int, 
                                    bool pre_initialized = false
 ) {
@@ -103,6 +103,8 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
     if (leaf_model_int == 0) model_type = StochTree::ModelType::kConstantLeafGaussian;
     else if (leaf_model_int == 1) model_type = StochTree::ModelType::kUnivariateRegressionLeafGaussian;
     else if (leaf_model_int == 2) model_type = StochTree::ModelType::kMultivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 3) model_type = StochTree::ModelType::kLogLinearVariance;
+    else StochTree::Log::Fatal("Invalid model type");
     
     // Unpack leaf model parameters
     double leaf_scale;
@@ -128,33 +130,34 @@ void sample_mcmc_one_iteration_cpp(cpp11::external_pointer<StochTree::ForestData
     }
     
     // Prepare the samplers
-    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix);
+    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix, a_forest, b_forest);
     int num_basis = data->NumBasis();
     
     // Run one iteration of the sampler
     if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
-        // StochTree::GaussianConstantLeafModel leaf_model = StochTree::GaussianConstantLeafModel(leaf_scale);
-        // StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized, true);
     } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
-        // StochTree::GaussianUnivariateRegressionLeafModel leaf_model = StochTree::GaussianUnivariateRegressionLeafModel(leaf_scale);
-        // StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*tracker, *forest_samples, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized, true);
     } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
-        // StochTree::GaussianMultivariateRegressionLeafModel leaf_model = StochTree::GaussianMultivariateRegressionLeafModel(leaf_scale_matrix);
-        // StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat>(*tracker, *forest_samples, leaf_model, *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized);
-        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*tracker, *forest_samples, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized, num_basis);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*tracker, *forest_samples, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized, true, num_basis);
+    } else if (model_type == StochTree::ModelType::kLogLinearVariance) {
+        StochTree::MCMCSampleOneIter<StochTree::LogLinearVarianceLeafModel, StochTree::LogLinearVarianceSuffStat>(*tracker, *forest_samples, std::get<StochTree::LogLinearVarianceLeafModel>(leaf_model), *data, *residual, *split_prior, *rng, var_weights_vector, global_variance, pre_initialized, false);
     }
 }
 
 [[cpp11::register]]
 double sample_sigma2_one_iteration_cpp(cpp11::external_pointer<StochTree::ColumnVector> residual, 
+                                       cpp11::external_pointer<StochTree::ForestDataset> dataset, 
                                        cpp11::external_pointer<std::mt19937> rng, 
                                        double a, double b
 ) {
     // Run one iteration of the sampler
     StochTree::GlobalHomoskedasticVarianceModel var_model = StochTree::GlobalHomoskedasticVarianceModel();
-    return var_model.SampleVarianceParameter(residual->GetData(), a, b, *rng);
+    if (dataset->HasVarWeights()) {
+        return var_model.SampleVarianceParameter(residual->GetData(), dataset->GetVarWeights(), a, b, *rng);
+    } else {
+        return var_model.SampleVarianceParameter(residual->GetData(), a, b, *rng);
+    }
 }
 
 [[cpp11::register]]
diff --git a/tools/debug/heteroskedastic_bart.R b/tools/debug/heteroskedastic_bart.R
new file mode 100644
index 00000000..99598563
--- /dev/null
+++ b/tools/debug/heteroskedastic_bart.R
@@ -0,0 +1,41 @@
+# Load libraries
+library(stochtree)
+library(here)
+
+# Load train and test data
+project_dir <- here()
+train_set_path <- file.path(project_dir, "debug", "data", "heterosked_train.csv")
+test_set_path <- file.path(project_dir, "debug", "data", "heterosked_test.csv")
+train_df <- read.csv(train_set_path)
+test_df <- read.csv(test_set_path)
+y_train <- train_df[,1]
+y_test <- test_df[,1]
+X_train <- train_df[,2:11]
+X_test <- test_df[,2:11]
+f_x_train <- train_df[,12]
+f_x_test <- test_df[,12]
+s_x_train <- train_df[,13]
+s_x_test <- test_df[,13]
+
+# Run BART
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 200
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test,
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc,
+    num_trees_mean = 0, num_trees_variance = 20,
+    alpha_mean = 0.8, beta_mean = 3, min_samples_leaf_mean = 5,
+    max_depth_mean = 3, alpha_variance = 0.95, beta_variance = 0.1,
+    min_samples_leaf_variance = 1, max_depth_variance = 10,
+    sample_sigma = T, sample_tau = F, keep_gfr = F
+)
+
+s_x_hat_train <- rowMeans(bart_model$sigma_x_hat_train)
+# plot(s_x_hat_train, s_x_train, main = "Conditional std dev as a function of x", xlab = "Predicted", ylab = "Actual"); abline(0,1,col="red",lty=3,lwd=3)
+# sqrt(mean((s_x_hat_train - s_x_train)^2))
+
+s_x_hat_test <- rowMeans(bart_model$sigma_x_hat_test)
+plot(s_x_hat_test, s_x_test, main = "Conditional std dev as a function of x", xlab = "Predicted", ylab = "Actual"); abline(0,1,col="red",lty=3,lwd=3)
+sqrt(mean((s_x_hat_test - s_x_test)^2))
diff --git a/tools/debug/rfx_debug.R b/tools/debug/rfx_debug.R
index 8658879b..f4b734e2 100644
--- a/tools/debug/rfx_debug.R
+++ b/tools/debug/rfx_debug.R
@@ -110,7 +110,7 @@ for (i in 1:num_warmstart) {
     
     # Sample global variance parameter
     global_var_samples[i+1] <- sample_sigma2_one_iteration(
-        outcome, rng, nu, lambda
+        outcome, forest_dataset, rng, nu, lambda
     )
     
     # Sample leaf node variance parameter and update `leaf_prior_scale`
@@ -133,7 +133,7 @@ for (i in (num_warmstart+1):num_samples) {
     
     # Sample global variance parameter
     global_var_samples[i+1] <- sample_sigma2_one_iteration(
-        outcome, rng, nu, lambda
+        outcome, forest_dataset, rng, nu, lambda
     )
     
     # Sample leaf node variance parameter and update `leaf_prior_scale`
diff --git a/tools/debug/supervised_learning_task_analysis.R b/tools/debug/supervised_learning_task_analysis.R
index 8ff8d1f9..b71d2a85 100644
--- a/tools/debug/supervised_learning_task_analysis.R
+++ b/tools/debug/supervised_learning_task_analysis.R
@@ -152,7 +152,7 @@ dispatch_stochtree_run <- function(num_gfr, num_burnin, num_mcmc_retained, param
                 outcome_model_type, param_list$leaf_prior_scale, param_list$var_weights, 
                 global_var_samples[i], param_list$cutpoint_grid_size, gfr = T
             )
-            global_var_samples[i+1] <- sample_sigma2_one_iteration(outcome_train, rng, param_list$nu, param_list$lambda)
+            global_var_samples[i+1] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, param_list$nu, param_list$lambda)
             leaf_scale_samples[i+1] <- sample_tau_one_iteration(forest_samples, rng, param_list$a_leaf, param_list$b_leaf, i-1)
             param_list$leaf_prior_scale[1,1] <- leaf_scale_samples[i+1]
         }
@@ -165,9 +165,7 @@ dispatch_stochtree_run <- function(num_gfr, num_burnin, num_mcmc_retained, param
             outcome_model_type, param_list$leaf_prior_scale, param_list$var_weights, 
             global_var_samples[i], param_list$cutpoint_grid_size, gfr = F
         )
-        global_var_samples[i+1] <- sample_sigma2_one_iteration(outcome_train, rng, param_list$nu, param_list$lambda)
-        # leaf_scale_samples[i+1] <- sample_tau_one_iteration(forest_samples, rng, param_list$a_leaf, param_list$b_leaf, i-1)
-        # param_list$leaf_prior_scale[1,1] <- leaf_scale_samples[i+1]
+        global_var_samples[i+1] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, param_list$nu, param_list$lambda)
     }
     
     # Forest predictions
diff --git a/vignettes/CustomSamplingRoutine.Rmd b/vignettes/CustomSamplingRoutine.Rmd
index 5d399e5a..ceff3c81 100644
--- a/vignettes/CustomSamplingRoutine.Rmd
+++ b/vignettes/CustomSamplingRoutine.Rmd
@@ -166,7 +166,7 @@ for (i in 1:num_warmstart) {
     
     # Sample global variance parameter
     global_var_samples[i+1] <- sample_sigma2_one_iteration(
-        outcome, rng, nu, lambda
+        outcome, forest_dataset, rng, nu, lambda
     )
     
     # Sample leaf node variance parameter and update `leaf_prior_scale`
@@ -191,7 +191,7 @@ for (i in (num_warmstart+1):num_samples) {
     
     # Sample global variance parameter
     global_var_samples[i+1] <- sample_sigma2_one_iteration(
-        outcome, rng, nu, lambda
+        outcome, forest_dataset, rng, nu, lambda
     )
     
     # Sample leaf node variance parameter and update `leaf_prior_scale`
@@ -375,7 +375,7 @@ for (i in 1:num_warmstart) {
     
     # Sample global variance parameter
     global_var_samples[i+1] <- sample_sigma2_one_iteration(
-        outcome, rng, nu, lambda
+        outcome, forest_dataset, rng, nu, lambda
     )
     
     # Sample leaf node variance parameter and update `leaf_prior_scale`
@@ -403,7 +403,7 @@ for (i in (num_warmstart+1):num_samples) {
     
     # Sample global variance parameter
     global_var_samples[i+1] <- sample_sigma2_one_iteration(
-        outcome, rng, nu, lambda
+        outcome, forest_dataset, rng, nu, lambda
     )
     
     # Sample leaf node variance parameter and update `leaf_prior_scale`
@@ -604,7 +604,7 @@ for (i in 1:num_warmstart) {
     
     # Sample global variance parameter
     global_var_samples[i+1] <- sample_sigma2_one_iteration(
-        outcome, rng, nu, lambda
+        outcome, forest_dataset, rng, nu, lambda
     )
     
     # Sample leaf node variance parameter and update `leaf_prior_scale`
@@ -632,7 +632,7 @@ for (i in (num_warmstart+1):num_samples) {
     
     # Sample global variance parameter
     global_var_samples[i+1] <- sample_sigma2_one_iteration(
-        outcome, rng, nu, lambda
+        outcome, forest_dataset, rng, nu, lambda
     )
     
     # Sample leaf node variance parameter and update `leaf_prior_scale`
@@ -924,7 +924,7 @@ if (num_gfr > 0){
         
         # Sample variance parameters (if requested)
         global_var_samples[i] <- sample_sigma2_one_iteration(
-            outcome, rng, nu, lambda
+            outcome, forest_dataset_mu, rng, nu, lambda
         )
         current_sigma2 <- global_var_samples[i]
 
@@ -953,7 +953,7 @@ if (num_gfr > 0){
         b_1_samples[i] <- current_b_1
         
         # Sample variance parameters (if requested)
-        global_var_samples[i] <- sample_sigma2_one_iteration(outcome, rng, nu, lambda)
+        global_var_samples[i] <- sample_sigma2_one_iteration(outcome, forest_dataset_tau, rng, nu, lambda)
         current_sigma2 <- global_var_samples[i]
     }
 }
@@ -972,7 +972,7 @@ if (num_burnin + num_mcmc > 0) {
         )
         
         # Sample global variance parameter
-        global_var_samples[i] <- sample_sigma2_one_iteration(outcome, rng, nu, lambda)
+        global_var_samples[i] <- sample_sigma2_one_iteration(outcome, forest_dataset_mu, rng, nu, lambda)
         current_sigma2 <- global_var_samples[i]
 
         # Sample the treatment forest
@@ -1000,7 +1000,7 @@ if (num_burnin + num_mcmc > 0) {
         b_1_samples[i] <- current_b_1
 
         # Sample global variance parameter
-        global_var_samples[i] <- sample_sigma2_one_iteration(outcome, rng, nu, lambda)
+        global_var_samples[i] <- sample_sigma2_one_iteration(outcome, forest_dataset_tau, rng, nu, lambda)
         current_sigma2 <- global_var_samples[i]
     }
 }
diff --git a/vignettes/Heteroskedasticity.Rmd b/vignettes/Heteroskedasticity.Rmd
new file mode 100644
index 00000000..6960de3a
--- /dev/null
+++ b/vignettes/Heteroskedasticity.Rmd
@@ -0,0 +1,517 @@
+---
+title: "Bayesian Supervised Learning with Heteroskedasticity in StochTree"
+output: rmarkdown::html_vignette
+vignette: >
+  %\VignetteIndexEntry{Bayesian-Supervised-Learning}
+  %\VignetteEncoding{UTF-8}
+  %\VignetteEngine{knitr::rmarkdown}
+bibliography: vignettes.bib
+editor_options: 
+  markdown: 
+    wrap: 72
+---
+
+```{r, include = FALSE}
+knitr::opts_chunk$set(
+  collapse = TRUE,
+  comment = "#>"
+)
+```
+
+This vignette demonstrates how to use the `bart()` function for Bayesian 
+supervised learning (@chipman2010bart), with an additional "variance forest," 
+for modeling conditional variance. To begin, we load the `stochtree` package.
+
+```{r setup}
+library(stochtree)
+```
+
+# Demo 1: Variance-Only Simulation (simple DGP)
+
+## Simulation
+
+Here, we generate data with a constant (zero) mean and a relatively simple covariate-modified variance function.
+
+\begin{equation*}
+\begin{aligned}
+y &= 0 + \sigma^2(X) \epsilon\\
+\sigma^2(X) &= \begin{cases}
+0.25 & X_1 \geq 0 \text{ and } X_1 < 0.25\\
+1 & X_1 \geq 0.25 \text{ and } X_1 < 0.5\\
+4 & X_1 \geq 0.5 \text{ and } X_1 < 0.75\\
+9 & X_1 \geq 0.75 \text{ and } X_1 < 1\\
+\end{cases}\\
+X_1,\dots,X_p &\sim \text{U}\left(0,1\right)\\
+\epsilon &\sim \mathcal{N}\left(0,1\right)
+\end{aligned}
+\end{equation*}
+
+```{r}
+# Generate the data
+n <- 500
+p_x <- 10
+X <- matrix(runif(n*p_x), ncol = p_x)
+f_XW <- 0
+s_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (0.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (1) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (3)
+)
+y <- f_XW + rnorm(n, 0, 1)*s_XW
+
+# Split data into test and train sets
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- as.data.frame(X[test_inds,])
+X_train <- as.data.frame(X[train_inds,])
+W_test <- NULL
+W_train <- NULL
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+f_x_test <- f_XW[test_inds]
+f_x_train <- f_XW[train_inds]
+s_x_test <- s_XW[test_inds]
+s_x_train <- s_XW[train_inds]
+```
+
+## Sampling and Analysis
+
+### Warmstart
+
+We first sample the $\sigma^2(X)$ ensemble using "warm-start" 
+initialization (@he2023stochastic). This is the default in 
+`stochtree`.
+
+```{r}
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model_warmstart <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 0, num_trees_variance = 20, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 0.5, 
+    min_samples_leaf_variance = 5, 
+    sample_sigma = T, sample_tau = F
+)
+```
+
+Inspect the MCMC samples
+
+```{r}
+plot(rowMeans(bart_model_warmstart$sigma_x_hat_test), s_x_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "standard deviation function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+```
+
+### MCMC
+
+We now sample the $\sigma^2(X)$ ensemble using MCMC with 
+root initialization (as in @chipman2010bart).
+
+```{r}
+num_gfr <- 0
+num_burnin <- 1000
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model_mcmc <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 0, num_trees_variance = 20, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 0.5, 
+    min_samples_leaf_variance = 5, 
+    sample_sigma = T, sample_tau = F
+)
+```
+
+Inspect the MCMC samples
+
+```{r}
+plot(rowMeans(bart_model_mcmc$sigma_x_hat_test), s_x_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "standard deviation function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+```
+
+# Demo 2: Variance-Only Simulation (complex DGP)
+
+## Simulation
+
+Here, we generate data with a constant (zero) mean and a more complex covariate-modified variance function.
+
+\begin{equation*}
+\begin{aligned}
+y &= 0 + \sigma^2(X) \epsilon\\
+\sigma^2(X) &= \begin{cases}
+0.25X_3^2 & X_1 \geq 0 \text{ and } X_1 < 0.25\\
+1X_3^2 & X_1 \geq 0.25 \text{ and } X_1 < 0.5\\
+4X_3^2 & X_1 \geq 0.5 \text{ and } X_1 < 0.75\\
+9X_3^2 & X_1 \geq 0.75 \text{ and } X_1 < 1\\
+\end{cases}\\
+X_1,\dots,X_p &\sim \text{U}\left(0,1\right)\\
+\epsilon &\sim \mathcal{N}\left(0,1\right)
+\end{aligned}
+\end{equation*}
+
+```{r}
+# Generate the data
+n <- 500
+p_x <- 10
+X <- matrix(runif(n*p_x), ncol = p_x)
+f_XW <- 0
+s_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (0.5*X[,3]) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (1*X[,3]) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2*X[,3]) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (3*X[,3])
+)
+y <- f_XW + rnorm(n, 0, 1)*s_XW
+
+# Split data into test and train sets
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- as.data.frame(X[test_inds,])
+X_train <- as.data.frame(X[train_inds,])
+W_test <- NULL
+W_train <- NULL
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+f_x_test <- f_XW[test_inds]
+f_x_train <- f_XW[train_inds]
+s_x_test <- s_XW[test_inds]
+s_x_train <- s_XW[train_inds]
+```
+
+## Sampling and Analysis
+
+### Warmstart
+
+We first sample the $\sigma^2(X)$ ensemble using "warm-start" 
+initialization (@he2023stochastic). This is the default in 
+`stochtree`.
+
+```{r}
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model_warmstart <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 0, num_trees_variance = 50, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 0.5, 
+    min_samples_leaf_variance = 1, 
+    sample_sigma = T, sample_tau = F
+)
+```
+
+Inspect the MCMC samples
+
+```{r}
+plot(rowMeans(bart_model_warmstart$sigma_x_hat_test), s_x_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "standard deviation function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+```
+
+### MCMC
+
+We now sample the $\sigma^2(X)$ ensemble using MCMC with 
+root initialization (as in @chipman2010bart).
+
+```{r}
+num_gfr <- 0
+num_burnin <- 1000
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model_mcmc <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 0, num_trees_variance = 20, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 0.5, 
+    min_samples_leaf_variance = 5, 
+    sample_sigma = T, sample_tau = F
+)
+```
+
+Inspect the MCMC samples
+
+```{r}
+plot(rowMeans(bart_model_mcmc$sigma_x_hat_test), s_x_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "standard deviation function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+```
+
+# Demo 3: Mean and Variance Simulation (simple DGP)
+
+## Simulation
+
+Here, we generate data with (relatively simple) covariate-modified mean and variance functions.
+
+\begin{equation*}
+\begin{aligned}
+y &= f(X) + \sigma^2(X) \epsilon\\
+f(X) &= \begin{cases}
+-6 & X_2 \geq 0 \text{ and } X_2 < 0.25\\
+-2 & X_2 \geq 0.25 \text{ and } X_2 < 0.5\\
+2 & X_2 \geq 0.5 \text{ and } X_2 < 0.75\\
+6 & X_2 \geq 0.75 \text{ and } X_2 < 1\\
+\end{cases}\\
+\sigma^2(X) &= \begin{cases}
+0.25 & X_1 \geq 0 \text{ and } X_1 < 0.25\\
+1 & X_1 \geq 0.25 \text{ and } X_1 < 0.5\\
+4 & X_1 \geq 0.5 \text{ and } X_1 < 0.75\\
+9 & X_1 \geq 0.75 \text{ and } X_1 < 1\\
+\end{cases}\\
+X_1,\dots,X_p &\sim \text{U}\left(0,1\right)\\
+\epsilon &\sim \mathcal{N}\left(0,1\right)
+\end{aligned}
+\end{equation*}
+
+```{r}
+# Generate the data
+n <- 500
+p_x <- 10
+X <- matrix(runif(n*p_x), ncol = p_x)
+f_XW <- (
+    ((0 <= X[,2]) & (0.25 > X[,2])) * (-6) + 
+    ((0.25 <= X[,2]) & (0.5 > X[,2])) * (-2) + 
+    ((0.5 <= X[,2]) & (0.75 > X[,2])) * (2) + 
+    ((0.75 <= X[,2]) & (1 > X[,2])) * (6)
+)
+s_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (0.5) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (1) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (3)
+)
+y <- f_XW + rnorm(n, 0, 1)*s_XW
+
+# Split data into test and train sets
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- as.data.frame(X[test_inds,])
+X_train <- as.data.frame(X[train_inds,])
+W_test <- NULL
+W_train <- NULL
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+f_x_test <- f_XW[test_inds]
+f_x_train <- f_XW[train_inds]
+s_x_test <- s_XW[test_inds]
+s_x_train <- s_XW[train_inds]
+```
+
+## Sampling and Analysis
+
+### Warmstart
+
+We first sample the $\sigma^2(X)$ ensemble using "warm-start" 
+initialization (@he2023stochastic). This is the default in 
+`stochtree`.
+
+```{r}
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model_warmstart <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 50, num_trees_variance = 20, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 0.5, 
+    min_samples_leaf_variance = 5, 
+    sample_sigma = T, sample_tau = F
+)
+```
+
+Inspect the MCMC samples
+
+```{r}
+plot(rowMeans(bart_model_warmstart$y_hat_test), y_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "mean function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+plot(rowMeans(bart_model_warmstart$sigma_x_hat_test), s_x_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "standard deviation function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+```
+
+### MCMC
+
+We now sample the $\sigma^2(X)$ ensemble using MCMC with 
+root initialization (as in @chipman2010bart).
+
+```{r}
+num_gfr <- 0
+num_burnin <- 1000
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model_mcmc <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 50, num_trees_variance = 20, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 0.5, 
+    min_samples_leaf_variance = 5, 
+    sample_sigma = T, sample_tau = F
+)
+```
+
+Inspect the MCMC samples
+
+```{r}
+plot(rowMeans(bart_model_mcmc$y_hat_test), y_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "mean function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+
+plot(rowMeans(bart_model_mcmc$sigma_x_hat_test), s_x_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "standard deviation function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+```
+
+# Demo 4: Mean and Variance Simulation (complex DGP)
+
+## Simulation
+
+Here, we generate data with more complex covariate-modified mean and variance functions.
+
+\begin{equation*}
+\begin{aligned}
+y &= f(X) + \sigma^2(X) \epsilon\\
+f(X) &= \begin{cases}
+-6X_4 & X_2 \geq 0 \text{ and } X_2 < 0.25\\
+-2X_4 & X_2 \geq 0.25 \text{ and } X_2 < 0.5\\
+2X_4 & X_2 \geq 0.5 \text{ and } X_2 < 0.75\\
+6X_4 & X_2 \geq 0.75 \text{ and } X_2 < 1\\
+\end{cases}\\
+\sigma^2(X) &= \begin{cases}
+0.25X_3^2 & X_1 \geq 0 \text{ and } X_1 < 0.25\\
+1X_3^2 & X_1 \geq 0.25 \text{ and } X_1 < 0.5\\
+4X_3^2 & X_1 \geq 0.5 \text{ and } X_1 < 0.75\\
+9X_3^2 & X_1 \geq 0.75 \text{ and } X_1 < 1\\
+\end{cases}\\
+X_1,\dots,X_p &\sim \text{U}\left(0,1\right)\\
+\epsilon &\sim \mathcal{N}\left(0,1\right)
+\end{aligned}
+\end{equation*}
+
+```{r}
+# Generate the data
+n <- 500
+p_x <- 10
+X <- matrix(runif(n*p_x), ncol = p_x)
+f_XW <- (
+    ((0 <= X[,2]) & (0.25 > X[,2])) * (-6*X[,4]) + 
+    ((0.25 <= X[,2]) & (0.5 > X[,2])) * (-2*X[,4]) + 
+    ((0.5 <= X[,2]) & (0.75 > X[,2])) * (2*X[,4]) + 
+    ((0.75 <= X[,2]) & (1 > X[,2])) * (6*X[,4])
+)
+s_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (0.5*X[,3]) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (1*X[,3]) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2*X[,3]) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (3*X[,3])
+)
+y <- f_XW + rnorm(n, 0, 1)*s_XW
+
+# Split data into test and train sets
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- as.data.frame(X[test_inds,])
+X_train <- as.data.frame(X[train_inds,])
+W_test <- NULL
+W_train <- NULL
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+f_x_test <- f_XW[test_inds]
+f_x_train <- f_XW[train_inds]
+s_x_test <- s_XW[test_inds]
+s_x_train <- s_XW[train_inds]
+```
+
+## Sampling and Analysis
+
+### Warmstart
+
+We first sample the $\sigma^2(X)$ ensemble using "warm-start" 
+initialization (@he2023stochastic). This is the default in 
+`stochtree`.
+
+```{r}
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model_warmstart <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 50, num_trees_variance = 20, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 0.5, 
+    min_samples_leaf_variance = 5, 
+    sample_sigma = T, sample_tau = F
+)
+```
+
+Inspect the MCMC samples
+
+```{r}
+plot(rowMeans(bart_model_warmstart$y_hat_test), y_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "mean function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+plot(rowMeans(bart_model_warmstart$sigma_x_hat_test), s_x_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "standard deviation function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+```
+
+### MCMC
+
+We now sample the $\sigma^2(X)$ ensemble using MCMC with 
+root initialization (as in @chipman2010bart).
+
+```{r}
+num_gfr <- 0
+num_burnin <- 1000
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model_mcmc <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 50, num_trees_variance = 20, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 0.5, 
+    min_samples_leaf_variance = 5, 
+    sample_sigma = T, sample_tau = F
+)
+```
+
+Inspect the MCMC samples
+
+```{r}
+plot(rowMeans(bart_model_mcmc$y_hat_test), y_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "mean function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+
+plot(rowMeans(bart_model_mcmc$sigma_x_hat_test), s_x_test, 
+     pch=16, cex=0.75, xlab = "pred", ylab = "actual", main = "standard deviation function")
+abline(0,1,col="red",lty=2,lwd=2.5)
+```
+
+# References

From 191fcb8e4a1bd969fe25f5ed22978bfbe5dc2abb Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Wed, 25 Sep 2024 11:39:47 -0400
Subject: [PATCH 26/41] Parameterizing as precision, rather than variance
 (still not producing expected results)

---
 R/bart.R                           |  4 ++--
 include/stochtree/gamma_sampler.h  |  9 ++-------
 include/stochtree/leaf_model.h     | 18 +++++++++---------
 include/stochtree/tree_sampler.h   |  7 ++++---
 include/stochtree/variance_model.h |  2 +-
 src/forest.cpp                     |  3 ++-
 src/leaf_model.cpp                 |  2 +-
 7 files changed, 21 insertions(+), 24 deletions(-)

diff --git a/R/bart.R b/R/bart.R
index 031ed1cf..8540c897 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -481,8 +481,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     
     # Variance forest predictions
     if (include_variance_forest) {
-        sigma_x_hat_train <- forest_samples_variance$predict(forest_dataset_train)
-        if (has_test) sigma_x_hat_test <- forest_samples_variance$predict(forest_dataset_test)
+        sigma_x_hat_train <- 1/forest_samples_variance$predict(forest_dataset_train)
+        if (has_test) sigma_x_hat_test <- 1/forest_samples_variance$predict(forest_dataset_test)
     }
     
     # Random effects predictions
diff --git a/include/stochtree/gamma_sampler.h b/include/stochtree/gamma_sampler.h
index 6bd037ec..26444693 100644
--- a/include/stochtree/gamma_sampler.h
+++ b/include/stochtree/gamma_sampler.h
@@ -11,13 +11,8 @@ class GammaSampler {
   GammaSampler() {}
   ~GammaSampler() {}
   double Sample(double a, double b, std::mt19937& gen, bool rate_param = true) {
-    // C++ standard library provides a gamma distribution with scale
-    // parameter, but the correspondence between gamma and IG is that 
-    // 1 / gamma(a,b) ~ IG(a,b) when b is a __rate__ parameter.
-    // Before sampling, we convert ig_scale to a gamma scale parameter by 
-    // taking its multiplicative inverse.
-    double rate = rate_param ? b : 1./b;
-    gamma_dist_ = std::gamma_distribution<double>(a, rate);
+    double scale = rate_param ? 1./b : b;
+    gamma_dist_ = std::gamma_distribution<double>(a, scale);
     return gamma_dist_(gen);
   }
  private:
diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index 57480f0b..315ec054 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -44,8 +44,8 @@ class GaussianConstantSuffStat {
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
-      sum_w += 1./dataset.VarWeightValue(row_idx);
-      sum_yw += outcome(row_idx, 0)/dataset.VarWeightValue(row_idx);
+      sum_w += dataset.VarWeightValue(row_idx);
+      sum_yw += outcome(row_idx, 0)*dataset.VarWeightValue(row_idx);
     } else {
       sum_w += 1.0;
       sum_yw += outcome(row_idx, 0);
@@ -109,8 +109,8 @@ class GaussianUnivariateRegressionSuffStat {
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
-      sum_xxw += dataset.BasisValue(row_idx, 0)*dataset.BasisValue(row_idx, 0)/dataset.VarWeightValue(row_idx);
-      sum_yxw += outcome(row_idx, 0)*dataset.BasisValue(row_idx, 0)/dataset.VarWeightValue(row_idx);
+      sum_xxw += dataset.BasisValue(row_idx, 0)*dataset.BasisValue(row_idx, 0)*dataset.VarWeightValue(row_idx);
+      sum_yxw += outcome(row_idx, 0)*dataset.BasisValue(row_idx, 0)*dataset.VarWeightValue(row_idx);
     } else {
       sum_xxw += dataset.BasisValue(row_idx, 0)*dataset.BasisValue(row_idx, 0);
       sum_yxw += outcome(row_idx, 0)*dataset.BasisValue(row_idx, 0);
@@ -176,8 +176,8 @@ class GaussianMultivariateRegressionSuffStat {
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
-      XtWX += dataset.GetBasis()(row_idx, Eigen::all).transpose()*dataset.GetBasis()(row_idx, Eigen::all)/dataset.VarWeightValue(row_idx);
-      ytWX += (outcome(row_idx, 0)*(dataset.GetBasis()(row_idx, Eigen::all)))/dataset.VarWeightValue(row_idx);
+      XtWX += dataset.GetBasis()(row_idx, Eigen::all).transpose()*dataset.GetBasis()(row_idx, Eigen::all)*dataset.VarWeightValue(row_idx);
+      ytWX += (outcome(row_idx, 0)*(dataset.GetBasis()(row_idx, Eigen::all)))*dataset.VarWeightValue(row_idx);
     } else {
       XtWX += dataset.GetBasis()(row_idx, Eigen::all).transpose()*dataset.GetBasis()(row_idx, Eigen::all);
       ytWX += (outcome(row_idx, 0)*(dataset.GetBasis()(row_idx, Eigen::all)));
@@ -240,7 +240,7 @@ class LogLinearVarianceSuffStat {
   }
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
-    weighted_sum_ei += outcome(row_idx)*outcome(row_idx)/dataset.VarWeightValue(row_idx);
+    weighted_sum_ei += std::exp(std::log(outcome(row_idx)*outcome(row_idx)) + tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx));
     sum_log_partial_var += tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx);
   }
   void ResetSuffStat() {
@@ -272,7 +272,7 @@ class LogLinearVarianceSuffStat {
 /*! \brief Marginal likelihood and posterior computation for heteroskedastic log-linear variance model */
 class LogLinearVarianceLeafModel {
  public:
-  LogLinearVarianceLeafModel(double a, double b) {a_ = a; b_ = b; ig_sampler_ = InverseGammaSampler();}
+  LogLinearVarianceLeafModel(double a, double b) {a_ = a; b_ = b; gamma_sampler_ = GammaSampler();}
   ~LogLinearVarianceLeafModel() {}
   double SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance);
   double NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance);
@@ -286,7 +286,7 @@ class LogLinearVarianceLeafModel {
  private:
   double a_;
   double b_;
-  InverseGammaSampler ig_sampler_;
+  GammaSampler gamma_sampler_;
 };
 
 using SuffStatVariant = std::variant<GaussianConstantSuffStat, 
diff --git a/include/stochtree/tree_sampler.h b/include/stochtree/tree_sampler.h
index 2cf8da4b..c38e0310 100644
--- a/include/stochtree/tree_sampler.h
+++ b/include/stochtree/tree_sampler.h
@@ -312,14 +312,15 @@ static inline void UpdateVarModelTree(ForestTracker& tracker, ForestDataset& dat
       pred_delta = pred_value - prev_tree_pred;
       tracker.SetTreeSamplePrediction(i, tree_num, pred_value);
       tracker.SetSamplePrediction(i, prev_pred + pred_delta);
+      new_weight = std::log(dataset.VarWeightValue(i)) + pred_value;
+      dataset.SetVarWeightValue(i, new_weight, true);
     } else {
       // If the tree has not yet been modified via a sampling step, 
       // we can query its prediction directly from the SamplePredMapper stored in tracker
       pred_value = tracker.GetTreeSamplePrediction(i, tree_num);
+      new_weight = std::log(dataset.VarWeightValue(i)) - pred_value;
+      dataset.SetVarWeightValue(i, new_weight, true);
     }
-    // Run op (either plus or minus) on the dataset's variance weights and the new prediction
-    new_weight = op(std::log(dataset.VarWeightValue(i)), pred_value);
-    dataset.SetVarWeightValue(i, std::exp(new_weight), false);
   }
 }
 
diff --git a/include/stochtree/variance_model.h b/include/stochtree/variance_model.h
index 9c61b357..79b8831f 100644
--- a/include/stochtree/variance_model.h
+++ b/include/stochtree/variance_model.h
@@ -45,7 +45,7 @@ class GlobalHomoskedasticVarianceModel {
     data_size_t n = residuals.rows();
     double sum_sq_resid = 0.;
     for (data_size_t i = 0; i < n; i++) {
-      sum_sq_resid += (residuals(i) * residuals(i)) / weights(i);
+      sum_sq_resid += (residuals(i) * residuals(i)) * weights(i);
     }
     return b + (0.5 * sum_sq_resid);
   }
diff --git a/src/forest.cpp b/src/forest.cpp
index 7959003d..a277bdfc 100644
--- a/src/forest.cpp
+++ b/src/forest.cpp
@@ -291,10 +291,11 @@ void initialize_forest_model_cpp(cpp11::external_pointer<StochTree::ForestDatase
         UpdateResidualEntireForest(*tracker, *data, *residual, forest_samples->GetEnsemble(0), true, std::minus<double>());
         tracker->UpdatePredictions(forest_samples->GetEnsemble(0), *data);
     } else if (model_type == StochTree::ModelType::kLogLinearVariance) {
-        forest_samples->InitializeRoot(std::log(init_val) / static_cast<double>(num_trees));
+        forest_samples->InitializeRoot(-std::log(init_val) / static_cast<double>(num_trees));
         tracker->UpdatePredictions(forest_samples->GetEnsemble(0), *data);
         int n = data->NumObservations();
         std::vector<double> initial_preds(n, init_val);
+        for (int i = 0; i < n; i++) initial_preds[i] = 1/initial_preds[i];
         data->AddVarianceWeights(initial_preds.data(), n);
     }
 }
diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index 5edb3002..4622cb84 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -267,7 +267,7 @@ void LogLinearVarianceLeafModel::SampleLeafParameters(ForestDataset& dataset, Fo
     node_rate = PosteriorParameterRate(node_suff_stat, global_variance);
     
     // Draw from IG(shape, scale) and set the leaf parameter with each draw
-    node_mu = std::log(ig_sampler_.Sample(node_shape, node_rate, gen, false));
+    node_mu = std::log(gamma_sampler_.Sample(node_shape, node_rate, gen, true));
     tree->SetLeaf(leaf_id, node_mu);
   }
 }

From dcbdd991d429fffc2e7bce32c0377a412744982d Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Wed, 25 Sep 2024 21:11:02 -0400
Subject: [PATCH 27/41] Updated variance forest code and demo

---
 R/bart.R                           |  8 ++--
 include/stochtree/leaf_model.h     |  1 +
 src/leaf_model.cpp                 | 31 +++++--------
 tools/debug/heteroskedastic_bart.R | 73 ++++++++++++++++++++++--------
 vignettes/Heteroskedasticity.Rmd   | 32 ++++++++-----
 5 files changed, 91 insertions(+), 54 deletions(-)

diff --git a/R/bart.R b/R/bart.R
index 8540c897..7c1dd24e 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -268,8 +268,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     current_leaf_scale <- as.matrix(tau_init)
     current_sigma2 <- sigma2_init
     a_0 <- 1.5
-    a_forest <- num_trees_variance/(a_0^2) + 0.5
-    b_forest <- num_trees_variance/(a_0^2)
+    if (is.null(a_forest)) a_forest <- num_trees_variance/(a_0^2) + 0.5
+    if (is.null(b_forest)) b_forest <- num_trees_variance/(a_0^2)
     
     # Determine leaf model type
     if (!has_basis) leaf_model_mean_forest <- 0
@@ -542,8 +542,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
             sigma_x_hat_train <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_train[,i]*sigma2_samples[i]))
             if (has_test) sigma_x_hat_test <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_test[,i]*sigma2_samples[i]))
         } else {
-            sigma_x_hat_train <- sqrt(sigma_x_hat_train*sigma2_init)
-            if (has_test) sigma_x_hat_test <- sqrt(sigma_x_hat_test*sigma2_init)
+            sigma_x_hat_train <- sqrt(sigma_x_hat_train*sigma2_init)*y_std_train
+            if (has_test) sigma_x_hat_test <- sqrt(sigma_x_hat_test*sigma2_init)*y_std_train
         }
     }
     
diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index 315ec054..95bf705a 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -276,6 +276,7 @@ class LogLinearVarianceLeafModel {
   ~LogLinearVarianceLeafModel() {}
   double SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance);
   double NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance);
+  double SuffStatLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   double PosteriorParameterShape(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   double PosteriorParameterRate(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   void SampleLeafParameters(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, Tree* tree, int tree_num, double global_variance, std::mt19937& gen);
diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index 4622cb84..adb18dd1 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -208,31 +208,22 @@ void GaussianMultivariateRegressionLeafModel::SetEnsembleRootPredictedValue(Fore
 }
 
 double LogLinearVarianceLeafModel::SplitLogMarginalLikelihood(LogLinearVarianceSuffStat& left_stat, LogLinearVarianceSuffStat& right_stat, double global_variance) {
-  double left_log_ml = (
-    boost::math::lgamma(a_ + 0.5 * left_stat.n) -
-    // (0.5 * left_stat.n) * std::log(2 * pi_constant * global_variance) - 
-    // 0.5 * left_stat.sum_log_partial_var - 
-    (a_ + 0.5 * left_stat.n) * std::log(b_ + (0.5 * left_stat.weighted_sum_ei) / global_variance)
-  );
-
-  double right_log_ml = (
-    boost::math::lgamma(a_ + 0.5 * right_stat.n) -
-    // (0.5 * right_stat.n) * std::log(2 * pi_constant * global_variance) - 
-    // 0.5 * right_stat.sum_log_partial_var - 
-    (a_ + 0.5 * right_stat.n) * std::log(b_ + (0.5 * right_stat.weighted_sum_ei) / global_variance)
-  );
-
+  double left_log_ml = SuffStatLogMarginalLikelihood(left_stat, global_variance);
+  double right_log_ml = SuffStatLogMarginalLikelihood(right_stat, global_variance);
   return left_log_ml + right_log_ml;
 }
 
 double LogLinearVarianceLeafModel::NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
-  double log_ml = (
-    boost::math::lgamma(a_ + 0.5 * suff_stat.n) -
-    // (0.5 * suff_stat.n) * std::log(2 * pi_constant * global_variance) - 
-    // 0.5 * suff_stat.sum_log_partial_var - 
-    (a_ + 0.5 * suff_stat.n) * std::log(b_ + (0.5 * suff_stat.weighted_sum_ei) / global_variance)
-  );
+  return SuffStatLogMarginalLikelihood(suff_stat, global_variance);
+}
 
+double LogLinearVarianceLeafModel::SuffStatLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
+  double a_term = a_ + 0.5 * suff_stat.n;
+  double b_term = b_ + ((0.5 * suff_stat.weighted_sum_ei) / global_variance);
+  double log_b_term = std::log(b_term);
+  double lgamma_a_term = boost::math::lgamma(a_term);
+  double resid_term = a_term * log_b_term;
+  double log_ml = lgamma_a_term - resid_term;
   return log_ml;
 }
 
diff --git a/tools/debug/heteroskedastic_bart.R b/tools/debug/heteroskedastic_bart.R
index 99598563..230b18d7 100644
--- a/tools/debug/heteroskedastic_bart.R
+++ b/tools/debug/heteroskedastic_bart.R
@@ -3,38 +3,75 @@ library(stochtree)
 library(here)
 
 # Load train and test data
-project_dir <- here()
-train_set_path <- file.path(project_dir, "debug", "data", "heterosked_train.csv")
-test_set_path <- file.path(project_dir, "debug", "data", "heterosked_test.csv")
-train_df <- read.csv(train_set_path)
-test_df <- read.csv(test_set_path)
-y_train <- train_df[,1]
-y_test <- test_df[,1]
-X_train <- train_df[,2:11]
-X_test <- test_df[,2:11]
-f_x_train <- train_df[,12]
-f_x_test <- test_df[,12]
-s_x_train <- train_df[,13]
-s_x_test <- test_df[,13]
+from_file <- T
+if (from_file) {
+    project_dir <- here()
+    train_set_path <- file.path(project_dir, "debug", "data", "heterosked_train.csv")
+    test_set_path <- file.path(project_dir, "debug", "data", "heterosked_test.csv")
+    train_df <- read.csv(train_set_path)
+    test_df <- read.csv(test_set_path)
+    y_train <- train_df[,1]
+    y_test <- test_df[,1]
+    X_train <- train_df[,2:11]
+    X_test <- test_df[,2:11]
+    f_x_train <- train_df[,12]
+    f_x_test <- test_df[,12]
+    s_x_train <- train_df[,13]
+    s_x_test <- test_df[,13]
+} else {
+    n <- 500
+    p_x <- 10
+    X <- matrix(runif(n*p_x), ncol = p_x)
+    f_XW <- 0
+    s_XW <- (
+        ((0 <= X[,1]) & (0.25 > X[,1])) * (0.5*X[,3]) + 
+        ((0.25 <= X[,1]) & (0.5 > X[,1])) * (1*X[,3]) + 
+        ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2*X[,3]) + 
+        ((0.75 <= X[,1]) & (1 > X[,1])) * (3*X[,3])
+    )
+    y <- f_XW + rnorm(n, 0, 1)*s_XW
+    
+    # Split data into test and train sets
+    test_set_pct <- 0.2
+    n_test <- round(test_set_pct*n)
+    n_train <- n - n_test
+    test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+    train_inds <- (1:n)[!((1:n) %in% test_inds)]
+    X_test <- as.data.frame(X[test_inds,])
+    X_train <- as.data.frame(X[train_inds,])
+    W_test <- NULL
+    W_train <- NULL
+    y_test <- y[test_inds]
+    y_train <- y[train_inds]
+    f_x_test <- f_XW[test_inds]
+    f_x_train <- f_XW[train_inds]
+    s_x_test <- s_XW[test_inds]
+    s_x_train <- s_XW[train_inds]
+}
 
 # Run BART
 num_gfr <- 10
 num_burnin <- 0
 num_mcmc <- 200
 num_samples <- num_gfr + num_burnin + num_mcmc
+m <- 50
+a_0 <- sqrt(1/2)
+sigma0 <- 1/2
 bart_model <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test,
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc,
-    num_trees_mean = 0, num_trees_variance = 20,
+    num_trees_mean = 0, num_trees_variance = m,
     alpha_mean = 0.8, beta_mean = 3, min_samples_leaf_mean = 5,
-    max_depth_mean = 3, alpha_variance = 0.95, beta_variance = 0.1,
+    max_depth_mean = 3, alpha_variance = 0.95, beta_variance = 1.25,
     min_samples_leaf_variance = 1, max_depth_variance = 10,
-    sample_sigma = T, sample_tau = F, keep_gfr = F
+    sample_sigma = F, sample_tau = F, keep_gfr = T, sigma2_init = sigma0, 
+    # a_forest = m/(a_0^2) + 1, b_forest = m/(a_0^2)
+    a_forest = 3, b_forest = 2
 )
 
 s_x_hat_train <- rowMeans(bart_model$sigma_x_hat_train)
-# plot(s_x_hat_train, s_x_train, main = "Conditional std dev as a function of x", xlab = "Predicted", ylab = "Actual"); abline(0,1,col="red",lty=3,lwd=3)
-# sqrt(mean((s_x_hat_train - s_x_train)^2))
+plot(s_x_hat_train, s_x_train, main = "Conditional std dev as a function of x", xlab = "Predicted", ylab = "Actual"); abline(0,1,col="red",lty=3,lwd=3)
+sqrt(mean((s_x_hat_train - s_x_train)^2))
 
 s_x_hat_test <- rowMeans(bart_model$sigma_x_hat_test)
 plot(s_x_hat_test, s_x_test, main = "Conditional std dev as a function of x", xlab = "Predicted", ylab = "Actual"); abline(0,1,col="red",lty=3,lwd=3)
diff --git a/vignettes/Heteroskedasticity.Rmd b/vignettes/Heteroskedasticity.Rmd
index 6960de3a..2b630827 100644
--- a/vignettes/Heteroskedasticity.Rmd
+++ b/vignettes/Heteroskedasticity.Rmd
@@ -96,9 +96,10 @@ bart_model_warmstart <- stochtree::bart(
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 0, num_trees_variance = 20, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 0.5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
     sample_sigma = T, sample_tau = F
+    # , a_forest = 1, b_forest = 1
 )
 ```
 
@@ -125,9 +126,10 @@ bart_model_mcmc <- stochtree::bart(
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 0, num_trees_variance = 20, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 0.5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
     sample_sigma = T, sample_tau = F
+    # , a_forest = 1, b_forest = 1
 )
 ```
 
@@ -209,9 +211,10 @@ bart_model_warmstart <- stochtree::bart(
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 0, num_trees_variance = 50, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 0.5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 1, 
     sample_sigma = T, sample_tau = F
+    # , a_forest = 1, b_forest = 1
 )
 ```
 
@@ -238,9 +241,10 @@ bart_model_mcmc <- stochtree::bart(
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 0, num_trees_variance = 20, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 0.5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
     sample_sigma = T, sample_tau = F
+    # , a_forest = 1, b_forest = 1
 )
 ```
 
@@ -333,9 +337,10 @@ bart_model_warmstart <- stochtree::bart(
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 50, num_trees_variance = 20, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 0.5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F
+    sample_sigma = T, sample_tau = F, 
+    a_forest = 1, b_forest = 1
 )
 ```
 
@@ -365,9 +370,10 @@ bart_model_mcmc <- stochtree::bart(
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 50, num_trees_variance = 20, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 0.5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F
+    sample_sigma = T, sample_tau = F, 
+    a_forest = 1, b_forest = 1
 )
 ```
 
@@ -464,9 +470,10 @@ bart_model_warmstart <- stochtree::bart(
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 50, num_trees_variance = 20, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 0.5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F
+    sample_sigma = T, sample_tau = F, 
+    a_forest = 1, b_forest = 1
 )
 ```
 
@@ -496,9 +503,10 @@ bart_model_mcmc <- stochtree::bart(
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 50, num_trees_variance = 20, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 0.5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F
+    sample_sigma = T, sample_tau = F, 
+    a_forest = 1, b_forest = 1
 )
 ```
 

From 01bd2d2bb4ee5b492ebbfac65f6f3bee09a9d8a8 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Wed, 25 Sep 2024 22:46:19 -0400
Subject: [PATCH 28/41] Added a parameter to rescale y to variance other than 1

---
 R/bart.R    |  4 +++-
 man/bart.Rd | 12 +++++++-----
 2 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/R/bart.R b/R/bart.R
index 7c1dd24e..2b963f38 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -46,6 +46,7 @@
 #' @param variance_forest_init Starting value of root forest prediction in conditional (heteroskedastic) error variance model. Calibrated internally as `log(pct_var_variance_forest_init*var((y-mean(y))/sd(y)))/num_trees_variance` if not set.
 #' @param pct_var_sigma2_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by `sigma2_init`.
 #' @param pct_var_variance_forest_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by `variance_forest_init`.
+#' @param variance_scale Variance after the data have been scaled. Default: 1.
 #' @param variable_weights_mean Numeric weights reflecting the relative probability of splitting on each variable in the mean forest. Does not need to sum to 1 but cannot be negative. Defaults to `rep(1/ncol(X_train), ncol(X_train))` if not set here.
 #' @param variable_weights_variance Numeric weights reflecting the relative probability of splitting on each variable in the variance forest. Does not need to sum to 1 but cannot be negative. Defaults to `rep(1/ncol(X_train), ncol(X_train))` if not set here.
 #' @param num_trees_mean Number of trees in the ensemble for the conditional mean model. Default: 200. If `num_trees_mean = 0`, the conditional mean will not be modeled using a forest and the function will only proceed if `num_trees_variance > 0`.
@@ -96,7 +97,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
                  min_samples_leaf_variance = 5, max_depth_variance = 10, 
                  a_global = 0, b_global = 0, a_leaf = 3, b_leaf = NULL, 
                  a_forest = NULL, b_forest = NULL, q = 0.9, sigma2_init = NULL, 
-                 variance_forest_init = NULL, pct_var_sigma2_init = 1, 
+                 variance_forest_init = NULL, pct_var_sigma2_init = 1, variance_scale = 1, 
                  pct_var_variance_forest_init = 1, variable_weights_mean = NULL, 
                  variable_weights_variance = NULL, num_trees_mean = 200, num_trees_variance = 20, 
                  num_gfr = 5, num_burnin = 0, num_mcmc = 100, sample_sigma = T, 
@@ -256,6 +257,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     y_bar_train <- mean(y_train)
     y_std_train <- sd(y_train)
     resid_train <- (y_train-y_bar_train)/y_std_train
+    resid_train <- resid_train*sqrt(variance_scale)
     
     # Compute initial value of root nodes in mean forest
     init_val_mean <- mean(resid_train)
diff --git a/man/bart.Rd b/man/bart.Rd
index d65f10d9..17d23413 100644
--- a/man/bart.Rd
+++ b/man/bart.Rd
@@ -34,11 +34,12 @@ bart(
   sigma2_init = NULL,
   variance_forest_init = NULL,
   pct_var_sigma2_init = 1,
-  pct_var_variance_forest_init = 0.4,
+  variance_scale = 1,
+  pct_var_variance_forest_init = 1,
   variable_weights_mean = NULL,
   variable_weights_variance = NULL,
   num_trees_mean = 200,
-  num_trees_variance = 200,
+  num_trees_variance = 20,
   num_gfr = 5,
   num_burnin = 0,
   num_mcmc = 100,
@@ -47,8 +48,7 @@ bart(
   random_seed = -1,
   keep_burnin = F,
   keep_gfr = F,
-  verbose = F,
-  include_variance_forest = F
+  verbose = F
 )
 }
 \arguments{
@@ -125,7 +125,9 @@ that were not in the training set.}
 
 \item{pct_var_sigma2_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by \code{sigma2_init}.}
 
-\item{pct_var_variance_forest_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by \code{variance_forest_init}.}
+\item{variance_scale}{Variance after the data have been scaled. Default: 1.}
+
+\item{pct_var_variance_forest_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by \code{variance_forest_init}.}
 
 \item{variable_weights_mean}{Numeric weights reflecting the relative probability of splitting on each variable in the mean forest. Does not need to sum to 1 but cannot be negative. Defaults to \code{rep(1/ncol(X_train), ncol(X_train))} if not set here.}
 

From 7dc94631f15a5dea8f121e071b5d403f91cb5d09 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Wed, 25 Sep 2024 22:58:02 -0400
Subject: [PATCH 29/41] Rescale samples by variance_scale after sampling is
 complete

---
 R/bart.R | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/R/bart.R b/R/bart.R
index 2b963f38..7baf0a44 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -477,8 +477,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     
     # Mean forest predictions
     if (include_mean_forest) {
-        y_hat_train <- forest_samples_mean$predict(forest_dataset_train)*y_std_train + y_bar_train
-        if (has_test) y_hat_test <- forest_samples_mean$predict(forest_dataset_test)*y_std_train + y_bar_train
+        y_hat_train <- forest_samples_mean$predict(forest_dataset_train)*y_std_train/sqrt(variance_scale) + y_bar_train
+        if (has_test) y_hat_test <- forest_samples_mean$predict(forest_dataset_test)*y_std_train/sqrt(variance_scale) + y_bar_train
     }
     
     # Variance forest predictions
@@ -489,11 +489,11 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     
     # Random effects predictions
     if (has_rfx) {
-        rfx_preds_train <- rfx_samples$predict(group_ids_train, rfx_basis_train)*y_std_train
+        rfx_preds_train <- rfx_samples$predict(group_ids_train, rfx_basis_train)*y_std_train/sqrt(variance_scale)
         y_hat_train <- y_hat_train + rfx_preds_train
     }
     if ((has_rfx_test) && (has_test)) {
-        rfx_preds_test <- rfx_samples$predict(group_ids_test, rfx_basis_test)*y_std_train
+        rfx_preds_test <- rfx_samples$predict(group_ids_test, rfx_basis_test)*y_std_train/sqrt(variance_scale)
         y_hat_test <- y_hat_test + rfx_preds_test
     }
     
@@ -533,7 +533,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     }
 
     # Global error variance
-    if (sample_sigma) sigma2_samples <- global_var_samples[keep_indices]*(y_std_train^2)
+    if (sample_sigma) sigma2_samples <- global_var_samples[keep_indices]*(y_std_train^2)/variance_scale
     
     # Leaf parameter variance
     if (sample_tau) tau_samples <- leaf_scale_samples[keep_indices]
@@ -544,8 +544,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
             sigma_x_hat_train <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_train[,i]*sigma2_samples[i]))
             if (has_test) sigma_x_hat_test <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_test[,i]*sigma2_samples[i]))
         } else {
-            sigma_x_hat_train <- sqrt(sigma_x_hat_train*sigma2_init)*y_std_train
-            if (has_test) sigma_x_hat_test <- sqrt(sigma_x_hat_test*sigma2_init)*y_std_train
+            sigma_x_hat_train <- sqrt(sigma_x_hat_train*sigma2_init)*y_std_train/sqrt(variance_scale)
+            if (has_test) sigma_x_hat_test <- sqrt(sigma_x_hat_test*sigma2_init)*y_std_train/sqrt(variance_scale)
         }
     }
     

From decf243aac5b8a894c461d0aa199ae297a47d9b7 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Wed, 25 Sep 2024 22:58:39 -0400
Subject: [PATCH 30/41] Adding TODO

---
 R/bart.R | 1 +
 1 file changed, 1 insertion(+)

diff --git a/R/bart.R b/R/bart.R
index 7baf0a44..468c3464 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -550,6 +550,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     }
     
     # Return results as a list
+    # TODO: store variance_scale and propagate through predict function
     model_params <- list(
         "sigma2_init" = sigma2_init, 
         "a_global" = a_global,

From b76423a0a580cac0f02455422c44d623b5f10bb1 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Thu, 26 Sep 2024 13:10:19 -0400
Subject: [PATCH 31/41] Correct log integrated likelihood

---
 src/leaf_model.cpp | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index adb18dd1..656858d0 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -218,12 +218,13 @@ double LogLinearVarianceLeafModel::NoSplitLogMarginalLikelihood(LogLinearVarianc
 }
 
 double LogLinearVarianceLeafModel::SuffStatLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
+  double prior_terms = a_ * std::log(b_) - boost::math::lgamma(a_);
   double a_term = a_ + 0.5 * suff_stat.n;
   double b_term = b_ + ((0.5 * suff_stat.weighted_sum_ei) / global_variance);
   double log_b_term = std::log(b_term);
   double lgamma_a_term = boost::math::lgamma(a_term);
   double resid_term = a_term * log_b_term;
-  double log_ml = lgamma_a_term - resid_term;
+  double log_ml = prior_terms + lgamma_a_term - resid_term;
   return log_ml;
 }
 
@@ -258,7 +259,9 @@ void LogLinearVarianceLeafModel::SampleLeafParameters(ForestDataset& dataset, Fo
     node_rate = PosteriorParameterRate(node_suff_stat, global_variance);
     
     // Draw from IG(shape, scale) and set the leaf parameter with each draw
-    node_mu = std::log(gamma_sampler_.Sample(node_shape, node_rate, gen, true));
+    std::gamma_distribution<double> gamma_dist_(node_shape, 1.);
+    node_mu = std::log(gamma_dist_(gen) / node_rate);
+    // node_mu = std::log(gamma_sampler_.Sample(node_shape, node_rate, gen, true));
     tree->SetLeaf(leaf_id, node_mu);
   }
 }

From 9e815df75a12448df11373368f9b78029d399aef Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Fri, 27 Sep 2024 12:30:18 -0400
Subject: [PATCH 32/41] Updated BART docs and vignettes

---
 R/bart.R                         | 20 +++++++++++--------
 man/bart.Rd                      |  8 ++++----
 vignettes/Heteroskedasticity.Rmd | 34 +++++++++++---------------------
 3 files changed, 27 insertions(+), 35 deletions(-)

diff --git a/R/bart.R b/R/bart.R
index 468c3464..963eed6b 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -27,12 +27,12 @@
 #' @param cutpoint_grid_size Maximum size of the "grid" of potential cutpoints to consider. Default: 100.
 #' @param tau_init Starting value of leaf node scale parameter. Calibrated internally as `1/num_trees_mean` if not set here.
 #' @param leaf_model Model to use in the leaves, coded as integer with (0 = constant leaf, 1 = univariate leaf regression, 2 = multivariate leaf regression). Default: 0.
-#' @param alpha_mean Prior probability of splitting for a tree of depth 0 in the mean model. Tree split prior combines `alpha_mean` and `beta_mean` via `alpha_mean*(1+node_depth)^-beta_mean`.
-#' @param beta_mean Exponent that decreases split probabilities for nodes of depth > 0 in the mean model. Tree split prior combines `alpha_mean` and `beta_mean` via `alpha_mean*(1+node_depth)^-beta_mean`.
+#' @param alpha_mean Prior probability of splitting for a tree of depth 0 in the mean model. Tree split prior combines `alpha_mean` and `beta_mean` via `alpha_mean*(1+node_depth)^-beta_mean`. Default: 0.95.
+#' @param beta_mean Exponent that decreases split probabilities for nodes of depth > 0 in the mean model. Tree split prior combines `alpha_mean` and `beta_mean` via `alpha_mean*(1+node_depth)^-beta_mean`. Default: 2.
 #' @param min_samples_leaf_mean Minimum allowable size of a leaf, in terms of training samples, in the mean model. Default: 5.
 #' @param max_depth_mean Maximum depth of any tree in the ensemble in the mean model. Default: 10. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
-#' @param alpha_variance Prior probability of splitting for a tree of depth 0 in the variance model. Tree split prior combines `alpha_variance` and `beta_variance` via `alpha_variance*(1+node_depth)^-beta_variance`.
-#' @param beta_variance Exponent that decreases split probabilities for nodes of depth > 0 in the variance model. Tree split prior combines `alpha_variance` and `beta_variance` via `alpha_variance*(1+node_depth)^-beta_variance`.
+#' @param alpha_variance Prior probability of splitting for a tree of depth 0 in the variance model. Tree split prior combines `alpha_variance` and `beta_variance` via `alpha_variance*(1+node_depth)^-beta_variance`. Default: 0.95.
+#' @param beta_variance Exponent that decreases split probabilities for nodes of depth > 0 in the variance model. Tree split prior combines `alpha_variance` and `beta_variance` via `alpha_variance*(1+node_depth)^-beta_variance` .Default: 2.
 #' @param min_samples_leaf_variance Minimum allowable size of a leaf, in terms of training samples, in the variance model. Default: 5.
 #' @param max_depth_variance Maximum depth of any tree in the ensemble in the variance model. Default: 10. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
 #' @param a_global Shape parameter in the `IG(a_global, b_global)` global error variance model. Default: 0.
@@ -109,6 +109,13 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     if (num_trees_mean > 0) include_mean_forest = T
     else include_mean_forest = F
     
+    # Set the variance forest priors if not set
+    if (include_variance_forest) {
+        a_0 <- 1.5
+        if (is.null(a_forest)) a_forest <- num_trees_variance / (a_0^2) + 0.5
+        if (is.null(b_forest)) b_forest <- num_trees_variance / (a_0^2)
+    }
+    
     # Override tau sampling if there is no mean forest
     if (!include_mean_forest) sample_tau <- F
     
@@ -269,10 +276,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     if (is.null(tau_init)) tau_init <- var(resid_train)/(num_trees_mean)
     current_leaf_scale <- as.matrix(tau_init)
     current_sigma2 <- sigma2_init
-    a_0 <- 1.5
-    if (is.null(a_forest)) a_forest <- num_trees_variance/(a_0^2) + 0.5
-    if (is.null(b_forest)) b_forest <- num_trees_variance/(a_0^2)
-    
+
     # Determine leaf model type
     if (!has_basis) leaf_model_mean_forest <- 0
     else if (ncol(W_train) == 1) leaf_model_mean_forest <- 1
diff --git a/man/bart.Rd b/man/bart.Rd
index 17d23413..c8434c05 100644
--- a/man/bart.Rd
+++ b/man/bart.Rd
@@ -89,17 +89,17 @@ that were not in the training set.}
 
 \item{tau_init}{Starting value of leaf node scale parameter. Calibrated internally as \code{1/num_trees_mean} if not set here.}
 
-\item{alpha_mean}{Prior probability of splitting for a tree of depth 0 in the mean model. Tree split prior combines \code{alpha_mean} and \code{beta_mean} via \code{alpha_mean*(1+node_depth)^-beta_mean}.}
+\item{alpha_mean}{Prior probability of splitting for a tree of depth 0 in the mean model. Tree split prior combines \code{alpha_mean} and \code{beta_mean} via \code{alpha_mean*(1+node_depth)^-beta_mean}. Default: 0.95.}
 
-\item{beta_mean}{Exponent that decreases split probabilities for nodes of depth > 0 in the mean model. Tree split prior combines \code{alpha_mean} and \code{beta_mean} via \code{alpha_mean*(1+node_depth)^-beta_mean}.}
+\item{beta_mean}{Exponent that decreases split probabilities for nodes of depth > 0 in the mean model. Tree split prior combines \code{alpha_mean} and \code{beta_mean} via \code{alpha_mean*(1+node_depth)^-beta_mean}. Default: 2.}
 
 \item{min_samples_leaf_mean}{Minimum allowable size of a leaf, in terms of training samples, in the mean model. Default: 5.}
 
 \item{max_depth_mean}{Maximum depth of any tree in the ensemble in the mean model. Default: 10. Can be overriden with \code{-1} which does not enforce any depth limits on trees.}
 
-\item{alpha_variance}{Prior probability of splitting for a tree of depth 0 in the variance model. Tree split prior combines \code{alpha_variance} and \code{beta_variance} via \code{alpha_variance*(1+node_depth)^-beta_variance}.}
+\item{alpha_variance}{Prior probability of splitting for a tree of depth 0 in the variance model. Tree split prior combines \code{alpha_variance} and \code{beta_variance} via \code{alpha_variance*(1+node_depth)^-beta_variance}. Default: 0.95.}
 
-\item{beta_variance}{Exponent that decreases split probabilities for nodes of depth > 0 in the variance model. Tree split prior combines \code{alpha_variance} and \code{beta_variance} via \code{alpha_variance*(1+node_depth)^-beta_variance}.}
+\item{beta_variance}{Exponent that decreases split probabilities for nodes of depth > 0 in the variance model. Tree split prior combines \code{alpha_variance} and \code{beta_variance} via \code{alpha_variance*(1+node_depth)^-beta_variance} .Default: 2.}
 
 \item{min_samples_leaf_variance}{Minimum allowable size of a leaf, in terms of training samples, in the variance model. Default: 5.}
 
diff --git a/vignettes/Heteroskedasticity.Rmd b/vignettes/Heteroskedasticity.Rmd
index 2b630827..56a74114 100644
--- a/vignettes/Heteroskedasticity.Rmd
+++ b/vignettes/Heteroskedasticity.Rmd
@@ -90,16 +90,14 @@ initialization (@he2023stochastic). This is the default in
 num_gfr <- 10
 num_burnin <- 0
 num_mcmc <- 100
+num_trees <- 20
+a_0 <- 1.5
 num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_warmstart <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    num_trees_mean = 0, num_trees_variance = 20, 
-    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 1.25, 
-    min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F
-    # , a_forest = 1, b_forest = 1
+    num_trees_mean = 0, num_trees_variance = num_trees, 
+    sample_sigma = F, sample_tau = F
 )
 ```
 
@@ -125,11 +123,7 @@ bart_model_mcmc <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 0, num_trees_variance = 20, 
-    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
-    alpha_variance = 0.95, beta_variance = 1.25, 
-    min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F
-    # , a_forest = 1, b_forest = 1
+    sample_sigma = F, sample_tau = F
 )
 ```
 
@@ -213,8 +207,7 @@ bart_model_warmstart <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 1, 
-    sample_sigma = T, sample_tau = F
-    # , a_forest = 1, b_forest = 1
+    sample_sigma = F, sample_tau = F
 )
 ```
 
@@ -243,8 +236,7 @@ bart_model_mcmc <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F
-    # , a_forest = 1, b_forest = 1
+    sample_sigma = F, sample_tau = F
 )
 ```
 
@@ -339,8 +331,7 @@ bart_model_warmstart <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F, 
-    a_forest = 1, b_forest = 1
+    sample_sigma = F, sample_tau = F
 )
 ```
 
@@ -372,8 +363,7 @@ bart_model_mcmc <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F, 
-    a_forest = 1, b_forest = 1
+    sample_sigma = F, sample_tau = F
 )
 ```
 
@@ -472,8 +462,7 @@ bart_model_warmstart <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F, 
-    a_forest = 1, b_forest = 1
+    sample_sigma = F, sample_tau = F
 )
 ```
 
@@ -505,8 +494,7 @@ bart_model_mcmc <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = T, sample_tau = F, 
-    a_forest = 1, b_forest = 1
+    sample_sigma = F, sample_tau = F
 )
 ```
 

From acda38ae9b29f35e516c315f6e02ec2e2147af82 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 1 Oct 2024 08:55:17 -0400
Subject: [PATCH 33/41] Simplified variance model sufficient statistic class

---
 include/stochtree/leaf_model.h | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index 95bf705a..d69ace46 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -232,31 +232,25 @@ class LogLinearVarianceSuffStat {
  public:
   data_size_t n;
   double weighted_sum_ei;
-  double sum_log_partial_var;
   LogLinearVarianceSuffStat() {
     n = 0;
     weighted_sum_ei = 0.0;
-    sum_log_partial_var = 0.0;
   }
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     weighted_sum_ei += std::exp(std::log(outcome(row_idx)*outcome(row_idx)) + tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx));
-    sum_log_partial_var += tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx);
   }
   void ResetSuffStat() {
     n = 0;
     weighted_sum_ei = 0.0;
-    sum_log_partial_var = 0.0;
   }
   void AddSuffStat(LogLinearVarianceSuffStat& lhs, LogLinearVarianceSuffStat& rhs) {
     n = lhs.n + rhs.n;
     weighted_sum_ei = lhs.weighted_sum_ei + rhs.weighted_sum_ei;
-    sum_log_partial_var = lhs.sum_log_partial_var + rhs.sum_log_partial_var;
   }
   void SubtractSuffStat(LogLinearVarianceSuffStat& lhs, LogLinearVarianceSuffStat& rhs) {
     n = lhs.n - rhs.n;
     weighted_sum_ei = lhs.weighted_sum_ei - rhs.weighted_sum_ei;
-    sum_log_partial_var = lhs.sum_log_partial_var - rhs.sum_log_partial_var;
   }
   bool SampleGreaterThan(data_size_t threshold) {
     return n > threshold;

From e00f9df52268287e416ef96ef0ce1c4103e03a74 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 1 Oct 2024 09:06:33 -0400
Subject: [PATCH 34/41] Converted internal heteroskedastic model back to
 variance, rather than precision, parameterization

---
 R/bart.R                       |  4 ++--
 include/stochtree/leaf_model.h | 16 ++++++++--------
 src/forest.cpp                 |  4 ++--
 src/leaf_model.cpp             |  6 +++---
 4 files changed, 15 insertions(+), 15 deletions(-)

diff --git a/R/bart.R b/R/bart.R
index 963eed6b..108e60ac 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -487,8 +487,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     
     # Variance forest predictions
     if (include_variance_forest) {
-        sigma_x_hat_train <- 1/forest_samples_variance$predict(forest_dataset_train)
-        if (has_test) sigma_x_hat_test <- 1/forest_samples_variance$predict(forest_dataset_test)
+        sigma_x_hat_train <- forest_samples_variance$predict(forest_dataset_train)
+        if (has_test) sigma_x_hat_test <- forest_samples_variance$predict(forest_dataset_test)
     }
     
     # Random effects predictions
diff --git a/include/stochtree/leaf_model.h b/include/stochtree/leaf_model.h
index d69ace46..e0f0e50f 100644
--- a/include/stochtree/leaf_model.h
+++ b/include/stochtree/leaf_model.h
@@ -44,8 +44,8 @@ class GaussianConstantSuffStat {
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
-      sum_w += dataset.VarWeightValue(row_idx);
-      sum_yw += outcome(row_idx, 0)*dataset.VarWeightValue(row_idx);
+      sum_w += 1/dataset.VarWeightValue(row_idx);
+      sum_yw += outcome(row_idx, 0)/dataset.VarWeightValue(row_idx);
     } else {
       sum_w += 1.0;
       sum_yw += outcome(row_idx, 0);
@@ -109,8 +109,8 @@ class GaussianUnivariateRegressionSuffStat {
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
-      sum_xxw += dataset.BasisValue(row_idx, 0)*dataset.BasisValue(row_idx, 0)*dataset.VarWeightValue(row_idx);
-      sum_yxw += outcome(row_idx, 0)*dataset.BasisValue(row_idx, 0)*dataset.VarWeightValue(row_idx);
+      sum_xxw += dataset.BasisValue(row_idx, 0)*dataset.BasisValue(row_idx, 0)/dataset.VarWeightValue(row_idx);
+      sum_yxw += outcome(row_idx, 0)*dataset.BasisValue(row_idx, 0)/dataset.VarWeightValue(row_idx);
     } else {
       sum_xxw += dataset.BasisValue(row_idx, 0)*dataset.BasisValue(row_idx, 0);
       sum_yxw += outcome(row_idx, 0)*dataset.BasisValue(row_idx, 0);
@@ -176,8 +176,8 @@ class GaussianMultivariateRegressionSuffStat {
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
     if (dataset.HasVarWeights()) {
-      XtWX += dataset.GetBasis()(row_idx, Eigen::all).transpose()*dataset.GetBasis()(row_idx, Eigen::all)*dataset.VarWeightValue(row_idx);
-      ytWX += (outcome(row_idx, 0)*(dataset.GetBasis()(row_idx, Eigen::all)))*dataset.VarWeightValue(row_idx);
+      XtWX += dataset.GetBasis()(row_idx, Eigen::all).transpose()*dataset.GetBasis()(row_idx, Eigen::all)/dataset.VarWeightValue(row_idx);
+      ytWX += (outcome(row_idx, 0)*(dataset.GetBasis()(row_idx, Eigen::all)))/dataset.VarWeightValue(row_idx);
     } else {
       XtWX += dataset.GetBasis()(row_idx, Eigen::all).transpose()*dataset.GetBasis()(row_idx, Eigen::all);
       ytWX += (outcome(row_idx, 0)*(dataset.GetBasis()(row_idx, Eigen::all)));
@@ -238,7 +238,7 @@ class LogLinearVarianceSuffStat {
   }
   void IncrementSuffStat(ForestDataset& dataset, Eigen::VectorXd& outcome, ForestTracker& tracker, data_size_t row_idx, int tree_idx) {
     n += 1;
-    weighted_sum_ei += std::exp(std::log(outcome(row_idx)*outcome(row_idx)) + tracker.GetSamplePrediction(row_idx) - tracker.GetTreeSamplePrediction(row_idx, tree_idx));
+    weighted_sum_ei += std::exp(std::log(outcome(row_idx)*outcome(row_idx)) - tracker.GetSamplePrediction(row_idx) + tracker.GetTreeSamplePrediction(row_idx, tree_idx));
   }
   void ResetSuffStat() {
     n = 0;
@@ -272,7 +272,7 @@ class LogLinearVarianceLeafModel {
   double NoSplitLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   double SuffStatLogMarginalLikelihood(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   double PosteriorParameterShape(LogLinearVarianceSuffStat& suff_stat, double global_variance);
-  double PosteriorParameterRate(LogLinearVarianceSuffStat& suff_stat, double global_variance);
+  double PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance);
   void SampleLeafParameters(ForestDataset& dataset, ForestTracker& tracker, ColumnVector& residual, Tree* tree, int tree_num, double global_variance, std::mt19937& gen);
   void SetEnsembleRootPredictedValue(ForestDataset& dataset, TreeEnsemble* ensemble, double root_pred_value);
   void SetPriorShape(double a) {a_ = a;}
diff --git a/src/forest.cpp b/src/forest.cpp
index a277bdfc..a03e9575 100644
--- a/src/forest.cpp
+++ b/src/forest.cpp
@@ -291,11 +291,11 @@ void initialize_forest_model_cpp(cpp11::external_pointer<StochTree::ForestDatase
         UpdateResidualEntireForest(*tracker, *data, *residual, forest_samples->GetEnsemble(0), true, std::minus<double>());
         tracker->UpdatePredictions(forest_samples->GetEnsemble(0), *data);
     } else if (model_type == StochTree::ModelType::kLogLinearVariance) {
-        forest_samples->InitializeRoot(-std::log(init_val) / static_cast<double>(num_trees));
+        forest_samples->InitializeRoot(std::log(init_val) / static_cast<double>(num_trees));
         tracker->UpdatePredictions(forest_samples->GetEnsemble(0), *data);
         int n = data->NumObservations();
         std::vector<double> initial_preds(n, init_val);
-        for (int i = 0; i < n; i++) initial_preds[i] = 1/initial_preds[i];
+        // for (int i = 0; i < n; i++) initial_preds[i] = 1/initial_preds[i];
         data->AddVarianceWeights(initial_preds.data(), n);
     }
 }
diff --git a/src/leaf_model.cpp b/src/leaf_model.cpp
index 656858d0..3b59ab96 100644
--- a/src/leaf_model.cpp
+++ b/src/leaf_model.cpp
@@ -232,7 +232,7 @@ double LogLinearVarianceLeafModel::PosteriorParameterShape(LogLinearVarianceSuff
   return a_ + 0.5 * suff_stat.n;
 }
 
-double LogLinearVarianceLeafModel::PosteriorParameterRate(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
+double LogLinearVarianceLeafModel::PosteriorParameterScale(LogLinearVarianceSuffStat& suff_stat, double global_variance) {
   return (b_ + (0.5 * suff_stat.weighted_sum_ei) / global_variance);
 }
 
@@ -256,11 +256,11 @@ void LogLinearVarianceLeafModel::SampleLeafParameters(ForestDataset& dataset, Fo
     
     // Compute posterior mean and variance
     node_shape = PosteriorParameterShape(node_suff_stat, global_variance);
-    node_rate = PosteriorParameterRate(node_suff_stat, global_variance);
+    node_rate = PosteriorParameterScale(node_suff_stat, global_variance);
     
     // Draw from IG(shape, scale) and set the leaf parameter with each draw
     std::gamma_distribution<double> gamma_dist_(node_shape, 1.);
-    node_mu = std::log(gamma_dist_(gen) / node_rate);
+    node_mu = -std::log(gamma_dist_(gen) / node_rate);
     // node_mu = std::log(gamma_sampler_.Sample(node_shape, node_rate, gen, true));
     tree->SetLeaf(leaf_id, node_mu);
   }

From 150db5049996f1ed0e21d0d81c174d506c958f03 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 1 Oct 2024 10:26:42 -0400
Subject: [PATCH 35/41] Updated predict.bartmodel() function

---
 R/bart.R | 39 ++++++++++++++++++++++-----------------
 1 file changed, 22 insertions(+), 17 deletions(-)

diff --git a/R/bart.R b/R/bart.R
index 108e60ac..d9331546 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -583,7 +583,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         "sample_sigma" = sample_sigma,
         "sample_tau" = sample_tau,
         "include_mean_forest" = include_mean_forest,
-        "include_variance_forest" = include_variance_forest
+        "include_variance_forest" = include_variance_forest,
+        "variance_scale" = variance_scale
     )
     result <- list(
         "model_params" = model_params, 
@@ -721,18 +722,19 @@ predict.bartmodel <- function(bart, X_test, W_test = NULL, group_ids_test = NULL
     else prediction_dataset <- createForestDataset(X_test)
     
     # Compute mean forest predictions
+    variance_scale <- bart$model_params$variance_scale
     y_std <- bart$model_params$outcome_scale
     y_bar <- bart$model_params$outcome_mean
-    mean_forest_predictions <- bart$mean_forests$predict(prediction_dataset)*y_std + y_bar
+    mean_forest_predictions <- bart$mean_forests$predict(prediction_dataset)*y_std/sqrt(variance_scale) + y_bar
     
     # Compute variance forest predictions
     if (bart$model_params$include_variance_forest) {
-        var_forest_predictions <- bart$variance_forests$predict(prediction_dataset)*(y_std^2)
+        var_forest_predictions <- bart$variance_forests$predict(prediction_dataset)*(y_std^2)/variance_scale
     }
     
     # Compute rfx predictions (if needed)
     if (bart$model_params$has_rfx) {
-        rfx_predictions <- bart$rfx_samples$predict(group_ids_test, rfx_basis_test)*y_std
+        rfx_predictions <- bart$rfx_samples$predict(group_ids_test, rfx_basis_test)*y_std/sqrt(variance_scale)
     }
     
     # Restrict predictions to the "retained" samples (if applicable)
@@ -746,21 +748,24 @@ predict.bartmodel <- function(bart, X_test, W_test = NULL, group_ids_test = NULL
     }
     
     if (bart$model_params$has_rfx) {
-        y_hat <- forest_predictions + rfx_predictions
-        result <- list(
-            "mean_forest_predictions" = mean_forest_predictions, 
-            "variance_forest_predictions" = variance_forest_predictions, 
-            "rfx_predictions" = rfx_predictions, 
-            "y_hat" = y_hat
-        )
-        return(result)
+        y_hat <- mean_forest_predictions + rfx_predictions
     } else {
-        result <- list(
-            "y_hat" = mean_forest_predictions, 
-            "variance_forest_predictions" = variance_forest_predictions
-        )
-        return(result)
+        y_hat <- mean_forest_predictions
+    }
+    
+    result <- list(
+        "y_hat" = y_hat, 
+        "mean_forest_predictions" = mean_forest_predictions
+    )
+    
+    if (bart$model_params$has_rfx) {
+        result[["rfx_predictions"]] = rfx_predictions
+    }
+    
+    if (bart$model_params$include_variance_forest) {
+        result[["variance_forest_predictions"]] = variance_forest_predictions
     }
+    return(result)
 }
 
 #' Extract raw sample values for each of the random effect parameter terms.

From 78114d9445169de0eefa70855aa4b8e8c508c5cd Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 1 Oct 2024 15:25:39 -0500
Subject: [PATCH 36/41] Update R unit tests

---
 test/R/testthat/test-residual.R | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/test/R/testthat/test-residual.R b/test/R/testthat/test-residual.R
index 4eb0fe3a..582963b9 100644
--- a/test/R/testthat/test-residual.R
+++ b/test/R/testthat/test-residual.R
@@ -29,6 +29,8 @@ test_that("Residual updates correctly propagated after forest sampling step", {
     current_leaf_scale = as.matrix(1./num_trees,nrow=1,ncol=1)
     cutpoint_grid_size = 100
     max_depth = 10
+    a_global = 0
+    b_global = 0
     
     # RNG
     cpp_rng = createRNG(-1)
@@ -44,7 +46,7 @@ test_that("Residual updates correctly propagated after forest sampling step", {
     # Run the forest sampling algorithm for a single iteration
     forest_model$sample_one_iteration(
         forest_dataset, residual, forest_samples, cpp_rng, feature_types, 
-        0, current_leaf_scale, variable_weights, 
+        0, current_leaf_scale, variable_weights, a_global, b_global, 
         current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = T
     )
 

From e643c4b43553bf03a991de257ae5ba91bd2225bd Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Tue, 1 Oct 2024 15:55:23 -0500
Subject: [PATCH 37/41] Fixed python unit tests

---
 src/py_stochtree.cpp            | 17 +++++++++--------
 stochtree/bart.py               | 10 ++++++++--
 stochtree/bcf.py                | 16 ++++++++++++----
 stochtree/sampler.py            |  5 +++--
 test/R/testthat/test-residual.R |  6 +++---
 test/python/test_residual.py    |  5 ++++-
 6 files changed, 39 insertions(+), 20 deletions(-)

diff --git a/src/py_stochtree.cpp b/src/py_stochtree.cpp
index d26bfd11..dd0e41d9 100644
--- a/src/py_stochtree.cpp
+++ b/src/py_stochtree.cpp
@@ -453,7 +453,8 @@ class ForestSamplerCpp {
 
   void SampleOneIteration(ForestContainerCpp& forest_samples, ForestDatasetCpp& dataset, ResidualCpp& residual, RngCpp& rng, 
                           py::array_t<int> feature_types, int cutpoint_grid_size, py::array_t<double> leaf_model_scale_input, 
-                          py::array_t<double> variable_weights, double global_variance, int leaf_model_int, bool gfr = true, bool pre_initialized = false) {
+                          py::array_t<double> variable_weights, double a_forest, double b_forest, double global_variance, 
+                          int leaf_model_int, bool gfr = true, bool pre_initialized = false) {
     // Unpack feature types
     std::vector<StochTree::FeatureType> feature_types_(feature_types.size());
     for (int i = 0; i < feature_types.size(); i++) {
@@ -490,7 +491,7 @@ class ForestSamplerCpp {
     }
 
     // Prepare the samplers
-    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix);
+    StochTree::LeafModelVariant leaf_model = StochTree::leafModelFactory(model_type, leaf_scale, leaf_scale_matrix, a_forest, b_forest);
     
     // Run one iteration of the sampler
     StochTree::ForestContainer* forest_sample_ptr = forest_samples.GetContainer();
@@ -500,19 +501,19 @@ class ForestSamplerCpp {
     std::mt19937* rng_ptr = rng.GetRng();
     if (gfr) {
       if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
-        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, true);
       } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
-        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized);
+        StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, true);
       } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
-        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, num_basis);
+        StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, true, num_basis);
       }
     } else {
       if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
-        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianConstantLeafModel, StochTree::GaussianConstantSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianConstantLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized, true);
       } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
-        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized, true);
       } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
-        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized, num_basis);
+        StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized, true, num_basis);
       }
     }
   }
diff --git a/stochtree/bart.py b/stochtree/bart.py
index e1553eaa..acf9da7c 100644
--- a/stochtree/bart.py
+++ b/stochtree/bart.py
@@ -228,6 +228,10 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
         else:
             leaf_model_int = 2
         
+        # TODO Placeholder: expose the heteroskedasticity interface through the function signature, as in R
+        a_forest = 1
+        b_forest = 1
+
         # Container of forest samples
         self.forest_container = ForestContainer(num_trees, 1, True) if not self.has_basis else ForestContainer(num_trees, self.num_basis, False)
         
@@ -249,7 +253,8 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
                 # Sample the forest
                 forest_sampler.sample_one_iteration(
                     self.forest_container, forest_dataset_train, residual_train, cpp_rng, feature_types, 
-                    cutpoint_grid_size, current_leaf_scale, variable_weights, current_sigma2, leaf_model_int, True, True
+                    cutpoint_grid_size, current_leaf_scale, variable_weights, a_forest, b_forest, 
+                    current_sigma2, leaf_model_int, True, True
                 )
 
                 # Sample variance parameters (if requested)
@@ -270,7 +275,8 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
                 # Sample the forest
                 forest_sampler.sample_one_iteration(
                     self.forest_container, forest_dataset_train, residual_train, cpp_rng, feature_types, 
-                    cutpoint_grid_size, current_leaf_scale, variable_weights, current_sigma2, leaf_model_int, False, True
+                    cutpoint_grid_size, current_leaf_scale, variable_weights, a_forest, b_forest, 
+                    current_sigma2, leaf_model_int, False, True
                 )
 
                 # Sample variance parameters (if requested)
diff --git a/stochtree/bcf.py b/stochtree/bcf.py
index 72ea2d3c..c1056d63 100644
--- a/stochtree/bcf.py
+++ b/stochtree/bcf.py
@@ -618,6 +618,10 @@ def sample(self, X_train: Union[pd.DataFrame, np.array], Z_train: np.array, y_tr
         else:
             cpp_rng = RNG(random_seed)
         
+        # TODO Placeholder: expose the heteroskedasticity interface through the function signature, as in R
+        a_forest = 1
+        b_forest = 1
+        
         # Sampling data structures
         forest_sampler_mu = ForestSampler(forest_dataset_train, feature_types, num_trees_mu, self.n_train, alpha_mu, beta_mu, min_samples_leaf_mu, max_depth_mu)
         forest_sampler_tau = ForestSampler(forest_dataset_train, feature_types, num_trees_tau, self.n_train, alpha_tau, beta_tau, min_samples_leaf_tau, max_depth_tau)
@@ -653,7 +657,8 @@ def sample(self, X_train: Union[pd.DataFrame, np.array], Z_train: np.array, y_tr
                 # Sample the prognostic forest
                 forest_sampler_mu.sample_one_iteration(
                     self.forest_container_mu, forest_dataset_train, residual_train, cpp_rng, feature_types, 
-                    cutpoint_grid_size, current_leaf_scale_mu, variable_weights_mu, current_sigma2, 0, True, True
+                    cutpoint_grid_size, current_leaf_scale_mu, variable_weights_mu, a_forest, b_forest, 
+                    current_sigma2, 0, True, True
                 )
 
                 # Sample variance parameters (if requested)
@@ -667,7 +672,8 @@ def sample(self, X_train: Union[pd.DataFrame, np.array], Z_train: np.array, y_tr
                 # Sample the treatment forest
                 forest_sampler_tau.sample_one_iteration(
                     self.forest_container_tau, forest_dataset_train, residual_train, cpp_rng, feature_types, 
-                    cutpoint_grid_size, current_leaf_scale_tau, variable_weights_tau, current_sigma2, treatment_leaf_model, True, True
+                    cutpoint_grid_size, current_leaf_scale_tau, variable_weights_tau, a_forest, b_forest, 
+                    current_sigma2, treatment_leaf_model, True, True
                 )
                 
                 # Sample variance parameters (if requested)
@@ -712,7 +718,8 @@ def sample(self, X_train: Union[pd.DataFrame, np.array], Z_train: np.array, y_tr
                 # Sample the prognostic forest
                 forest_sampler_mu.sample_one_iteration(
                     self.forest_container_mu, forest_dataset_train, residual_train, cpp_rng, feature_types, 
-                    cutpoint_grid_size, current_leaf_scale_mu, variable_weights_mu, current_sigma2, 0, False, True
+                    cutpoint_grid_size, current_leaf_scale_mu, variable_weights_mu, a_forest, b_forest, 
+                    current_sigma2, 0, False, True
                 )
 
                 # Sample variance parameters (if requested)
@@ -726,7 +733,8 @@ def sample(self, X_train: Union[pd.DataFrame, np.array], Z_train: np.array, y_tr
                 # Sample the treatment forest
                 forest_sampler_tau.sample_one_iteration(
                     self.forest_container_tau, forest_dataset_train, residual_train, cpp_rng, feature_types, 
-                    cutpoint_grid_size, current_leaf_scale_tau, variable_weights_tau, current_sigma2, treatment_leaf_model, False, True
+                    cutpoint_grid_size, current_leaf_scale_tau, variable_weights_tau, a_forest, b_forest, 
+                    current_sigma2, treatment_leaf_model, False, True
                 )
                 
                 # Sample variance parameters (if requested)
diff --git a/stochtree/sampler.py b/stochtree/sampler.py
index d7c1a01d..de8ad36d 100644
--- a/stochtree/sampler.py
+++ b/stochtree/sampler.py
@@ -19,13 +19,14 @@ def __init__(self, dataset: Dataset, feature_types: np.array, num_trees: int, nu
     
     def sample_one_iteration(self, forest_container: ForestContainer, dataset: Dataset, residual: Residual, rng: RNG, 
                              feature_types: np.array, cutpoint_grid_size: int, leaf_model_scale_input: np.array, 
-                             variable_weights: np.array, global_variance: float, leaf_model_int: int, gfr: bool, pre_initialized: bool):
+                             variable_weights: np.array, a_forest: float, b_forest: float, global_variance: float, 
+                             leaf_model_int: int, gfr: bool, pre_initialized: bool):
         """
         Sample one iteration of a forest using the specified model and tree sampling algorithm
         """
         self.forest_sampler_cpp.SampleOneIteration(forest_container.forest_container_cpp, dataset.dataset_cpp, residual.residual_cpp, rng.rng_cpp, 
                                                    feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, 
-                                                   global_variance, leaf_model_int, gfr, pre_initialized)
+                                                   a_forest, b_forest, global_variance, leaf_model_int, gfr, pre_initialized)
     
     def adjust_residual(self, dataset: Dataset, residual: Residual, forest_container: ForestContainer, requires_basis: bool, forest_num: int, add: bool) -> None:
         """
diff --git a/test/R/testthat/test-residual.R b/test/R/testthat/test-residual.R
index 582963b9..64752501 100644
--- a/test/R/testthat/test-residual.R
+++ b/test/R/testthat/test-residual.R
@@ -29,8 +29,8 @@ test_that("Residual updates correctly propagated after forest sampling step", {
     current_leaf_scale = as.matrix(1./num_trees,nrow=1,ncol=1)
     cutpoint_grid_size = 100
     max_depth = 10
-    a_global = 0
-    b_global = 0
+    a_forest = 0
+    b_forest = 0
     
     # RNG
     cpp_rng = createRNG(-1)
@@ -46,7 +46,7 @@ test_that("Residual updates correctly propagated after forest sampling step", {
     # Run the forest sampling algorithm for a single iteration
     forest_model$sample_one_iteration(
         forest_dataset, residual, forest_samples, cpp_rng, feature_types, 
-        0, current_leaf_scale, variable_weights, a_global, b_global, 
+        0, current_leaf_scale, variable_weights, a_forest, b_forest, 
         current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = T
     )
 
diff --git a/test/python/test_residual.py b/test/python/test_residual.py
index 96fde472..13d75e41 100644
--- a/test/python/test_residual.py
+++ b/test/python/test_residual.py
@@ -41,6 +41,8 @@ def test_basis_update(self):
         current_sigma2 = 1.
         current_leaf_scale = np.array([[1./num_trees]])
         cutpoint_grid_size = 100
+        a_forest = 1
+        b_forest = 1
 
         # RNG
         cpp_rng = RNG(-1)
@@ -57,7 +59,8 @@ def test_basis_update(self):
         # Run the forest sampling algorithm for a single iteration
         forest_sampler.sample_one_iteration(
             forest_container, forest_dataset, residual, cpp_rng, feature_types, 
-            cutpoint_grid_size, current_leaf_scale, variable_weights, current_sigma2, 1, True, True
+            cutpoint_grid_size, current_leaf_scale, variable_weights, a_forest, b_forest, 
+            current_sigma2, 1, True, True
         )
 
         # Get the current residual after running the sampler

From 0abaaa0738fb68ae8aa6b8aaae232abd489e09a6 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Fri, 4 Oct 2024 17:09:29 -0400
Subject: [PATCH 38/41] Updated python interface to include variance forest

---
 R/bart.R                                      |  48 +--
 .../heteroskedastic_supervised_learning.ipynb | 230 +++++++++++
 src/py_stochtree.cpp                          |  75 +++-
 stochtree/bart.py                             | 385 ++++++++++++++----
 stochtree/bcf.py                              |   4 +-
 stochtree/forest.py                           |   4 +-
 stochtree/sampler.py                          |  18 +
 vignettes/BayesianSupervisedLearning.Rmd      |  24 +-
 vignettes/Heteroskedasticity.Rmd              |  16 +-
 vignettes/PriorCalibration.Rmd                |   2 +-
 10 files changed, 681 insertions(+), 125 deletions(-)
 create mode 100644 demo/notebooks/heteroskedastic_supervised_learning.ipynb

diff --git a/R/bart.R b/R/bart.R
index d9331546..e501f11e 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -39,12 +39,12 @@
 #' @param b_global Scale parameter in the `IG(a_global, b_global)` global error variance model. Default: 0.
 #' @param a_leaf Shape parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model. Default: 3.
 #' @param b_leaf Scale parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model. Calibrated internally as `0.5/num_trees_mean` if not set here.
-#' @param a_forest Shape parameter in the `IG(a_forest, b_forest)` conditional error variance model (which is only sampled if `include_variance_forest = T`). Calibrated internally as `num_trees_variance / 1.5^2 + 0.5` if not set.
-#' @param b_forest Scale parameter in the `IG(a_forest, b_forest)` conditional error variance model (which is only sampled if `include_variance_forest = T`). Calibrated internally as `num_trees_variance / 1.5^2` if not set.
+#' @param a_forest Shape parameter in the `IG(a_forest, b_forest)` conditional error variance model (which is only sampled if `num_trees_variance > 0`). Calibrated internally as `num_trees_variance / 1.5^2 + 0.5` if not set.
+#' @param b_forest Scale parameter in the `IG(a_forest, b_forest)` conditional error variance model (which is only sampled if `num_trees_variance > 0`). Calibrated internally as `num_trees_variance / 1.5^2` if not set.
 #' @param q Quantile used to calibrated `lambda` as in Sparapani et al (2021). Default: 0.9.
 #' @param sigma2_init Starting value of global error variance parameter. Calibrated internally as `pct_var_sigma2_init*var((y-mean(y))/sd(y))` if not set.
 #' @param variance_forest_init Starting value of root forest prediction in conditional (heteroskedastic) error variance model. Calibrated internally as `log(pct_var_variance_forest_init*var((y-mean(y))/sd(y)))/num_trees_variance` if not set.
-#' @param pct_var_sigma2_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by `sigma2_init`.
+#' @param pct_var_sigma2_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by `sigma2_init`.
 #' @param pct_var_variance_forest_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by `variance_forest_init`.
 #' @param variance_scale Variance after the data have been scaled. Default: 1.
 #' @param variable_weights_mean Numeric weights reflecting the relative probability of splitting on each variable in the mean forest. Does not need to sum to 1 but cannot be negative. Defaults to `rep(1/ncol(X_train), ncol(X_train))` if not set here.
@@ -54,8 +54,8 @@
 #' @param num_gfr Number of "warm-start" iterations run using the grow-from-root algorithm (He and Hahn, 2021). Default: 5.
 #' @param num_burnin Number of "burn-in" iterations of the MCMC sampler. Default: 0.
 #' @param num_mcmc Number of "retained" iterations of the MCMC sampler. Default: 100.
-#' @param sample_sigma Whether or not to update the `sigma^2` global error variance parameter based on `IG(a_globa, b_global)`. Default: T.
-#' @param sample_tau Whether or not to update the `tau` leaf scale variance parameter based on `IG(a_leaf, b_leaf)`. Cannot (currently) be set to true if `ncol(W_train)>1`. Default: T.
+#' @param sample_sigma_global Whether or not to update the `sigma^2` global error variance parameter based on `IG(a_global, b_global)`. Default: T.
+#' @param sample_sigma_leaf Whether or not to update the `tau` leaf scale variance parameter based on `IG(a_leaf, b_leaf)`. Cannot (currently) be set to true if `ncol(W_train)>1`. Default: F.
 #' @param random_seed Integer parameterizing the C++ random number generator. If not specified, the C++ random number generator is seeded according to `std::random_device`.
 #' @param keep_burnin Whether or not "burnin" samples should be included in cached predictions. Default FALSE. Ignored if num_mcmc = 0.
 #' @param keep_gfr Whether or not "grow-from-root" samples should be included in cached predictions. Default TRUE. Ignored if num_mcmc = 0.
@@ -97,12 +97,13 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
                  min_samples_leaf_variance = 5, max_depth_variance = 10, 
                  a_global = 0, b_global = 0, a_leaf = 3, b_leaf = NULL, 
                  a_forest = NULL, b_forest = NULL, q = 0.9, sigma2_init = NULL, 
-                 variance_forest_init = NULL, pct_var_sigma2_init = 1, variance_scale = 1, 
-                 pct_var_variance_forest_init = 1, variable_weights_mean = NULL, 
-                 variable_weights_variance = NULL, num_trees_mean = 200, num_trees_variance = 20, 
-                 num_gfr = 5, num_burnin = 0, num_mcmc = 100, sample_sigma = T, 
-                 sample_tau = T, random_seed = -1, keep_burnin = F, 
-                 keep_gfr = F, verbose = F) {
+                 variance_forest_init = NULL, pct_var_sigma2_init = 1, 
+                 pct_var_variance_forest_init = 1, variance_scale = 1, 
+                 variable_weights_mean = NULL, variable_weights_variance = NULL, 
+                 num_trees_mean = 200, num_trees_variance = 20, 
+                 num_gfr = 5, num_burnin = 0, num_mcmc = 100, 
+                 sample_sigma_global = T, sample_sigma_leaf = F, random_seed = -1, 
+                 keep_burnin = F, keep_gfr = F, verbose = F) {
     # Determine whether conditional mean, variance, or both will be modeled
     if (num_trees_variance > 0) include_variance_forest = T
     else include_variance_forest = F
@@ -373,8 +374,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
 
     # Container of variance parameter samples
     num_samples <- num_gfr + num_burnin + num_mcmc
-    if (sample_sigma) global_var_samples <- rep(0, num_samples)
-    if (sample_tau) leaf_scale_samples <- rep(0, num_samples)
+    if (sample_sigma_global) global_var_samples <- rep(0, num_samples)
+    if (sample_sigma_leaf) leaf_scale_samples <- rep(0, num_samples)
     
     # Initialize the leaves of each tree in the mean forest
     if (include_mean_forest) {
@@ -399,7 +400,6 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
                 }
             }
             
-            
             if (include_mean_forest) {
                 forest_model_mean$sample_one_iteration(
                     forest_dataset_train, outcome_train, forest_samples_mean, rng, feature_types, 
@@ -414,11 +414,11 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
                     a_forest, b_forest, current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = T
                 )
             }
-            if (sample_sigma) {
+            if (sample_sigma_global) {
                 global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
             }
-            if (sample_tau) {
+            if (sample_sigma_leaf) {
                 leaf_scale_samples[i] <- sample_tau_one_iteration(forest_samples_mean, rng, a_leaf, b_leaf, i-1)
                 current_leaf_scale <- as.matrix(leaf_scale_samples[i])
             }
@@ -465,11 +465,11 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
                     a_forest, b_forest, current_sigma2, cutpoint_grid_size, gfr = F, pre_initialized = T
                 )
             }
-            if (sample_sigma) {
+            if (sample_sigma_global) {
                 global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
             }
-            if (sample_tau) {
+            if (sample_sigma_leaf) {
                 leaf_scale_samples[i] <- sample_tau_one_iteration(forest_samples_mean, rng, a_leaf, b_leaf, i-1)
                 current_leaf_scale <- as.matrix(leaf_scale_samples[i])
             }
@@ -537,10 +537,10 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     }
 
     # Global error variance
-    if (sample_sigma) sigma2_samples <- global_var_samples[keep_indices]*(y_std_train^2)/variance_scale
+    if (sample_sigma_global) sigma2_samples <- global_var_samples[keep_indices]*(y_std_train^2)/variance_scale
     
     # Leaf parameter variance
-    if (sample_tau) tau_samples <- leaf_scale_samples[keep_indices]
+    if (sample_sigma_leaf) tau_samples <- leaf_scale_samples[keep_indices]
     
     # Rescale variance forest prediction by sigma2_samples
     if (include_variance_forest) {
@@ -580,8 +580,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         "has_rfx" = has_rfx, 
         "has_rfx_basis" = has_basis_rfx, 
         "num_rfx_basis" = num_basis_rfx, 
-        "sample_sigma" = sample_sigma,
-        "sample_tau" = sample_tau,
+        "sample_sigma_global" = sample_sigma_global,
+        "sample_sigma_leaf" = sample_sigma_leaf,
         "include_mean_forest" = include_mean_forest,
         "include_variance_forest" = include_variance_forest,
         "variance_scale" = variance_scale
@@ -601,8 +601,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         result[["sigma_x_hat_train"]] = sigma_x_hat_train
         if (has_test) result[["sigma_x_hat_test"]] = sigma_x_hat_test
     }
-    if (sample_sigma) result[["sigma2_samples"]] = sigma2_samples
-    if (sample_tau) result[["tau_samples"]] = tau_samples
+    if (sample_sigma_global) result[["sigma2_global_samples"]] = sigma2_samples
+    if (sample_sigma_leaf) result[["sigma2_leaf_samples"]] = tau_samples
     if (has_rfx) {
         result[["rfx_samples"]] = rfx_samples
         result[["rfx_preds_train"]] = rfx_preds_train
diff --git a/demo/notebooks/heteroskedastic_supervised_learning.ipynb b/demo/notebooks/heteroskedastic_supervised_learning.ipynb
new file mode 100644
index 00000000..77814767
--- /dev/null
+++ b/demo/notebooks/heteroskedastic_supervised_learning.ipynb
@@ -0,0 +1,230 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Supervised Learning with Heteroskedasticity Demo Notebook"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Load necessary libraries"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import pandas as pd\n",
+    "import seaborn as sns\n",
+    "import matplotlib.pyplot as plt\n",
+    "from stochtree import BARTModel\n",
+    "from sklearn.model_selection import train_test_split\n",
+    "from math import sqrt"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Generate sample data"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# RNG\n",
+    "random_seed = 1234\n",
+    "rng = np.random.default_rng(random_seed)\n",
+    "\n",
+    "# Generate covariates and basis\n",
+    "n = 1000\n",
+    "p_X = 10\n",
+    "p_W = 1\n",
+    "X = rng.uniform(0, 1, (n, p_X))\n",
+    "W = rng.uniform(0, 1, (n, p_W))\n",
+    "\n",
+    "# Define the outcome mean function\n",
+    "def outcome_mean(X, W):\n",
+    "    return np.where(\n",
+    "        (X[:,0] >= 0.0) & (X[:,0] < 0.25), -7.5 * W[:,0], \n",
+    "        np.where(\n",
+    "            (X[:,0] >= 0.25) & (X[:,0] < 0.5), -2.5 * W[:,0], \n",
+    "            np.where(\n",
+    "                (X[:,0] >= 0.5) & (X[:,0] < 0.75), 2.5 * W[:,0], \n",
+    "                7.5 * W[:,0]\n",
+    "            )\n",
+    "        )\n",
+    "    )\n",
+    "\n",
+    "# Define the outcome standard deviation function\n",
+    "def outcome_stddev(X):\n",
+    "    return np.where(\n",
+    "        (X[:,1] >= 0.0) & (X[:,1] < 0.25), sqrt(0.5), \n",
+    "        np.where(\n",
+    "            (X[:,1] >= 0.25) & (X[:,1] < 0.5), 1., \n",
+    "            np.where(\n",
+    "                (X[:,1] >= 0.5) & (X[:,1] < 0.75), 2., \n",
+    "                3.\n",
+    "            )\n",
+    "        )\n",
+    "    )\n",
+    "\n",
+    "# Generate outcome\n",
+    "epsilon = rng.normal(0, 1, n)\n",
+    "f_x = outcome_mean(X, W)\n",
+    "s_x = outcome_stddev(X)\n",
+    "y = f_x + epsilon*s_x\n",
+    "\n",
+    "# Standardize outcome\n",
+    "y_bar = np.mean(y)\n",
+    "y_std = np.std(y)\n",
+    "resid = (y-y_bar)/y_std"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Test-train split"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "sample_inds = np.arange(n)\n",
+    "train_inds, test_inds = train_test_split(sample_inds, test_size=0.5)\n",
+    "X_train = X[train_inds,:]\n",
+    "X_test = X[test_inds,:]\n",
+    "basis_train = W[train_inds,:]\n",
+    "basis_test = W[test_inds,:]\n",
+    "y_train = y[train_inds]\n",
+    "y_test = y[test_inds]\n",
+    "f_x_train = f_x[train_inds]\n",
+    "f_x_test = f_x[test_inds]\n",
+    "s_x_train = s_x[train_inds]\n",
+    "s_x_test = s_x[test_inds]\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Demo 1: Using `W` in a linear leaf regression"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Run BART"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "bart_model = BARTModel()\n",
+    "bart_model.sample(X_train=X_train, y_train=y_train, X_test=X_test, basis_train=basis_train, basis_test=basis_test,\n",
+    "                  num_gfr=10, num_mcmc=100, num_trees_mean=100, num_trees_variance=50, sample_sigma_global=True, sample_sigma_leaf=False)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Inspect the MCMC (BART) samples"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "forest_preds_y_mcmc = bart_model.y_hat_test\n",
+    "y_avg_mcmc = np.squeeze(forest_preds_y_mcmc).mean(axis = 1, keepdims = True)\n",
+    "y_df_mcmc = pd.DataFrame(np.concatenate((np.expand_dims(y_test,1), y_avg_mcmc), axis = 1), columns=[\"True outcome\", \"Average estimated outcome\"])\n",
+    "sns.scatterplot(data=y_df_mcmc, x=\"Average estimated outcome\", y=\"True outcome\")\n",
+    "plt.axline((0, 0), slope=1, color=\"black\", linestyle=(0, (3,3)))\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "forest_preds_s_x_mcmc = bart_model.sigma_x_test\n",
+    "s_x_avg_mcmc = np.squeeze(forest_preds_s_x_mcmc).mean(axis = 1, keepdims = True)\n",
+    "s_x_df_mcmc = pd.DataFrame(np.concatenate((np.expand_dims(s_x_test,1), s_x_avg_mcmc), axis = 1), columns=[\"True standard deviation\", \"Average estimated standard deviation\"])\n",
+    "sns.scatterplot(data=s_x_df_mcmc, x=\"Average estimated standard deviation\", y=\"True standard deviation\")\n",
+    "plt.axline((0, 0), slope=1, color=\"black\", linestyle=(0, (3,3)))\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "sigma_df_mcmc = pd.DataFrame(np.concatenate((np.expand_dims(np.arange(bart_model.global_var_samples.shape[0]),axis=1), np.expand_dims(bart_model.global_var_samples,axis=1)), axis = 1), columns=[\"Sample\", \"Sigma\"])\n",
+    "sns.scatterplot(data=sigma_df_mcmc, x=\"Sample\", y=\"Sigma\")\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Compute the test set RMSE"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "np.sqrt(np.mean(np.power(y_test - np.squeeze(y_avg_mcmc),2)))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.17"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/src/py_stochtree.cpp b/src/py_stochtree.cpp
index dd0e41d9..35c86b57 100644
--- a/src/py_stochtree.cpp
+++ b/src/py_stochtree.cpp
@@ -137,12 +137,13 @@ class JsonCpp;
 
 class ForestContainerCpp {
  public:
-  ForestContainerCpp(int num_trees, int output_dimension = 1, bool is_leaf_constant = true) {
+  ForestContainerCpp(int num_trees, int output_dimension = 1, bool is_leaf_constant = true, bool is_exponentiated = false) {
     // Initialize pointer to C++ ForestContainer class
-    forest_samples_ = std::make_unique<StochTree::ForestContainer>(num_trees, output_dimension, is_leaf_constant);
+    forest_samples_ = std::make_unique<StochTree::ForestContainer>(num_trees, output_dimension, is_leaf_constant, is_exponentiated);
     num_trees_ = num_trees;
     output_dimension_ = output_dimension;
     is_leaf_constant_ = is_leaf_constant;
+    is_exponentiated_ = is_exponentiated;
   }
   ~ForestContainerCpp() {}
 
@@ -237,6 +238,14 @@ class ForestContainerCpp {
     forest_samples_->InitializeRoot(leaf_vector_converted);
   }
 
+  void InitializeRootValue(double val) {
+    forest_samples_->InitializeRoot(val);
+  }
+
+  void InitializeRootVector(std::vector<double> vals) {
+    forest_samples_->InitializeRoot(vals);
+  }
+
   void AdjustResidual(ForestDatasetCpp& dataset, ResidualCpp& residual, ForestSamplerCpp& sampler, bool requires_basis, int forest_num, bool add);
 
   void UpdateResidualNewBasis(ForestDatasetCpp& dataset, ResidualCpp& residual, ForestSamplerCpp& sampler, int forest_num);
@@ -431,6 +440,7 @@ class ForestContainerCpp {
   int num_trees_;
   int output_dimension_;
   bool is_leaf_constant_;
+  bool is_exponentiated_;
 };
 
 class ForestSamplerCpp {
@@ -466,6 +476,7 @@ class ForestSamplerCpp {
     if (leaf_model_int == 0) model_type = StochTree::ModelType::kConstantLeafGaussian;
     else if (leaf_model_int == 1) model_type = StochTree::ModelType::kUnivariateRegressionLeafGaussian;
     else if (leaf_model_int == 2) model_type = StochTree::ModelType::kMultivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 3) model_type = StochTree::ModelType::kLogLinearVariance;
 
     // Unpack leaf model parameters
     double leaf_scale;
@@ -506,6 +517,8 @@ class ForestSamplerCpp {
         StochTree::GFRSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, true);
       } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
         StochTree::GFRSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, true, num_basis);
+      } else if (model_type == StochTree::ModelType::kLogLinearVariance) {
+        StochTree::GFRSampleOneIter<StochTree::LogLinearVarianceLeafModel, StochTree::LogLinearVarianceSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::LogLinearVarianceLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, feature_types_, cutpoint_grid_size, pre_initialized, false);
       }
     } else {
       if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
@@ -514,10 +527,63 @@ class ForestSamplerCpp {
         StochTree::MCMCSampleOneIter<StochTree::GaussianUnivariateRegressionLeafModel, StochTree::GaussianUnivariateRegressionSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianUnivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized, true);
       } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
         StochTree::MCMCSampleOneIter<StochTree::GaussianMultivariateRegressionLeafModel, StochTree::GaussianMultivariateRegressionSuffStat, int>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::GaussianMultivariateRegressionLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized, true, num_basis);
+      } else if (model_type == StochTree::ModelType::kLogLinearVariance) {
+        StochTree::MCMCSampleOneIter<StochTree::LogLinearVarianceLeafModel, StochTree::LogLinearVarianceSuffStat>(*(tracker_.get()), *forest_sample_ptr, std::get<StochTree::LogLinearVarianceLeafModel>(leaf_model), *forest_data_ptr, *residual_data_ptr, *(split_prior_.get()), *rng_ptr, var_weights_vector, global_variance, pre_initialized, false);
       }
     }
   }
 
+  void InitializeForestModel(ForestDatasetCpp& dataset, ResidualCpp& residual, ForestContainerCpp& forest_samples, 
+                             int leaf_model_int, py::array_t<double> initial_values) {
+    // Convert leaf model type to enum
+    StochTree::ModelType model_type;
+    if (leaf_model_int == 0) model_type = StochTree::ModelType::kConstantLeafGaussian;
+    else if (leaf_model_int == 1) model_type = StochTree::ModelType::kUnivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 2) model_type = StochTree::ModelType::kMultivariateRegressionLeafGaussian;
+    else if (leaf_model_int == 3) model_type = StochTree::ModelType::kLogLinearVariance;
+    else StochTree::Log::Fatal("Invalid model type");
+    
+    // Unpack initial value
+    StochTree::ForestContainer* forest_sample_ptr = forest_samples.GetContainer();
+    StochTree::ForestDataset* forest_data_ptr = dataset.GetDataset();
+    StochTree::ColumnVector* residual_data_ptr = residual.GetData();
+    int num_trees = forest_sample_ptr->NumTrees();
+    double init_val;
+    std::vector<double> init_value_vector;
+    if ((model_type == StochTree::ModelType::kConstantLeafGaussian) || 
+        (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) || 
+        (model_type == StochTree::ModelType::kLogLinearVariance)) {
+        init_val = initial_values.at(0);
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
+        int leaf_dim = initial_values.size();
+        init_value_vector.resize(leaf_dim);
+        for (int i = 0; i < leaf_dim; i++) {
+            init_value_vector[i] = initial_values.at(i) / static_cast<double>(num_trees);
+        }
+    }
+    
+    // Initialize the models accordingly
+    if (model_type == StochTree::ModelType::kConstantLeafGaussian) {
+        forest_samples.InitializeRootValue(init_val / static_cast<double>(num_trees));
+        StochTree::UpdateResidualEntireForest(*tracker_, *forest_data_ptr, *residual_data_ptr, forest_sample_ptr->GetEnsemble(0), false, std::minus<double>());
+        tracker_->UpdatePredictions(forest_sample_ptr->GetEnsemble(0), *forest_data_ptr);
+    } else if (model_type == StochTree::ModelType::kUnivariateRegressionLeafGaussian) {
+        forest_samples.InitializeRootValue(init_val / static_cast<double>(num_trees));
+        StochTree::UpdateResidualEntireForest(*tracker_, *forest_data_ptr, *residual_data_ptr, forest_sample_ptr->GetEnsemble(0), true, std::minus<double>());
+        tracker_->UpdatePredictions(forest_sample_ptr->GetEnsemble(0), *forest_data_ptr);
+    } else if (model_type == StochTree::ModelType::kMultivariateRegressionLeafGaussian) {
+        forest_samples.InitializeRootVector(init_value_vector);
+        StochTree::UpdateResidualEntireForest(*tracker_, *forest_data_ptr, *residual_data_ptr, forest_sample_ptr->GetEnsemble(0), true, std::minus<double>());
+        tracker_->UpdatePredictions(forest_sample_ptr->GetEnsemble(0), *forest_data_ptr);
+    } else if (model_type == StochTree::ModelType::kLogLinearVariance) {
+        forest_samples.InitializeRootValue(std::log(init_val) / static_cast<double>(num_trees));
+        tracker_->UpdatePredictions(forest_sample_ptr->GetEnsemble(0), *forest_data_ptr);
+        int n = forest_data_ptr->NumObservations();
+        std::vector<double> initial_preds(n, init_val);
+        forest_data_ptr->AddVarianceWeights(initial_preds.data(), n);
+    }
+  }
+
  private:
   std::unique_ptr<StochTree::ForestTracker> tracker_;
   std::unique_ptr<StochTree::TreePrior> split_prior_;
@@ -894,7 +960,7 @@ PYBIND11_MODULE(stochtree_cpp, m) {
     .def(py::init<int>());
 
   py::class_<ForestContainerCpp>(m, "ForestContainerCpp")
-    .def(py::init<int,int,bool>())
+    .def(py::init<int,int,bool,bool>())
     .def("OutputDimension", &ForestContainerCpp::OutputDimension)
     .def("NumSamples", &ForestContainerCpp::NumSamples)
     .def("Predict", &ForestContainerCpp::Predict)
@@ -919,7 +985,8 @@ PYBIND11_MODULE(stochtree_cpp, m) {
 
   py::class_<ForestSamplerCpp>(m, "ForestSamplerCpp")
     .def(py::init<ForestDatasetCpp&, py::array_t<int>, int, data_size_t, double, double, int, int>())
-    .def("SampleOneIteration", &ForestSamplerCpp::SampleOneIteration);
+    .def("SampleOneIteration", &ForestSamplerCpp::SampleOneIteration)
+    .def("InitializeForestModel", &ForestSamplerCpp::InitializeForestModel);
 
   py::class_<GlobalVarianceModelCpp>(m, "GlobalVarianceModelCpp")
     .def(py::init<>())
diff --git a/stochtree/bart.py b/stochtree/bart.py
index acf9da7c..2f4c59b7 100644
--- a/stochtree/bart.py
+++ b/stochtree/bart.py
@@ -26,9 +26,13 @@ def is_sampled(self) -> bool:
         return self.sampled
     
     def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = None, X_test: np.array = None, basis_test: np.array = None, 
-               cutpoint_grid_size = 100, sigma_leaf: float = None, alpha: float = 0.95, beta: float = 2.0, min_samples_leaf: int = 5, max_depth: int = 10, 
-               a_global: float = 0, b_global: float = 0, a_leaf: float = 3, b_leaf: float = None, q: float = 0.9, sigma2: float = None, 
-               pct_var_sigma2_init: float = 0.25, num_trees: int = 200, num_gfr: int = 5, num_burnin: int = 0, num_mcmc: int = 100, 
+               cutpoint_grid_size = 100, sigma_leaf: float = None, alpha_mean: float = 0.95, beta_mean: float = 2.0, min_samples_leaf_mean: int = 5, 
+               max_depth_mean: int = 10, alpha_variance: float = 0.95, beta_variance: float = 2.0, min_samples_leaf_variance: int = 5, 
+               max_depth_variance: int = 10, a_global: float = 0, b_global: float = 0, a_leaf: float = 3, b_leaf: float = None, 
+               a_forest: float = None, b_forest: float = None, sigma2_init: float = None, variance_forest_leaf_init: float = None, 
+               pct_var_sigma2_init: float = 1, pct_var_variance_forest_init: float = 1, variance_scale: float = 1, 
+               variable_weights_mean: np.array = None, variable_weights_variance: np.array = None, num_trees_mean: int = 200, 
+               num_trees_variance: int = 0, num_gfr: int = 5, num_burnin: int = 0, num_mcmc: int = 100, 
                sample_sigma_global: bool = True, sample_sigma_leaf: bool = True, random_seed: int = -1, keep_burnin: bool = False, keep_gfr: bool = False) -> None:
         """Runs a BART sampler on provided training set. Predictions will be cached for the training set and (if provided) the test set. 
         Does not require a leaf regression basis. 
@@ -49,33 +53,59 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
         cutpoint_grid_size : :obj:`int`, optional
             Maximum number of cutpoints to consider for each feature. Defaults to ``100``.
         sigma_leaf : :obj:`float`, optional
-            Scale parameter on the leaf node regression model.
-        alpha : :obj:`float`, optional
-            Prior probability of splitting for a tree of depth 0. 
-            Tree split prior combines ``alpha`` and ``beta`` via ``alpha*(1+node_depth)^-beta``.
-        beta : :obj:`float`, optional
-            Exponent that decreases split probabilities for nodes of depth > 0. 
-            Tree split prior combines ``alpha`` and ``beta`` via ``alpha*(1+node_depth)^-beta``.
-        min_samples_leaf : :obj:`int`, optional
-            Minimum allowable size of a leaf, in terms of training samples. Defaults to ``5``.
-        max_depth : :obj:`int`, optional
-            Maximum depth of any tree in the ensemble. Defaults to ``10``. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
+            Scale parameter on the (conditional mean) leaf node regression model.
+        alpha_mean : :obj:`float`, optional
+            Prior probability of splitting for a tree of depth 0 in the conditional mean model. 
+            Tree split prior combines ``alpha_mean`` and ``beta_mean`` via ``alpha_mean*(1+node_depth)^-beta_mean``.
+        beta_mean : :obj:`float`, optional
+            Exponent that decreases split probabilities for nodes of depth > 0 in the conditional mean model. 
+            Tree split prior combines ``alpha_mean`` and ``beta_mean`` via ``alpha_mean*(1+node_depth)^-beta_mean``.
+        min_samples_leaf_mean : :obj:`int`, optional
+            Minimum allowable size of a leaf, in terms of training samples, in the conditional mean model. Defaults to ``5``.
+        max_depth_mean : :obj:`int`, optional
+            Maximum depth of any tree in the ensemble in the conditional mean model. Defaults to ``10``. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
+        alpha_variance : :obj:`float`, optional
+            Prior probability of splitting for a tree of depth 0 in the conditional variance model. 
+            Tree split prior combines ``alpha_variance`` and ``beta_variance`` via ``alpha_variance*(1+node_depth)^-beta_variance``.
+        beta_variance : :obj:`float`, optional
+            Exponent that decreases split probabilities for nodes of depth > 0 in the conditional variance model. 
+            Tree split prior combines ``alpha_variance`` and ``beta_variance`` via ``alpha_variance*(1+node_depth)^-beta_variance``.
+        min_samples_leaf_variance : :obj:`int`, optional
+            Minimum allowable size of a leaf, in terms of training samples in the conditional variance model. Defaults to ``5``.
+        max_depth_variance : :obj:`int`, optional
+            Maximum depth of any tree in the ensemble in the conditional variance model. Defaults to ``10``. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
         a_global : :obj:`float`, optional
             Shape parameter in the ``IG(a_global, b_global)`` global error variance model. Defaults to ``0``.
         b_global : :obj:`float`, optional
             Component of the scale parameter in the ``IG(a_global, b_global)`` global error variance prior. Defaults to ``0``.
+        b_leaf : :obj:`float`, optional
+            Scale parameter in the ``IG(a_leaf, b_leaf)`` leaf node parameter variance model. Calibrated internally as ``0.5/num_trees_mean`` if not set here.
         a_leaf : :obj:`float`, optional
             Shape parameter in the ``IG(a_leaf, b_leaf)`` leaf node parameter variance model. Defaults to ``3``.
         b_leaf : :obj:`float`, optional
-            Scale parameter in the ``IG(a_leaf, b_leaf)`` leaf node parameter variance model. Calibrated internally as ``0.5/num_trees`` if not set here.
-        q : :obj:`float`, optional
-            Quantile used to calibrated ``lamb`` as in Sparapani et al (2021). Defaults to ``0.9``.
-        sigma2 : :obj:`float`, optional
+            Scale parameter in the ``IG(a_leaf, b_leaf)`` leaf node parameter variance model. Calibrated internally as ``0.5/num_trees_mean`` if not set here.
+        a_forest : :obj:`float`, optional
+            Shape parameter in the [optional] ``IG(a_forest, b_forest)`` conditional error variance forest (which is only sampled if ``num_trees_variance > 0``). Calibrated internally as ``num_trees_variance / 1.5^2 + 0.5`` if not set here.
+        b_forest : :obj:`float`, optional
+            Scale parameter in the [optional] ``IG(a_forest, b_forest)`` conditional error variance forest (which is only sampled if ``num_trees_variance > 0``). Calibrated internally as ``num_trees_variance / 1.5^2`` if not set here.
+        sigma2_init : :obj:`float`, optional
             Starting value of global variance parameter. Set internally as a percentage of the standardized outcome variance if not set here.
+        variance_forest_leaf_init : :obj:`float`, optional
+            Starting value of root forest prediction in conditional (heteroskedastic) error variance model. Calibrated internally as ``np.log(pct_var_variance_forest_init*np.var((y-np.mean(y))/np.std(y)))/num_trees_variance`` if not set.
         pct_var_sigma2_init : :obj:`float`, optional
-            Percentage of standardized outcome variance used to initialize global error variance parameter. Superseded by ``sigma2``. Defaults to ``0.25``.
-        num_trees : :obj:`int`, optional
-            Number of trees in the ensemble. Defaults to ``200``.
+            Percentage of standardized outcome variance used to initialize global error variance parameter. Superseded by ``sigma2``. Defaults to ``1``.
+        pct_var_variance_forest_init : :obj:`float`, optional
+            Percentage of standardized outcome variance used to initialize global error variance parameter. Default: ``1``. Superseded by ``variance_forest_init``.
+        variance_scale : :obj:`float`, optional
+            Variance after the data have been scaled. Default: ``1``.
+        variable_weights_mean : :obj:`np.array`, optional
+            Numeric weights reflecting the relative probability of splitting on each variable in the mean forest. Does not need to sum to 1 but cannot be negative. Defaults to uniform over the columns of ``X_train`` if not provided.
+        variable_weights_forest : :obj:`np.array`, optional
+            Numeric weights reflecting the relative probability of splitting on each variable in the variance forest. Does not need to sum to 1 but cannot be negative. Defaults to uniform over the columns of ``X_train`` if not provided.
+        num_trees_mean : :obj:`int`, optional
+            Number of trees in the ensemble for the conditional mean model. Defaults to ``200``. If ``num_trees_mean = 0``, the conditional mean will not be modeled using a forest and the function will only proceed if ``num_trees_variance > 0``.
+        num_trees_variance : :obj:`int`, optional
+            Number of trees in the ensemble for the conditional variance model. Defaults to ``0``. Variance is only modeled using a tree / forest if `num_trees_variance > 0`.
         num_gfr : :obj:`int`, optional
             Number of "warm-start" iterations run using the grow-from-root algorithm (He and Hahn, 2021). Defaults to ``5``.
         num_burnin : :obj:`int`, optional
@@ -85,7 +115,7 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
         sample_sigma_global : :obj:`bool`, optional
             Whether or not to update the ``sigma^2`` global error variance parameter based on ``IG(a_global, b_global)``. Defaults to ``True``.
         sample_sigma_leaf : :obj:`bool`, optional
-            Whether or not to update the ``tau`` leaf scale variance parameter based on ``IG(a_leaf, b_leaf)``. Cannot (currently) be set to true if ``basis_train`` has more than one column. Defaults to ``True``.
+            Whether or not to update the ``tau`` leaf scale variance parameter based on ``IG(a_leaf, b_leaf)``. Cannot (currently) be set to true if ``basis_train`` has more than one column. Defaults to ``False``.
         random_seed : :obj:`int`, optional
             Integer parameterizing the C++ random number generator. If not specified, the C++ random number generator is seeded according to ``std::random_device``.
         keep_burnin : :obj:`bool`, optional
@@ -98,6 +128,10 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
         self : BARTModel
             Sampled BART Model.
         """
+        # Determine which models (conditional mean, conditional variance, or both) we will fit
+        self.include_mean_forest = True if num_trees_mean > 0 else False
+        self.include_variance_forest = True if num_trees_variance > 0 else False
+        
         # Check data inputs
         if not isinstance(X_train, pd.DataFrame) and not isinstance(X_train, np.ndarray):
             raise ValueError("X_train must be a pandas dataframe or numpy array")
@@ -148,6 +182,15 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
         if X_test is not None and basis_test is not None:
             if X_test.shape[0] != basis_test.shape[0]:
                 raise ValueError("X_test and basis_test must have the same number of rows")
+
+        # Compute variable weights
+        p = X_train.shape[1]
+        if self.include_mean_forest:
+            if not variable_weights_mean:
+                variable_weights_mean = np.repeat(1.0/p, p)
+        if self.include_variance_forest:
+            if not variable_weights_variance:
+                variable_weights_variance = np.repeat(1.0/p, p)
         
         # Covariate preprocessing
         self._covariate_transformer = CovariateTransformer()
@@ -169,21 +212,43 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
         self.num_covariates = X_train_processed.shape[1]
         self.num_basis = basis_train.shape[1] if self.has_basis else 0
         
-        # Set variable weights for the prognostic and treatment effect forests
-        variable_weights = np.repeat(1.0/self.num_covariates, self.num_covariates)
+        # Update variable weights if the covariates have been resized (by e.g. one-hot encoding)
+        if X_train_processed.shape[1] != X_train.shape[1]:
+            original_var_indices = self._covariate_transformer._original_feature_indices
+            variable_weights_adj = np.array([1/np.sum(original_var_indices==i) for i in original_var_indices])
+            if self.include_mean_forest:
+                variable_weights_mean = variable_weights_mean[original_var_indices]*variable_weights_adj
+            if self.include_variance_forest:
+                variable_weights_variance = variable_weights_variance[original_var_indices]*variable_weights_adj
 
         # Scale outcome
         self.y_bar = np.squeeze(np.mean(y_train))
         self.y_std = np.squeeze(np.std(y_train))
+        if variance_scale > 0:
+            self.variance_scale = variance_scale
+        else:
+            raise ValueError("variance_scale must be positive")
         resid_train = (y_train-self.y_bar)/self.y_std
+        resid_train = resid_train*np.sqrt(self.variance_scale)
 
         # Calibrate priors for global sigma^2 and sigma_leaf (don't use regression initializer for warm-start or XBART)
-        if not sigma2:
-            sigma2 = pct_var_sigma2_init*np.var(resid_train)
-        b_leaf = np.squeeze(np.var(resid_train)) / num_trees if b_leaf is None else b_leaf
-        sigma_leaf = np.squeeze(np.var(resid_train)) / num_trees if sigma_leaf is None else sigma_leaf
-        current_sigma2 = sigma2
-        current_leaf_scale = np.array([[sigma_leaf]])
+        if not sigma2_init:
+            sigma2_init = pct_var_sigma2_init*np.var(resid_train)
+        if not variance_forest_leaf_init:
+            variance_forest_leaf_init = pct_var_variance_forest_init*np.var(resid_train)
+        current_sigma2 = sigma2_init
+        self.sigma2_init = sigma2_init
+        if self.include_mean_forest:
+            b_leaf = np.squeeze(np.var(resid_train)) / num_trees_mean if b_leaf is None else b_leaf
+            sigma_leaf = np.squeeze(np.var(resid_train)) / num_trees_mean if sigma_leaf is None else sigma_leaf
+            current_leaf_scale = np.array([[sigma_leaf]])
+        else:
+            current_leaf_scale = np.array([[1.]])
+        if self.include_variance_forest:
+            if not a_forest:
+                a_forest = num_trees_variance / 1.5**2 + 0.5
+            if not b_forest:
+                b_forest = num_trees_variance / 1.5**2
 
         # Container of variance parameter samples
         self.num_gfr = num_gfr
@@ -218,22 +283,27 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
             cpp_rng = RNG(random_seed)
         
         # Sampling data structures
-        forest_sampler = ForestSampler(forest_dataset_train, feature_types, num_trees, self.n_train, alpha, beta, min_samples_leaf, max_depth)
+        if self.include_mean_forest:
+            forest_sampler_mean = ForestSampler(forest_dataset_train, feature_types, num_trees_mean, self.n_train, alpha_mean, beta_mean, min_samples_leaf_mean, max_depth_mean)
+        if self.include_variance_forest:
+            forest_sampler_variance = ForestSampler(forest_dataset_train, feature_types, num_trees_variance, self.n_train, alpha_variance, beta_variance, min_samples_leaf_variance, max_depth_variance)
+
+        # Set variance leaf model type (currently only one option)
+        leaf_model_variance_forest = 3
 
-        # Determine the leaf model
+        # Determine the mean forest leaf model type
         if not self.has_basis:
-            leaf_model_int = 0
+            leaf_model_mean_forest = 0
         elif self.num_basis == 1:
-            leaf_model_int = 1
+            leaf_model_mean_forest = 1
         else:
-            leaf_model_int = 2
-        
-        # TODO Placeholder: expose the heteroskedasticity interface through the function signature, as in R
-        a_forest = 1
-        b_forest = 1
+            leaf_model_mean_forest = 2
 
         # Container of forest samples
-        self.forest_container = ForestContainer(num_trees, 1, True) if not self.has_basis else ForestContainer(num_trees, self.num_basis, False)
+        if self.include_mean_forest:
+            self.forest_container_mean = ForestContainer(num_trees_mean, 1, True, False) if not self.has_basis else ForestContainer(num_trees_mean, self.num_basis, False, False)
+        if self.include_variance_forest:
+            self.forest_container_variance = ForestContainer(num_trees_variance, 1, True, True)
         
         # Variance samplers
         if self.sample_sigma_global:
@@ -241,28 +311,45 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
         if self.sample_sigma_leaf:
             leaf_var_model = LeafVarianceModel()
 
-        # Initialize the leaves of each tree in the prognostic forest
-        init_root = np.squeeze(np.mean(resid_train)) / num_trees
-        self.forest_container.set_root_leaves(0, init_root)
-        forest_sampler.adjust_residual(forest_dataset_train, residual_train, self.forest_container, False, 0, True)
+        # Initialize the leaves of each tree in the mean forest
+        if self.include_mean_forest:
+            if self.has_basis:
+                init_val_mean = np.repeat(0., basis_train.shape[1])
+            else:
+                init_val_mean = np.array([0.])
+            forest_sampler_mean.prepare_for_sampler(forest_dataset_train, residual_train, self.forest_container_mean, leaf_model_mean_forest, init_val_mean)
+
+        # Initialize the leaves of each tree in the variance forest
+        if self.include_variance_forest:
+            init_val_variance = np.array([variance_forest_leaf_init])
+            forest_sampler_variance.prepare_for_sampler(forest_dataset_train, residual_train, self.forest_container_variance, leaf_model_variance_forest, init_val_variance)
 
         # Run GFR (warm start) if specified
         if self.num_gfr > 0:
             gfr_indices = np.arange(self.num_gfr)
             for i in range(self.num_gfr):
-                # Sample the forest
-                forest_sampler.sample_one_iteration(
-                    self.forest_container, forest_dataset_train, residual_train, cpp_rng, feature_types, 
-                    cutpoint_grid_size, current_leaf_scale, variable_weights, a_forest, b_forest, 
-                    current_sigma2, leaf_model_int, True, True
-                )
+                # Sample the mean forest
+                if self.include_mean_forest:
+                    forest_sampler_mean.sample_one_iteration(
+                        self.forest_container_mean, forest_dataset_train, residual_train, cpp_rng, feature_types, 
+                        cutpoint_grid_size, current_leaf_scale, variable_weights_mean, a_forest, b_forest, 
+                        current_sigma2, leaf_model_mean_forest, True, True
+                    )
+                
+                # Sample the variance forest
+                if self.include_variance_forest:
+                    forest_sampler_variance.sample_one_iteration(
+                        self.forest_container_variance, forest_dataset_train, residual_train, cpp_rng, feature_types, 
+                        cutpoint_grid_size, current_leaf_scale, variable_weights_variance, a_forest, b_forest, 
+                        current_sigma2, leaf_model_variance_forest, True, True
+                    )
 
                 # Sample variance parameters (if requested)
                 if self.sample_sigma_global:
                     current_sigma2 = global_var_model.sample_one_iteration(residual_train, cpp_rng, a_global, b_global)
-                    self.global_var_samples[i] = current_sigma2*self.y_std*self.y_std
+                    self.global_var_samples[i] = current_sigma2*self.y_std*self.y_std/self.variance_scale
                 if self.sample_sigma_leaf:
-                    self.leaf_scale_samples[i] = leaf_var_model.sample_one_iteration(self.forest_container, cpp_rng, a_leaf, b_leaf, i)
+                    self.leaf_scale_samples[i] = leaf_var_model.sample_one_iteration(self.forest_container_mean, cpp_rng, a_leaf, b_leaf, i)
                     current_leaf_scale[0,0] = self.leaf_scale_samples[i]
         
         # Run MCMC
@@ -272,19 +359,28 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
             if self.num_mcmc > 0:
                 mcmc_indices = np.arange(self.num_gfr + self.num_burnin, self.num_gfr + self.num_burnin + self.num_mcmc)
             for i in range(self.num_gfr, self.num_samples):
-                # Sample the forest
-                forest_sampler.sample_one_iteration(
-                    self.forest_container, forest_dataset_train, residual_train, cpp_rng, feature_types, 
-                    cutpoint_grid_size, current_leaf_scale, variable_weights, a_forest, b_forest, 
-                    current_sigma2, leaf_model_int, False, True
-                )
+                # Sample the mean forest
+                if self.include_mean_forest:
+                    forest_sampler_mean.sample_one_iteration(
+                        self.forest_container_mean, forest_dataset_train, residual_train, cpp_rng, feature_types, 
+                        cutpoint_grid_size, current_leaf_scale, variable_weights_mean, a_forest, b_forest, 
+                        current_sigma2, leaf_model_mean_forest, False, True
+                    )
+                
+                # Sample the variance forest
+                if self.include_variance_forest:
+                    forest_sampler_variance.sample_one_iteration(
+                        self.forest_container_variance, forest_dataset_train, residual_train, cpp_rng, feature_types, 
+                        cutpoint_grid_size, current_leaf_scale, variable_weights_variance, a_forest, b_forest, 
+                        current_sigma2, leaf_model_variance_forest, False, True
+                    )
 
                 # Sample variance parameters (if requested)
                 if self.sample_sigma_global:
                     current_sigma2 = global_var_model.sample_one_iteration(residual_train, cpp_rng, a_global, b_global)
-                    self.global_var_samples[i] = current_sigma2*self.y_std*self.y_std
+                    self.global_var_samples[i] = current_sigma2*self.y_std*self.y_std/self.variance_scale
                 if self.sample_sigma_leaf:
-                    self.leaf_scale_samples[i] = leaf_var_model.sample_one_iteration(self.forest_container, cpp_rng, a_leaf, b_leaf, i)
+                    self.leaf_scale_samples[i] = leaf_var_model.sample_one_iteration(self.forest_container_mean, cpp_rng, a_leaf, b_leaf, i)
                     current_leaf_scale[0,0] = self.leaf_scale_samples[i]
         
         # Mark the model as sampled
@@ -312,14 +408,95 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
                 raise RuntimeError("There are no samples to retain!")
         
         # Store predictions
-        yhat_train_raw = self.forest_container.forest_container_cpp.Predict(forest_dataset_train.dataset_cpp)[:,self.keep_indices]
-        self.y_hat_train = yhat_train_raw*self.y_std + self.y_bar
-        if self.has_test:
-            yhat_test_raw = self.forest_container.forest_container_cpp.Predict(forest_dataset_test.dataset_cpp)[:,self.keep_indices]
-            self.y_hat_test = yhat_test_raw*self.y_std + self.y_bar
-    
+        if self.sample_sigma_global:
+            self.global_var_samples = self.global_var_samples[self.keep_indices]
+
+        if self.sample_sigma_leaf:
+            self.leaf_scale_samples = self.leaf_scale_samples[self.keep_indices]
+        
+        if self.include_mean_forest:
+            yhat_train_raw = self.forest_container_mean.forest_container_cpp.Predict(forest_dataset_train.dataset_cpp)[:,self.keep_indices]
+            self.y_hat_train = yhat_train_raw*self.y_std/np.sqrt(self.variance_scale) + self.y_bar
+            if self.has_test:
+                yhat_test_raw = self.forest_container_mean.forest_container_cpp.Predict(forest_dataset_test.dataset_cpp)[:,self.keep_indices]
+                self.y_hat_test = yhat_test_raw*self.y_std/np.sqrt(self.variance_scale) + self.y_bar
+        
+        if self.include_variance_forest:
+            sigma_x_train_raw = self.forest_container_variance.forest_container_cpp.Predict(forest_dataset_train.dataset_cpp)[:,self.keep_indices]
+            if self.sample_sigma_global:
+                self.sigma_x_train = sigma_x_train_raw
+                for i in range(self.keep_indices.shape[0]):
+                    self.sigma_x_train[:,i] = np.sqrt(sigma_x_train_raw[:,i]*self.global_var_samples[i])
+            else:
+                self.sigma_x_train = np.sqrt(sigma_x_train_raw*self.sigma2_init)*self.y_std/np.sqrt(self.variance_scale)
+            if self.has_test:
+                sigma_x_test_raw = self.forest_container_variance.forest_container_cpp.Predict(forest_dataset_test.dataset_cpp)[:,self.keep_indices]
+                if self.sample_sigma_global:
+                    self.sigma_x_test = sigma_x_test_raw
+                    for i in range(self.keep_indices.shape[0]):
+                        self.sigma_x_test[:,i] = np.sqrt(sigma_x_test_raw[:,i]*self.global_var_samples[i])
+                else:
+                    self.sigma_x_test = np.sqrt(sigma_x_test_raw*self.sigma2_init)*self.y_std/np.sqrt(self.variance_scale)
+
     def predict(self, covariates: np.array, basis: np.array = None) -> np.array:
-        """Predict outcome from every retained forest of a BART sampler.
+        """Return predictions from every forest sampled (either / both of mean and variance)
+
+        Parameters
+        ----------
+        covariates : np.array
+            Test set covariates.
+        basis_train : :obj:`np.array`, optional
+            Optional test set basis vector, must be provided if the model was trained with a leaf regression basis.
+        
+        Returns
+        -------
+        tuple of :obj:`np.array`
+            Tuple of arrays of predictions corresponding to each forest (mean and variance, depending on whether either / both was included). Each array will contain as many rows as in ``covariates`` and as many columns as retained samples of the algorithm.
+        """
+        if not self.is_sampled():
+            msg = (
+                "This BARTModel instance is not fitted yet. Call 'fit' with "
+                "appropriate arguments before using this model."
+            )
+            raise NotSampledError(msg)
+        
+        # Convert everything to standard shape (2-dimensional)
+        if covariates.ndim == 1:
+            covariates = np.expand_dims(covariates, 1)
+        if basis is not None:
+            if basis.ndim == 1:
+                basis = np.expand_dims(basis, 1)
+        
+        # Data checks
+        if basis is not None:
+            if basis.shape[0] != covariates.shape[0]:
+                raise ValueError("covariates and basis must have the same number of rows")
+
+        pred_dataset = Dataset()
+        pred_dataset.add_covariates(covariates)
+        if basis is not None:
+            pred_dataset.add_basis(basis)
+        if self.include_mean_forest:
+            mean_pred_raw = self.forest_container_mean.forest_container_cpp.Predict(pred_dataset.dataset_cpp)[:,self.keep_indices]
+            mean_pred = mean_pred_raw*self.y_std/np.sqrt(self.variance_scale) + self.y_bar
+        if self.include_variance_forest:
+            variance_pred_raw = self.forest_container_variance.forest_container_cpp.Predict(pred_dataset.dataset_cpp)[:,self.keep_indices]
+            if self.sample_sigma_global:
+                variance_pred = variance_pred_raw
+                for i in range(self.keep_indices.shape[0]):
+                    variance_pred[:,i] = np.sqrt(variance_pred_raw[:,i]*self.global_var_samples[i])
+            else:
+                variance_pred = np.sqrt(variance_pred_raw*self.sigma2_init)*self.y_std/np.sqrt(self.variance_scale)
+
+        if self.include_mean_forest and self.include_variance_forest:
+            return (mean_pred, variance_pred)
+        elif self.include_mean_forest and not self.include_variance_forest:
+            return (mean_pred)
+        elif not self.include_mean_forest and self.include_variance_forest:
+            return (variance_pred)
+
+    def predict_mean(self, covariates: np.array, basis: np.array = None) -> np.array:
+        """Predict expected conditional outcome from a BART model.
 
         Parameters
         ----------
@@ -330,15 +507,22 @@ def predict(self, covariates: np.array, basis: np.array = None) -> np.array:
         
         Returns
         -------
-        np.array
-            Array of predictions with as many rows as in ``covariates`` and as many columns as retained samples of the algorithm.
+        tuple of :obj:`np.array`
+            Tuple of arrays of predictions corresponding to each forest (mean and variance, depending on whether either / both was included). Each array will contain as many rows as in ``covariates`` and as many columns as retained samples of the algorithm.
         """
         if not self.is_sampled():
             msg = (
-                "This BCFModel instance is not fitted yet. Call 'fit' with "
+                "This BARTModel instance is not fitted yet. Call 'fit' with "
                 "appropriate arguments before using this model."
             )
             raise NotSampledError(msg)
+
+        if not self.include_mean_forest:
+            msg = (
+                "This BARTModel instance was not sampled with a mean forest. "
+                "Call 'fit' with appropriate arguments before using this model."
+            )
+            raise NotSampledError(msg)
         
         # Convert everything to standard shape (2-dimensional)
         if covariates.ndim == 1:
@@ -356,5 +540,62 @@ def predict(self, covariates: np.array, basis: np.array = None) -> np.array:
         pred_dataset.add_covariates(covariates)
         if basis is not None:
             pred_dataset.add_basis(basis)
-        pred_raw = self.forest_container.forest_container_cpp.Predict(pred_dataset.dataset_cpp)
-        return pred_raw[:,self.keep_indices]*self.y_std + self.y_bar
+        mean_pred_raw = self.forest_container_mean.forest_container_cpp.Predict(pred_dataset.dataset_cpp)[:,self.keep_indices]
+        mean_pred = mean_pred_raw*self.y_std/np.sqrt(self.variance_scale) + self.y_bar
+
+        return mean_pred
+
+    def predict_variance(self, covariates: np.array, basis: np.array = None) -> np.array:
+        """Predict expected conditional variance from a BART model.
+
+        Parameters
+        ----------
+        covariates : np.array
+            Test set covariates.
+        basis_train : :obj:`np.array`, optional
+            Optional test set basis vector, must be provided if the model was trained with a leaf regression basis.
+        
+        Returns
+        -------
+        tuple of :obj:`np.array`
+            Tuple of arrays of predictions corresponding to each forest (mean and variance, depending on whether either / both was included). Each array will contain as many rows as in ``covariates`` and as many columns as retained samples of the algorithm.
+        """
+        if not self.is_sampled():
+            msg = (
+                "This BARTModel instance is not fitted yet. Call 'fit' with "
+                "appropriate arguments before using this model."
+            )
+            raise NotSampledError(msg)
+
+        if not self.include_variance_forest:
+            msg = (
+                "This BARTModel instance was not sampled with a variance forest. "
+                "Call 'fit' with appropriate arguments before using this model."
+            )
+            raise NotSampledError(msg)
+        
+        # Convert everything to standard shape (2-dimensional)
+        if covariates.ndim == 1:
+            covariates = np.expand_dims(covariates, 1)
+        if basis is not None:
+            if basis.ndim == 1:
+                basis = np.expand_dims(basis, 1)
+        
+        # Data checks
+        if basis is not None:
+            if basis.shape[0] != covariates.shape[0]:
+                raise ValueError("covariates and basis must have the same number of rows")
+
+        pred_dataset = Dataset()
+        pred_dataset.add_covariates(covariates)
+        # if basis is not None:
+        #     pred_dataset.add_basis(basis)
+        variance_pred_raw = self.forest_container_variance.forest_container_cpp.Predict(pred_dataset.dataset_cpp)[:,self.keep_indices]
+        if self.sample_sigma_global:
+            variance_pred = variance_pred_raw
+            for i in range(self.keep_indices.shape[0]):
+                variance_pred[:,i] = np.sqrt(variance_pred_raw[:,i]*self.global_var_samples[i])
+        else:
+            variance_pred = np.sqrt(variance_pred_raw*self.sigma2_init)*self.y_std/np.sqrt(self.variance_scale)
+
+        return variance_pred
diff --git a/stochtree/bcf.py b/stochtree/bcf.py
index c1056d63..7c3d7c15 100644
--- a/stochtree/bcf.py
+++ b/stochtree/bcf.py
@@ -627,8 +627,8 @@ def sample(self, X_train: Union[pd.DataFrame, np.array], Z_train: np.array, y_tr
         forest_sampler_tau = ForestSampler(forest_dataset_train, feature_types, num_trees_tau, self.n_train, alpha_tau, beta_tau, min_samples_leaf_tau, max_depth_tau)
 
         # Container of forest samples
-        self.forest_container_mu = ForestContainer(num_trees_mu, 1, True)
-        self.forest_container_tau = ForestContainer(num_trees_tau, Z_train.shape[1], False)
+        self.forest_container_mu = ForestContainer(num_trees_mu, 1, True, False)
+        self.forest_container_tau = ForestContainer(num_trees_tau, Z_train.shape[1], False, False)
         
         # Variance samplers
         if self.sample_sigma_global:
diff --git a/stochtree/forest.py b/stochtree/forest.py
index cb39e28d..eb844d64 100644
--- a/stochtree/forest.py
+++ b/stochtree/forest.py
@@ -8,9 +8,9 @@
 from typing import Union
 
 class ForestContainer:
-    def __init__(self, num_trees: int, output_dimension: int, leaf_constant: bool) -> None:
+    def __init__(self, num_trees: int, output_dimension: int, leaf_constant: bool, is_exponentiated: bool) -> None:
         # Initialize a ForestContainerCpp object
-        self.forest_container_cpp = ForestContainerCpp(num_trees, output_dimension, leaf_constant)
+        self.forest_container_cpp = ForestContainerCpp(num_trees, output_dimension, leaf_constant, is_exponentiated)
     
     def predict(self, dataset: Dataset) -> np.array:
         # Predict samples from Dataset
diff --git a/stochtree/sampler.py b/stochtree/sampler.py
index de8ad36d..df7b3c8e 100644
--- a/stochtree/sampler.py
+++ b/stochtree/sampler.py
@@ -5,6 +5,7 @@
 from .data import Dataset, Residual
 from .forest import ForestContainer
 from stochtree_cpp import RngCpp, ForestSamplerCpp, GlobalVarianceModelCpp, LeafVarianceModelCpp
+from typing import Union
 
 class RNG:
     def __init__(self, random_seed: int) -> None:
@@ -28,6 +29,23 @@ def sample_one_iteration(self, forest_container: ForestContainer, dataset: Datas
                                                    feature_types, cutpoint_grid_size, leaf_model_scale_input, variable_weights, 
                                                    a_forest, b_forest, global_variance, leaf_model_int, gfr, pre_initialized)
     
+    def prepare_for_sampler(self, dataset: Dataset, residual: Residual, forests: ForestContainer, leaf_model: int, initial_values: np.array):
+        """
+        Initialize forest and tracking data structures with constant root values before running a sampler
+
+        dataset : :obj:`Dataset`
+            Stochtree dataset object storing covariates / bases / weights
+        residual : :obj:`Residual`
+            Stochtree object storing continuously updated partial / full residual
+        forests : :obj:`ForestContainer`
+            Stochtree object storing tree ensembles
+        leaf_model : :obj:`int`
+            Integer encoding the leaf model type
+        initial_values : :obj:`np.array`
+            Constant root node value(s) at which to initialize forest prediction (internally, it is divided by the number of trees and typically it is 0 for mean models and 1 for variance models).
+        """
+        self.forest_sampler_cpp.InitializeForestModel(dataset.dataset_cpp, residual.residual_cpp, forests.forest_container_cpp, leaf_model, initial_values)
+    
     def adjust_residual(self, dataset: Dataset, residual: Residual, forest_container: ForestContainer, requires_basis: bool, forest_num: int, add: bool) -> None:
         """
         Method that "adjusts" the residual used for training tree ensembles by either adding or subtracting the prediction of each tree to the existing residual. 
diff --git a/vignettes/BayesianSupervisedLearning.Rmd b/vignettes/BayesianSupervisedLearning.Rmd
index 0a589757..d66bca56 100644
--- a/vignettes/BayesianSupervisedLearning.Rmd
+++ b/vignettes/BayesianSupervisedLearning.Rmd
@@ -76,14 +76,14 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_warmstart <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_trees = 100, num_gfr = num_gfr, num_burnin = num_burnin, 
-    num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T
+    num_mcmc = num_mcmc, sample_sigma_global = T, sample_sigma_leaf = T
 )
 ```
 
 Inspect the MCMC samples
 
 ```{r bart_warmstart_plot}
-plot(bart_model_warmstart$sigma2_samples, ylab="sigma^2")
+plot(bart_model_warmstart$sigma2_global_samples, ylab="sigma^2")
 plot(rowMeans(bart_model_warmstart$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
 abline(0,1,col="red",lty=2,lwd=2.5)
@@ -101,14 +101,14 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_root <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_trees = 100, num_gfr = num_gfr, num_burnin = num_burnin, 
-    num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T
+    num_mcmc = num_mcmc, sample_sigma_global = T, sample_sigma_leaf = T
 )
 ```
 
 Inspect the MCMC samples
 
 ```{r bart_root_plot}
-plot(bart_model_root$sigma2_samples, ylab="sigma^2")
+plot(bart_model_root$sigma2_global_samples, ylab="sigma^2")
 plot(rowMeans(bart_model_root$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
 abline(0,1,col="red",lty=2,lwd=2.5)
@@ -168,14 +168,14 @@ bart_model_warmstart <- stochtree::bart(
     X_train = X_train, W_train = W_train, y_train = y_train, 
     X_test = X_test, W_test = W_test, num_trees = 100, 
     num_gfr = num_gfr, num_burnin = num_burnin, 
-    num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T
+    num_mcmc = num_mcmc, sample_sigma_global = T, sample_sigma_leaf = T
 )
 ```
 
 Inspect the MCMC samples
 
 ```{r bart_warmstart_plot_plm}
-plot(bart_model_warmstart$sigma2_samples, ylab="sigma^2")
+plot(bart_model_warmstart$sigma2_global_samples, ylab="sigma^2")
 plot(rowMeans(bart_model_warmstart$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
 abline(0,1,col="red",lty=2,lwd=2.5)
@@ -194,14 +194,14 @@ bart_model_root <- stochtree::bart(
     X_train = X_train, W_train = W_train, y_train = y_train, 
     X_test = X_test, W_test = W_test, num_trees = 100, 
     num_gfr = num_gfr, num_burnin = num_burnin, 
-    num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T
+    num_mcmc = num_mcmc, sample_sigma_global = T, sample_sigma_leaf = T
 )
 ```
 
 Inspect the BART samples after burnin.
 
 ```{r bart_root_plot_plm}
-plot(bart_model_root$sigma2_samples, ylab="sigma^2")
+plot(bart_model_root$sigma2_global_samples, ylab="sigma^2")
 plot(rowMeans(bart_model_root$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
 abline(0,1,col="red",lty=2,lwd=2.5)
@@ -272,14 +272,14 @@ bart_model_warmstart <- stochtree::bart(
     X_test = X_test, W_test = W_test, group_ids_test = group_ids_test,
     rfx_basis_test = rfx_basis_test, num_trees = 100, num_gfr = num_gfr, 
     num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    sample_sigma = T, sample_tau = T
+    sample_sigma_global = T, sample_sigma_leaf = T
 )
 ```
 
 Inspect the MCMC samples
 
 ```{r bart_warmstart_plot_plm_rfx}
-plot(bart_model_warmstart$sigma2_samples, ylab="sigma^2")
+plot(bart_model_warmstart$sigma2_global_samples, ylab="sigma^2")
 abline(h=noise_sd^2,col="red",lty=2,lwd=2.5)
 plot(rowMeans(bart_model_warmstart$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
@@ -301,14 +301,14 @@ bart_model_root <- stochtree::bart(
     X_test = X_test, W_test = W_test, group_ids_test = group_ids_test,
     rfx_basis_test = rfx_basis_test, num_trees = 100, num_gfr = num_gfr, 
     num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    sample_sigma = T, sample_tau = T
+    sample_sigma_global = T, sample_sigma_leaf = T
 )
 ```
 
 Inspect the MCMC samples
 
 ```{r bart_root_plot_plm_rfx}
-plot(bart_model_root$sigma2_samples, ylab="sigma^2")
+plot(bart_model_root$sigma2_global_samples, ylab="sigma^2")
 abline(h=noise_sd^2,col="red",lty=2,lwd=2.5)
 plot(rowMeans(bart_model_root$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
diff --git a/vignettes/Heteroskedasticity.Rmd b/vignettes/Heteroskedasticity.Rmd
index 56a74114..10261023 100644
--- a/vignettes/Heteroskedasticity.Rmd
+++ b/vignettes/Heteroskedasticity.Rmd
@@ -97,7 +97,7 @@ bart_model_warmstart <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 0, num_trees_variance = num_trees, 
-    sample_sigma = F, sample_tau = F
+    sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
 
@@ -123,7 +123,7 @@ bart_model_mcmc <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     num_trees_mean = 0, num_trees_variance = 20, 
-    sample_sigma = F, sample_tau = F
+    sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
 
@@ -207,7 +207,7 @@ bart_model_warmstart <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 1, 
-    sample_sigma = F, sample_tau = F
+    sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
 
@@ -236,7 +236,7 @@ bart_model_mcmc <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = F, sample_tau = F
+    sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
 
@@ -331,7 +331,7 @@ bart_model_warmstart <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = F, sample_tau = F
+    sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
 
@@ -363,7 +363,7 @@ bart_model_mcmc <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = F, sample_tau = F
+    sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
 
@@ -462,7 +462,7 @@ bart_model_warmstart <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = F, sample_tau = F
+    sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
 
@@ -494,7 +494,7 @@ bart_model_mcmc <- stochtree::bart(
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
-    sample_sigma = F, sample_tau = F
+    sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
 
diff --git a/vignettes/PriorCalibration.Rmd b/vignettes/PriorCalibration.Rmd
index f2ae5d59..9cf56ba5 100644
--- a/vignettes/PriorCalibration.Rmd
+++ b/vignettes/PriorCalibration.Rmd
@@ -102,7 +102,7 @@ abline(0,1,col="red",lty=3,lwd=3)
 Inspect the posterior samples of $\sigma^2$
 
 ```{r}
-plot(bart_model$sigma2_samples, ylab = "sigma^2", xlab = "iteration")
+plot(bart_model$sigma2_global_samples, ylab = "sigma^2", xlab = "iteration")
 abline(h = noise_sd^2, col = "red", lty = 3, lwd = 3)
 ```
 

From 9a3160f8f7ecba090a85b9d11fd765bc2d1b0228 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sun, 6 Oct 2024 00:45:16 -0400
Subject: [PATCH 39/41] Fixed python unit tests

---
 src/partition_tracker.cpp    |  3 ++-
 stochtree/bart.py            |  5 +++++
 stochtree/bcf.py             | 11 +++++------
 stochtree/serialization.py   |  3 ++-
 test/python/test_json.py     |  2 +-
 test/python/test_predict.py  |  6 +++---
 test/python/test_residual.py |  2 +-
 7 files changed, 19 insertions(+), 13 deletions(-)

diff --git a/src/partition_tracker.cpp b/src/partition_tracker.cpp
index e1237cec..38b4ce68 100644
--- a/src/partition_tracker.cpp
+++ b/src/partition_tracker.cpp
@@ -121,7 +121,8 @@ void ForestTracker::UpdatePredictionsInternal(TreeEnsemble* ensemble, Eigen::Mat
 }
 
 void ForestTracker::UpdatePredictions(TreeEnsemble* ensemble, ForestDataset& dataset) {
-  if (dataset.HasBasis()) {
+  if (!ensemble->IsLeafConstant()) {
+    CHECK(dataset.HasBasis());
     UpdatePredictionsInternal(ensemble, dataset.GetCovariates(), dataset.GetBasis());
   } else {
     UpdatePredictionsInternal(ensemble, dataset.GetCovariates());
diff --git a/stochtree/bart.py b/stochtree/bart.py
index 2f4c59b7..594fa9c1 100644
--- a/stochtree/bart.py
+++ b/stochtree/bart.py
@@ -249,6 +249,11 @@ def sample(self, X_train: np.array, y_train: np.array, basis_train: np.array = N
                 a_forest = num_trees_variance / 1.5**2 + 0.5
             if not b_forest:
                 b_forest = num_trees_variance / 1.5**2
+        else:
+            if not a_forest:
+                a_forest = 1.
+            if not b_forest:
+                b_forest = 1.
 
         # Container of variance parameter samples
         self.num_gfr = num_gfr
diff --git a/stochtree/bcf.py b/stochtree/bcf.py
index 7c3d7c15..f87a0db7 100644
--- a/stochtree/bcf.py
+++ b/stochtree/bcf.py
@@ -639,16 +639,15 @@ def sample(self, X_train: Union[pd.DataFrame, np.array], Z_train: np.array, y_tr
             leaf_var_model_tau = LeafVarianceModel()
 
         # Initialize the leaves of each tree in the prognostic forest
-        init_mu = np.squeeze(np.mean(resid_train)) / num_trees_mu
-        self.forest_container_mu.set_root_leaves(0, init_mu)
-        forest_sampler_mu.adjust_residual(forest_dataset_train, residual_train, self.forest_container_mu, False, 0, True)
+        init_mu = np.array([np.squeeze(np.mean(resid_train))])
+        forest_sampler_mu.prepare_for_sampler(forest_dataset_train, residual_train, self.forest_container_mu, 0, init_mu)
 
         # Initialize the leaves of each tree in the treatment forest
         if self.multivariate_treatment:
-            self.forest_container_tau.set_root_leaves(0, np.zeros(self.treatment_dim))
+            init_tau = np.zeros(Z_train.shape[1])
         else:
-            self.forest_container_tau.set_root_leaves(0, 0.)
-        forest_sampler_tau.adjust_residual(forest_dataset_train, residual_train, self.forest_container_tau, True, 0, True)
+            init_tau = np.array([0.])
+        forest_sampler_tau.prepare_for_sampler(forest_dataset_train, residual_train, self.forest_container_tau, treatment_leaf_model, init_tau)
 
         # Run GFR (warm start) if specified
         if self.num_gfr > 0:
diff --git a/stochtree/serialization.py b/stochtree/serialization.py
index 9c7d04bc..a9f9e0d1 100644
--- a/stochtree/serialization.py
+++ b/stochtree/serialization.py
@@ -178,6 +178,7 @@ def get_string_vector(self, field_name: str, subfolder_name: str = None) -> list
             return self.json_cpp.ExtractStringVectorSubfolder(subfolder_name, field_name)
     
     def get_forest_container(self, forest_label: str) -> ForestContainer:
-        result = ForestContainer(0, 1, True)
+        # TODO: read this from JSON
+        result = ForestContainer(0, 1, True, False)
         result.forest_container_cpp.LoadFromJson(self.json_cpp, forest_label)
         return result
diff --git a/test/python/test_json.py b/test/python/test_json.py
index db88d3d6..8a187709 100644
--- a/test/python/test_json.py
+++ b/test/python/test_json.py
@@ -57,7 +57,7 @@ def outcome_mean(X):
 
         # Roundtrip to / from JSON
         json_test = JSONSerializer()
-        json_test.add_forest(bart_model.forest_container)
+        json_test.add_forest(bart_model.forest_container_mean)
         forest_container = json_test.get_forest_container("forest_0")
 
         # Predict from the deserialized forest container
diff --git a/test/python/test_predict.py b/test/python/test_predict.py
index 154a6773..77505915 100644
--- a/test/python/test_predict.py
+++ b/test/python/test_predict.py
@@ -18,7 +18,7 @@ def test_constant_leaf_prediction(self):
         output_dim = 1
         forest_dataset = Dataset()
         forest_dataset.add_covariates(X)
-        forest_samples = ForestContainer(num_trees, output_dim, True)
+        forest_samples = ForestContainer(num_trees, output_dim, True, False)
 
         # Initialize a forest with constant root predictions
         forest_samples.add_sample(0.)
@@ -82,7 +82,7 @@ def test_univariate_regression_leaf_prediction(self):
         forest_dataset = Dataset()
         forest_dataset.add_covariates(X)
         forest_dataset.add_basis(W)
-        forest_samples = ForestContainer(num_trees, output_dim, False)
+        forest_samples = ForestContainer(num_trees, output_dim, False, False)
 
         # Initialize a forest with constant root predictions
         forest_samples.add_sample(0.)
@@ -149,7 +149,7 @@ def test_multivariate_regression_leaf_prediction(self):
         forest_dataset = Dataset()
         forest_dataset.add_covariates(X)
         forest_dataset.add_basis(W)
-        forest_samples = ForestContainer(num_trees, output_dim, False)
+        forest_samples = ForestContainer(num_trees, output_dim, False, False)
 
         # Initialize a forest with constant root predictions
         forest_samples.add_sample(np.array([1.,1.]))
diff --git a/test/python/test_residual.py b/test/python/test_residual.py
index 13d75e41..7acb9688 100644
--- a/test/python/test_residual.py
+++ b/test/python/test_residual.py
@@ -49,7 +49,7 @@ def test_basis_update(self):
 
         # Create forest sampler and forest container
         forest_sampler = ForestSampler(forest_dataset, feature_types, num_trees, n, alpha, beta, min_samples_leaf)
-        forest_container = ForestContainer(num_trees, 1, False)
+        forest_container = ForestContainer(num_trees, 1, False, False)
         
         # Initialize the leaves of each tree in the prognostic forest
         init_root = np.squeeze(np.mean(resid)) / num_trees

From 2d5b4740496ec3b6d27aa4de89a636ca406a2fb3 Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Sun, 6 Oct 2024 23:56:24 -0500
Subject: [PATCH 40/41] Updated to work with the latest version of stochtree

---
 R/bart.R                                 | 117 +++++++++++++++--------
 R/bcf.R                                  |  20 ++--
 R/kernel.R                               |  64 ++++++++++---
 man/bart.Rd                              |  20 ++--
 man/computeForestKernels.Rd              |  13 ++-
 man/computeForestLeafIndices.Rd          |  13 ++-
 vignettes/BayesianSupervisedLearning.Rmd |  16 ++--
 vignettes/EnsembleKernel.Rmd             |   4 +-
 vignettes/Heteroskedasticity.Rmd         |  14 +--
 vignettes/ModelSerialization.Rmd         |  89 ++++++++++++++++-
 vignettes/MultiChain.Rmd                 |  11 ++-
 vignettes/vignettes.bib                  |  11 +++
 12 files changed, 299 insertions(+), 93 deletions(-)

diff --git a/R/bart.R b/R/bart.R
index 21aeb964..4dd796fc 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -544,7 +544,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     
     # Rescale variance forest prediction by sigma2_samples
     if (include_variance_forest) {
-        if (sample_sigma) {
+        if (sample_sigma_global) {
             sigma_x_hat_train <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_train[,i]*sigma2_samples[i]))
             if (has_test) sigma_x_hat_test <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_test[,i]*sigma2_samples[i]))
         } else {
@@ -576,6 +576,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         "num_gfr" = num_gfr, 
         "num_burnin" = num_burnin, 
         "num_mcmc" = num_mcmc, 
+        "num_retained_samples" = length(keep_indices),
         "has_basis" = !is.null(W_train), 
         "has_rfx" = has_rfx, 
         "has_rfx_basis" = has_basis_rfx, 
@@ -872,7 +873,12 @@ convertBARTModelToJson <- function(object){
     }
 
     # Add the forests
-    jsonobj$add_forest(object$forests)
+    if (object$model_params$include_mean_forest) {
+        jsonobj$add_forest(object$mean_forests)
+    }
+    if (object$model_params$include_variance_forest) {
+        jsonobj$add_forest(object$variance_forests)
+    }
 
     # Add metadata
     jsonobj$add_scalar("num_numeric_vars", object$train_set_metadata$num_numeric_vars)
@@ -893,8 +899,10 @@ convertBARTModelToJson <- function(object){
     # Add global parameters
     jsonobj$add_scalar("outcome_scale", object$model_params$outcome_scale)
     jsonobj$add_scalar("outcome_mean", object$model_params$outcome_mean)
-    jsonobj$add_boolean("sample_sigma", object$model_params$sample_sigma)
-    jsonobj$add_boolean("sample_tau", object$model_params$sample_tau)
+    jsonobj$add_boolean("sample_sigma_global", object$model_params$sample_sigma_global)
+    jsonobj$add_boolean("sample_sigma_leaf", object$model_params$sample_sigma_leaf)
+    jsonobj$add_boolean("include_mean_forest", object$model_params$include_mean_forest)
+    jsonobj$add_boolean("include_variance_forest", object$model_params$include_variance_forest)
     jsonobj$add_boolean("has_rfx", object$model_params$has_rfx)
     jsonobj$add_boolean("has_rfx_basis", object$model_params$has_rfx_basis)
     jsonobj$add_scalar("num_rfx_basis", object$model_params$num_rfx_basis)
@@ -906,11 +914,11 @@ convertBARTModelToJson <- function(object){
     jsonobj$add_scalar("num_basis", object$model_params$num_basis)
     jsonobj$add_boolean("requires_basis", object$model_params$requires_basis)
     jsonobj$add_vector("keep_indices", object$keep_indices)
-    if (object$model_params$sample_sigma) {
-        jsonobj$add_vector("sigma2_samples", object$sigma2_samples, "parameters")
+    if (object$model_params$sample_sigma_global) {
+        jsonobj$add_vector("sigma2_global_samples", object$sigma2_global_samples, "parameters")
     }
-    if (object$model_params$sample_tau) {
-        jsonobj$add_vector("tau_samples", object$tau_samples, "parameters")
+    if (object$model_params$sample_sigma_leaf) {
+        jsonobj$add_vector("sigma2_leaf_samples", object$sigma2_leaf_samples, "parameters")
     }
 
     # Add random effects (if present)
@@ -1035,7 +1043,16 @@ createBARTModelFromJson <- function(json_object){
     output <- list()
     
     # Unpack the forests
-    output[["forests"]] <- loadForestContainerJson(json_object, "forest_0")
+    include_mean_forest <- json_object$get_boolean("include_mean_forest")
+    include_variance_forest <- json_object$get_boolean("include_variance_forest")
+    if (include_mean_forest) {
+        output[["mean_forests"]] <- loadForestContainerJson(json_object, "forest_0")
+        if (include_variance_forest) {
+            output[["variance_forests"]] <- loadForestContainerJson(json_object, "forest_1")
+        }
+    } else {
+        output[["variance_forests"]] <- loadForestContainerJson(json_object, "forest_0")
+    }
 
     # Unpack metadata
     train_set_metadata = list()
@@ -1060,8 +1077,10 @@ createBARTModelFromJson <- function(json_object){
     model_params = list()
     model_params[["outcome_scale"]] <- json_object$get_scalar("outcome_scale")
     model_params[["outcome_mean"]] <- json_object$get_scalar("outcome_mean")
-    model_params[["sample_sigma"]] <- json_object$get_boolean("sample_sigma")
-    model_params[["sample_tau"]] <- json_object$get_boolean("sample_tau")
+    model_params[["sample_sigma_global"]] <- json_object$get_boolean("sample_sigma_global")
+    model_params[["sample_sigma_leaf"]] <- json_object$get_boolean("sample_sigma_leaf")
+    model_params[["include_mean_forest"]] <- include_mean_forest
+    model_params[["include_variance_forest"]] <- include_variance_forest
     model_params[["has_rfx"]] <- json_object$get_boolean("has_rfx")
     model_params[["has_rfx_basis"]] <- json_object$get_boolean("has_rfx_basis")
     model_params[["num_rfx_basis"]] <- json_object$get_scalar("num_rfx_basis")
@@ -1075,11 +1094,11 @@ createBARTModelFromJson <- function(json_object){
     output[["model_params"]] <- model_params
     
     # Unpack sampled parameters
-    if (model_params[["sample_sigma"]]) {
-        output[["sigma2_samples"]] <- json_object$get_vector("sigma2_samples", "parameters")
+    if (model_params[["sample_sigma_global"]]) {
+        output[["sigma2_global_samples"]] <- json_object$get_vector("sigma2_global_samples", "parameters")
     }
-    if (model_params[["sample_tau"]]) {
-        output[["tau_samples"]] <- json_object$get_vector("tau_samples", "parameters")
+    if (model_params[["sample_sigma_leaf"]]) {
+        output[["sigma2_leaf_samples"]] <- json_object$get_vector("sigma2_leaf_samples", "parameters")
     }
 
     # Unpack random effects
@@ -1214,14 +1233,23 @@ createBARTModelFromJsonString <- function(json_string){
 createBARTModelFromCombinedJson <- function(json_object_list){
     # Initialize the BCF model
     output <- list()
-    
-    # Unpack the forests
-    output[["forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_0")
-    
+
     # For scalar / preprocessing details which aren't sample-dependent, 
     # defer to the first json
     json_object_default <- json_object_list[[1]]
     
+    # Unpack the forests
+    include_mean_forest <- json_object_default$get_boolean("include_mean_forest")
+    include_variance_forest <- json_object_default$get_boolean("include_variance_forest")
+    if (include_mean_forest) {
+        output[["mean_forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_0")
+        if (include_variance_forest) {
+            output[["variance_forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_1")
+        }
+    } else {
+        output[["variance_forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_0")
+    }
+    
     # Unpack metadata
     train_set_metadata = list()
     train_set_metadata[["num_numeric_vars"]] <- json_object_default$get_scalar("num_numeric_vars")
@@ -1244,8 +1272,10 @@ createBARTModelFromCombinedJson <- function(json_object_list){
     model_params = list()
     model_params[["outcome_scale"]] <- json_object_default$get_scalar("outcome_scale")
     model_params[["outcome_mean"]] <- json_object_default$get_scalar("outcome_mean")
-    model_params[["sample_sigma"]] <- json_object_default$get_boolean("sample_sigma")
-    model_params[["sample_tau"]] <- json_object_default$get_boolean("sample_tau")
+    model_params[["sample_sigma_global"]] <- json_object$get_boolean("sample_sigma_global")
+    model_params[["sample_sigma_leaf"]] <- json_object$get_boolean("sample_sigma_leaf")
+    model_params[["include_mean_forest"]] <- include_mean_forest
+    model_params[["include_variance_forest"]] <- include_variance_forest
     model_params[["has_rfx"]] <- json_object_default$get_boolean("has_rfx")
     model_params[["has_rfx_basis"]] <- json_object_default$get_boolean("has_rfx_basis")
     model_params[["num_rfx_basis"]] <- json_object_default$get_scalar("num_rfx_basis")
@@ -1278,23 +1308,23 @@ createBARTModelFromCombinedJson <- function(json_object_list){
     output[["model_params"]] <- model_params
     
     # Unpack sampled parameters
-    if (model_params[["sample_sigma"]]) {
+    if (model_params[["sample_sigma_global"]]) {
         for (i in 1:length(json_object_list)) {
             json_object <- json_object_list[[i]]
             if (i == 1) {
-                output[["sigma2_samples"]] <- json_object$get_vector("sigma2_samples", "parameters")
+                output[["sigma2_global_samples"]] <- json_object$get_vector("sigma2_global_samples", "parameters")
             } else {
-                output[["sigma2_samples"]] <- c(output[["sigma2_samples"]], json_object$get_vector("sigma2_samples", "parameters"))
+                output[["sigma2_global_samples"]] <- c(output[["sigma2_global_samples"]], json_object$get_vector("sigma2_global_samples", "parameters"))
             }
         }
     }
-    if (model_params[["sample_tau"]]) {
+    if (model_params[["sample_sigma_leaf"]]) {
         for (i in 1:length(json_object_list)) {
             json_object <- json_object_list[[i]]
             if (i == 1) {
-                output[["tau_samples"]] <- json_object$get_vector("tau_samples", "parameters")
+                output[["sigma2_leaf_samples"]] <- json_object$get_vector("sigma2_leaf_samples", "parameters")
             } else {
-                output[["tau_samples"]] <- c(output[["tau_samples"]], json_object$get_vector("tau_samples", "parameters"))
+                output[["sigma2_leaf_samples"]] <- c(output[["sigma2_leaf_samples"]], json_object$get_vector("sigma2_leaf_samples", "parameters"))
             }
         }
     }
@@ -1352,13 +1382,22 @@ createBARTModelFromCombinedJsonString <- function(json_string_list){
         json_object_list[[i]] <- createCppJsonString(json_string)
     }
     
-    # Unpack the forests
-    output[["forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_0")
-    
     # For scalar / preprocessing details which aren't sample-dependent, 
     # defer to the first json
     json_object_default <- json_object_list[[1]]
     
+    # Unpack the forests
+    include_mean_forest <- json_object_default$get_boolean("include_mean_forest")
+    include_variance_forest <- json_object_default$get_boolean("include_variance_forest")
+    if (include_mean_forest) {
+        output[["mean_forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_0")
+        if (include_variance_forest) {
+            output[["variance_forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_1")
+        }
+    } else {
+        output[["variance_forests"]] <- loadForestContainerCombinedJson(json_object_list, "forest_0")
+    }
+    
     # Unpack metadata
     train_set_metadata = list()
     train_set_metadata[["num_numeric_vars"]] <- json_object_default$get_scalar("num_numeric_vars")
@@ -1382,8 +1421,10 @@ createBARTModelFromCombinedJsonString <- function(json_string_list){
     model_params = list()
     model_params[["outcome_scale"]] <- json_object_default$get_scalar("outcome_scale")
     model_params[["outcome_mean"]] <- json_object_default$get_scalar("outcome_mean")
-    model_params[["sample_sigma"]] <- json_object_default$get_boolean("sample_sigma")
-    model_params[["sample_tau"]] <- json_object_default$get_boolean("sample_tau")
+    model_params[["sample_sigma_global"]] <- json_object$get_boolean("sample_sigma_global")
+    model_params[["sample_sigma_leaf"]] <- json_object$get_boolean("sample_sigma_leaf")
+    model_params[["include_mean_forest"]] <- include_mean_forest
+    model_params[["include_variance_forest"]] <- include_variance_forest
     model_params[["has_rfx"]] <- json_object_default$get_boolean("has_rfx")
     model_params[["has_rfx_basis"]] <- json_object_default$get_boolean("has_rfx_basis")
     model_params[["num_rfx_basis"]] <- json_object_default$get_scalar("num_rfx_basis")
@@ -1416,23 +1457,23 @@ createBARTModelFromCombinedJsonString <- function(json_string_list){
     output[["model_params"]] <- model_params
     
     # Unpack sampled parameters
-    if (model_params[["sample_sigma"]]) {
+    if (model_params[["sample_sigma_global"]]) {
         for (i in 1:length(json_object_list)) {
             json_object <- json_object_list[[i]]
             if (i == 1) {
-                output[["sigma2_samples"]] <- json_object$get_vector("sigma2_samples", "parameters")
+                output[["sigma2_global_samples"]] <- json_object$get_vector("sigma2_global_samples", "parameters")
             } else {
-                output[["sigma2_samples"]] <- c(output[["sigma2_samples"]], json_object$get_vector("sigma2_samples", "parameters"))
+                output[["sigma2_global_samples"]] <- c(output[["sigma2_global_samples"]], json_object$get_vector("sigma2_global_samples", "parameters"))
             }
         }
     }
-    if (model_params[["sample_tau"]]) {
+    if (model_params[["sample_sigma_leaf"]]) {
         for (i in 1:length(json_object_list)) {
             json_object <- json_object_list[[i]]
             if (i == 1) {
-                output[["tau_samples"]] <- json_object$get_vector("tau_samples", "parameters")
+                output[["sigma2_leaf_samples"]] <- json_object$get_vector("sigma2_leaf_samples", "parameters")
             } else {
-                output[["tau_samples"]] <- c(output[["tau_samples"]], json_object$get_vector("tau_samples", "parameters"))
+                output[["sigma2_leaf_samples"]] <- c(output[["sigma2_leaf_samples"]], json_object$get_vector("sigma2_leaf_samples", "parameters"))
             }
         }
     }
diff --git a/R/bcf.R b/R/bcf.R
index 6a406f81..bf63972a 100644
--- a/R/bcf.R
+++ b/R/bcf.R
@@ -498,13 +498,17 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     forest_samples_mu <- createForestContainer(num_trees_mu, 1, T)
     forest_samples_tau <- createForestContainer(num_trees_tau, 1, F)
     
+    # Placeholder heteroskedasticity parameters
+    a_forest = 1.
+    b_forest = 1.
+    
     # Initialize the leaves of each tree in the prognostic forest
-    forest_samples_mu$set_root_leaves(0, mean(resid_train) / num_trees_mu)
-    forest_samples_mu$adjust_residual(forest_dataset_train, outcome_train, forest_model_mu, F, 0, F)
+    init_mu <- mean(resid_train)
+    forest_samples_mu$prepare_for_sampler(forest_dataset_train, outcome_train, forest_model_mu, 0, init_mu)
     
     # Initialize the leaves of each tree in the treatment effect forest
-    forest_samples_tau$set_root_leaves(0, 0.)
-    forest_samples_tau$adjust_residual(forest_dataset_train, outcome_train, forest_model_tau, T, 0, F)
+    init_tau <- 0.
+    forest_samples_tau$prepare_for_sampler(forest_dataset_train, outcome_train, forest_model_tau, 1, init_tau)
 
     # Run GFR (warm start) if specified
     if (num_gfr > 0){
@@ -520,7 +524,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             # Sample the prognostic forest
             forest_model_mu$sample_one_iteration(
                 forest_dataset_train, outcome_train, forest_samples_mu, rng, feature_types, 
-                0, current_leaf_scale_mu, variable_weights_mu, 
+                0, current_leaf_scale_mu, variable_weights_mu, a_forest, b_forest, 
                 current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = T
             )
             
@@ -537,7 +541,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             # Sample the treatment forest
             forest_model_tau$sample_one_iteration(
                 forest_dataset_train, outcome_train, forest_samples_tau, rng, feature_types, 
-                1, current_leaf_scale_tau, variable_weights_tau, 
+                1, current_leaf_scale_tau, variable_weights_tau, a_forest, b_forest, 
                 current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = T
             )
             
@@ -619,7 +623,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             # Sample the prognostic forest
             forest_model_mu$sample_one_iteration(
                 forest_dataset_train, outcome_train, forest_samples_mu, rng, feature_types, 
-                0, current_leaf_scale_mu, variable_weights_mu, 
+                0, current_leaf_scale_mu, variable_weights_mu, a_forest, b_forest, 
                 current_sigma2, cutpoint_grid_size, gfr = F, pre_initialized = T
             )
             
@@ -636,7 +640,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             # Sample the treatment forest
             forest_model_tau$sample_one_iteration(
                 forest_dataset_train, outcome_train, forest_samples_tau, rng, feature_types, 
-                1, current_leaf_scale_tau, variable_weights_tau, 
+                1, current_leaf_scale_tau, variable_weights_tau, a_forest, b_forest, 
                 current_sigma2, cutpoint_grid_size, gfr = F, pre_initialized = T
             )
             
diff --git a/R/kernel.R b/R/kernel.R
index 5b199082..2675d2b3 100644
--- a/R/kernel.R
+++ b/R/kernel.R
@@ -132,8 +132,10 @@ createForestKernel <- function() {
 #' corresponds to the observations for which outcomes are unobserved and must be estimated 
 #' based on the kernels k(X_test,X_test), k(X_test,X_train), and k(X_train,X_train). If not provided, 
 #' this function will only compute k(X_train, X_train).
-#' @param forest_num (Option) Index of the forest sample to use for kernel computation. If not provided, 
+#' @param forest_num (Optional) Index of the forest sample to use for kernel computation. If not provided, 
 #' this function will use the last forest.
+#' @param forest_type (Optional) Whether to compute the kernel from the mean or variance forest. Default: "mean". Specify "variance" for the variance forest. 
+#' All other inputs are invalid. Must have sampled the relevant forest or an error will occur.
 #' @return List of kernel matrices. If `X_test = NULL`, the list contains 
 #' one `n_train` x `n_train` matrix, where `n_train = nrow(X_train)`. 
 #' This matrix is the kernel defined by `W_train %*% t(W_train)` where `W_train` 
@@ -141,8 +143,19 @@ createForestKernel <- function() {
 #' If `X_test` is not `NULL`, the list contains two more matrices defined by 
 #' `W_test %*% t(W_train)` and `W_test %*% t(W_test)`.
 #' @export
-computeForestKernels <- function(bart_model, X_train, X_test=NULL, forest_num=NULL) {
+computeForestKernels <- function(bart_model, X_train, X_test=NULL, forest_num=NULL, forest_type="mean") {
     stopifnot(class(bart_model)=="bartmodel")
+    if (forest_type=="mean") {
+        if (!bart_model$model_params$include_mean_forest) {
+            stop("Mean forest was not sampled in the bart model provided")
+        }
+    } else if (forest_type=="variance") {
+        if (!bart_model$model_params$include_variance_forest) {
+            stop("Variance forest was not sampled in the bart model provided")
+        }
+    } else {
+        stop("Must provide either 'mean' or 'variance' for the `forest_type` parameter")
+    }
     
     # Preprocess covariates
     if (!is.data.frame(X_train)) {
@@ -164,10 +177,17 @@ computeForestKernels <- function(bart_model, X_train, X_test=NULL, forest_num=NU
     num_samples <- bart_model$model_params$num_samples
     stopifnot(forest_num <= num_samples)
     sample_index <- ifelse(is.null(forest_num), num_samples-1, forest_num-1)
-    return(forest_kernel$compute_kernel(
-        covariates_train = X_train, covariates_test = X_test,
-        forest_container = bart_model$forests, forest_num = sample_index
-    ))
+    if (forest_type=="mean") {
+        return(forest_kernel$compute_kernel(
+            covariates_train = X_train, covariates_test = X_test,
+            forest_container = bart_model$mean_forests, forest_num = sample_index
+        ))
+    } else if (forest_type=="variance") {
+        return(forest_kernel$compute_kernel(
+            covariates_train = X_train, covariates_test = X_test,
+            forest_container = bart_model$variance_forests, forest_num = sample_index
+        ))
+    }
 }
 
 #' Compute and return a vector representation of a forest's leaf predictions for 
@@ -192,21 +212,41 @@ computeForestKernels <- function(bart_model, X_train, X_test=NULL, forest_num=NU
 #' corresponds to the observations for which outcomes are unobserved and must be estimated 
 #' based on the kernels k(X_test,X_test), k(X_test,X_train), and k(X_train,X_train). If not provided, 
 #' this function will only compute k(X_train, X_train).
-#' @param forest_num (Option) Index of the forest sample to use for kernel computation. If not provided, 
+#' @param forest_num (Optional) Index of the forest sample to use for kernel computation. If not provided, 
 #' this function will use the last forest.
+#' @param forest_type (Optional) Whether to compute the kernel from the mean or variance forest. Default: "mean". Specify "variance" for the variance forest. 
+#' All other inputs are invalid. Must have sampled the relevant forest or an error will occur.
 #' @return List of vectors. If `X_test = NULL`, the list contains 
 #' one vector of length `n_train * num_trees`, where `n_train = nrow(X_train)` 
 #' and `num_trees` is the number of trees in `bart_model`. If `X_test` is not `NULL`, 
 #' the list contains another vector of length `n_test * num_trees`.
 #' @export
-computeForestLeafIndices <- function(bart_model, X_train, X_test=NULL, forest_num=NULL) {
+computeForestLeafIndices <- function(bart_model, X_train, X_test=NULL, forest_num=NULL, forest_type="mean") {
     stopifnot(class(bart_model)=="bartmodel")
+    if (forest_type=="mean") {
+        if (!bart_model$model_params$include_mean_forest) {
+            stop("Mean forest was not sampled in the bart model provided")
+        }
+    } else if (forest_type=="variance") {
+        if (!bart_model$model_params$include_variance_forest) {
+            stop("Variance forest was not sampled in the bart model provided")
+        }
+    } else {
+        stop("Must provide either 'mean' or 'variance' for the `forest_type` parameter")
+    }
     forest_kernel <- createForestKernel()
     num_samples <- bart_model$model_params$num_samples
     stopifnot(forest_num <= num_samples)
     sample_index <- ifelse(is.null(forest_num), num_samples-1, forest_num-1)
-    return(forest_kernel$compute_leaf_indices(
-        covariates_train = X_train, covariates_test = X_test,
-        forest_container = bart_model$forests, forest_num = sample_index
-    ))
+    if (forest_type == "mean") {
+        return(forest_kernel$compute_leaf_indices(
+            covariates_train = X_train, covariates_test = X_test,
+            forest_container = bart_model$mean_forests, forest_num = sample_index
+        ))
+    } else if (forest_type == "variance") {
+        return(forest_kernel$compute_leaf_indices(
+            covariates_train = X_train, covariates_test = X_test,
+            forest_container = bart_model$variance_forests, forest_num = sample_index
+        ))
+    }
 }
diff --git a/man/bart.Rd b/man/bart.Rd
index c8434c05..fa90f64a 100644
--- a/man/bart.Rd
+++ b/man/bart.Rd
@@ -34,8 +34,8 @@ bart(
   sigma2_init = NULL,
   variance_forest_init = NULL,
   pct_var_sigma2_init = 1,
-  variance_scale = 1,
   pct_var_variance_forest_init = 1,
+  variance_scale = 1,
   variable_weights_mean = NULL,
   variable_weights_variance = NULL,
   num_trees_mean = 200,
@@ -43,8 +43,8 @@ bart(
   num_gfr = 5,
   num_burnin = 0,
   num_mcmc = 100,
-  sample_sigma = T,
-  sample_tau = T,
+  sample_sigma_global = T,
+  sample_sigma_leaf = F,
   random_seed = -1,
   keep_burnin = F,
   keep_gfr = F,
@@ -113,9 +113,9 @@ that were not in the training set.}
 
 \item{b_leaf}{Scale parameter in the \code{IG(a_leaf, b_leaf)} leaf node parameter variance model. Calibrated internally as \code{0.5/num_trees_mean} if not set here.}
 
-\item{a_forest}{Shape parameter in the \code{IG(a_forest, b_forest)} conditional error variance model (which is only sampled if \code{include_variance_forest = T}). Calibrated internally as \code{num_trees_variance / 1.5^2 + 0.5} if not set.}
+\item{a_forest}{Shape parameter in the \code{IG(a_forest, b_forest)} conditional error variance model (which is only sampled if \code{num_trees_variance > 0}). Calibrated internally as \code{num_trees_variance / 1.5^2 + 0.5} if not set.}
 
-\item{b_forest}{Scale parameter in the \code{IG(a_forest, b_forest)} conditional error variance model (which is only sampled if \code{include_variance_forest = T}). Calibrated internally as \code{num_trees_variance / 1.5^2} if not set.}
+\item{b_forest}{Scale parameter in the \code{IG(a_forest, b_forest)} conditional error variance model (which is only sampled if \code{num_trees_variance > 0}). Calibrated internally as \code{num_trees_variance / 1.5^2} if not set.}
 
 \item{q}{Quantile used to calibrated \code{lambda} as in Sparapani et al (2021). Default: 0.9.}
 
@@ -123,12 +123,12 @@ that were not in the training set.}
 
 \item{variance_forest_init}{Starting value of root forest prediction in conditional (heteroskedastic) error variance model. Calibrated internally as \code{log(pct_var_variance_forest_init*var((y-mean(y))/sd(y)))/num_trees_variance} if not set.}
 
-\item{pct_var_sigma2_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by \code{sigma2_init}.}
-
-\item{variance_scale}{Variance after the data have been scaled. Default: 1.}
+\item{pct_var_sigma2_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by \code{sigma2_init}.}
 
 \item{pct_var_variance_forest_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by \code{variance_forest_init}.}
 
+\item{variance_scale}{Variance after the data have been scaled. Default: 1.}
+
 \item{variable_weights_mean}{Numeric weights reflecting the relative probability of splitting on each variable in the mean forest. Does not need to sum to 1 but cannot be negative. Defaults to \code{rep(1/ncol(X_train), ncol(X_train))} if not set here.}
 
 \item{variable_weights_variance}{Numeric weights reflecting the relative probability of splitting on each variable in the variance forest. Does not need to sum to 1 but cannot be negative. Defaults to \code{rep(1/ncol(X_train), ncol(X_train))} if not set here.}
@@ -143,9 +143,9 @@ that were not in the training set.}
 
 \item{num_mcmc}{Number of "retained" iterations of the MCMC sampler. Default: 100.}
 
-\item{sample_sigma}{Whether or not to update the \code{sigma^2} global error variance parameter based on \code{IG(a_globa, b_global)}. Default: T.}
+\item{sample_sigma_global}{Whether or not to update the \code{sigma^2} global error variance parameter based on \code{IG(a_global, b_global)}. Default: T.}
 
-\item{sample_tau}{Whether or not to update the \code{tau} leaf scale variance parameter based on \code{IG(a_leaf, b_leaf)}. Cannot (currently) be set to true if \code{ncol(W_train)>1}. Default: T.}
+\item{sample_sigma_leaf}{Whether or not to update the \code{tau} leaf scale variance parameter based on \code{IG(a_leaf, b_leaf)}. Cannot (currently) be set to true if \code{ncol(W_train)>1}. Default: F.}
 
 \item{random_seed}{Integer parameterizing the C++ random number generator. If not specified, the C++ random number generator is seeded according to \code{std::random_device}.}
 
diff --git a/man/computeForestKernels.Rd b/man/computeForestKernels.Rd
index ccabc40b..f9a02062 100644
--- a/man/computeForestKernels.Rd
+++ b/man/computeForestKernels.Rd
@@ -6,7 +6,13 @@
 of trees of an ensemble in which two observations fall into the
 same leaf.}
 \usage{
-computeForestKernels(bart_model, X_train, X_test = NULL, forest_num = NULL)
+computeForestKernels(
+  bart_model,
+  X_train,
+  X_test = NULL,
+  forest_num = NULL,
+  forest_type = "mean"
+)
 }
 \arguments{
 \item{bart_model}{Object of type \code{bartmodel} corresponding to a BART model with at least one sample}
@@ -19,8 +25,11 @@ corresponds to the observations for which outcomes are unobserved and must be es
 based on the kernels k(X_test,X_test), k(X_test,X_train), and k(X_train,X_train). If not provided,
 this function will only compute k(X_train, X_train).}
 
-\item{forest_num}{(Option) Index of the forest sample to use for kernel computation. If not provided,
+\item{forest_num}{(Optional) Index of the forest sample to use for kernel computation. If not provided,
 this function will use the last forest.}
+
+\item{forest_type}{(Optional) Whether to compute the kernel from the mean or variance forest. Default: "mean". Specify "variance" for the variance forest.
+All other inputs are invalid. Must have sampled the relevant forest or an error will occur.}
 }
 \value{
 List of kernel matrices. If \code{X_test = NULL}, the list contains
diff --git a/man/computeForestLeafIndices.Rd b/man/computeForestLeafIndices.Rd
index 0f5dd895..2c32b951 100644
--- a/man/computeForestLeafIndices.Rd
+++ b/man/computeForestLeafIndices.Rd
@@ -17,7 +17,13 @@ or two datasets (which we refer to as "training and test sets"). This verbiage
 hints that one potential use-case for a matrix of leaf indices is to define a
 ensemble-based kernel for kriging.}
 \usage{
-computeForestLeafIndices(bart_model, X_train, X_test = NULL, forest_num = NULL)
+computeForestLeafIndices(
+  bart_model,
+  X_train,
+  X_test = NULL,
+  forest_num = NULL,
+  forest_type = "mean"
+)
 }
 \arguments{
 \item{bart_model}{Object of type \code{bartmodel} corresponding to a BART model with at least one sample}
@@ -30,8 +36,11 @@ corresponds to the observations for which outcomes are unobserved and must be es
 based on the kernels k(X_test,X_test), k(X_test,X_train), and k(X_train,X_train). If not provided,
 this function will only compute k(X_train, X_train).}
 
-\item{forest_num}{(Option) Index of the forest sample to use for kernel computation. If not provided,
+\item{forest_num}{(Optional) Index of the forest sample to use for kernel computation. If not provided,
 this function will use the last forest.}
+
+\item{forest_type}{(Optional) Whether to compute the kernel from the mean or variance forest. Default: "mean". Specify "variance" for the variance forest.
+All other inputs are invalid. Must have sampled the relevant forest or an error will occur.}
 }
 \value{
 List of vectors. If \code{X_test = NULL}, the list contains
diff --git a/vignettes/BayesianSupervisedLearning.Rmd b/vignettes/BayesianSupervisedLearning.Rmd
index d66bca56..18c03b7a 100644
--- a/vignettes/BayesianSupervisedLearning.Rmd
+++ b/vignettes/BayesianSupervisedLearning.Rmd
@@ -75,7 +75,7 @@ num_mcmc <- 100
 num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_warmstart <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
-    num_trees = 100, num_gfr = num_gfr, num_burnin = num_burnin, 
+    num_trees_mean = 100, num_gfr = num_gfr, num_burnin = num_burnin, 
     num_mcmc = num_mcmc, sample_sigma_global = T, sample_sigma_leaf = T
 )
 ```
@@ -84,6 +84,7 @@ Inspect the MCMC samples
 
 ```{r bart_warmstart_plot}
 plot(bart_model_warmstart$sigma2_global_samples, ylab="sigma^2")
+abline(h=noise_sd^2,col="red",lty=2,lwd=2.5)
 plot(rowMeans(bart_model_warmstart$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
 abline(0,1,col="red",lty=2,lwd=2.5)
@@ -100,7 +101,7 @@ num_mcmc <- 100
 num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_root <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
-    num_trees = 100, num_gfr = num_gfr, num_burnin = num_burnin, 
+    num_trees_mean = 100, num_gfr = num_gfr, num_burnin = num_burnin, 
     num_mcmc = num_mcmc, sample_sigma_global = T, sample_sigma_leaf = T
 )
 ```
@@ -109,6 +110,7 @@ Inspect the MCMC samples
 
 ```{r bart_root_plot}
 plot(bart_model_root$sigma2_global_samples, ylab="sigma^2")
+abline(h=noise_sd^2,col="red",lty=2,lwd=2.5)
 plot(rowMeans(bart_model_root$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
 abline(0,1,col="red",lty=2,lwd=2.5)
@@ -166,7 +168,7 @@ num_mcmc <- 100
 num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_warmstart <- stochtree::bart(
     X_train = X_train, W_train = W_train, y_train = y_train, 
-    X_test = X_test, W_test = W_test, num_trees = 100, 
+    X_test = X_test, W_test = W_test, num_trees_mean = 100, 
     num_gfr = num_gfr, num_burnin = num_burnin, 
     num_mcmc = num_mcmc, sample_sigma_global = T, sample_sigma_leaf = T
 )
@@ -176,6 +178,7 @@ Inspect the MCMC samples
 
 ```{r bart_warmstart_plot_plm}
 plot(bart_model_warmstart$sigma2_global_samples, ylab="sigma^2")
+abline(h=noise_sd^2,col="red",lty=2,lwd=2.5)
 plot(rowMeans(bart_model_warmstart$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
 abline(0,1,col="red",lty=2,lwd=2.5)
@@ -192,7 +195,7 @@ num_mcmc <- 100
 num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_root <- stochtree::bart(
     X_train = X_train, W_train = W_train, y_train = y_train, 
-    X_test = X_test, W_test = W_test, num_trees = 100, 
+    X_test = X_test, W_test = W_test, num_trees_mean = 100, 
     num_gfr = num_gfr, num_burnin = num_burnin, 
     num_mcmc = num_mcmc, sample_sigma_global = T, sample_sigma_leaf = T
 )
@@ -202,6 +205,7 @@ Inspect the BART samples after burnin.
 
 ```{r bart_root_plot_plm}
 plot(bart_model_root$sigma2_global_samples, ylab="sigma^2")
+abline(h=noise_sd^2,col="red",lty=2,lwd=2.5)
 plot(rowMeans(bart_model_root$y_hat_test), y_test, 
      pch=16, cex=0.75, xlab = "pred", ylab = "actual")
 abline(0,1,col="red",lty=2,lwd=2.5)
@@ -270,7 +274,7 @@ bart_model_warmstart <- stochtree::bart(
     X_train = X_train, W_train = W_train, y_train = y_train, 
     group_ids_train = group_ids_train, rfx_basis_train = rfx_basis_train, 
     X_test = X_test, W_test = W_test, group_ids_test = group_ids_test,
-    rfx_basis_test = rfx_basis_test, num_trees = 100, num_gfr = num_gfr, 
+    rfx_basis_test = rfx_basis_test, num_trees_mean = 100, num_gfr = num_gfr, 
     num_burnin = num_burnin, num_mcmc = num_mcmc, 
     sample_sigma_global = T, sample_sigma_leaf = T
 )
@@ -299,7 +303,7 @@ bart_model_root <- stochtree::bart(
     X_train = X_train, W_train = W_train, y_train = y_train, 
     group_ids_train = group_ids_train, rfx_basis_train = rfx_basis_train, 
     X_test = X_test, W_test = W_test, group_ids_test = group_ids_test,
-    rfx_basis_test = rfx_basis_test, num_trees = 100, num_gfr = num_gfr, 
+    rfx_basis_test = rfx_basis_test, num_trees_mean = 100, num_gfr = num_gfr, 
     num_burnin = num_burnin, num_mcmc = num_mcmc, 
     sample_sigma_global = T, sample_sigma_leaf = T
 )
diff --git a/vignettes/EnsembleKernel.Rmd b/vignettes/EnsembleKernel.Rmd
index 7b7dd87c..cce00faf 100644
--- a/vignettes/EnsembleKernel.Rmd
+++ b/vignettes/EnsembleKernel.Rmd
@@ -96,7 +96,7 @@ sigma_leaf <- 1/num_trees
 X_train <- as.data.frame(X_train)
 X_test <- as.data.frame(X_test)
 colnames(X_train) <- colnames(X_test) <- "x1"
-bart_model <- bart(X_train=X_train, y_train=y_train, X_test=X_test, num_trees=num_trees)
+bart_model <- bart(X_train=X_train, y_train=y_train, X_test=X_test, num_trees_mean=num_trees)
 
 # Extract kernels needed for kriging
 result_kernels <- computeForestKernels(bart_model=bart_model, X_train=X_train, X_test=X_test)
@@ -167,7 +167,7 @@ num_trees <- 200
 sigma_leaf <- 1/num_trees
 X_train <- as.data.frame(X_train)
 X_test <- as.data.frame(X_test)
-bart_model <- bart(X_train=X_train, y_train=y_train, X_test=X_test, num_trees=num_trees)
+bart_model <- bart(X_train=X_train, y_train=y_train, X_test=X_test, num_trees_mean=num_trees)
 
 # Extract kernels needed for kriging
 result_kernels <- computeForestKernels(bart_model=bart_model, X_train=X_train, X_test=X_test)
diff --git a/vignettes/Heteroskedasticity.Rmd b/vignettes/Heteroskedasticity.Rmd
index 10261023..ed81c36a 100644
--- a/vignettes/Heteroskedasticity.Rmd
+++ b/vignettes/Heteroskedasticity.Rmd
@@ -20,7 +20,7 @@ knitr::opts_chunk$set(
 
 This vignette demonstrates how to use the `bart()` function for Bayesian 
 supervised learning (@chipman2010bart), with an additional "variance forest," 
-for modeling conditional variance. To begin, we load the `stochtree` package.
+for modeling conditional variance (see @murray2021log). To begin, we load the `stochtree` package.
 
 ```{r setup}
 library(stochtree)
@@ -122,7 +122,7 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_mcmc <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    num_trees_mean = 0, num_trees_variance = 20, 
+    num_trees_mean = 0, num_trees_variance = 50, 
     sample_sigma_global = F, sample_sigma_leaf = F
 )
 ```
@@ -232,7 +232,7 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_mcmc <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    num_trees_mean = 0, num_trees_variance = 20, 
+    num_trees_mean = 0, num_trees_variance = 50, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
@@ -327,7 +327,7 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_warmstart <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    num_trees_mean = 50, num_trees_variance = 20, 
+    num_trees_mean = 50, num_trees_variance = 50, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
@@ -359,7 +359,7 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_mcmc <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    num_trees_mean = 50, num_trees_variance = 20, 
+    num_trees_mean = 50, num_trees_variance = 50, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
@@ -458,7 +458,7 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_warmstart <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    num_trees_mean = 50, num_trees_variance = 20, 
+    num_trees_mean = 50, num_trees_variance = 50, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
@@ -490,7 +490,7 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bart_model_mcmc <- stochtree::bart(
     X_train = X_train, y_train = y_train, X_test = X_test, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
-    num_trees_mean = 50, num_trees_variance = 20, 
+    num_trees_mean = 50, num_trees_variance = 50, 
     alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
     alpha_variance = 0.95, beta_variance = 1.25, 
     min_samples_leaf_variance = 5, 
diff --git a/vignettes/ModelSerialization.Rmd b/vignettes/ModelSerialization.Rmd
index 199cbffd..cc1af62b 100644
--- a/vignettes/ModelSerialization.Rmd
+++ b/vignettes/ModelSerialization.Rmd
@@ -42,7 +42,7 @@ Here we show how to save and reload models from JSON files on disk.
 
 Draw from a modified version of the data generating process defined in @hahn2020bayesian.
 
-```{r data}
+```{r}
 # Generate synthetic data
 n <- 1000
 snr <- 2
@@ -141,4 +141,91 @@ plot(rowMeans(bcf_model$y_hat_train), rowMeans(bcf_preds_reload$y_hat),
 abline(0,1,col="red",lwd=3,lty=3)
 ```
 
+# Demo 2: BART
+
+BART models are initially sampled and constructed using the `bart()` function.
+Here we show how to save and reload models from JSON files on disk.
+
+## Model Building
+
+Draw from a relatively straightforward heteroskedastic supervised learning DGP.
+
+```{r}
+# Generate the data
+n <- 500
+p_x <- 10
+X <- matrix(runif(n*p_x), ncol = p_x)
+f_XW <- 0
+s_XW <- (
+    ((0 <= X[,1]) & (0.25 > X[,1])) * (0.5*X[,3]) + 
+    ((0.25 <= X[,1]) & (0.5 > X[,1])) * (1*X[,3]) + 
+    ((0.5 <= X[,1]) & (0.75 > X[,1])) * (2*X[,3]) + 
+    ((0.75 <= X[,1]) & (1 > X[,1])) * (3*X[,3])
+)
+y <- f_XW + rnorm(n, 0, 1)*s_XW
+
+# Split data into test and train sets
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- as.data.frame(X[test_inds,])
+X_train <- as.data.frame(X[train_inds,])
+W_test <- NULL
+W_train <- NULL
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+f_x_test <- f_XW[test_inds]
+f_x_train <- f_XW[train_inds]
+s_x_test <- s_XW[test_inds]
+s_x_train <- s_XW[train_inds]
+```
+
+Sample a BART model.
+
+```{r}
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 100
+num_samples <- num_gfr + num_burnin + num_mcmc
+bart_model <- stochtree::bart(
+    X_train = X_train, y_train = y_train, X_test = X_test, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    num_trees_mean = 0, num_trees_variance = 50, 
+    alpha_mean = 0.95, beta_mean = 2, min_samples_leaf_mean = 5, 
+    alpha_variance = 0.95, beta_variance = 1.25, 
+    min_samples_leaf_variance = 1, 
+    sample_sigma_global = F, sample_sigma_leaf = F
+)
+```
+
+## Serialization
+
+Save the BART model to disk.
+
+```{r bart_serialization}
+saveBARTModelToJsonFile(bart_model, "bart.json")
+```
+
+## Deserialization
+
+Reload the BART model from disk.
+
+```{r bart_deserialization}
+bart_model_reload <- createBARTModelFromJsonFile("bart.json")
+```
+
+Check that the predictions align with those of the original model.
+
+```{r bart_roundtrip}
+bart_preds_reload <- predict(bart_model_reload, X_train)
+plot(rowMeans(bart_model$y_hat_train), rowMeans(bart_preds_reload$y_hat), 
+     xlab = "Original", ylab = "Deserialized", main = "Conditional Mean Estimates")
+abline(0,1,col="red",lwd=3,lty=3)
+plot(rowMeans(bart_model$sigma_x_hat_train), rowMeans(bart_preds_reload$variance_forest_predictions), 
+     xlab = "Original", ylab = "Deserialized", main = "Conditional Variance Estimates")
+abline(0,1,col="red",lwd=3,lty=3)
+```
+
 # References
diff --git a/vignettes/MultiChain.Rmd b/vignettes/MultiChain.Rmd
index 9cecaadd..65752ae4 100644
--- a/vignettes/MultiChain.Rmd
+++ b/vignettes/MultiChain.Rmd
@@ -100,9 +100,10 @@ bart_models <- list()
 for (i in 1:num_chains) {
     bart_models[[i]] <- stochtree::bart(
         X_train = X_train, W_train = W_train, y_train = y_train, 
-        X_test = X_test, W_test = W_test, num_trees = num_trees, 
+        X_test = X_test, W_test = W_test, num_trees_mean = num_trees, 
         num_gfr = num_gfr, num_burnin = num_burnin, 
-        num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T
+        num_mcmc = num_mcmc, sample_sigma_global = T, 
+        sample_sigma_leaf = T
     )
 }
 ```
@@ -179,10 +180,10 @@ bart_model_strings <- foreach (i = 1:num_chains) %dopar% {
   random_seed <- i
   bart_model <- stochtree::bart(
     X_train = X_train, W_train = W_train, y_train = y_train, 
-    X_test = X_test, W_test = W_test, num_trees = num_trees, 
+    X_test = X_test, W_test = W_test, num_trees_mean = num_trees, 
     num_gfr = num_gfr, num_burnin = num_burnin, 
-    num_mcmc = num_mcmc, sample_sigma = T, sample_tau = T,
-    random_seed = random_seed
+    num_mcmc = num_mcmc, sample_sigma_global = T, 
+    sample_sigma_leaf = T, random_seed = random_seed
   )
   bart_model_string <- stochtree::saveBARTModelToJsonString(bart_model)
   bart_model_string
diff --git a/vignettes/vignettes.bib b/vignettes/vignettes.bib
index eec4a2a8..a1b0a768 100644
--- a/vignettes/vignettes.bib
+++ b/vignettes/vignettes.bib
@@ -1,3 +1,14 @@
+@article{murray2021log,
+  title={Log-linear Bayesian additive regression trees for multinomial logistic and count regression models},
+  author={Murray, Jared S},
+  journal={Journal of the American Statistical Association},
+  volume={116},
+  number={534},
+  pages={756--769},
+  year={2021},
+  publisher={Taylor \& Francis}
+}
+
 @article{pratola2020heteroscedastic,
   title={Heteroscedastic BART via multiplicative regression trees},
   author={Pratola, Matthew T and Chipman, Hugh A and George, Edward I and McCulloch, Robert E},

From cce596620b336fdfdf0ba169fd27b17424e6dfbb Mon Sep 17 00:00:00 2001
From: Drew Herren <drewherrenopensource@gmail.com>
Date: Mon, 7 Oct 2024 02:37:09 -0500
Subject: [PATCH 41/41] Added heteroskedasticity to BCF

---
 R/bart.R                      |  72 ++++++----
 R/bcf.R                       | 242 +++++++++++++++++++++++++++-------
 man/bart.Rd                   |   6 +-
 man/bcf.Rd                    |  52 ++++++--
 man/predict.bartmodel.Rd      |   5 +-
 man/predict.bcf.Rd            |   7 +-
 tools/debug/bcf_quick.R       |  53 ++++++++
 vignettes/CausalInference.Rmd |   1 +
 8 files changed, 339 insertions(+), 99 deletions(-)
 create mode 100644 tools/debug/bcf_quick.R

diff --git a/R/bart.R b/R/bart.R
index 4dd796fc..1c452bb0 100644
--- a/R/bart.R
+++ b/R/bart.R
@@ -25,7 +25,7 @@
 #' that were not in the training set.
 #' @param rfx_basis_test (Optional) Test set basis for "random-slope" regression in additive random effects model.
 #' @param cutpoint_grid_size Maximum size of the "grid" of potential cutpoints to consider. Default: 100.
-#' @param tau_init Starting value of leaf node scale parameter. Calibrated internally as `1/num_trees_mean` if not set here.
+#' @param sigma_leaf_init Starting value of leaf node scale parameter. Calibrated internally as `1/num_trees_mean` if not set here.
 #' @param leaf_model Model to use in the leaves, coded as integer with (0 = constant leaf, 1 = univariate leaf regression, 2 = multivariate leaf regression). Default: 0.
 #' @param alpha_mean Prior probability of splitting for a tree of depth 0 in the mean model. Tree split prior combines `alpha_mean` and `beta_mean` via `alpha_mean*(1+node_depth)^-beta_mean`. Default: 0.95.
 #' @param beta_mean Exponent that decreases split probabilities for nodes of depth > 0 in the mean model. Tree split prior combines `alpha_mean` and `beta_mean` via `alpha_mean*(1+node_depth)^-beta_mean`. Default: 2.
@@ -91,7 +91,7 @@
 bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL, 
                  rfx_basis_train = NULL, X_test = NULL, W_test = NULL, 
                  group_ids_test = NULL, rfx_basis_test = NULL, 
-                 cutpoint_grid_size = 100, tau_init = NULL, 
+                 cutpoint_grid_size = 100, sigma_leaf_init = NULL, 
                  alpha_mean = 0.95, beta_mean = 2.0, min_samples_leaf_mean = 5, 
                  max_depth_mean = 10, alpha_variance = 0.95, beta_variance = 2.0, 
                  min_samples_leaf_variance = 5, max_depth_variance = 10, 
@@ -100,7 +100,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
                  variance_forest_init = NULL, pct_var_sigma2_init = 1, 
                  pct_var_variance_forest_init = 1, variance_scale = 1, 
                  variable_weights_mean = NULL, variable_weights_variance = NULL, 
-                 num_trees_mean = 200, num_trees_variance = 20, 
+                 num_trees_mean = 200, num_trees_variance = 0, 
                  num_gfr = 5, num_burnin = 0, num_mcmc = 100, 
                  sample_sigma_global = T, sample_sigma_leaf = F, random_seed = -1, 
                  keep_burnin = F, keep_gfr = F, verbose = F) {
@@ -115,6 +115,9 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         a_0 <- 1.5
         if (is.null(a_forest)) a_forest <- num_trees_variance / (a_0^2) + 0.5
         if (is.null(b_forest)) b_forest <- num_trees_variance / (a_0^2)
+    } else {
+        a_forest <- 1.
+        b_forest <- 1.
     }
     
     # Override tau sampling if there is no mean forest
@@ -274,8 +277,8 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     if (is.null(sigma2_init)) sigma2_init <- pct_var_sigma2_init*var(resid_train)
     if (is.null(variance_forest_init)) variance_forest_init <- pct_var_variance_forest_init*var(resid_train)
     if (is.null(b_leaf)) b_leaf <- var(resid_train)/(2*num_trees_mean)
-    if (is.null(tau_init)) tau_init <- var(resid_train)/(num_trees_mean)
-    current_leaf_scale <- as.matrix(tau_init)
+    if (is.null(sigma_leaf_init)) sigma_leaf_init <- var(resid_train)/(num_trees_mean)
+    current_leaf_scale <- as.matrix(sigma_leaf_init)
     current_sigma2 <- sigma2_init
 
     # Determine leaf model type
@@ -542,7 +545,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     # Leaf parameter variance
     if (sample_sigma_leaf) tau_samples <- leaf_scale_samples[keep_indices]
     
-    # Rescale variance forest prediction by sigma2_samples
+    # Rescale variance forest prediction by global sigma2 (sampled or constant)
     if (include_variance_forest) {
         if (sample_sigma_global) {
             sigma_x_hat_train <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_train[,i]*sigma2_samples[i]))
@@ -557,9 +560,9 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
     # TODO: store variance_scale and propagate through predict function
     model_params <- list(
         "sigma2_init" = sigma2_init, 
+        "sigma_leaf_init" = sigma_leaf_init,
         "a_global" = a_global,
         "b_global" = b_global, 
-        "tau_init" = tau_init,
         "a_leaf" = a_leaf, 
         "b_leaf" = b_leaf,
         "a_forest" = a_forest, 
@@ -598,7 +601,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
         if (has_test) result[["y_hat_test"]] = y_hat_test
     }
     if (include_variance_forest) {
-        result[["var_forests"]] = forest_samples_variance
+        result[["variance_forests"]] = forest_samples_variance
         result[["sigma_x_hat_train"]] = sigma_x_hat_train
         if (has_test) result[["sigma_x_hat_test"]] = sigma_x_hat_test
     }
@@ -634,7 +637,6 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
 #' We do not currently support (but plan to in the near future), test set evaluation for group labels
 #' that were not in the training set.
 #' @param rfx_basis_test (Optional) Test set basis for "random-slope" regression in additive random effects model.
-#' @param predict_all (Optional) Whether to predict the model for all of the samples in the stored objects or the subset of burnt-in / GFR samples as specified at training time. Default FALSE.
 #'
 #' @return List of prediction matrices. If model does not have random effects, the list has one element -- the predictions from the forest. 
 #' If the model does have random effects, the list has three elements -- forest predictions, random effects predictions, and their sum (`y_hat`).
@@ -665,7 +667,7 @@ bart <- function(X_train, y_train, W_train = NULL, group_ids_train = NULL,
 #' y_hat_test <- predict(bart_model, X_test)
 #' # plot(rowMeans(y_hat_test), y_test, xlab = "predicted", ylab = "actual")
 #' # abline(0,1,col="red",lty=3,lwd=3)
-predict.bartmodel <- function(bart, X_test, W_test = NULL, group_ids_test = NULL, rfx_basis_test = NULL, predict_all = F){
+predict.bartmodel <- function(bart, X_test, W_test = NULL, group_ids_test = NULL, rfx_basis_test = NULL){
     # Preprocess covariates
     if ((!is.data.frame(X_test)) && (!is.matrix(X_test))) {
         stop("X_test must be a matrix or dataframe")
@@ -726,11 +728,14 @@ predict.bartmodel <- function(bart, X_test, W_test = NULL, group_ids_test = NULL
     variance_scale <- bart$model_params$variance_scale
     y_std <- bart$model_params$outcome_scale
     y_bar <- bart$model_params$outcome_mean
-    mean_forest_predictions <- bart$mean_forests$predict(prediction_dataset)*y_std/sqrt(variance_scale) + y_bar
+    sigma2_init <- bart$model_params$sigma2_init
+    if (bart$model_params$include_mean_forest) {
+        mean_forest_predictions <- bart$mean_forests$predict(prediction_dataset)*y_std/sqrt(variance_scale) + y_bar
+    }
     
     # Compute variance forest predictions
     if (bart$model_params$include_variance_forest) {
-        var_forest_predictions <- bart$variance_forests$predict(prediction_dataset)*(y_std^2)/variance_scale
+        s_x_raw <- bart$variance_forests$predict(prediction_dataset)
     }
     
     # Compute rfx predictions (if needed)
@@ -739,30 +744,43 @@ predict.bartmodel <- function(bart, X_test, W_test = NULL, group_ids_test = NULL
     }
     
     # Restrict predictions to the "retained" samples (if applicable)
-    if (!predict_all) {
-        keep_indices = bart$keep_indices
+    keep_indices = bart$keep_indices
+    if (bart$model_params$include_mean_forest) {
         mean_forest_predictions <- mean_forest_predictions[,keep_indices]
-        if (bart$model_params$include_variance_forest) {
-            variance_forest_predictions <- variance_forest_predictions[,keep_indices]
-        }
-        if (bart$model_params$has_rfx) rfx_predictions <- rfx_predictions[,keep_indices]
     }
+    if (bart$model_params$include_variance_forest) {
+        s_x_raw <- s_x_raw[,keep_indices]
+    }
+    if (bart$model_params$has_rfx) rfx_predictions <- rfx_predictions[,keep_indices]
     
-    if (bart$model_params$has_rfx) {
+    # Scale variance forest predictions
+    if (bart$model_params$include_variance_forest) {
+        if (bart$model_params$sample_sigma_global) {
+            sigma2_samples <- bart$sigma2_global_samples
+            variance_forest_predictions <- sapply(1:length(keep_indices), function(i) sqrt(s_x_raw[,i]*sigma2_samples[i]))
+        } else {
+            variance_forest_predictions <- sqrt(s_x_raw*sigma2_init)*y_std/sqrt(variance_scale)
+        }
+    }
+
+    if ((bart$model_params$include_mean_forest) && (bart$model_params$has_rfx)) {
         y_hat <- mean_forest_predictions + rfx_predictions
-    } else {
+    } else if ((bart$model_params$include_mean_forest) && (!bart$model_params$has_rfx)) {
         y_hat <- mean_forest_predictions
-    }
-    
-    result <- list(
-        "y_hat" = y_hat, 
-        "mean_forest_predictions" = mean_forest_predictions
-    )
+    } else if ((!bart$model_params$include_mean_forest) && (bart$model_params$has_rfx)) {
+        y_hat <- rfx_predictions
+    } 
     
+    result <- list()
+    if ((bart$model_params$has_rfx) || (bart$model_params$include_mean_forest)) {
+        result[["y_hat"]] = y_hat
+    }
+    if (bart$model_params$include_mean_forest) {
+        result[["mean_forest_predictions"]] = mean_forest_predictions
+    }
     if (bart$model_params$has_rfx) {
         result[["rfx_predictions"]] = rfx_predictions
     }
-    
     if (bart$model_params$include_variance_forest) {
         result[["variance_forest_predictions"]] = variance_forest_predictions
     }
diff --git a/R/bcf.R b/R/bcf.R
index bf63972a..a93272f9 100644
--- a/R/bcf.R
+++ b/R/bcf.R
@@ -22,32 +22,42 @@
 #' that were not in the training set.
 #' @param rfx_basis_test (Optional) Test set basis for "random-slope" regression in additive random effects model.
 #' @param cutpoint_grid_size Maximum size of the "grid" of potential cutpoints to consider. Default: 100.
-#' @param sigma_leaf_mu Starting value of leaf node scale parameter for the prognostic forest. Calibrated internally as `2/num_trees_mu` if not set here.
-#' @param sigma_leaf_tau Starting value of leaf node scale parameter for the treatment effect forest. Calibrated internally as `1/num_trees_tau` if not set here.
-#' @param alpha_mu Prior probability of splitting for a tree of depth 0 for the prognostic forest. Tree split prior combines `alpha` and `beta` via `alpha*(1+node_depth)^-beta`. Default: 0.95.
-#' @param alpha_tau Prior probability of splitting for a tree of depth 0 for the treatment effect forest. Tree split prior combines `alpha` and `beta` via `alpha*(1+node_depth)^-beta`. Default: 0.25.
-#' @param beta_mu Exponent that decreases split probabilities for nodes of depth > 0 for the prognostic forest. Tree split prior combines `alpha` and `beta` via `alpha*(1+node_depth)^-beta`. Default: 2.0.
-#' @param beta_tau Exponent that decreases split probabilities for nodes of depth > 0 for the treatment effect forest. Tree split prior combines `alpha` and `beta` via `alpha*(1+node_depth)^-beta`. Default: 3.0.
+#' @param sigma_leaf_mu Starting value of leaf node scale parameter for the prognostic forest. Calibrated internally as `1/num_trees_mu` if not set here.
+#' @param sigma_leaf_tau Starting value of leaf node scale parameter for the treatment effect forest. Calibrated internally as `1/(2*num_trees_tau)` if not set here.
+#' @param alpha_mu Prior probability of splitting for a tree of depth 0 for the prognostic forest. Tree split prior combines `alpha` and `beta` via `alpha_mu*(1+node_depth)^-beta_mu`. Default: 0.95.
+#' @param alpha_tau Prior probability of splitting for a tree of depth 0 for the treatment effect forest. Tree split prior combines `alpha` and `beta` via `alpha_tau*(1+node_depth)^-beta_tau`. Default: 0.25.
+#' @param alpha_variance Prior probability of splitting for a tree of depth 0 in the (optional) conditional variance model. Tree split prior combines `alpha_variance` and `beta_variance` via `alpha_variance*(1+node_depth)^-beta_variance`. Default: 0.95.
+#' @param beta_mu Exponent that decreases split probabilities for nodes of depth > 0 for the prognostic forest. Tree split prior combines `alpha` and `beta` via `alpha_mu*(1+node_depth)^-beta_mu`. Default: 2.0.
+#' @param beta_tau Exponent that decreases split probabilities for nodes of depth > 0 for the treatment effect forest. Tree split prior combines `alpha` and `beta` via `alpha_tau*(1+node_depth)^-beta_tau`. Default: 3.0.
+#' @param beta_variance Exponent that decreases split probabilities for nodes of depth > 0 in the (optional) conditional variance model. Tree split prior combines `alpha_variance` and `beta_variance` via `alpha_variance*(1+node_depth)^-beta_variance`. Default: 2.0.
 #' @param min_samples_leaf_mu Minimum allowable size of a leaf, in terms of training samples, for the prognostic forest. Default: 5.
 #' @param min_samples_leaf_tau Minimum allowable size of a leaf, in terms of training samples, for the treatment effect forest. Default: 5.
+#' @param min_samples_leaf_variance Minimum allowable size of a leaf, in terms of training samples, in the (optional) conditional variance model. Default: 5.
 #' @param max_depth_mu Maximum depth of any tree in the mu ensemble. Default: 10. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
 #' @param max_depth_tau Maximum depth of any tree in the tau ensemble. Default: 5. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
+#' @param max_depth_variance Maximum depth of any tree in the ensemble in the (optional) conditional variance model. Default: 10. Can be overriden with ``-1`` which does not enforce any depth limits on trees.
 #' @param a_global Shape parameter in the `IG(a_global, b_global)` global error variance model. Default: 0.
 #' @param b_global Scale parameter in the `IG(a_global, b_global)` global error variance model. Default: 0.
 #' @param a_leaf_mu Shape parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model for the prognostic forest. Default: 3.
 #' @param a_leaf_tau Shape parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model for the treatment effect forest. Default: 3.
 #' @param b_leaf_mu Scale parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model for the prognostic forest. Calibrated internally as 0.5/num_trees if not set here.
 #' @param b_leaf_tau Scale parameter in the `IG(a_leaf, b_leaf)` leaf node parameter variance model for the treatment effect forest. Calibrated internally as 0.5/num_trees if not set here.
-#' @param q Quantile used to calibrated `lambda` as in Sparapani et al (2021). Default: 0.9.
-#' @param sigma2 Starting value of global error variance parameter. Calibrated internally as `pct_var_sigma2_init*var((y-mean(y))/sd(y))` if not set.
-#' @param pct_var_sigma2_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by `sigma2`.
+#' @param a_forest Shape parameter in the `IG(a_forest, b_forest)` conditional error variance model (which is only sampled if `num_trees_variance > 0`). Calibrated internally as `num_trees_variance / 1.5^2 + 0.5` if not set.
+#' @param b_forest Scale parameter in the `IG(a_forest, b_forest)` conditional error variance model (which is only sampled if `num_trees_variance > 0`). Calibrated internally as `num_trees_variance / 1.5^2` if not set.
+#' @param sigma2_init Starting value of global error variance parameter. Calibrated internally as `pct_var_sigma2_init*var((y-mean(y))/sd(y))` if not set.
+#' @param variance_forest_init Starting value of root forest prediction in conditional (heteroskedastic) error variance model. Calibrated internally as `log(pct_var_variance_forest_init*var((y-mean(y))/sd(y)))/num_trees_variance` if not set.
+#' @param pct_var_sigma2_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by `sigma2_init`.
+#' @param pct_var_variance_forest_init Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by `variance_forest_init`.
 #' @param variable_weights Numeric weights reflecting the relative probability of splitting on each variable. Does not need to sum to 1 but cannot be negative. Defaults to `rep(1/ncol(X_train), ncol(X_train))` if not set here. Note that if the propensity score is included as a covariate in either forest, its weight will default to `1/ncol(X_train)`. A workaround if you wish to provide a custom weight for the propensity score is to include it as a column in `X_train` and then set `propensity_covariate` to `'none'` adjust `keep_vars_mu` and `keep_vars_tau` accordingly.
 #' @param keep_vars_mu Vector of variable names or column indices denoting variables that should be included in the prognostic (`mu(X)`) forest. Default: NULL.
 #' @param drop_vars_mu Vector of variable names or column indices denoting variables that should be excluded from the prognostic (`mu(X)`) forest. Default: NULL. If both `drop_vars_mu` and `keep_vars_mu` are set, `drop_vars_mu` will be ignored.
 #' @param keep_vars_tau Vector of variable names or column indices denoting variables that should be included in the treatment effect (`tau(X)`) forest. Default: NULL.
 #' @param drop_vars_tau Vector of variable names or column indices denoting variables that should be excluded from the treatment effect (`tau(X)`) forest. Default: NULL. If both `drop_vars_tau` and `keep_vars_tau` are set, `drop_vars_tau` will be ignored.
+#' @param keep_vars_variance Vector of variable names or column indices denoting variables that should be included in the (optional) conditional variance forest. Default: NULL.
+#' @param drop_vars_variance Vector of variable names or column indices denoting variables that should be excluded from the (optional) conditional variance forest. Default: NULL. If both `drop_vars_variance` and `keep_vars_variance` are set, `drop_vars_variance` will be ignored.
 #' @param num_trees_mu Number of trees in the prognostic forest. Default: 200.
 #' @param num_trees_tau Number of trees in the treatment effect forest. Default: 50.
+#' @param num_trees_variance Number of trees in the (optional) conditional variance forest model. Default: 0.
 #' @param num_gfr Number of "warm-start" iterations run using the grow-from-root algorithm (He and Hahn, 2021). Default: 5.
 #' @param num_burnin Number of "burn-in" iterations of the MCMC sampler. Default: 0.
 #' @param num_mcmc Number of "retained" iterations of the MCMC sampler. Default: 100.
@@ -118,14 +128,31 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
                 rfx_basis_train = NULL, X_test = NULL, Z_test = NULL, pi_test = NULL, 
                 group_ids_test = NULL, rfx_basis_test = NULL, cutpoint_grid_size = 100, 
                 sigma_leaf_mu = NULL, sigma_leaf_tau = NULL, alpha_mu = 0.95, alpha_tau = 0.25, 
-                beta_mu = 2.0, beta_tau = 3.0, min_samples_leaf_mu = 5, min_samples_leaf_tau = 5, 
-                max_depth_mu = 10, max_depth_tau = 5, a_global = 0, b_global = 0, a_leaf_mu = 3, a_leaf_tau = 3, 
-                b_leaf_mu = NULL, b_leaf_tau = NULL, q = 0.9, sigma2 = NULL, pct_var_sigma2_init = 0.25, 
-                variable_weights = NULL, keep_vars_mu = NULL, drop_vars_mu = NULL, keep_vars_tau = NULL, 
-                drop_vars_tau = NULL, num_trees_mu = 250, num_trees_tau = 50, num_gfr = 5, num_burnin = 0, 
-                num_mcmc = 100, sample_sigma_global = T, sample_sigma_leaf_mu = T, sample_sigma_leaf_tau = F, 
-                propensity_covariate = "mu", adaptive_coding = T, b_0 = -0.5, b_1 = 0.5, 
+                alpha_variance = 0.95, beta_mu = 2.0, beta_tau = 3.0, beta_variance = 2.0, 
+                min_samples_leaf_mu = 5, min_samples_leaf_tau = 5, min_samples_leaf_variance = 5, 
+                max_depth_mu = 10, max_depth_tau = 5, max_depth_variance = 10, a_global = 0, b_global = 0, 
+                a_leaf_mu = 3, a_leaf_tau = 3, b_leaf_mu = NULL, b_leaf_tau = NULL, a_forest = NULL, b_forest = NULL, 
+                sigma2_init = NULL, variance_forest_init = NULL, pct_var_sigma2_init = 1, 
+                pct_var_variance_forest_init = 1, variable_weights = NULL, keep_vars_mu = NULL, 
+                drop_vars_mu = NULL, keep_vars_tau = NULL, drop_vars_tau = NULL, keep_vars_variance = NULL, 
+                drop_vars_variance = NULL, num_trees_mu = 250, num_trees_tau = 50, num_trees_variance = 0, 
+                num_gfr = 5, num_burnin = 0, num_mcmc = 100, sample_sigma_global = T, sample_sigma_leaf_mu = T, 
+                sample_sigma_leaf_tau = F, propensity_covariate = "mu", adaptive_coding = T, b_0 = -0.5, b_1 = 0.5, 
                 rfx_prior_var = NULL, random_seed = -1, keep_burnin = F, keep_gfr = F, verbose = F) {
+    # Determine whether conditional variance will be modeled
+    if (num_trees_variance > 0) include_variance_forest = T
+    else include_variance_forest = F
+
+    # Set the variance forest priors if not set
+    if (include_variance_forest) {
+        a_0 <- 1.5
+        if (is.null(a_forest)) a_forest <- num_trees_variance / (a_0^2) + 0.5
+        if (is.null(b_forest)) b_forest <- num_trees_variance / (a_0^2)
+    } else {
+        a_forest <- 1.
+        b_forest <- 1.
+    }
+    
     # Variable weight preprocessing (and initialization if necessary)
     if (is.null(variable_weights)) {
         variable_weights = rep(1/ncol(X_train), ncol(X_train))
@@ -212,6 +239,39 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     } else {
         variable_subset_tau <- 1:ncol(X_train)
     }
+    if (!is.null(keep_vars_variance)) {
+        if (is.character(keep_vars_variance)) {
+            if (!all(keep_vars_variance %in% names(X_train))) {
+                stop("keep_vars_variance includes some variable names that are not in X_train")
+            }
+            variable_subset_variance <- unname(which(names(X_train) %in% keep_vars_variance))
+        } else {
+            if (any(keep_vars_variance > ncol(X_train))) {
+                stop("keep_vars_variance includes some variable indices that exceed the number of columns in X_train")
+            }
+            if (any(keep_vars_variance < 0)) {
+                stop("keep_vars_variance includes some negative variable indices")
+            }
+            variable_subset_variance <- keep_vars_variance
+        }
+    } else if ((is.null(keep_vars_variance)) && (!is.null(drop_vars_variance))) {
+        if (is.character(drop_vars_variance)) {
+            if (!all(drop_vars_variance %in% names(X_train))) {
+                stop("drop_vars_variance includes some variable names that are not in X_train")
+            }
+            variable_subset_variance <- unname(which(!(names(X_train) %in% drop_vars_variance)))
+        } else {
+            if (any(drop_vars_variance > ncol(X_train))) {
+                stop("drop_vars_variance includes some variable indices that exceed the number of columns in X_train")
+            }
+            if (any(drop_vars_variance < 0)) {
+                stop("drop_vars_variance includes some negative variable indices")
+            }
+            variable_subset_variance <- (1:ncol(X_train))[!(1:ncol(X_train) %in% drop_vars_variance)]
+        }
+    } else {
+        variable_subset_variance <- 1:ncol(X_train)
+    }
     
     # Preprocess covariates
     train_cov_preprocess_list <- preprocessTrainData(X_train)
@@ -314,10 +374,13 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     variable_weights_adj <- 1/sapply(original_var_indices, function(x) sum(original_var_indices == x))
     variable_weights <- variable_weights[original_var_indices]*variable_weights_adj
     
-    # Create mu and tau specific variable weights with weights zeroed out for excluded variables
-    variable_weights_tau <- variable_weights_mu <- variable_weights
+    # Create mu and tau (and variance) specific variable weights with weights zeroed out for excluded variables
+    variable_weights_variance <- variable_weights_tau <- variable_weights_mu <- variable_weights
     variable_weights_mu[!(original_var_indices %in% variable_subset_mu)] <- 0
     variable_weights_tau[!(original_var_indices %in% variable_subset_tau)] <- 0
+    if (include_variance_forest) {
+        variable_weights_variance[!(original_var_indices %in% variable_subset_variance)] <- 0
+    }
 
     # Fill in rfx basis as a vector of 1s (random intercept) if a basis not provided 
     has_basis_rfx <- F
@@ -380,7 +443,15 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
         bart_model_propensity <- bart(X_train = X_train_raw, y_train = as.numeric(Z_train), X_test = X_test_raw, 
                                       num_gfr = num_total, num_burnin = 0, num_mcmc = 0)
         pi_train <- rowMeans(bart_model_propensity$y_hat_train[,(num_burnin+1):num_total])
-        if (has_test) pi_test <- rowMeans(bart_model_propensity$y_hat_test[,(num_burnin+1):num_total])
+        if ((is.null(dim(pi_train))) && (!is.null(pi_train))) {
+            pi_train <- as.matrix(pi_train)
+        }
+        if (has_test) {
+            pi_test <- rowMeans(bart_model_propensity$y_hat_test[,(num_burnin+1):num_total])
+            if ((is.null(dim(pi_test))) && (!is.null(pi_test))) {
+                pi_test <- as.matrix(pi_test)
+            }
+        }
     }
 
     if (has_test) {
@@ -394,12 +465,15 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
         if (propensity_covariate == "mu") {
             variable_weights_mu <- c(variable_weights_mu, rep(1./num_cov_orig, ncol(pi_train)))
             variable_weights_tau <- c(variable_weights_tau, 0)
+            if (include_variance_forest) variable_weights_variance <- c(variable_weights_variance, 0)
         } else if (propensity_covariate == "tau") {
             variable_weights_mu <- c(variable_weights_mu, 0)
             variable_weights_tau <- c(variable_weights_tau, rep(1./num_cov_orig, ncol(pi_train)))
+            if (include_variance_forest) variable_weights_variance <- c(variable_weights_variance, 0)
         } else if (propensity_covariate == "both") {
             variable_weights_mu <- c(variable_weights_mu, rep(1./num_cov_orig, ncol(pi_train)))
             variable_weights_tau <- c(variable_weights_tau, rep(1./num_cov_orig, ncol(pi_train)))
+            if (include_variance_forest) variable_weights_variance <- c(variable_weights_variance, 0)
         }
         if (has_test) X_test <- cbind(X_test, pi_test)
     }
@@ -407,6 +481,9 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     # Renormalize variable weights
     variable_weights_mu <- variable_weights_mu / sum(variable_weights_mu)
     variable_weights_tau <- variable_weights_tau / sum(variable_weights_tau)
+    if (include_variance_forest) {
+        variable_weights_variance <- variable_weights_variance / sum(variable_weights_variance)
+    }
     
     # Standardize outcome separately for test and train
     y_bar_train <- mean(y_train)
@@ -414,15 +491,19 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     resid_train <- (y_train-y_bar_train)/y_std_train
     
     # Calibrate priors for global sigma^2 and sigma_leaf_mu / sigma_leaf_tau
-    if (is.null(sigma2)) sigma2 <- pct_var_sigma2_init*var(resid_train)
+    if (is.null(sigma2_init)) sigma2_init <- pct_var_sigma2_init*var(resid_train)
+    if (is.null(variance_forest_init)) variance_forest_init <- pct_var_variance_forest_init*var(resid_train)
     if (is.null(b_leaf_mu)) b_leaf_mu <- var(resid_train)/(num_trees_mu)
     if (is.null(b_leaf_tau)) b_leaf_tau <- var(resid_train)/(2*num_trees_tau)
     if (is.null(sigma_leaf_mu)) sigma_leaf_mu <- var(resid_train)/(num_trees_mu)
     if (is.null(sigma_leaf_tau)) sigma_leaf_tau <- var(resid_train)/(2*num_trees_tau)
-    current_sigma2 <- sigma2
+    current_sigma2 <- sigma2_init
     current_leaf_scale_mu <- as.matrix(sigma_leaf_mu)
     current_leaf_scale_tau <- as.matrix(sigma_leaf_tau)
     
+    # Set variance leaf model type (currently only one option)
+    leaf_model_variance_forest <- 3
+    
     # Random effects prior parameters
     if (has_rfx) {
         # Initialize the working parameter to 1
@@ -493,14 +574,16 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     # Sampling data structures
     forest_model_mu <- createForestModel(forest_dataset_train, feature_types, num_trees_mu, nrow(X_train), alpha_mu, beta_mu, min_samples_leaf_mu, max_depth_mu)
     forest_model_tau <- createForestModel(forest_dataset_train, feature_types, num_trees_tau, nrow(X_train), alpha_tau, beta_tau, min_samples_leaf_tau, max_depth_tau)
+    if (include_variance_forest) {
+        forest_model_variance <- createForestModel(forest_dataset_train, feature_types, num_trees_variance, nrow(X_train), alpha_variance, beta_variance, min_samples_leaf_variance, max_depth_variance)
+    }
     
     # Container of forest samples
     forest_samples_mu <- createForestContainer(num_trees_mu, 1, T)
     forest_samples_tau <- createForestContainer(num_trees_tau, 1, F)
-    
-    # Placeholder heteroskedasticity parameters
-    a_forest = 1.
-    b_forest = 1.
+    if (include_variance_forest) {
+        forest_samples_variance <- createForestContainer(num_trees_variance, 1, TRUE, TRUE)
+    }
     
     # Initialize the leaves of each tree in the prognostic forest
     init_mu <- mean(resid_train)
@@ -509,6 +592,11 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     # Initialize the leaves of each tree in the treatment effect forest
     init_tau <- 0.
     forest_samples_tau$prepare_for_sampler(forest_dataset_train, outcome_train, forest_model_tau, 1, init_tau)
+    
+    # Initialize the leaves of each tree in the variance forest
+    if (include_variance_forest) {
+        forest_samples_variance$prepare_for_sampler(forest_dataset_train, outcome_train, forest_model_variance, leaf_model_variance_forest, variance_forest_init)
+    }
 
     # Run GFR (warm start) if specified
     if (num_gfr > 0){
@@ -581,6 +669,13 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             }
             
             # Sample variance parameters (if requested)
+            if (include_variance_forest) {
+                forest_model_variance$sample_one_iteration(
+                    forest_dataset_train, outcome_train, forest_samples_variance, rng, feature_types, 
+                    leaf_model_variance_forest, current_leaf_scale_mu, variable_weights_variance, 
+                    a_forest, b_forest, current_sigma2, cutpoint_grid_size, gfr = T, pre_initialized = T
+                )
+            }
             if (sample_sigma_global) {
                 global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
@@ -680,6 +775,13 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             }
             
             # Sample variance parameters (if requested)
+            if (include_variance_forest) {
+                forest_model_variance$sample_one_iteration(
+                    forest_dataset_train, outcome_train, forest_samples_variance, rng, feature_types, 
+                    leaf_model_variance_forest, current_leaf_scale_mu, variable_weights_variance, 
+                    a_forest, b_forest, current_sigma2, cutpoint_grid_size, gfr = F, pre_initialized = T
+                )
+            }
             if (sample_sigma_global) {
                 global_var_samples[i] <- sample_sigma2_one_iteration(outcome_train, forest_dataset_train, rng, a_global, b_global)
                 current_sigma2 <- global_var_samples[i]
@@ -715,6 +817,10 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
         }
         y_hat_test <- mu_hat_test + tau_hat_test * as.numeric(Z_test)
     }
+    if (include_variance_forest) {
+        sigma_x_hat_train <- forest_samples_variance$predict(forest_dataset_train)
+        if (has_test) sigma_x_hat_test <- forest_samples_variance$predict(forest_dataset_test)
+    }
 
     # Random effects predictions
     if (has_rfx) {
@@ -762,6 +868,10 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
             rfx_preds_test <- rfx_preds_test[,keep_indices]
         }
     }
+    if (include_variance_forest) {
+        sigma_x_hat_train <- sigma_x_hat_train[,keep_indices]
+        if (has_test) sigma_x_hat_test <- sigma_x_hat_test[,keep_indices]
+    }
     
     # Global error variance
     if (sample_sigma_global) sigma2_samples <- global_var_samples[keep_indices]*(y_std_train^2)
@@ -772,9 +882,25 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     # Leaf parameter variance for treatment effect forest
     if (sample_sigma_leaf_tau) sigma_leaf_tau_samples <- leaf_scale_tau_samples[keep_indices]
     
+    # Rescale variance forest prediction by global sigma2 (sampled or constant)
+    if (include_variance_forest) {
+        if (sample_sigma_global) {
+            sigma_x_hat_train <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_train[,i]*sigma2_samples[i]))
+            if (has_test) sigma_x_hat_test <- sapply(1:length(keep_indices), function(i) sqrt(sigma_x_hat_test[,i]*sigma2_samples[i]))
+        } else {
+            sigma_x_hat_train <- sqrt(sigma_x_hat_train*sigma2_init)*y_std_train
+            if (has_test) sigma_x_hat_test <- sqrt(sigma_x_hat_test*sigma2_init)*y_std_train
+        }
+    }
+    
     # Return results as a list
+    if (include_variance_forest) {
+        num_variance_covariates <- sum(variable_weights_variance > 0)
+    } else {
+        num_variance_covariates <- 0
+    }
     model_params <- list(
-        "initial_sigma2" = sigma2, 
+        "initial_sigma2" = sigma2_init, 
         "initial_sigma_leaf_mu" = sigma_leaf_mu,
         "initial_sigma_leaf_tau" = sigma_leaf_tau,
         "initial_b_0" = b_0,
@@ -785,11 +911,14 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
         "b_leaf_mu" = b_leaf_mu,
         "a_leaf_tau" = a_leaf_tau, 
         "b_leaf_tau" = b_leaf_tau,
+        "a_forest" = a_forest, 
+        "b_forest" = b_forest,
         "outcome_mean" = y_bar_train,
         "outcome_scale" = y_std_train, 
         "num_covariates" = num_cov_orig,
         "num_prognostic_covariates" = sum(variable_weights_mu > 0),
         "num_treatment_covariates" = sum(variable_weights_tau > 0),
+        "num_variance_covariates" = num_variance_covariates,
         "treatment_dim" = ncol(Z_train), 
         "propensity_covariate" = propensity_covariate, 
         "binary_treatment" = binary_treatment, 
@@ -801,6 +930,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
         "has_rfx" = has_rfx, 
         "has_rfx_basis" = has_basis_rfx, 
         "num_rfx_basis" = num_basis_rfx, 
+        "include_variance_forest" = include_variance_forest, 
         "sample_sigma_global" = sample_sigma_global,
         "sample_sigma_leaf_mu" = sample_sigma_leaf_mu,
         "sample_sigma_leaf_tau" = sample_sigma_leaf_tau
@@ -821,6 +951,11 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
     if (has_test) result[["mu_hat_test"]] = mu_hat_test
     if (has_test) result[["tau_hat_test"]] = tau_hat_test
     if (has_test) result[["y_hat_test"]] = y_hat_test
+    if (include_variance_forest) {
+        result[["forests_variance"]] = forest_samples_variance
+        result[["sigma_x_hat_train"]] = sigma_x_hat_train
+        if (has_test) result[["sigma_x_hat_test"]] = sigma_x_hat_test
+    }
     if (sample_sigma_global) result[["sigma2_samples"]] = sigma2_samples
     if (sample_sigma_leaf_mu) result[["sigma_leaf_mu_samples"]] = sigma_leaf_mu_samples
     if (sample_sigma_leaf_tau) result[["sigma_leaf_tau_samples"]] = sigma_leaf_tau_samples
@@ -849,9 +984,8 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
 #' We do not currently support (but plan to in the near future), test set evaluation for group labels
 #' that were not in the training set.
 #' @param rfx_basis_test (Optional) Test set basis for "random-slope" regression in additive random effects model.
-#' @param predict_all (Optional) Whether to predict the model for all of the samples in the stored objects or the subset of burnt-in / GFR samples as specified at training time. Default FALSE.
 #'
-#' @return List of three (or four) `nrow(X_test)` by `bcf$num_samples` matrices: prognostic function estimates, treatment effect estimates, (possibly) random effects predictions, and outcome predictions.
+#' @return List of 3-5 `nrow(X_test)` by `bcf$num_samples` matrices: prognostic function estimates, treatment effect estimates, (optionally) random effects predictions, (optionally) variance forest predictions, and outcome predictions.
 #' @export
 #'
 #' @examples
@@ -901,7 +1035,7 @@ bcf <- function(X_train, Z_train, y_train, pi_train = NULL, group_ids_train = NU
 #' # abline(0,1,col="red",lty=3,lwd=3)
 #' # plot(rowMeans(preds$tau_hat), tau_test, xlab = "predicted", ylab = "actual", main = "Treatment effect")
 #' # abline(0,1,col="red",lty=3,lwd=3)
-predict.bcf <- function(bcf, X_test, Z_test, pi_test = NULL, group_ids_test = NULL, rfx_basis_test = NULL, predict_all = F){
+predict.bcf <- function(bcf, X_test, Z_test, pi_test = NULL, group_ids_test = NULL, rfx_basis_test = NULL){
     # Preprocess covariates
     if ((!is.data.frame(X_test)) && (!is.matrix(X_test))) {
         stop("X_test must be a matrix or dataframe")
@@ -976,6 +1110,7 @@ predict.bcf <- function(bcf, X_test, Z_test, pi_test = NULL, group_ids_test = NU
     # Compute forest predictions
     y_std <- bcf$model_params$outcome_scale
     y_bar <- bcf$model_params$outcome_mean
+    sigma2_init <- bcf$model_params$initial_sigma2
     mu_hat_test <- bcf$forests_mu$predict(prediction_dataset_mu)*y_std + y_bar
     if (bcf$model_params$adaptive_coding) {
         tau_hat_test_raw <- bcf$forests_tau$predict_raw(prediction_dataset_tau)
@@ -983,6 +1118,9 @@ predict.bcf <- function(bcf, X_test, Z_test, pi_test = NULL, group_ids_test = NU
     } else {
         tau_hat_test <- bcf$forests_tau$predict_raw(prediction_dataset_tau)*y_std
     }
+    if (bcf$model_params$include_variance_forest) {
+        s_x_raw <- bcf$variance_forests$predict(prediction_dataset)
+    }
     
     # Compute rfx predictions (if needed)
     if (bcf$model_params$has_rfx) {
@@ -994,27 +1132,35 @@ predict.bcf <- function(bcf, X_test, Z_test, pi_test = NULL, group_ids_test = NU
     if (bcf$model_params$has_rfx) y_hat_test <- y_hat_test + rfx_predictions
     
     # Restrict predictions to the "retained" samples (if applicable)
-    if (!predict_all) {
-        keep_indices = bcf$keep_indices
-        mu_hat_test <- mu_hat_test[,keep_indices]
-        tau_hat_test <- tau_hat_test[,keep_indices]
-        y_hat_test <- y_hat_test[,keep_indices]
-        if (bcf$model_params$has_rfx) rfx_predictions <- rfx_predictions[,keep_indices]
+    keep_indices = bcf$keep_indices
+    mu_hat_test <- mu_hat_test[,keep_indices]
+    tau_hat_test <- tau_hat_test[,keep_indices]
+    y_hat_test <- y_hat_test[,keep_indices]
+    if (bcf$model_params$has_rfx) rfx_predictions <- rfx_predictions[,keep_indices]
+    if (bcf$model_params$include_variance_forest) {
+        s_x_raw <- s_x_raw[,keep_indices]
+    }
+    
+    # Scale variance forest predictions
+    if (bcf$model_params$include_variance_forest) {
+        if (bcf$model_params$sample_sigma_global) {
+            sigma2_samples <- bcf$sigma2_global_samples
+            variance_forest_predictions <- sapply(1:length(keep_indices), function(i) sqrt(s_x_raw[,i]*sigma2_samples[i]))
+        } else {
+            variance_forest_predictions <- sqrt(s_x_raw*sigma2_init)*y_std
+        }
     }
-    
+
+    result <- list(
+        "mu_hat" = mu_hat_test, 
+        "tau_hat" = tau_hat_test, 
+        "y_hat" = y_hat_test
+    )
     if (bcf$model_params$has_rfx) {
-        result <- list(
-            "mu_hat" = mu_hat_test, 
-            "tau_hat" = tau_hat_test, 
-            "rfx_predictions" = rfx_predictions, 
-            "y_hat" = y_hat_test
-        )
-    } else {
-        result <- list(
-            "mu_hat" = mu_hat_test, 
-            "tau_hat" = tau_hat_test, 
-            "y_hat" = y_hat_test
-        )
+        result[["rfx_predictions"]] = rfx_predictions
+    }
+    if (bcf$model_params$include_variance_forest) {
+        result[["variance_forest_predictions"]] = variance_forest_predictions
     }
     return(result)
 }
diff --git a/man/bart.Rd b/man/bart.Rd
index fa90f64a..45d5a0f7 100644
--- a/man/bart.Rd
+++ b/man/bart.Rd
@@ -15,7 +15,7 @@ bart(
   group_ids_test = NULL,
   rfx_basis_test = NULL,
   cutpoint_grid_size = 100,
-  tau_init = NULL,
+  sigma_leaf_init = NULL,
   alpha_mean = 0.95,
   beta_mean = 2,
   min_samples_leaf_mean = 5,
@@ -39,7 +39,7 @@ bart(
   variable_weights_mean = NULL,
   variable_weights_variance = NULL,
   num_trees_mean = 200,
-  num_trees_variance = 20,
+  num_trees_variance = 0,
   num_gfr = 5,
   num_burnin = 0,
   num_mcmc = 100,
@@ -87,7 +87,7 @@ that were not in the training set.}
 
 \item{cutpoint_grid_size}{Maximum size of the "grid" of potential cutpoints to consider. Default: 100.}
 
-\item{tau_init}{Starting value of leaf node scale parameter. Calibrated internally as \code{1/num_trees_mean} if not set here.}
+\item{sigma_leaf_init}{Starting value of leaf node scale parameter. Calibrated internally as \code{1/num_trees_mean} if not set here.}
 
 \item{alpha_mean}{Prior probability of splitting for a tree of depth 0 in the mean model. Tree split prior combines \code{alpha_mean} and \code{beta_mean} via \code{alpha_mean*(1+node_depth)^-beta_mean}. Default: 0.95.}
 
diff --git a/man/bcf.Rd b/man/bcf.Rd
index 0108b46b..9bcfd339 100644
--- a/man/bcf.Rd
+++ b/man/bcf.Rd
@@ -21,28 +21,36 @@ bcf(
   sigma_leaf_tau = NULL,
   alpha_mu = 0.95,
   alpha_tau = 0.25,
+  alpha_variance = 0.95,
   beta_mu = 2,
   beta_tau = 3,
+  beta_variance = 2,
   min_samples_leaf_mu = 5,
   min_samples_leaf_tau = 5,
+  min_samples_leaf_variance = 5,
   max_depth_mu = 10,
   max_depth_tau = 5,
+  max_depth_variance = 10,
   a_global = 0,
   b_global = 0,
   a_leaf_mu = 3,
   a_leaf_tau = 3,
   b_leaf_mu = NULL,
   b_leaf_tau = NULL,
-  q = 0.9,
-  sigma2 = NULL,
-  pct_var_sigma2_init = 0.25,
+  sigma2_init = NULL,
+  variance_forest_init = NULL,
+  pct_var_sigma2_init = 1,
+  pct_var_variance_forest_init = 1,
   variable_weights = NULL,
   keep_vars_mu = NULL,
   drop_vars_mu = NULL,
   keep_vars_tau = NULL,
   drop_vars_tau = NULL,
+  keep_vars_variance = NULL,
+  drop_vars_variance = NULL,
   num_trees_mu = 250,
   num_trees_tau = 50,
+  num_trees_variance = 0,
   num_gfr = 5,
   num_burnin = 0,
   num_mcmc = 100,
@@ -95,26 +103,34 @@ that were not in the training set.}
 
 \item{cutpoint_grid_size}{Maximum size of the "grid" of potential cutpoints to consider. Default: 100.}
 
-\item{sigma_leaf_mu}{Starting value of leaf node scale parameter for the prognostic forest. Calibrated internally as \code{2/num_trees_mu} if not set here.}
+\item{sigma_leaf_mu}{Starting value of leaf node scale parameter for the prognostic forest. Calibrated internally as \code{1/num_trees_mu} if not set here.}
 
-\item{sigma_leaf_tau}{Starting value of leaf node scale parameter for the treatment effect forest. Calibrated internally as \code{1/num_trees_tau} if not set here.}
+\item{sigma_leaf_tau}{Starting value of leaf node scale parameter for the treatment effect forest. Calibrated internally as \code{1/(2*num_trees_tau)} if not set here.}
 
-\item{alpha_mu}{Prior probability of splitting for a tree of depth 0 for the prognostic forest. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha*(1+node_depth)^-beta}. Default: 0.95.}
+\item{alpha_mu}{Prior probability of splitting for a tree of depth 0 for the prognostic forest. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha_mu*(1+node_depth)^-beta_mu}. Default: 0.95.}
 
-\item{alpha_tau}{Prior probability of splitting for a tree of depth 0 for the treatment effect forest. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha*(1+node_depth)^-beta}. Default: 0.25.}
+\item{alpha_tau}{Prior probability of splitting for a tree of depth 0 for the treatment effect forest. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha_tau*(1+node_depth)^-beta_tau}. Default: 0.25.}
 
-\item{beta_mu}{Exponent that decreases split probabilities for nodes of depth > 0 for the prognostic forest. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha*(1+node_depth)^-beta}. Default: 2.0.}
+\item{alpha_variance}{Prior probability of splitting for a tree of depth 0 in the (optional) conditional variance model. Tree split prior combines \code{alpha_variance} and \code{beta_variance} via \code{alpha_variance*(1+node_depth)^-beta_variance}. Default: 0.95.}
 
-\item{beta_tau}{Exponent that decreases split probabilities for nodes of depth > 0 for the treatment effect forest. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha*(1+node_depth)^-beta}. Default: 3.0.}
+\item{beta_mu}{Exponent that decreases split probabilities for nodes of depth > 0 for the prognostic forest. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha_mu*(1+node_depth)^-beta_mu}. Default: 2.0.}
+
+\item{beta_tau}{Exponent that decreases split probabilities for nodes of depth > 0 for the treatment effect forest. Tree split prior combines \code{alpha} and \code{beta} via \code{alpha_tau*(1+node_depth)^-beta_tau}. Default: 3.0.}
+
+\item{beta_variance}{Exponent that decreases split probabilities for nodes of depth > 0 in the (optional) conditional variance model. Tree split prior combines \code{alpha_variance} and \code{beta_variance} via \code{alpha_variance*(1+node_depth)^-beta_variance}. Default: 2.0.}
 
 \item{min_samples_leaf_mu}{Minimum allowable size of a leaf, in terms of training samples, for the prognostic forest. Default: 5.}
 
 \item{min_samples_leaf_tau}{Minimum allowable size of a leaf, in terms of training samples, for the treatment effect forest. Default: 5.}
 
+\item{min_samples_leaf_variance}{Minimum allowable size of a leaf, in terms of training samples, in the (optional) conditional variance model. Default: 5.}
+
 \item{max_depth_mu}{Maximum depth of any tree in the mu ensemble. Default: 10. Can be overriden with \code{-1} which does not enforce any depth limits on trees.}
 
 \item{max_depth_tau}{Maximum depth of any tree in the tau ensemble. Default: 5. Can be overriden with \code{-1} which does not enforce any depth limits on trees.}
 
+\item{max_depth_variance}{Maximum depth of any tree in the ensemble in the (optional) conditional variance model. Default: 10. Can be overriden with \code{-1} which does not enforce any depth limits on trees.}
+
 \item{a_global}{Shape parameter in the \code{IG(a_global, b_global)} global error variance model. Default: 0.}
 
 \item{b_global}{Scale parameter in the \code{IG(a_global, b_global)} global error variance model. Default: 0.}
@@ -127,11 +143,13 @@ that were not in the training set.}
 
 \item{b_leaf_tau}{Scale parameter in the \code{IG(a_leaf, b_leaf)} leaf node parameter variance model for the treatment effect forest. Calibrated internally as 0.5/num_trees if not set here.}
 
-\item{q}{Quantile used to calibrated \code{lambda} as in Sparapani et al (2021). Default: 0.9.}
+\item{sigma2_init}{Starting value of global error variance parameter. Calibrated internally as \code{pct_var_sigma2_init*var((y-mean(y))/sd(y))} if not set.}
+
+\item{variance_forest_init}{Starting value of root forest prediction in conditional (heteroskedastic) error variance model. Calibrated internally as \code{log(pct_var_variance_forest_init*var((y-mean(y))/sd(y)))/num_trees_variance} if not set.}
 
-\item{sigma2}{Starting value of global error variance parameter. Calibrated internally as \code{pct_var_sigma2_init*var((y-mean(y))/sd(y))} if not set.}
+\item{pct_var_sigma2_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by \code{sigma2_init}.}
 
-\item{pct_var_sigma2_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 0.25. Superseded by \code{sigma2}.}
+\item{pct_var_variance_forest_init}{Percentage of standardized outcome variance used to initialize global error variance parameter. Default: 1. Superseded by \code{variance_forest_init}.}
 
 \item{variable_weights}{Numeric weights reflecting the relative probability of splitting on each variable. Does not need to sum to 1 but cannot be negative. Defaults to \code{rep(1/ncol(X_train), ncol(X_train))} if not set here. Note that if the propensity score is included as a covariate in either forest, its weight will default to \code{1/ncol(X_train)}. A workaround if you wish to provide a custom weight for the propensity score is to include it as a column in \code{X_train} and then set \code{propensity_covariate} to \code{'none'} adjust \code{keep_vars_mu} and \code{keep_vars_tau} accordingly.}
 
@@ -143,10 +161,16 @@ that were not in the training set.}
 
 \item{drop_vars_tau}{Vector of variable names or column indices denoting variables that should be excluded from the treatment effect (\code{tau(X)}) forest. Default: NULL. If both \code{drop_vars_tau} and \code{keep_vars_tau} are set, \code{drop_vars_tau} will be ignored.}
 
+\item{keep_vars_variance}{Vector of variable names or column indices denoting variables that should be included in the (optional) conditional variance forest. Default: NULL.}
+
+\item{drop_vars_variance}{Vector of variable names or column indices denoting variables that should be excluded from the (optional) conditional variance forest. Default: NULL. If both \code{drop_vars_variance} and \code{keep_vars_variance} are set, \code{drop_vars_variance} will be ignored.}
+
 \item{num_trees_mu}{Number of trees in the prognostic forest. Default: 200.}
 
 \item{num_trees_tau}{Number of trees in the treatment effect forest. Default: 50.}
 
+\item{num_trees_variance}{Number of trees in the (optional) conditional variance forest model. Default: 0.}
+
 \item{num_gfr}{Number of "warm-start" iterations run using the grow-from-root algorithm (He and Hahn, 2021). Default: 5.}
 
 \item{num_burnin}{Number of "burn-in" iterations of the MCMC sampler. Default: 0.}
@@ -176,6 +200,10 @@ that were not in the training set.}
 \item{keep_gfr}{Whether or not "grow-from-root" samples should be included in cached predictions. Default FALSE. Ignored if num_mcmc = 0.}
 
 \item{verbose}{Whether or not to print progress during the sampling loops. Default: FALSE.}
+
+\item{a_forest}{Shape parameter in the \code{IG(a_forest, b_forest)} conditional error variance model (which is only sampled if \code{num_trees_variance > 0}). Calibrated internally as \code{num_trees_variance / 1.5^2 + 0.5} if not set.}
+
+\item{b_forest}{Scale parameter in the \code{IG(a_forest, b_forest)} conditional error variance model (which is only sampled if \code{num_trees_variance > 0}). Calibrated internally as \code{num_trees_variance / 1.5^2} if not set.}
 }
 \value{
 List of sampling outputs and a wrapper around the sampled forests (which can be used for in-memory prediction on new data, or serialized to JSON on disk).
diff --git a/man/predict.bartmodel.Rd b/man/predict.bartmodel.Rd
index 930af52d..28237c9b 100644
--- a/man/predict.bartmodel.Rd
+++ b/man/predict.bartmodel.Rd
@@ -9,8 +9,7 @@
   X_test,
   W_test = NULL,
   group_ids_test = NULL,
-  rfx_basis_test = NULL,
-  predict_all = F
+  rfx_basis_test = NULL
 )
 }
 \arguments{
@@ -25,8 +24,6 @@ We do not currently support (but plan to in the near future), test set evaluatio
 that were not in the training set.}
 
 \item{rfx_basis_test}{(Optional) Test set basis for "random-slope" regression in additive random effects model.}
-
-\item{predict_all}{(Optional) Whether to predict the model for all of the samples in the stored objects or the subset of burnt-in / GFR samples as specified at training time. Default FALSE.}
 }
 \value{
 List of prediction matrices. If model does not have random effects, the list has one element -- the predictions from the forest.
diff --git a/man/predict.bcf.Rd b/man/predict.bcf.Rd
index 8a4f5766..1841c14d 100644
--- a/man/predict.bcf.Rd
+++ b/man/predict.bcf.Rd
@@ -10,8 +10,7 @@
   Z_test,
   pi_test = NULL,
   group_ids_test = NULL,
-  rfx_basis_test = NULL,
-  predict_all = F
+  rfx_basis_test = NULL
 )
 }
 \arguments{
@@ -28,11 +27,9 @@ We do not currently support (but plan to in the near future), test set evaluatio
 that were not in the training set.}
 
 \item{rfx_basis_test}{(Optional) Test set basis for "random-slope" regression in additive random effects model.}
-
-\item{predict_all}{(Optional) Whether to predict the model for all of the samples in the stored objects or the subset of burnt-in / GFR samples as specified at training time. Default FALSE.}
 }
 \value{
-List of three (or four) \code{nrow(X_test)} by \code{bcf$num_samples} matrices: prognostic function estimates, treatment effect estimates, (possibly) random effects predictions, and outcome predictions.
+List of 3-5 \code{nrow(X_test)} by \code{bcf$num_samples} matrices: prognostic function estimates, treatment effect estimates, (optionally) random effects predictions, (optionally) variance forest predictions, and outcome predictions.
 }
 \description{
 Predict from a sampled BCF model on new data
diff --git a/tools/debug/bcf_quick.R b/tools/debug/bcf_quick.R
new file mode 100644
index 00000000..60a40bda
--- /dev/null
+++ b/tools/debug/bcf_quick.R
@@ -0,0 +1,53 @@
+library(stochtree)
+g <- function(x) {ifelse(x[,5]==1,2,ifelse(x[,5]==2,-1,-4))}
+mu1 <- function(x) {1+g(x)+x[,1]*x[,3]}
+mu2 <- function(x) {1+g(x)+6*abs(x[,3]-1)}
+tau1 <- function(x) {rep(3,nrow(x))}
+tau2 <- function(x) {1+2*x[,2]*x[,4]}
+n <- 500
+snr <- 3
+x1 <- rnorm(n)
+x2 <- rnorm(n)
+x3 <- rnorm(n)
+x4 <- as.numeric(rbinom(n,1,0.5))
+x5 <- as.numeric(sample(1:3,n,replace=TRUE))
+X <- cbind(x1,x2,x3,x4,x5)
+p <- ncol(X)
+mu_x <- mu1(X)
+tau_x <- tau2(X)
+pi_x <- 0.8*pnorm((3*mu_x/sd(mu_x)) - 0.5*X[,1]) + 0.05 + runif(n)/10
+Z <- rbinom(n,1,pi_x)
+E_XZ <- mu_x + Z*tau_x
+y <- E_XZ + rnorm(n, 0, 1)*(sd(E_XZ)/snr)
+X <- as.data.frame(X)
+X$x4 <- factor(X$x4, ordered = TRUE)
+X$x5 <- factor(X$x5, ordered = TRUE)
+
+# Split data into test and train sets
+test_set_pct <- 0.2
+n_test <- round(test_set_pct*n)
+n_train <- n - n_test
+test_inds <- sort(sample(1:n, n_test, replace = FALSE))
+train_inds <- (1:n)[!((1:n) %in% test_inds)]
+X_test <- X[test_inds,]
+X_train <- X[train_inds,]
+pi_test <- pi_x[test_inds]
+pi_train <- pi_x[train_inds]
+Z_test <- Z[test_inds]
+Z_train <- Z[train_inds]
+y_test <- y[test_inds]
+y_train <- y[train_inds]
+mu_test <- mu_x[test_inds]
+mu_train <- mu_x[train_inds]
+tau_test <- tau_x[test_inds]
+tau_train <- tau_x[train_inds]
+num_gfr <- 10
+num_burnin <- 0
+num_mcmc <- 1000
+num_samples <- num_gfr + num_burnin + num_mcmc
+bcf_model_warmstart <- bcf(
+    X_train = X_train, Z_train = Z_train, y_train = y_train, pi_train = pi_train, 
+    X_test = X_test, Z_test = Z_test, pi_test = pi_test, num_trees_variance = 50, 
+    num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
+    sample_sigma_leaf_mu = F, sample_sigma_leaf_tau = F
+)
diff --git a/vignettes/CausalInference.Rmd b/vignettes/CausalInference.Rmd
index 9802818e..1fd270c1 100644
--- a/vignettes/CausalInference.Rmd
+++ b/vignettes/CausalInference.Rmd
@@ -115,6 +115,7 @@ num_samples <- num_gfr + num_burnin + num_mcmc
 bcf_model_warmstart <- bcf(
     X_train = X_train, Z_train = Z_train, y_train = y_train, pi_train = pi_train, 
     X_test = X_test, Z_test = Z_test, pi_test = pi_test, 
+    num_trees_variance = 50, 
     num_gfr = num_gfr, num_burnin = num_burnin, num_mcmc = num_mcmc, 
     sample_sigma_leaf_mu = F, sample_sigma_leaf_tau = F
 )