diff --git a/.github/workflows/R-CMD-check.yml b/.github/workflows/R-CMD-check.yml
index 5f2d726f..1c413f21 100644
--- a/.github/workflows/R-CMD-check.yml
+++ b/.github/workflows/R-CMD-check.yml
@@ -32,7 +32,7 @@ jobs:
         uses: actions/checkout@v2
 
       - name: Setup R
-        uses: r-lib/actions/setup-r@master
+        uses: r-lib/actions/setup-r@v2
         with:
           r-version: ${{ matrix.config.r }}
 
diff --git a/DESCRIPTION b/DESCRIPTION
index 63c65a99..a6621fb2 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -68,5 +68,5 @@ LinkingTo:
   Rcpp,
   RcppEigen
 VignetteBuilder: knitr
-RoxygenNote: 7.1.2
+RoxygenNote: 7.2.0
 Roxygen: list(markdown = TRUE)
diff --git a/NAMESPACE b/NAMESPACE
index 4976c069..495ea7e5 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -16,7 +16,6 @@ export(make_copy_map)
 export(make_design_matrix)
 export(make_reduced_basis_map)
 export(squash_hal_fit)
-import(Rcpp)
 importFrom(Matrix,tcrossprod)
 importFrom(Rcpp,sourceCpp)
 importFrom(assertthat,assert_that)
@@ -27,13 +26,9 @@ importFrom(data.table,setorder)
 importFrom(glmnet,cv.glmnet)
 importFrom(glmnet,glmnet)
 importFrom(methods,is)
-importFrom(methods,new)
 importFrom(origami,cross_validate)
-importFrom(origami,fold_index)
 importFrom(origami,folds2foldvec)
 importFrom(origami,make_folds)
-importFrom(origami,training)
-importFrom(origami,validation)
 importFrom(stats,aggregate)
 importFrom(stats,as.formula)
 importFrom(stats,coef)
diff --git a/R/RcppExports.R b/R/RcppExports.R
index bd17cee2..aaedb7ca 100644
--- a/R/RcppExports.R
+++ b/R/RcppExports.R
@@ -51,16 +51,6 @@ apply_copy_map <- function(X, copy_map) {
     .Call('_hal9001_apply_copy_map', PACKAGE = 'hal9001', X, copy_map)
 }
 
-#' Prediction from a Lassi Model
-#'
-#' @param X A sparse matrix of HAL basis functions.
-#' @param beta A vector of coefficient values for the HAL basis functions.
-#' @param intercept A numeric value giving the intercept of the HAL model.
-#'
-lassi_predict <- function(X, beta, intercept) {
-    .Call('_hal9001_lassi_predict', PACKAGE = 'hal9001', X, beta, intercept)
-}
-
 #' Sort Basis Functions
 #'
 #' Build a sorted list of unique basis functions based on columns, where each
diff --git a/R/cv_lasso.R b/R/cv_lasso.R
index 44233825..a7fece86 100644
--- a/R/cv_lasso.R
+++ b/R/cv_lasso.R
@@ -1,55 +1,3 @@
-#' Single Lasso estimation for cross-validation with Origami
-#'
-#' Fits Lasso regression over a single fold of a cross-validated data set. This
-#' is meant to be called using \code{\link[origami]{cross_validate}}, which is
-#' done through \code{\link{cv_lasso}}. Note that this procedure is NOT meant
-#' to be invoked by itself. INTERNAL USE ONLY.
-#'
-#' @param fold A \code{fold} object produced by a call to \code{make_folds}
-#'  from the \pkg{origami}.
-#' @param data A \code{dgCMatrix} object containing the outcome values (Y) in
-#'  its first column and vectors corresponding to the basis functions of HAL in
-#'  all other columns. Consult the description of HAL regression for details.
-#' @param lambdas A \code{numeric} vector corresponding to a sequence of lambda
-#'  values obtained by fitting the Lasso on the full data.
-#' @param center binary. If \code{TRUE}, covariates are centered. This is much
-#'  slower, but matches the \code{glmnet} implementation. Default \code{FALSE}.
-#'
-#' @importFrom origami training validation fold_index
-lassi_origami <- function(fold, data, lambdas, center = FALSE) {
-  # make sure data is an (augmented) sparse matrix of basis functions
-  stopifnot(class(data) == "dgCMatrix")
-
-  # split data for V-fold cross-validation
-  train_data <- origami::training(data)
-  valid_data <- origami::validation(data)
-
-  # wrangle objects to clearer forms
-  train_x_basis <- train_data[, -1]
-  valid_x_basis <- valid_data[, -1]
-  train_y <- train_data[, 1]
-  valid_y <- valid_data[, 1]
-
-  # compute the predicted betas for the given training and validation sets
-  lassi_fit <- lassi(
-    x = train_x_basis, y = train_y, lambdas = lambdas,
-    center = center
-  )
-  pred_mat <- predict(lassi_fit, valid_x_basis)
-
-  # compute the MSE for the given training and validation sets
-  mses <- apply(pred_mat, 2, function(preds) {
-    mean((preds - valid_y)^2)
-  })
-
-  # the only output needed is the lambda-wise MSE over each fold
-  mses_out <- matrix(mses, nrow = 1)
-  out <- list(mses = mses_out)
-  return(out)
-}
-
-###############################################################################
-
 #' Cross-validated Lasso on Indicator Bases
 #'
 #' Fits Lasso regression using a customized procedure, with cross-validation
diff --git a/R/cv_lasso_early_stopping.R b/R/cv_lasso_early_stopping.R
deleted file mode 100644
index a8423f63..00000000
--- a/R/cv_lasso_early_stopping.R
+++ /dev/null
@@ -1,97 +0,0 @@
-#' Cross-validated LASSO on Indicator Bases
-#'
-#' Fits the LASSO regression using a customized procedure with cross-validation
-#' based on \pkg{origami}
-#'
-#' @param x_basis A \code{dgCMatrix} object corresponding to a sparse matrix of
-#'  the basis functions generated for the HAL algorithm.
-#' @param y A \code{numeric} vector of the observed outcome variable values.
-#' @param n_lambda A \code{numeric} scalar indicating the number of values of
-#'  the L1 regularization parameter (lambda) to be obtained from fitting the
-#'  LASSO to the full data. Cross-validation is used to select an optimal
-#'  lambda (that minimizes the risk) from among these.
-#' @param n_folds A \code{numeric} scalar for the number of folds to be used in
-#'  the cross-validation procedure to select an optimal value of lambda.
-#'
-#' @importFrom origami make_folds cross_validate
-#' @importFrom stats sd
-cv_lasso_early_stopping <- function(x_basis, y, n_lambda = 100, n_folds = 10) {
-  # first, need to run lasso on the full data to get a sequence of lambdas
-  lasso_init <- lassi(y = y, x = x_basis, nlambda = n_lambda, center = FALSE)
-  lambdas_init <- lasso_init$lambdas
-
-  # next, set up a cross-validated lasso using the sequence of lambdas
-  folds <- origami::make_folds(x_basis, V = n_folds)
-
-  # track separately for folds = xscale, beta, resid, intercept
-  fold <- folds[[1]]
-  setup_fold_data <- function(fold, x_basis, y) {
-    x_train <- training(x_basis)
-    y_train <- training(y)
-    x_valid <- validation(x_basis)
-    y_valid <- validation(y)
-
-    intercept <- mean(y_train)
-    resid <- y_train - intercept
-    xcenter <- rep(0, ncol(x_basis))
-    xscale <- calc_xscale(x_train, xcenter)
-    beta <- rep(0, ncol(x_basis))
-
-    fold_data <- list(
-      x_train = x_train, x_valid = x_valid, y_valid = y_valid,
-      intercept = intercept, resid = resid, xscale = xscale, xcenter = xcenter,
-      beta = beta
-    )
-
-    return(list(fold_data = fold_data))
-  }
-
-  all_fold_data <- cross_validate(setup_fold_data, folds, x_basis, y,
-    .combine = FALSE
-  )$fold_data
-
-  cv_lassi_step <- function(fold, all_fold_data, lambda) {
-    fold_data <- fold_index(all_fold_data)[[1]]
-    n_updates <- with(fold_data, fit_lassi_step(
-      x_train, resid, beta, lambda,
-      xscale, xcenter, intercept,
-      FALSE
-    ))
-    preds <- with(fold_data, as.vector(x_valid %*% (beta / xscale)) +
-      intercept)
-    mse <- with(fold_data, mean((preds - y_valid)^2))
-    return(list(fold_data = fold_data, mse = mse))
-  }
-
-  null_mse <- NULL
-  min_mse <- Inf
-  step_mses <- rep(Inf, n_lambda)
-  for (lambda_step in seq_along(lambdas_init)) {
-    lambda <- lambdas_init[lambda_step]
-    step_results <- lapply(folds, cv_lassi_step, all_fold_data, lambda)
-    all_fold_data <- lapply(step_results, `[[`, "fold_data")
-    step_mse <- mean(sapply(step_results, `[[`, "mse"))
-    # step_results <- cross_validate(cv_lassi_step, folds, all_fold_data,
-    # lambda, .combine = FALSE)
-    # all_fold_data <- step_results$fold_data
-
-    if (is.null(null_mse)) {
-      # null_mse is the first mse (i.e. for the null model)
-      null_mse <- step_mse
-    }
-
-    if (step_mse < min_mse) {
-      min_mse <- step_mse
-    }
-
-    # compute increase above minimum as percentage of total range
-    ratio <- (step_mse - min_mse) / (null_mse - min_mse)
-
-    # cat(sprintf("lambda: %f, mse: %f, ratio: %f\n", lambda, step_mse, ratio))
-    if (is.finite(ratio) && (ratio > 0.1)) {
-      break
-    }
-    step_mses[lambda_step] <- step_mse
-  }
-  return(step_mses)
-}
diff --git a/R/lassi.R b/R/lassi.R
deleted file mode 100644
index 6fa3986d..00000000
--- a/R/lassi.R
+++ /dev/null
@@ -1,97 +0,0 @@
-#' Rcpp module: lassi_fit_module
-#' @import Rcpp
-#' @name lassi_fit_module
-NULL
-loadModule("lassi_module", TRUE)
-
-#' Custom Lasso implementation for matrices of indicator functions
-#'
-#' @param x The covariate matrix
-#' @param y The outcome vector
-#' @param lambdas A sequence of values for the L1 regularization parameter
-#'  (lambda) to be used in fitting the LASSO. Defaults to \code{NULL}.
-#' @param nlambda number of lambdas to fit.
-#' @param lambda_min_ratio ratio of largest to smallest lambda to fit.
-#' @param center ...
-#'
-#' @importFrom methods new
-#'
-#' @keywords internal
-lassi <- function(x, y, lambdas = NULL, nlambda = 100,
-                  lambda_min_ratio = 0.01, center = FALSE) {
-  if (!is.null(lambdas)) {
-    nlambda <- length(lambdas)
-  }
-
-  # initialize object
-  lassi_object <- methods::new(Lassi, x, y, nlambda, lambda_min_ratio, center)
-
-  if (!is.null(lambdas)) {
-    lassi_object$lambdas <- lambdas
-  }
-
-  # initialize step counter
-  step_counts <- rep(0, nlambda)
-
-  # iterative procedure for active step convergence
-  for (i in (seq_len(nlambda) - 1)) {
-    full_steps <- lassi_object$lassi_fit_cd(i, FALSE, 1)
-    if (full_steps > 0) {
-      active_steps <- lassi_object$lassi_fit_cd(i, TRUE, 1000)
-    } else {
-      active_steps <- 0
-    }
-    step_counts[i + 1] <- active_steps
-  }
-
-  beta_mat <- as.matrix(lassi_object$beta_mat)
-  intercepts <- lassi_object$intercepts
-  beta_mat <- beta_mat / lassi_object$xscale
-  if (center) {
-    intercepts <- intercepts - crossprod(lassi_object$xcenter, beta_mat)
-  }
-
-  chichignoud_criterion <- NULL
-
-  # create output object
-  out <- list(beta_mat, intercepts,
-    lambdas = lassi_object$lambdas,
-    step_counts, chichignoud_criterion
-  )
-  names(out) <- c(
-    "beta_mat", "intercepts", "lambdas", "steps",
-    "chichignoud_criterion"
-  )
-  class(out) <- "lassi"
-  return(out)
-}
-
-#' Predict Method for Lasso on Indicator Bases
-#'
-#' @param fit ...
-#' @param new_x_basis ...
-#' @param lambdas ...
-#'
-#' @keywords internal
-predict.lassi <- function(fit, new_x_basis, lambdas = NULL) {
-  if (is.null(lambdas)) {
-    lambdas <- fit$lambdas
-  }
-
-  if (!all(lambdas %in% fit$lambdas)) {
-    stop("Attempting to predict for a lambda that was not fit.")
-  }
-
-  preds <- matrix(0, nrow = nrow(new_x_basis), ncol = length(lambdas))
-
-  for (i in seq_along(lambdas)) {
-    lambda <- lambdas[i]
-    beta_col <- which(lambda == fit$lambdas)
-    beta <- fit$beta_mat[, beta_col]
-    intercept <- fit$intercepts[beta_col]
-    pred_col <- lassi_predict(new_x_basis, beta, intercept)
-    preds[, i] <- pred_col
-    # find corresponding betas
-  }
-  return(preds)
-}
diff --git a/README.md b/README.md
index cb168d68..e8ed0d6a 100644
--- a/README.md
+++ b/README.md
@@ -27,7 +27,7 @@ Phillips](https://github.com/rachaelvp), [Lars van der
 Laan](https://github.com/Larsvanderlaan), and [Mark van der
 Laan](https://vanderlaan-lab.org/)
 
------
+------------------------------------------------------------------------
 
 ## What’s `hal9001`?
 
@@ -49,7 +49,7 @@ variations of HAL regression are used to estimate nuisance parameters
 (e.g., van der Laan, Benkeser, and Cai 2019; Ertefaie, Hejazi, and van
 der Laan 2020).
 
------
+------------------------------------------------------------------------
 
 ## Installation
 
@@ -67,14 +67,14 @@ GitHub via [`remotes`](https://CRAN.R-project.org/package=remotes):
 remotes::install_github("tlverse/hal9001")
 ```
 
------
+------------------------------------------------------------------------
 
 ## Issues
 
 If you encounter any bugs or have any specific feature requests, please
 [file an issue](https://github.com/tlverse/hal9001/issues).
 
------
+------------------------------------------------------------------------
 
 ## Example
 
@@ -85,7 +85,7 @@ predictions via Highly Adaptive Lasso regression:
 # load the package and set a seed
 library(hal9001)
 #> Loading required package: Rcpp
-#> hal9001 v0.4.3: The Scalable Highly Adaptive Lasso
+#> hal9001 v0.4.5: The Scalable Highly Adaptive Lasso
 #> note: fit_hal defaults have changed. See ?fit_hal for details
 set.seed(385971)
 
@@ -100,20 +100,20 @@ hal_fit <- fit_hal(X = x, Y = y, yolo = TRUE)
 #> [1] "I'm sorry, Dave. I'm afraid I can't do that."
 hal_fit$times
 #>                   user.self sys.self elapsed user.child sys.child
-#> enumerate_basis       0.008     0.00   0.008          0         0
-#> design_matrix         0.003     0.00   0.003          0         0
-#> reduce_basis          0.000     0.00   0.000          0         0
-#> remove_duplicates     0.000     0.00   0.000          0         0
-#> lasso                 3.012     0.01   3.023          0         0
-#> total                 3.024     0.01   3.035          0         0
+#> enumerate_basis       0.008    0.001   0.009          0         0
+#> design_matrix         0.003    0.000   0.003          0         0
+#> reduce_basis          0.000    0.000   0.000          0         0
+#> remove_duplicates     0.000    0.000   0.001          0         0
+#> lasso                 1.690    0.036   1.764          0         0
+#> total                 1.702    0.037   1.778          0         0
 
 # training sample prediction
 preds <- predict(hal_fit, new_data = x)
 mean(hal_mse <- (preds - y)^2)
-#> [1] 0.03754093
+#> [1] 0.03667466
 ```
 
------
+------------------------------------------------------------------------
 
 ## Contributions
 
@@ -122,37 +122,35 @@ our [contribution
 guidelines](https://github.com/tlverse/hal9001/blob/master/CONTRIBUTING.md)
 prior to submitting a pull request.
 
------
+------------------------------------------------------------------------
 
 ## Citation
 
 After using the `hal9001` R package, please cite both of the following:
 
-``` 
-    @software{coyle2022hal9001-rpkg,
-      author = {Coyle, Jeremy R and Hejazi, Nima S and Phillips, Rachael V
-        and {van der Laan}, Lars and {van der Laan}, Mark J},
-      title = {{hal9001}: The scalable highly adaptive lasso},
-      year  = {2022},
-      url = {https://doi.org/10.5281/zenodo.3558313},
-      doi = {10.5281/zenodo.3558313}
-      note = {{R} package version 0.4.2}
-    }
-
-    @article{hejazi2020hal9001-joss,
-      author = {Hejazi, Nima S and Coyle, Jeremy R and {van der Laan}, Mark
-        J},
-      title = {{hal9001}: Scalable highly adaptive lasso regression in
-        {R}},
-      year  = {2020},
-      url = {https://doi.org/10.21105/joss.02526},
-      doi = {10.21105/joss.02526},
-      journal = {Journal of Open Source Software},
-      publisher = {The Open Journal}
-    }
-```
-
------
+        @software{coyle2022hal9001-rpkg,
+          author = {Coyle, Jeremy R and Hejazi, Nima S and Phillips, Rachael V
+            and {van der Laan}, Lars and {van der Laan}, Mark J},
+          title = {{hal9001}: The scalable highly adaptive lasso},
+          year  = {2022},
+          url = {https://doi.org/10.5281/zenodo.3558313},
+          doi = {10.5281/zenodo.3558313}
+          note = {{R} package version 0.4.2}
+        }
+
+        @article{hejazi2020hal9001-joss,
+          author = {Hejazi, Nima S and Coyle, Jeremy R and {van der Laan}, Mark
+            J},
+          title = {{hal9001}: Scalable highly adaptive lasso regression in
+            {R}},
+          year  = {2020},
+          url = {https://doi.org/10.21105/joss.02526},
+          doi = {10.21105/joss.02526},
+          journal = {Journal of Open Source Software},
+          publisher = {The Open Journal}
+        }
+
+------------------------------------------------------------------------
 
 ## License
 
@@ -162,13 +160,13 @@ Hejazi](https://nimahejazi.org)
 The contents of this repository are distributed under the GPL-3 license.
 See file `LICENSE` for details.
 
------
+------------------------------------------------------------------------
 
 ## References
 
-<div id="refs" class="references">
+<div id="refs" class="references csl-bib-body hanging-indent">
 
-<div id="ref-benkeser2016hal">
+<div id="ref-benkeser2016hal" class="csl-entry">
 
 Benkeser, David, and Mark J van der Laan. 2016. “The Highly Adaptive
 Lasso Estimator.” In *2016 IEEE International Conference on Data Science
@@ -177,7 +175,7 @@ and Advanced Analytics (DSAA)*. IEEE.
 
 </div>
 
-<div id="ref-bibaut2019fast">
+<div id="ref-bibaut2019fast" class="csl-entry">
 
 Bibaut, Aurélien F, and Mark J van der Laan. 2019. “Fast Rates for
 Empirical Risk Minimization over Càdlàg Functions with Bounded Sectional
@@ -185,7 +183,7 @@ Variation Norm.” <https://arxiv.org/abs/1907.09244>.
 
 </div>
 
-<div id="ref-ertefaie2020nonparametric">
+<div id="ref-ertefaie2020nonparametric" class="csl-entry">
 
 Ertefaie, Ashkan, Nima S Hejazi, and Mark J van der Laan. 2020.
 “Nonparametric Inverse Probability Weighted Estimators Based on the
@@ -193,7 +191,7 @@ Highly Adaptive Lasso.” <https://arxiv.org/abs/2005.11303>.
 
 </div>
 
-<div id="ref-vdl2017generally">
+<div id="ref-vdl2017generally" class="csl-entry">
 
 van der Laan, Mark J. 2017a. “A Generally Efficient Targeted Minimum
 Loss Based Estimator Based on the Highly Adaptive Lasso.” *The
@@ -202,14 +200,14 @@ International Journal of Biostatistics*.
 
 </div>
 
-<div id="ref-vdl2017finite">
+<div id="ref-vdl2017finite" class="csl-entry">
 
 ———. 2017b. “Finite Sample Inference for Targeted Learning.”
 <https://arxiv.org/abs/1708.09502>.
 
 </div>
 
-<div id="ref-vdl2019efficient">
+<div id="ref-vdl2019efficient" class="csl-entry">
 
 van der Laan, Mark J, David Benkeser, and Weixin Cai. 2019. “Efficient
 Estimation of Pathwise Differentiable Target Parameters with the
@@ -218,7 +216,7 @@ Undersmoothed Highly Adaptive Lasso.”
 
 </div>
 
-<div id="ref-vdl2017uniform">
+<div id="ref-vdl2017uniform" class="csl-entry">
 
 van der Laan, Mark J, and Aurélien F Bibaut. 2017. “Uniform Consistency
 of the Highly Adaptive Lasso Estimator of Infinite-Dimensional
diff --git a/docs/404.html b/docs/404.html
index 33347803..2fa8a621 100644
--- a/docs/404.html
+++ b/docs/404.html
@@ -100,7 +100,7 @@ <h1>Page not found (404)</h1>
 
 <div class="pkgdown">
   <p></p>
-<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer>
diff --git a/docs/CONTRIBUTING.html b/docs/CONTRIBUTING.html
index 10224508..c278dd85 100644
--- a/docs/CONTRIBUTING.html
+++ b/docs/CONTRIBUTING.html
@@ -116,7 +116,7 @@ <h2 id="pull-requests">Pull requests<a class="anchor" aria-label="anchor" href="
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/LICENSE-text.html b/docs/LICENSE-text.html
index 758f7f4e..210dedbf 100644
--- a/docs/LICENSE-text.html
+++ b/docs/LICENSE-text.html
@@ -750,7 +750,7 @@ <h1>License</h1>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/articles/index.html b/docs/articles/index.html
index 9c5a4943..e707ca32 100644
--- a/docs/articles/index.html
+++ b/docs/articles/index.html
@@ -74,7 +74,7 @@ <h3>All vignettes</h3>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/articles/intro_hal9001.html b/docs/articles/intro_hal9001.html
index d29deab3..21f17a12 100644
--- a/docs/articles/intro_hal9001.html
+++ b/docs/articles/intro_hal9001.html
@@ -78,12 +78,14 @@
       </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
-      <h1 data-toc-skip>Fitting the Highly Adaptive Lasso with <code>hal9001</code>
+      <h1 data-toc-skip>Fitting the Highly Adaptive Lasso with
+<code>hal9001</code>
 </h1>
                         <h4 data-toc-skip class="author">
-<a href="https://nimahejazi.org" class="external-link">Nima Hejazi</a>, <a href="https://github.com/jeremyrcoyle" class="external-link">Jeremy Coyle</a>, Rachael Phillips, Lars van der Laan</h4>
+<a href="https://nimahejazi.org" class="external-link">Nima Hejazi</a>, <a href="https://github.com/jeremyrcoyle" class="external-link">Jeremy Coyle</a>, Rachael
+Phillips, Lars van der Laan</h4>
             
-            <h4 data-toc-skip class="date">2022-02-09</h4>
+            <h4 data-toc-skip class="date">2022-11-04</h4>
       
       <small class="dont-index">Source: <a href="https://github.com/tlverse/hal9001/blob/HEAD/vignettes/intro_hal9001.Rmd" class="external-link"><code>vignettes/intro_hal9001.Rmd</code></a></small>
       <div class="hidden name"><code>intro_hal9001.Rmd</code></div>
@@ -95,7 +97,23 @@ <h4 data-toc-skip class="date">2022-02-09</h4>
 <div class="section level2">
 <h2 id="introduction">Introduction<a class="anchor" aria-label="anchor" href="#introduction"></a>
 </h2>
-<p>The <em>highly adaptive Lasso</em> (HAL) is a flexible machine learning algorithm that nonparametrically estimates a function based on available data by embedding a set of input observations and covariates in an extremely high-dimensional space (i.e., generating basis functions from the available data). For an input data matrix of <span class="math inline">\(n\)</span> observations and <span class="math inline">\(d\)</span> covariates, the maximum number of zero-order basis functions generated is approximately <span class="math inline">\(n \cdot 2^{d - 1}\)</span>. To select a set of basis functions from among the (possibly reduced/screener) set that’s generated, the lasso is employed. The <code>hal9001</code> R package <span class="citation">(Hejazi, Coyle, and van der Laan 2020; Coyle, Hejazi, and van der Laan, n.d.)</span> provides an efficient implementation of this routine, relying on the <code>glmnet</code> R package <span class="citation">(Friedman, Hastie, and Tibshirani 2010)</span> for compatibility with the canonical Lasso implementation and using lasso regression with an input matrix composed of basis functions. Consult <span class="citation">Benkeser and van der Laan (2016)</span>, <span class="citation">(<span class="citeproc-not-found" data-reference-id="vdl2015generally"><strong>???</strong></span>)</span>, <span class="citation">van der Laan (2017)</span> for detailed theoretical descriptions of HAL and its various optimality properties.</p>
+<p>The <em>highly adaptive Lasso</em> (HAL) is a flexible machine
+learning algorithm that nonparametrically estimates a function based on
+available data by embedding a set of input observations and covariates
+in an extremely high-dimensional space (i.e., generating basis functions
+from the available data). For an input data matrix of <span class="math inline">\(n\)</span> observations and <span class="math inline">\(d\)</span> covariates, the maximum number of
+zero-order basis functions generated is approximately <span class="math inline">\(n \cdot 2^{d - 1}\)</span>. To select a set of
+basis functions from among the (possibly reduced/screener) set that’s
+generated, the lasso is employed. The <code>hal9001</code> R package
+<span class="citation">(Hejazi, Coyle, and van der Laan 2020; Coyle,
+Hejazi, and van der Laan, n.d.)</span> provides an efficient
+implementation of this routine, relying on the <code>glmnet</code> R
+package <span class="citation">(Friedman, Hastie, and Tibshirani
+2010)</span> for compatibility with the canonical Lasso implementation
+and using lasso regression with an input matrix composed of basis
+functions. Consult <span class="citation">Benkeser and van der Laan
+(2016)</span>, <span class="citation">(<strong>vdl2015generally?</strong>)</span>, <span class="citation">van der Laan (2017)</span> for detailed theoretical
+descriptions of HAL and its various optimality properties.</p>
 <hr>
 </div>
 <div class="section level2">
@@ -141,22 +159,29 @@ <h2 id="using-the-highly-adaptive-lasso">Using the Highly Adaptive Lasso<a class
 <div class="section level3">
 <h3 id="fitting-the-model">Fitting the model<a class="anchor" aria-label="anchor" href="#fitting-the-model"></a>
 </h3>
-<p>HAL uses the popular <code>glmnet</code> R package for the lasso step:</p>
+<p>HAL uses the popular <code>glmnet</code> R package for the lasso
+step:</p>
 <div class="sourceCode" id="cb9"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="va">hal_fit</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/fit_hal.html">fit_hal</a></span><span class="op">(</span>X <span class="op">=</span> <span class="va">x</span>, Y <span class="op">=</span> <span class="va">y</span><span class="op">)</span>
 <span class="va">hal_fit</span><span class="op">$</span><span class="va">times</span></code></pre></div>
 <pre><code><span class="co">##                   user.self sys.self elapsed user.child sys.child</span>
-<span class="co">## enumerate_basis       0.017    0.000   0.017          0         0</span>
-<span class="co">## design_matrix         0.090    0.000   0.091          0         0</span>
+<span class="co">## enumerate_basis       0.017    0.000   0.018          0         0</span>
+<span class="co">## design_matrix         0.082    0.003   0.086          0         0</span>
 <span class="co">## reduce_basis          0.000    0.000   0.000          0         0</span>
 <span class="co">## remove_duplicates     0.000    0.000   0.000          0         0</span>
-<span class="co">## lasso                 3.832    0.008   3.840          0         0</span>
-<span class="co">## total                 3.940    0.008   3.948          0         0</span></code></pre>
+<span class="co">## lasso                 2.284    0.072   2.399          0         0</span>
+<span class="co">## total                 2.384    0.075   2.503          0         0</span></code></pre>
 </div>
 <div class="section level3">
 <h3 id="summarizing-the-model">Summarizing the model<a class="anchor" aria-label="anchor" href="#summarizing-the-model"></a>
 </h3>
-<p>While the raw output object may be examined, it has (usually large) slots that make quick examination challenging. The <code>summary</code> method provides an interpretable table of basis functions with non-zero coefficients. All terms (i.e., including the terms with zero coefficient) can be included by setting <code>only_nonzero_coefs</code> to <code>FALSE</code> when calling <code>summary</code> on a <code>hal9001</code> model object.</p>
+<p>While the raw output object may be examined, it has (usually large)
+slots that make quick examination challenging. The <code>summary</code>
+method provides an interpretable table of basis functions with non-zero
+coefficients. All terms (i.e., including the terms with zero
+coefficient) can be included by setting <code>only_nonzero_coefs</code>
+to <code>FALSE</code> when calling <code>summary</code> on a
+<code>hal9001</code> model object.</p>
 <div class="sourceCode" id="cb11"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/print.html" class="external-link">print</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/summary.html" class="external-link">summary</a></span><span class="op">(</span><span class="va">hal_fit</span><span class="op">)</span><span class="op">)</span></code></pre></div>
 <pre><code><span class="co">## </span>
@@ -237,7 +262,11 @@ <h3 id="summarizing-the-model">Summarizing the model<a class="anchor" aria-label
 <span class="co">##                                          [ I(x1 &gt;= 0.594)*(x1 - 0.594)^1 ] * [ I(x3 &gt;= -3.289)*(x3 - -3.289)^1 ]</span>
 <span class="co">##                                        [ I(x1 &gt;= -0.685)*(x1 - -0.685)^1 ] * [ I(x3 &gt;= -3.289)*(x3 - -3.289)^1 ]</span>
 <span class="co">##                                                                                                             term</span></code></pre>
-<p>Note the length and width of these tables! The R environment might not be the optimal location to view the summary. Tip: Tables can be exported from R to LaTeX with the <code>xtable</code> R package. Here’s an example: <code>print(xtable(summary(fit)$table, type = "latex"), file = "haltbl_meow.tex")</code>.</p>
+<p>Note the length and width of these tables! The R environment might
+not be the optimal location to view the summary. Tip: Tables can be
+exported from R to LaTeX with the <code>xtable</code> R package. Here’s
+an example: <code>print(xtable(summary(fit)$table, type = "latex"), file
+= "haltbl_meow.tex")</code>.</p>
 </div>
 <div class="section level3">
 <h3 id="obtaining-model-predictions">Obtaining model predictions<a class="anchor" aria-label="anchor" href="#obtaining-model-predictions"></a>
@@ -261,19 +290,31 @@ <h3 id="obtaining-model-predictions">Obtaining model predictions<a class="anchor
 <div class="section level3">
 <h3 id="reducing-basis-functions">Reducing basis functions<a class="anchor" aria-label="anchor" href="#reducing-basis-functions"></a>
 </h3>
-<p>As described in <span class="citation">Benkeser and van der Laan (2016)</span>, the HAL algorithm operates by first constructing a set of basis functions and subsequently fitting a Lasso model with this set of basis functions as the design matrix. Several approaches are considered for reducing this set of basis functions: 1. Removing duplicated basis functions (done by default in the <code>fit_hal</code> function), 2. Removing basis functions that correspond to only a small set of observations; a good rule of thumb is to scale with <span class="math inline">\(\frac{1}{\sqrt{n}}\)</span>, and that is the default.</p>
-<p>The second of these two options may be modified by specifying the <code>reduce_basis</code> argument to the <code>fit_hal</code> function:</p>
+<p>As described in <span class="citation">Benkeser and van der Laan
+(2016)</span>, the HAL algorithm operates by first constructing a set of
+basis functions and subsequently fitting a Lasso model with this set of
+basis functions as the design matrix. Several approaches are considered
+for reducing this set of basis functions: 1. Removing duplicated basis
+functions (done by default in the <code>fit_hal</code> function), 2.
+Removing basis functions that correspond to only a small set of
+observations; a good rule of thumb is to scale with <span class="math inline">\(\frac{1}{\sqrt{n}}\)</span>, and that is the
+default.</p>
+<p>The second of these two options may be modified by specifying the
+<code>reduce_basis</code> argument to the <code>fit_hal</code>
+function:</p>
 <div class="sourceCode" id="cb17"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="va">hal_fit_reduced</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/fit_hal.html">fit_hal</a></span><span class="op">(</span>X <span class="op">=</span> <span class="va">x</span>, Y <span class="op">=</span> <span class="va">y</span>, reduce_basis <span class="op">=</span> <span class="fl">0.1</span><span class="op">)</span>
 <span class="va">hal_fit_reduced</span><span class="op">$</span><span class="va">times</span></code></pre></div>
 <pre><code><span class="co">##                   user.self sys.self elapsed user.child sys.child</span>
-<span class="co">## enumerate_basis       0.013    0.000   0.014          0         0</span>
-<span class="co">## design_matrix         0.084    0.000   0.084          0         0</span>
+<span class="co">## enumerate_basis       0.026    0.005   0.031          0         0</span>
+<span class="co">## design_matrix         0.080    0.002   0.082          0         0</span>
 <span class="co">## reduce_basis          0.000    0.000   0.000          0         0</span>
 <span class="co">## remove_duplicates     0.000    0.000   0.000          0         0</span>
-<span class="co">## lasso                 3.763    0.008   3.771          0         0</span>
-<span class="co">## total                 3.860    0.008   3.869          0         0</span></code></pre>
-<p>In the above, all basis functions with fewer than 10% of observations meeting the criterion imposed are automatically removed prior to the Lasso step of fitting the HAL regression. The results appear below</p>
+<span class="co">## lasso                 1.951    0.063   2.030          0         0</span>
+<span class="co">## total                 2.057    0.070   2.143          0         0</span></code></pre>
+<p>In the above, all basis functions with fewer than 10% of observations
+meeting the criterion imposed are automatically removed prior to the
+Lasso step of fitting the HAL regression. The results appear below</p>
 <div class="sourceCode" id="cb19"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/summary.html" class="external-link">summary</a></span><span class="op">(</span><span class="va">hal_fit_reduced</span><span class="op">)</span><span class="op">$</span><span class="va">table</span></code></pre></div>
 <pre><code><span class="co">##              coef</span>
@@ -350,12 +391,42 @@ <h3 id="reducing-basis-functions">Reducing basis functions<a class="anchor" aria
 <span class="co">## 34:                                                                             [ I(x3 &gt;= -3.289)*(x3 - -3.289)^1 ]</span>
 <span class="co">## 35:   [ I(x1 &gt;= -3.224)*(x1 - -3.224)^1 ] * [ I(x2 &gt;= -3.038)*(x2 - -3.038)^1 ] * [ I(x3 &gt;= 1.202)*(x3 - 1.202)^1 ]</span>
 <span class="co">##                                                                                                                term</span></code></pre>
-<p>Other approaches exist for reducing the set of basis functions <em>before</em> they are actually created, which is essential for most real-world applications with HAL. Currently, we provide this “pre-screening” via <code>num_knots</code> argument in <code>hal_fit</code>. The <code>num_knots</code> argument is akin to binning: it increases the coarseness of the approximation. <code>num_knots</code> allows one to specify the number of knot points used to generate the basis functions for each/all interaction degree(s). This reduces the total number of basis functions generated, and thus the size of the optimization problem, and it can dramatically decrease runtime. One can pass in a vector of length <code>max_degree</code> to <code>num_knots</code>, specifying the number of knot points to use by interaction degree for each basis function. Thus, one can specify if interactions of higher degrees (e.g., two- or three- way interactions) should be more coarse. Increasing the coarseness of more complex basis functions helps prevent a combinatorial explosion of basis functions, which can easily occur when basis functions are generated for all possible knot points. We will show an example with <code>num_knots</code> in the section that follows.</p>
+<p>Other approaches exist for reducing the set of basis functions
+<em>before</em> they are actually created, which is essential for most
+real-world applications with HAL. Currently, we provide this
+“pre-screening” via <code>num_knots</code> argument in
+<code>hal_fit</code>. The <code>num_knots</code> argument is akin to
+binning: it increases the coarseness of the approximation.
+<code>num_knots</code> allows one to specify the number of knot points
+used to generate the basis functions for each/all interaction degree(s).
+This reduces the total number of basis functions generated, and thus the
+size of the optimization problem, and it can dramatically decrease
+runtime. One can pass in a vector of length <code>max_degree</code> to
+<code>num_knots</code>, specifying the number of knot points to use by
+interaction degree for each basis function. Thus, one can specify if
+interactions of higher degrees (e.g., two- or three- way interactions)
+should be more coarse. Increasing the coarseness of more complex basis
+functions helps prevent a combinatorial explosion of basis functions,
+which can easily occur when basis functions are generated for all
+possible knot points. We will show an example with
+<code>num_knots</code> in the section that follows.</p>
 </div>
 <div class="section level3">
 <h3 id="specifying-smoothness-of-the-hal-model">Specifying smoothness of the HAL model<a class="anchor" aria-label="anchor" href="#specifying-smoothness-of-the-hal-model"></a>
 </h3>
-<p>One might wish to enforce smoothness on the functional form of the HAL fit. This can be done using the <code>smoothness_orders</code> argument. Setting <code>smoothness_orders = 0</code> gives a piece-wise constant fit (via zero-order basis functions), allowing for discontinuous jumps in the function. This is useful if one does not want to assume any smoothness or continuity of the “true” function. Setting <code>smoothness_orders = 1</code> gives a piece-wise linear fit (via first-order basis functions), which is continuous and mostly differentiable. In general, <code>smoothness_orders = k</code> corresponds to a piece-wise polynomial fit of degree <span class="math inline">\(k\)</span>. Mathematically, <code>smoothness_orders = k</code> corresponds with finding the best fit under the constraint that the total variation of the function’s <span class="math inline">\(k^{\text{th}}\)</span> derivative is bounded by some constant, which is selected with cross-validation.</p>
+<p>One might wish to enforce smoothness on the functional form of the
+HAL fit. This can be done using the <code>smoothness_orders</code>
+argument. Setting <code>smoothness_orders = 0</code> gives a piece-wise
+constant fit (via zero-order basis functions), allowing for
+discontinuous jumps in the function. This is useful if one does not want
+to assume any smoothness or continuity of the “true” function. Setting
+<code>smoothness_orders = 1</code> gives a piece-wise linear fit (via
+first-order basis functions), which is continuous and mostly
+differentiable. In general, <code>smoothness_orders = k</code>
+corresponds to a piece-wise polynomial fit of degree <span class="math inline">\(k\)</span>. Mathematically,
+<code>smoothness_orders = k</code> corresponds with finding the best fit
+under the constraint that the total variation of the function’s <span class="math inline">\(k^{\text{th}}\)</span> derivative is bounded by
+some constant, which is selected with cross-validation.</p>
 <p>Let’s see this in action.</p>
 <div class="sourceCode" id="cb21"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/Random.html" class="external-link">set.seed</a></span><span class="op">(</span><span class="fl">98109</span><span class="op">)</span>
@@ -393,7 +464,16 @@ <h3 id="specifying-smoothness-of-the-hal-model">Specifying smoothness of the HAL
 <span class="va">long</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/melt.data.table.html" class="external-link">melt</a></span><span class="op">(</span><span class="va">dt</span>, id <span class="op">=</span> <span class="st">"x"</span><span class="op">)</span>
 <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/ggplot.html" class="external-link">ggplot</a></span><span class="op">(</span><span class="va">long</span>, <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/aes.html" class="external-link">aes</a></span><span class="op">(</span>x <span class="op">=</span> <span class="va">x</span>, y <span class="op">=</span> <span class="va">value</span>, group <span class="op">=</span> <span class="va">variable</span><span class="op">)</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/geom_path.html" class="external-link">geom_line</a></span><span class="op">(</span><span class="op">)</span></code></pre></div>
 <p><img src="intro_hal9001_files/figure-html/unnamed-chunk-2-1.png" width="700"></p>
-<p>Comparing the mean squared error (MSE) between the predictions and the true (denoised) outcome, the first- and second- order smoothed HAL is able to recover from the coarseness of the basis functions caused by the small <code>num_knots</code> argument. Also, the HAL with second-order smoothness is able to fit the true function very well (as expected, since sin(x) is a very smooth function). The main benefit of imposing higher-order smoothness is that fewer knot points are required for a near-optimal fit. Therefore, one can safely pass a smaller value to <code>num_knots</code> for a big decrease in runtime without sacrificing performance.</p>
+<p>Comparing the mean squared error (MSE) between the predictions and
+the true (denoised) outcome, the first- and second- order smoothed HAL
+is able to recover from the coarseness of the basis functions caused by
+the small <code>num_knots</code> argument. Also, the HAL with
+second-order smoothness is able to fit the true function very well (as
+expected, since sin(x) is a very smooth function). The main benefit of
+imposing higher-order smoothness is that fewer knot points are required
+for a near-optimal fit. Therefore, one can safely pass a smaller value
+to <code>num_knots</code> for a big decrease in runtime without
+sacrificing performance.</p>
 <div class="sourceCode" id="cb22"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="op">(</span><span class="va">pred_0</span> <span class="op">-</span> <span class="va">ytrue</span><span class="op">)</span><span class="op">^</span><span class="fl">2</span><span class="op">)</span></code></pre></div>
 <pre><code><span class="co">## [1] 0.00732315</span></code></pre>
@@ -422,7 +502,17 @@ <h3 id="specifying-smoothness-of-the-hal-model">Specifying smoothness of the HAL
 <div class="sourceCode" id="cb31"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/graphics/plot.default.html" class="external-link">plot</a></span><span class="op">(</span><span class="va">x</span>, <span class="va">pred_smooth_2</span>, main <span class="op">=</span> <span class="st">"Second order smoothness fit"</span><span class="op">)</span></code></pre></div>
 <p><img src="intro_hal9001_files/figure-html/unnamed-chunk-3-4.png" width="700"></p>
-<p>In general, if the basis functions are not coarse, then the performance for different smoothness orders is similar. Notice how the runtime is a fair bit slower when more knot points are considered. In general, we recommend either zero- or first- order smoothness. Second-order smoothness tends to be less robust and suffers from extrapolation on new data. One can also use cross-validation to data-adaptively choose the optimal smoothness (invoked in <code>fit_hal</code> by setting <code>adaptive_smoothing = TRUE</code>). Comparing the following simulation and the previous one, the HAL with second-order smoothness performed better when there were fewer knot points.</p>
+<p>In general, if the basis functions are not coarse, then the
+performance for different smoothness orders is similar. Notice how the
+runtime is a fair bit slower when more knot points are considered. In
+general, we recommend either zero- or first- order smoothness.
+Second-order smoothness tends to be less robust and suffers from
+extrapolation on new data. One can also use cross-validation to
+data-adaptively choose the optimal smoothness (invoked in
+<code>fit_hal</code> by setting <code>adaptive_smoothing = TRUE</code>).
+Comparing the following simulation and the previous one, the HAL with
+second-order smoothness performed better when there were fewer knot
+points.</p>
 <div class="sourceCode" id="cb32"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/Random.html" class="external-link">set.seed</a></span><span class="op">(</span><span class="fl">98109</span><span class="op">)</span>
 <span class="va">n_covars</span> <span class="op">&lt;-</span> <span class="fl">1</span>
@@ -467,7 +557,19 @@ <h3 id="specifying-smoothness-of-the-hal-model">Specifying smoothness of the HAL
 <div class="section level3">
 <h3 id="formula-interface">Formula interface<a class="anchor" aria-label="anchor" href="#formula-interface"></a>
 </h3>
-<p>One might wish to specify the functional form of the HAL fit further. This can be done using the formula interface. Specifically, the formula interface allows one to specify monotonicity constraints on components of the HAL fit. It also allows one to specify exactly which basis functions (e.g., interactions) one wishes to model. The <code>formula_hal</code> function generates a <code>formula</code> object from a user-supplied character string, and this <code>formula</code> object contains the necessary specification information for <code>fit_hal</code> and <code>glmnet</code>. The <code>formula_hal</code> function is intended for use within <code>fit_hal</code>, and the user-supplied character string is inputted into <code>fit_hal</code>. Here, we call <code>formula_hal</code> directly for illustrative purposes.</p>
+<p>One might wish to specify the functional form of the HAL fit further.
+This can be done using the formula interface. Specifically, the formula
+interface allows one to specify monotonicity constraints on components
+of the HAL fit. It also allows one to specify exactly which basis
+functions (e.g., interactions) one wishes to model. The
+<code>formula_hal</code> function generates a <code>formula</code>
+object from a user-supplied character string, and this
+<code>formula</code> object contains the necessary specification
+information for <code>fit_hal</code> and <code>glmnet</code>. The
+<code>formula_hal</code> function is intended for use within
+<code>fit_hal</code>, and the user-supplied character string is inputted
+into <code>fit_hal</code>. Here, we call <code>formula_hal</code>
+directly for illustrative purposes.</p>
 <div class="sourceCode" id="cb42"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/Random.html" class="external-link">set.seed</a></span><span class="op">(</span><span class="fl">98109</span><span class="op">)</span>
 <span class="va">num_knots</span> <span class="op">&lt;-</span> <span class="fl">100</span>
@@ -479,7 +581,13 @@ <h3 id="formula-interface">Formula interface<a class="anchor" aria-label="anchor
 <span class="va">X</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>x1 <span class="op">=</span> <span class="va">x1</span>, x2 <span class="op">=</span> <span class="va">x2</span>, A <span class="op">=</span> <span class="va">A</span><span class="op">)</span>
 <span class="va">Y</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://rdrr.io/r/base/colSums.html" class="external-link">rowMeans</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/Trig.html" class="external-link">sin</a></span><span class="op">(</span><span class="va">X</span><span class="op">)</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="https://rdrr.io/r/stats/Normal.html" class="external-link">rnorm</a></span><span class="op">(</span><span class="va">n_obs</span>, mean <span class="op">=</span> <span class="fl">0</span>, sd <span class="op">=</span> <span class="fl">0.2</span><span class="op">)</span></code></pre></div>
 <p>We can specify an additive model in a number of ways.</p>
-<p>The formula below includes the outcome, but <code>formula_hal</code> doesn’t fit a HAL model, and doesn’t need the outcome (actually everything before “<span class="math inline">\(\tilde\)</span>” is ignored in <code>formula_hal</code>). This is why <code>formula_hal</code> takes the input <code>X</code> matrix of covariates, and not <code>X</code> and <code>Y</code>. In what follows, we include formulas with and without “y” in the character string.</p>
+<p>The formula below includes the outcome, but <code>formula_hal</code>
+doesn’t fit a HAL model, and doesn’t need the outcome (actually
+everything before “<span class="math inline">\(\tilde\)</span>” is
+ignored in <code>formula_hal</code>). This is why
+<code>formula_hal</code> takes the input <code>X</code> matrix of
+covariates, and not <code>X</code> and <code>Y</code>. In what follows,
+we include formulas with and without “y” in the character string.</p>
 <div class="sourceCode" id="cb43"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="co"># The `h` function is used to specify the basis functions for a given term</span>
 <span class="co"># h(x1) generates one-way basis functions for the variable x1</span>
@@ -519,7 +627,12 @@ <h3 id="formula-interface">Formula interface<a class="anchor" aria-label="anchor
 <span class="va">formula</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/formula_hal.html">formula_hal</a></span><span class="op">(</span>
   <span class="va">Y</span> <span class="op">~</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">x1</span>, k<span class="op">=</span><span class="fl">1</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">x2</span>,  k<span class="op">=</span><span class="fl">1</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">A</span>, k<span class="op">=</span><span class="fl">1</span><span class="op">)</span>, X <span class="op">=</span> <span class="va">X</span>, smoothness_orders <span class="op">=</span> <span class="fl">1</span>, num_knots <span class="op">=</span> <span class="fl">10</span>
 <span class="op">)</span></code></pre></div>
-<p>The <code>.</code> argument. We can generate an additive model for all or a subset of variables using the <code>.</code> variable and <code>.</code> argument of <code>h</code>. By default, <code>.</code> in <code>h(.)</code> is treated as a wildcard and basis functions are generated by replacing the <code>.</code> with all variables in <code>X</code>.</p>
+<p>The <code>.</code> argument. We can generate an additive model for
+all or a subset of variables using the <code>.</code> variable and
+<code>.</code> argument of <code>h</code>. By default, <code>.</code> in
+<code>h(.)</code> is treated as a wildcard and basis functions are
+generated by replacing the <code>.</code> with all variables in
+<code>X</code>.</p>
 <div class="sourceCode" id="cb48"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="va">smoothness_orders</span> <span class="op">&lt;-</span> <span class="fl">1</span>
 <span class="va">num_knots</span> <span class="op">&lt;-</span> <span class="fl">5</span>
@@ -560,7 +673,10 @@ <h3 id="formula-interface">Formula interface<a class="anchor" aria-label="anchor
 <span class="va">formula2</span> <span class="op">&lt;-</span>  <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">.</span><span class="op">)</span>  <span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">.</span>, <span class="va">.</span><span class="op">)</span><span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">.</span>,<span class="va">.</span>,<span class="va">.</span><span class="op">)</span>  
 <span class="fu"><a href="https://rdrr.io/r/base/length.html" class="external-link">length</a></span><span class="op">(</span><span class="va">formula1</span><span class="op">$</span><span class="va">basis_list</span> <span class="op">)</span> <span class="op">==</span> <span class="fu"><a href="https://rdrr.io/r/base/length.html" class="external-link">length</a></span><span class="op">(</span><span class="va">formula2</span><span class="op">$</span><span class="va">basis_list</span><span class="op">)</span></code></pre></div>
 <pre><code><span class="co">## [1] TRUE</span></code></pre>
-<p>Sometimes, one might want to build an additive model, but include all two-way interactions with one variable (e.g., treatment “A”). This can be done in a variety of ways. The <code>.</code> argument allows you to specify a subset of variables.</p>
+<p>Sometimes, one might want to build an additive model, but include all
+two-way interactions with one variable (e.g., treatment “A”). This can
+be done in a variety of ways. The <code>.</code> argument allows you to
+specify a subset of variables.</p>
 <div class="sourceCode" id="cb60"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="co"># Write it all out</span>
 <span class="va">formula</span> <span class="op">&lt;-</span>  <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">x1</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">x2</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">A</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">A</span>, <span class="va">x1</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">A</span>,<span class="va">x2</span><span class="op">)</span>
@@ -581,7 +697,15 @@ <h3 id="formula-interface">Formula interface<a class="anchor" aria-label="anchor
 <span class="va">formula2</span> <span class="op">&lt;-</span>   <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">A</span>,<span class="va">.</span>, . <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"x1"</span><span class="op">)</span><span class="op">)</span> 
  <span class="fu"><a href="https://rdrr.io/r/base/length.html" class="external-link">length</a></span><span class="op">(</span><span class="va">formula1</span><span class="op">$</span><span class="va">basis_list</span><span class="op">)</span> <span class="op">==</span> <span class="fu"><a href="https://rdrr.io/r/base/length.html" class="external-link">length</a></span><span class="op">(</span><span class="va">formula2</span><span class="op">$</span><span class="va">basis_list</span><span class="op">)</span></code></pre></div>
 <pre><code><span class="co">## [1] FALSE</span></code></pre>
-<p>A key feature of the HAL formula is <strong>monotonicity constraints</strong>. Specifying these constraints is achieved by specifying the <code>monotone</code> argument of <code>h</code>. Note if smoothness_orders = 0 then this is a monotonicity constrain on the function, but if if smoothness_orders = 1 then this is a monotonicity constraint on the function’s derivative (e.g. a convexity constraint). We can also specify that certain terms are not penalized in the LASSO/glmnet using the <code>pf</code> argument of <code>h</code> (stands for penalty factor).</p>
+<p>A key feature of the HAL formula is <strong>monotonicity
+constraints</strong>. Specifying these constraints is achieved by
+specifying the <code>monotone</code> argument of <code>h</code>. Note if
+smoothness_orders = 0 then this is a monotonicity constrain on the
+function, but if if smoothness_orders = 1 then this is a monotonicity
+constraint on the function’s derivative (e.g. a convexity constraint).
+We can also specify that certain terms are not penalized in the
+LASSO/glmnet using the <code>pf</code> argument of <code>h</code>
+(stands for penalty factor).</p>
 <div class="sourceCode" id="cb62"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="co"># An additive monotone increasing model</span>
 <span class="va">formula</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/formula_hal.html">formula_hal</a></span><span class="op">(</span>
@@ -614,7 +738,9 @@ <h3 id="formula-interface">Formula interface<a class="anchor" aria-label="anchor
 <span class="co"># intraction glm</span>
 <span class="va">formula</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">.</span>, <span class="va">.</span>, s <span class="op">=</span> <span class="fl">1</span>, k <span class="op">=</span> <span class="fl">1</span>, pf <span class="op">=</span> <span class="fl">0</span><span class="op">)</span> <span class="op">+</span> <span class="fu"><a href="../reference/h.html">h</a></span><span class="op">(</span><span class="va">.</span>, s <span class="op">=</span> <span class="fl">1</span>, k <span class="op">=</span> <span class="fl">1</span>, pf <span class="op">=</span> <span class="fl">0</span><span class="op">)</span>
 <span class="co"># Running HAL with this formula will be equivalent to running glm with the formula Y ~ .^2</span></code></pre></div>
-<p>Now, that we’ve illustrated the options with <code>formula_hal</code>, let’s show how to fit a HAL model with the specified formula.</p>
+<p>Now, that we’ve illustrated the options with
+<code>formula_hal</code>, let’s show how to fit a HAL model with the
+specified formula.</p>
 <div class="sourceCode" id="cb64"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span class="co"># get formula object</span>
 <span class="va">fit</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/fit_hal.html">fit_hal</a></span><span class="op">(</span>
@@ -641,23 +767,34 @@ <h3 id="formula-interface">Formula interface<a class="anchor" aria-label="anchor
 </div>
 </div>
 <div class="section level2 unnumbered">
-<h2 id="references">References<a class="anchor" aria-label="anchor" href="#references"></a>
+<h2 class="unnumbered" id="references">References<a class="anchor" aria-label="anchor" href="#references"></a>
 </h2>
-<div id="refs" class="references">
-<div id="ref-benkeser2016hal">
-<p>Benkeser, David, and Mark J van der Laan. 2016. “The Highly Adaptive Lasso Estimator.” In <em>2016 IEEE International Conference on Data Science and Advanced Analytics (DSAA)</em>. IEEE. <a href="https://doi.org/10.1109/dsaa.2016.93" class="external-link">https://doi.org/10.1109/dsaa.2016.93</a>.</p>
+<div id="refs" class="references csl-bib-body hanging-indent">
+<div id="ref-benkeser2016hal" class="csl-entry">
+Benkeser, David, and Mark J van der Laan. 2016. <span>“The Highly
+Adaptive Lasso Estimator.”</span> In <em>2016 <span>IEEE</span>
+International Conference on Data Science and Advanced Analytics
+(<span>DSAA</span>)</em>. <span>IEEE</span>. <a href="https://doi.org/10.1109/dsaa.2016.93" class="external-link">https://doi.org/10.1109/dsaa.2016.93</a>.
 </div>
-<div id="ref-coyle-gh-hal9001">
-<p>Coyle, Jeremy R, Nima S Hejazi, and Mark J van der Laan. n.d. <em><code>hal9001</code>: The Scalable Highly Adaptive Lasso</em> (version 0.2.7). <a href="https://doi.org/10.5281/zenodo.3558313" class="external-link">https://doi.org/10.5281/zenodo.3558313</a>.</p>
+<div id="ref-coyle-gh-hal9001" class="csl-entry">
+Coyle, Jeremy R, Nima S Hejazi, and Mark J van der Laan. n.d.
+<em><span><code>hal9001</code></span>: The Scalable Highly Adaptive
+Lasso</em> (version 0.2.7). <a href="https://doi.org/10.5281/zenodo.3558313" class="external-link">https://doi.org/10.5281/zenodo.3558313</a>.
 </div>
-<div id="ref-friedman2010glmnet">
-<p>Friedman, Jerome, Trevor Hastie, and Rob Tibshirani. 2010. “Regularization Paths for Generalized Linear Models via Coordinate Descent.” <em>Journal of Statistical Software</em> 33 (1): 1.</p>
+<div id="ref-friedman2010glmnet" class="csl-entry">
+Friedman, Jerome, Trevor Hastie, and Rob Tibshirani. 2010.
+<span>“Regularization Paths for Generalized Linear Models via Coordinate
+Descent.”</span> <em>Journal of Statistical Software</em> 33 (1): 1.
 </div>
-<div id="ref-hejazi2020hal9001">
-<p>Hejazi, Nima S, Jeremy R Coyle, and Mark J van der Laan. 2020. “hal9001: Scalable Highly Adaptive Lasso Regression in R.” <em>Journal of Open Source Software</em> 5 (53): 2526. <a href="https://doi.org/10.21105/joss.02526" class="external-link">https://doi.org/10.21105/joss.02526</a>.</p>
+<div id="ref-hejazi2020hal9001" class="csl-entry">
+Hejazi, Nima S, Jeremy R Coyle, and Mark J van der Laan. 2020.
+<span>“<span class="nocase">hal9001</span>: Scalable Highly Adaptive
+Lasso Regression in <span>R</span>.”</span> <em>Journal of Open Source
+Software</em> 5 (53): 2526. <a href="https://doi.org/10.21105/joss.02526" class="external-link">https://doi.org/10.21105/joss.02526</a>.
 </div>
-<div id="ref-vdl2017finite">
-<p>van der Laan, Mark J. 2017. “Finite Sample Inference for Targeted Learning.” <a href="https://arxiv.org/abs/1708.09502" class="external-link">https://arxiv.org/abs/1708.09502</a>.</p>
+<div id="ref-vdl2017finite" class="csl-entry">
+van der Laan, Mark J. 2017. <span>“Finite Sample Inference for
+<span>Targeted Learning</span>.”</span> <a href="https://arxiv.org/abs/1708.09502" class="external-link">https://arxiv.org/abs/1708.09502</a>.
 </div>
 </div>
 </div>
@@ -680,7 +817,7 @@ <h2 id="references">References<a class="anchor" aria-label="anchor" href="#refer
 
 <div class="pkgdown">
   <p></p>
-<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer>
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-13-1.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-13-1.png
index 66b130d2..32553fc6 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-13-1.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-13-1.png differ
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-2-1.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-2-1.png
index 3a44677f..7df64e57 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-2-1.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-2-1.png differ
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-1.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-1.png
index 31549fde..d12920ac 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-1.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-1.png differ
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-2.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-2.png
index ca8b1175..8f6da37c 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-2.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-2.png differ
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-3.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-3.png
index a4695e82..6b1c3032 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-3.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-3.png differ
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-4.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-4.png
index e359a501..957b9b53 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-4.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-3-4.png differ
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-1.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-1.png
index ca8b1175..8f6da37c 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-1.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-1.png differ
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-2.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-2.png
index a4695e82..6b1c3032 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-2.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-2.png differ
diff --git a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-3.png b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-3.png
index 0c6c2172..f2a89afe 100644
Binary files a/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-3.png and b/docs/articles/intro_hal9001_files/figure-html/unnamed-chunk-5-3.png differ
diff --git a/docs/authors.html b/docs/authors.html
index 22290116..b4c87ab8 100644
--- a/docs/authors.html
+++ b/docs/authors.html
@@ -103,7 +103,7 @@ <h1 id="citation">Citation</h1>
 
     <p>Coyle J, Hejazi N, Phillips R, van der Laan L, van der Laan M (2022).
 <em>hal9001: The scalable highly adaptive lasso</em>.
-doi: <a href="https://doi.org/10.5281/zenodo.3558313" class="external-link">10.5281/zenodo.3558313</a>, R package version 0.4.3, <a href="https://github.com/tlverse/hal9001" class="external-link">https://github.com/tlverse/hal9001</a>. 
+<a href="https://doi.org/10.5281/zenodo.3558313" class="external-link">doi:10.5281/zenodo.3558313</a>, R package version 0.4.3, <a href="https://github.com/tlverse/hal9001" class="external-link">https://github.com/tlverse/hal9001</a>. 
 </p>
     <pre>@Manual{,
   title = {{hal9001}: The scalable highly adaptive lasso},
@@ -116,7 +116,7 @@ <h1 id="citation">Citation</h1>
     <p>Hejazi N, Coyle J, van der Laan M (2020).
 “hal9001: Scalable highly adaptive lasso regression in R.”
 <em>Journal of Open Source Software</em>.
-doi: <a href="https://doi.org/10.21105/joss.02526" class="external-link">10.21105/joss.02526</a>, <a href="https://doi.org/10.21105/joss.02526" class="external-link">https://doi.org/10.21105/joss.02526</a>. 
+<a href="https://doi.org/10.21105/joss.02526" class="external-link">doi:10.21105/joss.02526</a>, <a href="https://doi.org/10.21105/joss.02526" class="external-link">https://doi.org/10.21105/joss.02526</a>. 
 </p>
     <pre>@Article{,
   title = {{hal9001}: Scalable highly adaptive lasso regression in {R}},
@@ -139,7 +139,7 @@ <h1 id="citation">Citation</h1>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/index.html b/docs/index.html
index 8e7e4609..4faf8401 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -128,7 +128,7 @@ <h2 id="example">Example<a class="anchor" aria-label="anchor" href="#example"></
 <code class="sourceCode R"><span class="co"># load the package and set a seed</span>
 <span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://github.com/tlverse/hal9001" class="external-link">hal9001</a></span><span class="op">)</span>
 <span class="co">#&gt; Loading required package: Rcpp</span>
-<span class="co">#&gt; hal9001 v0.4.3: The Scalable Highly Adaptive Lasso</span>
+<span class="co">#&gt; hal9001 v0.4.5: The Scalable Highly Adaptive Lasso</span>
 <span class="co">#&gt; note: fit_hal defaults have changed. See ?fit_hal for details</span>
 <span class="fu"><a href="https://rdrr.io/r/base/Random.html" class="external-link">set.seed</a></span><span class="op">(</span><span class="fl">385971</span><span class="op">)</span>
 
@@ -143,17 +143,17 @@ <h2 id="example">Example<a class="anchor" aria-label="anchor" href="#example"></
 <span class="co">#&gt; [1] "I'm sorry, Dave. I'm afraid I can't do that."</span>
 <span class="va">hal_fit</span><span class="op">$</span><span class="va">times</span>
 <span class="co">#&gt;                   user.self sys.self elapsed user.child sys.child</span>
-<span class="co">#&gt; enumerate_basis       0.008     0.00   0.008          0         0</span>
-<span class="co">#&gt; design_matrix         0.003     0.00   0.003          0         0</span>
-<span class="co">#&gt; reduce_basis          0.000     0.00   0.000          0         0</span>
-<span class="co">#&gt; remove_duplicates     0.000     0.00   0.000          0         0</span>
-<span class="co">#&gt; lasso                 3.012     0.01   3.023          0         0</span>
-<span class="co">#&gt; total                 3.024     0.01   3.035          0         0</span>
+<span class="co">#&gt; enumerate_basis       0.008    0.001   0.009          0         0</span>
+<span class="co">#&gt; design_matrix         0.003    0.000   0.003          0         0</span>
+<span class="co">#&gt; reduce_basis          0.000    0.000   0.000          0         0</span>
+<span class="co">#&gt; remove_duplicates     0.000    0.000   0.001          0         0</span>
+<span class="co">#&gt; lasso                 1.690    0.036   1.764          0         0</span>
+<span class="co">#&gt; total                 1.702    0.037   1.778          0         0</span>
 
 <span class="co"># training sample prediction</span>
 <span class="va">preds</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://rdrr.io/r/stats/predict.html" class="external-link">predict</a></span><span class="op">(</span><span class="va">hal_fit</span>, new_data <span class="op">=</span> <span class="va">x</span><span class="op">)</span>
 <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">hal_mse</span> <span class="op">&lt;-</span> <span class="op">(</span><span class="va">preds</span> <span class="op">-</span> <span class="va">y</span><span class="op">)</span><span class="op">^</span><span class="fl">2</span><span class="op">)</span>
-<span class="co">#&gt; [1] 0.03754093</span></code></pre></div>
+<span class="co">#&gt; [1] 0.03667466</span></code></pre></div>
 <hr>
 </div>
 <div class="section level2">
@@ -166,27 +166,27 @@ <h2 id="contributions">Contributions<a class="anchor" aria-label="anchor" href="
 <h2 id="citation">Citation<a class="anchor" aria-label="anchor" href="#citation"></a>
 </h2>
 <p>After using the <code>hal9001</code> R package, please cite both of the following:</p>
-<pre><code>    @software{coyle2022hal9001-rpkg,
-      author = {Coyle, Jeremy R and Hejazi, Nima S and Phillips, Rachael V
-        and {van der Laan}, Lars and {van der Laan}, Mark J},
-      title = {{hal9001}: The scalable highly adaptive lasso},
-      year  = {2022},
-      url = {https://doi.org/10.5281/zenodo.3558313},
-      doi = {10.5281/zenodo.3558313}
-      note = {{R} package version 0.4.2}
-    }
-
-    @article{hejazi2020hal9001-joss,
-      author = {Hejazi, Nima S and Coyle, Jeremy R and {van der Laan}, Mark
-        J},
-      title = {{hal9001}: Scalable highly adaptive lasso regression in
-        {R}},
-      year  = {2020},
-      url = {https://doi.org/10.21105/joss.02526},
-      doi = {10.21105/joss.02526},
-      journal = {Journal of Open Source Software},
-      publisher = {The Open Journal}
-    }</code></pre>
+<div class="sourceCode" id="cb4"><pre class="sourceCode R"><code class="sourceCode r"><span id="cb4-1"><a href="#cb4-1" aria-hidden="true" tabindex="-1"></a>    <span class="sc">@</span>software{coyle2022hal9001<span class="sc">-</span>rpkg,</span>
+<span id="cb4-2"><a href="#cb4-2" aria-hidden="true" tabindex="-1"></a>      author <span class="ot">=</span> {Coyle, Jeremy R and Hejazi, Nima S and Phillips, Rachael V</span>
+<span id="cb4-3"><a href="#cb4-3" aria-hidden="true" tabindex="-1"></a>        and {van der Laan}, Lars and {van der Laan}, Mark J},</span>
+<span id="cb4-4"><a href="#cb4-4" aria-hidden="true" tabindex="-1"></a>      title <span class="ot">=</span> {{hal9001}<span class="sc">:</span> The scalable highly adaptive lasso},</span>
+<span id="cb4-5"><a href="#cb4-5" aria-hidden="true" tabindex="-1"></a>      year  <span class="ot">=</span> {<span class="dv">2022</span>},</span>
+<span id="cb4-6"><a href="#cb4-6" aria-hidden="true" tabindex="-1"></a>      url <span class="ot">=</span> {https<span class="sc">:</span><span class="er">//</span>doi.org<span class="sc">/</span><span class="fl">10.5281</span><span class="sc">/</span>zenodo<span class="fl">.3558313</span>},</span>
+<span id="cb4-7"><a href="#cb4-7" aria-hidden="true" tabindex="-1"></a>      doi <span class="ot">=</span> {<span class="fl">10.5281</span><span class="sc">/</span>zenodo<span class="fl">.3558313</span>}</span>
+<span id="cb4-8"><a href="#cb4-8" aria-hidden="true" tabindex="-1"></a>      note <span class="ot">=</span> {{R} package version <span class="dv">0</span>.<span class="fl">4.2</span>}</span>
+<span id="cb4-9"><a href="#cb4-9" aria-hidden="true" tabindex="-1"></a>    }</span>
+<span id="cb4-10"><a href="#cb4-10" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb4-11"><a href="#cb4-11" aria-hidden="true" tabindex="-1"></a>    <span class="sc">@</span>article{hejazi2020hal9001<span class="sc">-</span>joss,</span>
+<span id="cb4-12"><a href="#cb4-12" aria-hidden="true" tabindex="-1"></a>      author <span class="ot">=</span> {Hejazi, Nima S and Coyle, Jeremy R and {van der Laan}, Mark</span>
+<span id="cb4-13"><a href="#cb4-13" aria-hidden="true" tabindex="-1"></a>        J},</span>
+<span id="cb4-14"><a href="#cb4-14" aria-hidden="true" tabindex="-1"></a>      title <span class="ot">=</span> {{hal9001}<span class="sc">:</span> Scalable highly adaptive lasso regression <span class="cf">in</span></span>
+<span id="cb4-15"><a href="#cb4-15" aria-hidden="true" tabindex="-1"></a>        {R}},</span>
+<span id="cb4-16"><a href="#cb4-16" aria-hidden="true" tabindex="-1"></a>      year  <span class="ot">=</span> {<span class="dv">2020</span>},</span>
+<span id="cb4-17"><a href="#cb4-17" aria-hidden="true" tabindex="-1"></a>      url <span class="ot">=</span> {https<span class="sc">:</span><span class="er">//</span>doi.org<span class="sc">/</span><span class="fl">10.21105</span><span class="sc">/</span>joss<span class="fl">.02526</span>},</span>
+<span id="cb4-18"><a href="#cb4-18" aria-hidden="true" tabindex="-1"></a>      doi <span class="ot">=</span> {<span class="fl">10.21105</span><span class="sc">/</span>joss<span class="fl">.02526</span>},</span>
+<span id="cb4-19"><a href="#cb4-19" aria-hidden="true" tabindex="-1"></a>      journal <span class="ot">=</span> {Journal of Open Source Software},</span>
+<span id="cb4-20"><a href="#cb4-20" aria-hidden="true" tabindex="-1"></a>      publisher <span class="ot">=</span> {The Open Journal}</span>
+<span id="cb4-21"><a href="#cb4-21" aria-hidden="true" tabindex="-1"></a>    }</span></code></pre></div>
 <hr>
 </div>
 <div class="section level2">
@@ -199,27 +199,27 @@ <h2 id="license">License<a class="anchor" aria-label="anchor" href="#license"></
 <div class="section level2">
 <h2 id="references">References<a class="anchor" aria-label="anchor" href="#references"></a>
 </h2>
-<div id="refs" class="references">
-<div id="ref-benkeser2016hal">
-<p>Benkeser, David, and Mark J van der Laan. 2016. “The Highly Adaptive Lasso Estimator.” In <em>2016 IEEE International Conference on Data Science and Advanced Analytics (DSAA)</em>. IEEE. <a href="https://doi.org/10.1109/dsaa.2016.93" class="external-link uri">https://doi.org/10.1109/dsaa.2016.93</a>.</p>
+<div id="refs" class="references csl-bib-body hanging-indent">
+<div id="ref-benkeser2016hal" class="csl-entry">
+Benkeser, David, and Mark J van der Laan. 2016. “The Highly Adaptive Lasso Estimator.” In <em>2016 IEEE International Conference on Data Science and Advanced Analytics (DSAA)</em>. IEEE. <a href="https://doi.org/10.1109/dsaa.2016.93" class="external-link uri">https://doi.org/10.1109/dsaa.2016.93</a>.
 </div>
-<div id="ref-bibaut2019fast">
-<p>Bibaut, Aurélien F, and Mark J van der Laan. 2019. “Fast Rates for Empirical Risk Minimization over Càdlàg Functions with Bounded Sectional Variation Norm.” <a href="https://arxiv.org/abs/1907.09244" class="external-link uri">https://arxiv.org/abs/1907.09244</a>.</p>
+<div id="ref-bibaut2019fast" class="csl-entry">
+Bibaut, Aurélien F, and Mark J van der Laan. 2019. “Fast Rates for Empirical Risk Minimization over Càdlàg Functions with Bounded Sectional Variation Norm.” <a href="https://arxiv.org/abs/1907.09244" class="external-link uri">https://arxiv.org/abs/1907.09244</a>.
 </div>
-<div id="ref-ertefaie2020nonparametric">
-<p>Ertefaie, Ashkan, Nima S Hejazi, and Mark J van der Laan. 2020. “Nonparametric Inverse Probability Weighted Estimators Based on the Highly Adaptive Lasso.” <a href="https://arxiv.org/abs/2005.11303" class="external-link uri">https://arxiv.org/abs/2005.11303</a>.</p>
+<div id="ref-ertefaie2020nonparametric" class="csl-entry">
+Ertefaie, Ashkan, Nima S Hejazi, and Mark J van der Laan. 2020. “Nonparametric Inverse Probability Weighted Estimators Based on the Highly Adaptive Lasso.” <a href="https://arxiv.org/abs/2005.11303" class="external-link uri">https://arxiv.org/abs/2005.11303</a>.
 </div>
-<div id="ref-vdl2017generally">
-<p>van der Laan, Mark J. 2017a. “A Generally Efficient Targeted Minimum Loss Based Estimator Based on the Highly Adaptive Lasso.” <em>The International Journal of Biostatistics</em>. <a href="https://doi.org/10.1515/ijb-2015-0097" class="external-link uri">https://doi.org/10.1515/ijb-2015-0097</a>.</p>
+<div id="ref-vdl2017generally" class="csl-entry">
+van der Laan, Mark J. 2017a. “A Generally Efficient Targeted Minimum Loss Based Estimator Based on the Highly Adaptive Lasso.” <em>The International Journal of Biostatistics</em>. <a href="https://doi.org/10.1515/ijb-2015-0097" class="external-link uri">https://doi.org/10.1515/ijb-2015-0097</a>.
 </div>
-<div id="ref-vdl2017finite">
-<p>———. 2017b. “Finite Sample Inference for Targeted Learning.” <a href="https://arxiv.org/abs/1708.09502" class="external-link uri">https://arxiv.org/abs/1708.09502</a>.</p>
+<div id="ref-vdl2017finite" class="csl-entry">
+———. 2017b. “Finite Sample Inference for Targeted Learning.” <a href="https://arxiv.org/abs/1708.09502" class="external-link uri">https://arxiv.org/abs/1708.09502</a>.
 </div>
-<div id="ref-vdl2019efficient">
-<p>van der Laan, Mark J, David Benkeser, and Weixin Cai. 2019. “Efficient Estimation of Pathwise Differentiable Target Parameters with the Undersmoothed Highly Adaptive Lasso.” <a href="https://arxiv.org/abs/1908.05607" class="external-link uri">https://arxiv.org/abs/1908.05607</a>.</p>
+<div id="ref-vdl2019efficient" class="csl-entry">
+van der Laan, Mark J, David Benkeser, and Weixin Cai. 2019. “Efficient Estimation of Pathwise Differentiable Target Parameters with the Undersmoothed Highly Adaptive Lasso.” <a href="https://arxiv.org/abs/1908.05607" class="external-link uri">https://arxiv.org/abs/1908.05607</a>.
 </div>
-<div id="ref-vdl2017uniform">
-<p>van der Laan, Mark J, and Aurélien F Bibaut. 2017. “Uniform Consistency of the Highly Adaptive Lasso Estimator of Infinite-Dimensional Parameters.” <a href="https://arxiv.org/abs/1709.06256" class="external-link uri">https://arxiv.org/abs/1709.06256</a>.</p>
+<div id="ref-vdl2017uniform" class="csl-entry">
+van der Laan, Mark J, and Aurélien F Bibaut. 2017. “Uniform Consistency of the Highly Adaptive Lasso Estimator of Infinite-Dimensional Parameters.” <a href="https://arxiv.org/abs/1709.06256" class="external-link uri">https://arxiv.org/abs/1709.06256</a>.
 </div>
 </div>
 </div>
@@ -295,7 +295,7 @@ <h2 data-toc-skip>Dev status</h2>
 
 <div class="pkgdown">
   <p></p>
-<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer>
diff --git a/docs/news/index.html b/docs/news/index.html
index f0ccb7cd..880a8638 100644
--- a/docs/news/index.html
+++ b/docs/news/index.html
@@ -107,7 +107,7 @@ <h2 class="page-header" data-toc-text="0.2.5" id="hal9001-025">hal9001 0.2.5<sma
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/pkgdown.yml b/docs/pkgdown.yml
index 264ee722..ce08e0d7 100644
--- a/docs/pkgdown.yml
+++ b/docs/pkgdown.yml
@@ -1,9 +1,9 @@
-pandoc: '2.5'
-pkgdown: 2.0.2
+pandoc: 2.17.0.1
+pkgdown: 2.0.3
 pkgdown_sha: ~
 articles:
   intro_hal9001: intro_hal9001.html
-last_built: 2022-02-09T21:19Z
+last_built: 2022-11-04T20:06Z
 urls:
   reference: https://tlverse.org/hal9001/reference
   article: https://tlverse.org/hal9001/articles
diff --git a/docs/reference/SL.hal9001.html b/docs/reference/SL.hal9001.html
index d0527f27..d10342df 100644
--- a/docs/reference/SL.hal9001.html
+++ b/docs/reference/SL.hal9001.html
@@ -144,7 +144,7 @@ <h2>Value</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/apply_copy_map.html b/docs/reference/apply_copy_map.html
index 17e5a645..609faab4 100644
--- a/docs/reference/apply_copy_map.html
+++ b/docs/reference/apply_copy_map.html
@@ -120,7 +120,7 @@ <h2>Examples</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/as_dgCMatrix.html b/docs/reference/as_dgCMatrix.html
index 1f6afbb7..19770364 100644
--- a/docs/reference/as_dgCMatrix.html
+++ b/docs/reference/as_dgCMatrix.html
@@ -95,7 +95,7 @@ <h2>Value</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/basis_list_cols.html b/docs/reference/basis_list_cols.html
index bbd64ea6..25e30700 100644
--- a/docs/reference/basis_list_cols.html
+++ b/docs/reference/basis_list_cols.html
@@ -122,7 +122,7 @@ <h2>Value</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/basis_of_degree.html b/docs/reference/basis_of_degree.html
index 5c4e015f..9e6d0da5 100644
--- a/docs/reference/basis_of_degree.html
+++ b/docs/reference/basis_of_degree.html
@@ -121,7 +121,7 @@ <h2>Value</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/calc_pnz.html b/docs/reference/calc_pnz.html
index 77ee389f..1d5a5b48 100644
--- a/docs/reference/calc_pnz.html
+++ b/docs/reference/calc_pnz.html
@@ -81,7 +81,7 @@ <h1>Calculate Proportion of Nonzero Entries</h1>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/calc_xscale.html b/docs/reference/calc_xscale.html
index dc7f676c..b00b4c64 100644
--- a/docs/reference/calc_xscale.html
+++ b/docs/reference/calc_xscale.html
@@ -88,7 +88,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/cv_lasso.html b/docs/reference/cv_lasso.html
index e4888958..46721e99 100644
--- a/docs/reference/cv_lasso.html
+++ b/docs/reference/cv_lasso.html
@@ -102,7 +102,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/enumerate_basis.html b/docs/reference/enumerate_basis.html
index 5822f040..f703cd4f 100644
--- a/docs/reference/enumerate_basis.html
+++ b/docs/reference/enumerate_basis.html
@@ -157,7 +157,7 @@ <h2>Examples</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/enumerate_edge_basis.html b/docs/reference/enumerate_edge_basis.html
index 736478c6..e2fc5b7a 100644
--- a/docs/reference/enumerate_edge_basis.html
+++ b/docs/reference/enumerate_edge_basis.html
@@ -126,7 +126,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/evaluate_basis.html b/docs/reference/evaluate_basis.html
index 2173f9fb..535d5286 100644
--- a/docs/reference/evaluate_basis.html
+++ b/docs/reference/evaluate_basis.html
@@ -92,7 +92,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/fit_hal.html b/docs/reference/fit_hal.html
index baaca18c..e66ae317 100644
--- a/docs/reference/fit_hal.html
+++ b/docs/reference/fit_hal.html
@@ -283,7 +283,7 @@ <h2>Examples</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/formula_hal.html b/docs/reference/formula_hal.html
index 67f8b2c1..e8230126 100644
--- a/docs/reference/formula_hal.html
+++ b/docs/reference/formula_hal.html
@@ -95,7 +95,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/formula_helpers.html b/docs/reference/formula_helpers.html
index da94183c..a7d761fb 100644
--- a/docs/reference/formula_helpers.html
+++ b/docs/reference/formula_helpers.html
@@ -90,7 +90,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/h.html b/docs/reference/h.html
index e587791b..dde8a391 100644
--- a/docs/reference/h.html
+++ b/docs/reference/h.html
@@ -149,7 +149,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/hal9000.html b/docs/reference/hal9000.html
index 4b2b8040..d2b2a1e0 100644
--- a/docs/reference/hal9000.html
+++ b/docs/reference/hal9000.html
@@ -81,7 +81,7 @@ <h1>HAL 9000 Quotes</h1>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/hal9001.html b/docs/reference/hal9001.html
index c4771760..9721fdbb 100644
--- a/docs/reference/hal9001.html
+++ b/docs/reference/hal9001.html
@@ -78,7 +78,7 @@ <h1>hal9001</h1>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/hal_quotes.html b/docs/reference/hal_quotes.html
index 3686f7e6..8c94ebad 100644
--- a/docs/reference/hal_quotes.html
+++ b/docs/reference/hal_quotes.html
@@ -87,7 +87,7 @@ <h2>Format</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/index.html b/docs/reference/index.html
index 57d2660c..0c29898d 100644
--- a/docs/reference/index.html
+++ b/docs/reference/index.html
@@ -86,10 +86,6 @@ <h2 id="all-functions">All functions <a href="#all-functions" class="anchor" ari
           <p><code><a href="cv_lasso.html">cv_lasso()</a></code> </p>
         </td>
         <td><p>Cross-validated Lasso on Indicator Bases</p></td>
-      </tr><tr><td>
-          <p><code><a href="cv_lasso_early_stopping.html">cv_lasso_early_stopping()</a></code> </p>
-        </td>
-        <td><p>Cross-validated LASSO on Indicator Bases</p></td>
       </tr><tr><td>
           <p><code><a href="enumerate_basis.html">enumerate_basis()</a></code> </p>
         </td>
@@ -130,18 +126,6 @@ <h2 id="all-functions">All functions <a href="#all-functions" class="anchor" ari
           <p><code><a href="index_first_copy.html">index_first_copy()</a></code> </p>
         </td>
         <td><p>Find Copies of Columns</p></td>
-      </tr><tr><td>
-          <p><code><a href="lassi_fit_module.html">lassi_fit_module</a></code> </p>
-        </td>
-        <td><p>Rcpp module: lassi_fit_module</p></td>
-      </tr><tr><td>
-          <p><code><a href="lassi_origami.html">lassi_origami()</a></code> </p>
-        </td>
-        <td><p>Single Lasso estimation for cross-validation with Origami</p></td>
-      </tr><tr><td>
-          <p><code><a href="lassi_predict.html">lassi_predict()</a></code> </p>
-        </td>
-        <td><p>Prediction from a Lassi Model</p></td>
       </tr><tr><td>
           <p><code><a href="make_basis_list.html">make_basis_list()</a></code> </p>
         </td>
@@ -204,7 +188,7 @@ <h2 id="all-functions">All functions <a href="#all-functions" class="anchor" ari
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/index_first_copy.html b/docs/reference/index_first_copy.html
index 6092692b..ebb7fa38 100644
--- a/docs/reference/index_first_copy.html
+++ b/docs/reference/index_first_copy.html
@@ -88,7 +88,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/make_basis_list.html b/docs/reference/make_basis_list.html
index 7608e691..7c265ce1 100644
--- a/docs/reference/make_basis_list.html
+++ b/docs/reference/make_basis_list.html
@@ -97,7 +97,7 @@ <h2>Details</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/make_copy_map.html b/docs/reference/make_copy_map.html
index 595f68fb..6a02ad48 100644
--- a/docs/reference/make_copy_map.html
+++ b/docs/reference/make_copy_map.html
@@ -117,7 +117,7 @@ <h2>Examples</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/make_design_matrix.html b/docs/reference/make_design_matrix.html
index 4e8a460f..9ed0bebd 100644
--- a/docs/reference/make_design_matrix.html
+++ b/docs/reference/make_design_matrix.html
@@ -122,7 +122,7 @@ <h2>Examples</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/make_reduced_basis_map.html b/docs/reference/make_reduced_basis_map.html
index 44cbe64a..10805fb4 100644
--- a/docs/reference/make_reduced_basis_map.html
+++ b/docs/reference/make_reduced_basis_map.html
@@ -105,7 +105,7 @@ <h2>Value</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/meets_basis.html b/docs/reference/meets_basis.html
index 46654c5e..1eea6fdb 100644
--- a/docs/reference/meets_basis.html
+++ b/docs/reference/meets_basis.html
@@ -96,7 +96,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/num_knots_generator.html b/docs/reference/num_knots_generator.html
index 55719bc2..75235939 100644
--- a/docs/reference/num_knots_generator.html
+++ b/docs/reference/num_knots_generator.html
@@ -108,7 +108,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/plus-.formula_hal9001.html b/docs/reference/plus-.formula_hal9001.html
index 69167ea4..6559f4fe 100644
--- a/docs/reference/plus-.formula_hal9001.html
+++ b/docs/reference/plus-.formula_hal9001.html
@@ -94,7 +94,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/predict.SL.hal9001.html b/docs/reference/predict.SL.hal9001.html
index ff72c30e..9f2d224f 100644
--- a/docs/reference/predict.SL.hal9001.html
+++ b/docs/reference/predict.SL.hal9001.html
@@ -95,7 +95,7 @@ <h2>Value</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/predict.hal9001.html b/docs/reference/predict.hal9001.html
index 65c819cc..d94608e6 100644
--- a/docs/reference/predict.hal9001.html
+++ b/docs/reference/predict.hal9001.html
@@ -139,7 +139,7 @@ <h2>Note</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/print.formula_hal9001.html b/docs/reference/print.formula_hal9001.html
index 7ed0b5b0..d4228a34 100644
--- a/docs/reference/print.formula_hal9001.html
+++ b/docs/reference/print.formula_hal9001.html
@@ -89,7 +89,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/print.summary.hal9001.html b/docs/reference/print.summary.hal9001.html
index a4dbb09b..6ff49f7e 100644
--- a/docs/reference/print.summary.hal9001.html
+++ b/docs/reference/print.summary.hal9001.html
@@ -91,7 +91,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/quantizer.html b/docs/reference/quantizer.html
index 197d65fc..7a710d60 100644
--- a/docs/reference/quantizer.html
+++ b/docs/reference/quantizer.html
@@ -89,7 +89,7 @@ <h2>Arguments</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/squash_hal_fit.html b/docs/reference/squash_hal_fit.html
index 6b43095b..e6c72b5c 100644
--- a/docs/reference/squash_hal_fit.html
+++ b/docs/reference/squash_hal_fit.html
@@ -108,7 +108,7 @@ <h2>Examples</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/docs/reference/summary.hal9001.html b/docs/reference/summary.hal9001.html
index 75d019d2..795a34c1 100644
--- a/docs/reference/summary.hal9001.html
+++ b/docs/reference/summary.hal9001.html
@@ -140,7 +140,7 @@ <h2>Details</h2>
 </div>
 
 <div class="pkgdown">
-  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.3.</p>
 </div>
 
       </footer></div>
diff --git a/man/cv_lasso_early_stopping.Rd b/man/cv_lasso_early_stopping.Rd
deleted file mode 100644
index cea940fa..00000000
--- a/man/cv_lasso_early_stopping.Rd
+++ /dev/null
@@ -1,26 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/cv_lasso_early_stopping.R
-\name{cv_lasso_early_stopping}
-\alias{cv_lasso_early_stopping}
-\title{Cross-validated LASSO on Indicator Bases}
-\usage{
-cv_lasso_early_stopping(x_basis, y, n_lambda = 100, n_folds = 10)
-}
-\arguments{
-\item{x_basis}{A \code{dgCMatrix} object corresponding to a sparse matrix of
-the basis functions generated for the HAL algorithm.}
-
-\item{y}{A \code{numeric} vector of the observed outcome variable values.}
-
-\item{n_lambda}{A \code{numeric} scalar indicating the number of values of
-the L1 regularization parameter (lambda) to be obtained from fitting the
-LASSO to the full data. Cross-validation is used to select an optimal
-lambda (that minimizes the risk) from among these.}
-
-\item{n_folds}{A \code{numeric} scalar for the number of folds to be used in
-the cross-validation procedure to select an optimal value of lambda.}
-}
-\description{
-Fits the LASSO regression using a customized procedure with cross-validation
-based on \pkg{origami}
-}
diff --git a/man/lassi.Rd b/man/lassi.Rd
deleted file mode 100644
index 2803067e..00000000
--- a/man/lassi.Rd
+++ /dev/null
@@ -1,33 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/lassi.R
-\name{lassi}
-\alias{lassi}
-\title{Custom Lasso implementation for matrices of indicator functions}
-\usage{
-lassi(
-  x,
-  y,
-  lambdas = NULL,
-  nlambda = 100,
-  lambda_min_ratio = 0.01,
-  center = FALSE
-)
-}
-\arguments{
-\item{x}{The covariate matrix}
-
-\item{y}{The outcome vector}
-
-\item{lambdas}{A sequence of values for the L1 regularization parameter
-(lambda) to be used in fitting the LASSO. Defaults to \code{NULL}.}
-
-\item{nlambda}{number of lambdas to fit.}
-
-\item{lambda_min_ratio}{ratio of largest to smallest lambda to fit.}
-
-\item{center}{...}
-}
-\description{
-Custom Lasso implementation for matrices of indicator functions
-}
-\keyword{internal}
diff --git a/man/lassi_fit_module.Rd b/man/lassi_fit_module.Rd
deleted file mode 100644
index 35929eae..00000000
--- a/man/lassi_fit_module.Rd
+++ /dev/null
@@ -1,8 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/lassi.R
-\name{lassi_fit_module}
-\alias{lassi_fit_module}
-\title{Rcpp module: lassi_fit_module}
-\description{
-Rcpp module: lassi_fit_module
-}
diff --git a/man/lassi_origami.Rd b/man/lassi_origami.Rd
deleted file mode 100644
index dbfa5899..00000000
--- a/man/lassi_origami.Rd
+++ /dev/null
@@ -1,28 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/cv_lasso.R
-\name{lassi_origami}
-\alias{lassi_origami}
-\title{Single Lasso estimation for cross-validation with Origami}
-\usage{
-lassi_origami(fold, data, lambdas, center = FALSE)
-}
-\arguments{
-\item{fold}{A \code{fold} object produced by a call to \code{make_folds}
-from the \pkg{origami}.}
-
-\item{data}{A \code{dgCMatrix} object containing the outcome values (Y) in
-its first column and vectors corresponding to the basis functions of HAL in
-all other columns. Consult the description of HAL regression for details.}
-
-\item{lambdas}{A \code{numeric} vector corresponding to a sequence of lambda
-values obtained by fitting the Lasso on the full data.}
-
-\item{center}{binary. If \code{TRUE}, covariates are centered. This is much
-slower, but matches the \code{glmnet} implementation. Default \code{FALSE}.}
-}
-\description{
-Fits Lasso regression over a single fold of a cross-validated data set. This
-is meant to be called using \code{\link[origami]{cross_validate}}, which is
-done through \code{\link{cv_lasso}}. Note that this procedure is NOT meant
-to be invoked by itself. INTERNAL USE ONLY.
-}
diff --git a/man/lassi_predict.Rd b/man/lassi_predict.Rd
deleted file mode 100644
index 6737dfba..00000000
--- a/man/lassi_predict.Rd
+++ /dev/null
@@ -1,18 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/RcppExports.R
-\name{lassi_predict}
-\alias{lassi_predict}
-\title{Prediction from a Lassi Model}
-\usage{
-lassi_predict(X, beta, intercept)
-}
-\arguments{
-\item{X}{A sparse matrix of HAL basis functions.}
-
-\item{beta}{A vector of coefficient values for the HAL basis functions.}
-
-\item{intercept}{A numeric value giving the intercept of the HAL model.}
-}
-\description{
-Prediction from a Lassi Model
-}
diff --git a/man/predict.lassi.Rd b/man/predict.lassi.Rd
deleted file mode 100644
index aede8220..00000000
--- a/man/predict.lassi.Rd
+++ /dev/null
@@ -1,19 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/lassi.R
-\name{predict.lassi}
-\alias{predict.lassi}
-\title{Predict Method for Lasso on Indicator Bases}
-\usage{
-\method{predict}{lassi}(fit, new_x_basis, lambdas = NULL)
-}
-\arguments{
-\item{fit}{...}
-
-\item{new_x_basis}{...}
-
-\item{lambdas}{...}
-}
-\description{
-Predict Method for Lasso on Indicator Bases
-}
-\keyword{internal}
diff --git a/src/RcppExports.cpp b/src/RcppExports.cpp
index 9ab10913..f47ac63b 100644
--- a/src/RcppExports.cpp
+++ b/src/RcppExports.cpp
@@ -35,19 +35,6 @@ BEGIN_RCPP
     return rcpp_result_gen;
 END_RCPP
 }
-// lassi_predict
-NumericVector lassi_predict(const MSpMat X, const NumericVector beta, double intercept);
-RcppExport SEXP _hal9001_lassi_predict(SEXP XSEXP, SEXP betaSEXP, SEXP interceptSEXP) {
-BEGIN_RCPP
-    Rcpp::RObject rcpp_result_gen;
-    Rcpp::RNGScope rcpp_rngScope_gen;
-    Rcpp::traits::input_parameter< const MSpMat >::type X(XSEXP);
-    Rcpp::traits::input_parameter< const NumericVector >::type beta(betaSEXP);
-    Rcpp::traits::input_parameter< double >::type intercept(interceptSEXP);
-    rcpp_result_gen = Rcpp::wrap(lassi_predict(X, beta, intercept));
-    return rcpp_result_gen;
-END_RCPP
-}
 // make_basis_list
 List make_basis_list(const NumericMatrix& X_sub, const NumericVector& cols, const IntegerVector& order_map);
 RcppExport SEXP _hal9001_make_basis_list(SEXP X_subSEXP, SEXP colsSEXP, SEXP order_mapSEXP) {
@@ -137,12 +124,9 @@ BEGIN_RCPP
 END_RCPP
 }
 
-RcppExport SEXP _rcpp_module_boot_lassi_module();
-
 static const R_CallMethodDef CallEntries[] = {
     {"_hal9001_index_first_copy", (DL_FUNC) &_hal9001_index_first_copy, 1},
     {"_hal9001_apply_copy_map", (DL_FUNC) &_hal9001_apply_copy_map, 2},
-    {"_hal9001_lassi_predict", (DL_FUNC) &_hal9001_lassi_predict, 3},
     {"_hal9001_make_basis_list", (DL_FUNC) &_hal9001_make_basis_list, 3},
     {"_hal9001_meets_basis", (DL_FUNC) &_hal9001_meets_basis, 5},
     {"_hal9001_evaluate_basis", (DL_FUNC) &_hal9001_evaluate_basis, 4},
@@ -150,7 +134,6 @@ static const R_CallMethodDef CallEntries[] = {
     {"_hal9001_as_dgCMatrix", (DL_FUNC) &_hal9001_as_dgCMatrix, 1},
     {"_hal9001_calc_pnz", (DL_FUNC) &_hal9001_calc_pnz, 1},
     {"_hal9001_calc_xscale", (DL_FUNC) &_hal9001_calc_xscale, 2},
-    {"_rcpp_module_boot_lassi_module", (DL_FUNC) &_rcpp_module_boot_lassi_module, 0},
     {NULL, NULL, 0}
 };
 
diff --git a/src/lassi_fit.cpp b/src/lassi_fit.cpp
deleted file mode 100644
index 9509bda5..00000000
--- a/src/lassi_fit.cpp
+++ /dev/null
@@ -1,446 +0,0 @@
-// [[Rcpp::depends(RcppEigen)]]
-#include <RcppEigen.h>
-#include "hal9001_types.h"
-#include "utils.h"
-#include <Rcpp.h>
-#include <Rcpp/Benchmark/Timer.h>
-
-using namespace Rcpp;
-
-
-class Lassi {
-  const MSpMat X;
-  int n;
-  int p;
-  bool center;
-  double intercept;
-  NumericVector resids;
-  double resid_sum;
-  double rss;
-  double null_rss;
-  NumericVector beta;
-  NumericVector xcenter;
-  NumericVector xscale;
-  NumericVector lambdas;
-  SpMat beta_mat;
-  NumericVector intercepts;
-  /*
-   * variable_state is a vector of a lazy-person's enumerated type
-   * state=2 is the active_set (possibly also the strong_set)
-   * state=1 is the strong_set, but not the active_set
-   * state=0 is neither the strong_set nor the active_set
-   */
-  IntegerVector variable_state;
-  NumericVector safe_lambda;
-  double lambda_max;
-public:
-  Lassi(const MSpMat X_init, NumericVector y, int nlambda,
-      double lambda_min_ratio, bool center):
-  X(X_init),
-  n(X_init.rows()),
-  p(X_init.cols()),
-  center(center),
-  intercept(mean(y)),
-  resids(y-intercept),
-  resid_sum(sum(resids)),
-  rss(sum(resids * resids)),
-  null_rss(rss),
-  beta(NumericVector(p,0.0)),
-  lambdas(NumericVector(nlambda, 0.0)),
-  beta_mat(SpMat(p, nlambda)),
-  intercepts(NumericVector(nlambda,0.0)),
-  variable_state(IntegerVector(p, 0))
-  {
-    // get centering and scaling vectors if applicable
-    if(center){
-      xcenter = calc_pnz(X);
-    } else {
-      xcenter = NumericVector(p, 0.0);
-    }
-
-    xscale = calc_xscale(X, xcenter);
-
-    // initialize lambda_max and lambda vector
-    // X_t_resid is used for lots of things:
-    // strong rule
-    // kkt violation
-    // beta update
-    // so we compute beta updates
-    // then we check strong filtering
-    // then we check for kkt violations (all at once, but why)
-
-    lambda_max = 0;
-    double new_beta;
-    for (int j = 0; j < p; ++j) {
-      new_beta = X_t_resid(j) / n;
-      new_beta = std::abs(new_beta);
-      if (new_beta > lambda_max) {
-
-        lambda_max = new_beta;
-      }
-    }
-
-    double log_lambda_max = log(lambda_max);
-    double log_lambda_min = log(lambda_min_ratio*lambda_max);
-    double lambda_step_size = (log_lambda_max - log_lambda_min) / (nlambda - 1);
-
-    for(int i = 0; i < nlambda; i++){
-      lambdas[i] = exp(log_lambda_max - i*lambda_step_size);
-    }
-
-    //below this lambda, we must check if variable is now active.
-    safe_lambda = NumericVector(p, lambda_max);
-
-    beta_mat.reserve(0.2 * p * nlambda);
-  }
-
-  const MSpMat& get_X(){
-    return(X);
-  }
-
-  NumericVector get_beta(){
-    return(beta);
-  }
-
-  SpMat get_beta_mat(){
-    beta_mat.makeCompressed();
-    return(beta_mat);
-  }
-
-  NumericVector get_intercepts(){
-    return(intercepts);
-  }
-
-  NumericVector get_lambdas(){
-    return(lambdas);
-  }
-
-  void set_lambdas(NumericVector new_lambdas){
-    if(new_lambdas.length()!=lambdas.length()){
-      stop("length(lambdas) must match nlambda passed on construction");
-    }
-
-    lambdas=new_lambdas;
-  }
-
-  NumericVector get_resids(){
-    return(resids);
-  }
-
-  NumericVector get_xscale(){
-    return(xscale);
-  }
-
-  NumericVector get_xcenter(){
-    return(xcenter);
-  }
-
-  double X_t_resid(int j) {
-    double crossprod_sum = 0;
-    for (MInIterMat i_(X, j); i_; ++i_) {
-      crossprod_sum += resids[i_.index()];
-    }
-
-    if(center){
-      crossprod_sum = (crossprod_sum - xcenter[j] * resid_sum) / xscale[j];
-    } else {
-      crossprod_sum = crossprod_sum / xscale[j];
-    }
-
-    return(crossprod_sum);
-  }
-
-  double get_new_beta(int j) {
-    double crossprod_sum = X_t_resid(j);
-    double new_beta = crossprod_sum / n + beta[j];
-    return(new_beta);
-  }
-
-  double find_lambda_max(){
-    return(lambda_max);
-  }
-
-  void update_resid(int j, double beta_diff) {
-
-    double scaled_diff = beta_diff / xscale[j];
-
-    // if(center){
-    //   for (int i=0; i<n; ++i) {
-    //     resid_shift = scaled_diff * (X.coeff(i,j) - xcenter_j);
-    //     resids[i] -= resid_shift;
-    //     resid_sum -= resid_shift;
-    //   }
-    // } else {
-    //   for (MInIterMat i_(X, j); i_; ++i_) {
-    //     resids[i_.index()] -= scaled_diff;
-    //     resid_sum -= scaled_diff;
-    //   }
-    // }
-
-    for (MInIterMat i_(X, j); i_; ++i_) {
-      resids[i_.index()] -= scaled_diff;
-    }
-
-    if(center){
-      double resid_shift = scaled_diff * xcenter[j];
-      for (int i=0; i<n; ++i) {
-        resids[i] += resid_shift;
-      }
-
-      //resid_sum is only used when centering
-      resid_sum = sum(resids);
-    }
-
-    rss = sum( resids * resids);
-    // rss = sum(resids*resids);
-  }
-
-  double update_coord(int j, double lambda) {
-
-    double new_beta = get_new_beta(j);
-
-    new_beta = soft_max(new_beta, lambda);
-
-    //if we changed this beta, we must update the residuals
-    double beta_diff = new_beta-beta[j];
-    if (std::abs(beta_diff) > 1e-7) {
-
-      update_resid(j, beta_diff);
-      beta[j] = new_beta;
-    } else {
-      beta_diff = 0;
-    }
-    return(beta_diff);
-  }
-
-  int update_coords(double lambda, bool active_set) {
-    // update coordinates one-by-one
-    int j;
-    double old_rss = rss;
-    int updates = 0;
-    double update;
-    for (j = 0; j < X.outerSize(); ++j) {
-      if(!(active_set) || beta[j]!=0){
-        update = update_coord(j, lambda);
-
-        // see if we decreased the rss
-        // todo: should be relative to null deviance
-        if(update!=0){
-          if((old_rss-rss)/null_rss > 1e-7){
-            updates++;
-          }
-          old_rss = rss;
-        }
-      }
-    }
-
-    // update intercept
-    double mean_resid = mean(resids);
-    resids = resids - mean_resid;
-    intercept += mean_resid;
-
-    // Rcout << "Updated " << updated << " coords" << std::endl;
-    return(updates);
-  }
-
-  int check_kkt(double lambda) {
-    return(0);
-  }
-
-  int lassi_fit_cd(int lambda_step, bool active_set, int nsteps) {
-    double lambda = lambdas[lambda_step];
-
-    int step_num = 0;
-    double last_rss = rss;
-    double ratio = 0;
-    int updated=0;
-    // Rcout << "Starting mse " << mse << std::endl;
-    for (step_num = 0; step_num < nsteps; step_num++) {
-      last_rss = rss;
-
-      updated = update_coords(lambda, active_set);
-      // rss = sum(resids*resids);
-      // we failed to substantially improve any coords
-      if (updated == 0) {
-        break;
-      }
-
-      ratio = (last_rss - rss) / last_rss;
-
-      if (ratio < 1e-2) {
-        break;
-      }
-    }
-
-    //copy nz betas into beta_mat col
-    for (int j = 0; j < p; j++) {
-      if(beta[j]!=0){
-        beta_mat.insert(j, lambda_step) = beta[j];
-      }
-    }
-
-    intercepts[lambda_step] = intercept;
-    return(step_num);
-  }
-
-  NumericVector complex_approach(int lambda_step){
-    // use active set
-    // update_coords until convergence
-    // check kkt for strong set, if violations, add to active, continue iterating
-    // check kkt for all preds, if violations, add to active, recompute strong, continue iterating
-    // basically, prioritize strong set before other preds when activating vars
-
-    // kkt violations in non strong preds are very rare
-    // step 2 is active set
-    // step 1 is strong set
-    // step 0 is full set
-    int step_num=2;
-    int steps=0;
-    int max_steps=1000;
-    // double old_rss = rss;
-    double loop_rss = rss;
-    double lambda = lambdas[lambda_step];
-    double old_lambda;
-    double thresh = 1e-7 * null_rss / n;
-    if(lambda_step==0){
-      old_lambda = lambda;
-    } else {
-      old_lambda = lambdas[lambda_step-1];
-    }
-    double strong_criterion = 2*lambda - old_lambda;
-
-    Timer timer;
-    timer.step("start");
-    while((steps<max_steps ) && (step_num>=0)){
-      int updates=0;
-      double update;
-      int checked=0;
-      double max_update=0.0;
-      for(int j=0; j<p; j++){
-
-        // only update if step_num matches the variable state
-        if((variable_state[j]==step_num) && lambda < safe_lambda[j]){
-          checked++;
-          // compute update
-          update = X_t_resid(j) / n;
-          double old_beta = beta[j];
-          double new_beta = update + old_beta;
-
-          new_beta = soft_max(new_beta, lambda);
-          //if we changed this beta, we must update the residuals
-          double beta_diff = new_beta-beta[j];
-          if (std::abs(beta_diff) > 1e-7) {
-
-            update_resid(j, beta_diff);
-            beta[j] = new_beta;
-            updates++;
-          }
-
-          double something = beta_diff * beta_diff;
-          if(something>max_update){
-            max_update=something;
-          }
-
-          if(std::abs(update) > lambda){
-            if(step_num<2){
-              // if not already, put in active set
-              variable_state[j]=2;
-            }
-
-          } else {
-            //put in strong if not currently and criteria met
-            if(step_num==0){
-
-              //update strong
-              if(std::abs(update) > strong_criterion){
-                variable_state[j]=1;
-              }
-
-              //update safe
-              //we need to start checking this predictor again
-              //when lambda gets smaller than safe_lambda
-              double rnorm=std::sqrt(rss)/n;
-              safe_lambda[j]=lambda*((rnorm+std::abs(update))/(rnorm+lambda));
-              // Rcout << "rnorm: " << rnorm << " update: " << update << " current: " 
-              //       << lambda << " next_safe: "<< safe_lambda[j] << std::endl;
-            }
-          }
-        }
-      }
-
-      if(max_update<thresh){
-        // Rcout << "rss: " << rss << std::endl;
-        updates=0;
-      }
-
-      timer.step(sprintf<100>("%d, %d, %d, %d, %f", steps, step_num, checked, updates, max_update));
-      // Rcout << "step: " << steps << " step_num: " << step_num << " updates: " << updates
-      //       << " loop_rss: "<< loop_rss << " old_rss: "<< old_rss << " ratio: " << (loop_rss-old_rss)/loop_rss << std::endl;
-      loop_rss = rss;
-
-      if(updates==0){
-        //if we failed to update, move on to the next step (lower numbered)
-        step_num--;
-      } else{
-        //if we updated anything, we should go back to the active set step
-        step_num=2;
-      }
-      steps++;
-    }
-    //copy nz betas into beta_mat col
-    for (int j = 0; j < p; j++) {
-      if(beta[j]!=0){
-        beta_mat.insert(j, lambda_step) = beta[j];
-      }
-    }
-    intercepts[lambda_step] = intercept;
-    NumericVector res(timer);
-    return(res);
-  }
-};
-
-RCPP_MODULE(lassi_module) {
-  class_<Lassi>( "Lassi" )
-  .constructor<MSpMat, NumericVector, int, double, bool>()
-  .method( "update_coord", &Lassi::update_coord)
-  .method( "update_coords", &Lassi::update_coords)
-
-  .method( "lassi_fit_cd", &Lassi::lassi_fit_cd )
-  .method( "complex_approach", &Lassi::complex_approach)
-  .method( "X_t_resid", &Lassi::X_t_resid)
-  .property( "beta", &Lassi::get_beta)
-  .property( "beta_mat", &Lassi::get_beta_mat)
-  .property( "intercepts", &Lassi::get_intercepts)
-
-  .property( "resids", &Lassi::get_resids)
-  .property( "xscale", &Lassi::get_xscale)
-  .property( "xcenter", &Lassi::get_xcenter)
-  .property( "X", &Lassi::get_X)
-  .property( "lambdas", &Lassi::get_lambdas, &Lassi::set_lambdas)
-  .property( "lambda_max", &Lassi::find_lambda_max)
-  ;
-}
-
-//' Prediction from a Lassi Model
-//'
-//' @param X A sparse matrix of HAL basis functions.
-//' @param beta A vector of coefficient values for the HAL basis functions.
-//' @param intercept A numeric value giving the intercept of the HAL model.
-//'
-// [[Rcpp::export]]
-NumericVector lassi_predict(const MSpMat X, const NumericVector beta,
-                           double intercept) {
-  int n = X.rows();
-  NumericVector pred(n, intercept);
-  int k = 0;
-  double current_beta;
-
-  for (k = 0; k < X.outerSize(); ++k) {
-    current_beta = beta[k];
-
-    for (MInIterMat it_(X, k); it_; ++it_) {
-      pred[it_.row()] += current_beta;
-    }
-  }
-  return(pred);
-}
diff --git a/tests/testthat/test-cv_lasso.R b/tests/testthat/test-cv_lasso.R
index 8054e4d3..70e34775 100644
--- a/tests/testthat/test-cv_lasso.R
+++ b/tests/testthat/test-cv_lasso.R
@@ -33,7 +33,6 @@ x_basis <- x_basis[, unique_columns]
 # cv.glmnet reference
 ################################################################################
 
-
 # create fold ID object for using the same folds between cv.glmnet and origami
 folds <- make_folds(n)
 fold_id <- origami:::folds2foldvec(folds)
@@ -43,114 +42,8 @@ lasso_glmnet <- glmnet::cv.glmnet(
   x = x_basis, y = y, nfolds = n_folds,
   foldid = fold_id
 )
-glmnet_nlambda <- length(lasso_glmnet$lambda)
-
-
-################################################################################
-# CV-LASSO custom implementation
-################################################################################
-
-# first, need to run lasso on the full data to get a sequence of lambdas
-lasso_init <- hal9001:::lassi(y = y, x = x_basis, center = TRUE)
-lambdas_init <- lasso_init$lambdas
-
-test_that("Check that procedure to generate lambdas matches that from glmnet", {
-  expect_equal(lambdas_init[seq_len(glmnet_nlambda)], lasso_glmnet$lambda)
-})
-lambdas_init <- lambdas_init[seq_len(glmnet_nlambda)]
-
-# next, set up a cross-validated lasso using the sequence of lambdas
-full_data_mat <- cbind(y, x_basis)
-folds <- origami::make_folds(full_data_mat, V = n_folds)
-
-# run the cross-validated lasso procedure to find the optimal lambda
-cv_lasso_out <- origami::cross_validate(
-  cv_fun = lassi_origami,
-  folds = folds,
-  data = full_data_mat,
-  lambdas = lambdas_init,
-  center = TRUE
-)
-
-# compute cv-mean of MSEs for each lambda
-lambdas_cvmse <- colMeans(cv_lasso_out$mses)
-
-# NOTE: there is an off-by-one error occurring in the computation of the optimal
-#       lambda and the lambda 1 standard deviation above it. Based on manual
-#       inspection, the custom CV-Lasso routine consistently selects an optimal
-#       lambda that is slightly too large and a 1se-lambda slightly too small.
-
-# find the lambda that minimizes the MSE
-lambda_optim_index <- which.min(lambdas_cvmse) + 1
-lambda_minmse_origami <- lambdas_init[lambda_optim_index]
-
-# also need the adjusted CV standard for each lambda
-lambdas_cvsd <- apply(cv_lasso_out$mses, 2, sd) / sqrt(n_folds)
-
-# find the maximum lambda among those 1 standard error above the minimum
-lambda_min_1se <- (lambdas_cvmse + lambdas_cvsd)[lambda_optim_index]
-lambda_1se_origami <- max(lambdas_init[lambdas_cvmse <= lambda_min_1se],
-  na.rm = TRUE
-)
-lambda_1se_index <- which.min(abs(lambdas_init - lambda_1se_origami))
-
-# create output object
-get_lambda_indices <- c(lambda_1se_index, lambda_optim_index)
-betas_out <- lasso_init$beta_mat[, get_lambda_indices]
-colnames(betas_out) <- c("lambda_1se", "lambda_min")
-
-# add in intercept term to coefs matrix and convert to sparse matrix output
-betas_out <- rbind(rep(mean(y), ncol(betas_out)), betas_out)
-betas_out <- as_dgCMatrix(betas_out * 1.0)
-coef_minmse_origami <- as.numeric(betas_out[, 2])
-coef_1se_origami <- as.numeric(betas_out[, 1])
-
-
-################################################################################
-# test set performance
-################################################################################
-
-# create fold ID object for using the same folds between cv.glmnet and origami
-fold_id <- origami::folds2foldvec(folds)
-
-# just use the standard implementation available in glmnet with origami folds
-lasso_glmnet <- glmnet::cv.glmnet(
-  x = x_basis, y = y, nfolds = n_folds,
-  foldid = fold_id
-)
 lambda_minmse_cvglmnet <- lasso_glmnet$lambda.min
 lambda_1se_cvglmnet <- lasso_glmnet$lambda.1se
 coef_minmse_cvglmnet <- as.numeric(coef(lasso_glmnet, "lambda.min"))
 coef_1se_cvglmnet <- as.numeric(coef(lasso_glmnet, "lambda.1se"))
 betas_cvglmnet <- cbind(coef_1se_cvglmnet, coef_minmse_cvglmnet)
-
-# now use the glmnet implementation with origami folds and lassi lambdas
-lassi_glmnet <- glmnet::cv.glmnet(
-  x = x_basis, y = y, nfolds = n_folds,
-  foldid = fold_id, lambda = lambdas_init
-)
-lambda_minmse_cvglmnet_lassi <- lassi_glmnet$lambda.min
-lambda_1se_cvglmnet_lassi <- lassi_glmnet$lambda.1se
-coef_minmse_cvglmnet_lassi <- coef(lassi_glmnet, "lambda.min")
-coef_1se_cvglmnet_lassi <- coef(lassi_glmnet, "lambda.1se")
-betas_cvglmnet_lassi <- cbind(
-  coef_1se_cvglmnet_lassi,
-  coef_minmse_cvglmnet_lassi
-)
-
-################################################################################
-# TEST THAT ORIGAMI AND CV-GLMNET IMPLEMENTATIONS MATCH
-################################################################################
-test_that("lambda-min difference between cv.glmnet, cv_lasso within 0.5%.", {
-  expect_lte(
-    lambda_minmse_origami - lambda_minmse_cvglmnet,
-    lambda_minmse_cvglmnet * 0.005
-  )
-})
-
-test_that("lambda-1se difference between cv.glmnet and cv_lasso within 1%.", {
-  expect_lte(
-    lambda_minmse_origami - lambda_minmse_cvglmnet,
-    lambda_minmse_cvglmnet * 0.01
-  )
-})
diff --git a/tests/testthat/test-lasso.R b/tests/testthat/test-lasso.R
index c8ac8c34..9d6dc756 100644
--- a/tests/testthat/test-lasso.R
+++ b/tests/testthat/test-lasso.R
@@ -37,80 +37,6 @@ system.time({
   )
 })
 
-#################################################
-# test scaling and centering
-lassi_fit <- methods::new(hal9001:::Lassi, x_basis, y, 100, 0.01, TRUE)
-xcenter <- lassi_fit$xcenter
-xscale <- lassi_fit$xscale
-
-# apply scaling and centering
-xcentered <- sweep(x_basis, 2, xcenter, "-")
-
-# xscale_r <- apply(xcentered, 2, sd) * sqrt((n-1)/n) # bessel correction
-xcenter_scaled <- sweep(xcentered, 2, xscale, "/")
-
-cs_means <- colMeans(as.matrix(xcenter_scaled))
-# bessel correction
-cs_sd <- apply(xcenter_scaled, 2, sd) * sqrt((n - 1) / n)
-
-test_that("centering and scaling x works", {
-  expect_lt(max(abs(cs_means)), 1e-8)
-  expect_lt(max(abs(cs_sd[cs_sd != 0] - 1)), 1e-8)
-})
-
-
-#################################################
-# test generating the sequence of lambdas
-test_that("lambda sequence matches glmnet", {
-  expect_equal(lassi_fit$lambdas, glmnet_fit$lambda)
-})
-lambda_max <- lassi_fit$lambdas[1]
-
-# verify that lambda max zeros out coefficients
-lassi_fit$update_coords(lambda_max, FALSE)
-test_that("lambda_max results in zero beta vector", {
-  expect_true(all(lassi_fit$beta == 0))
-})
-
-# verify that a slightly smaller lambda does not
-delta <- 1 - 1e-3
-lambda_not_quite_max <- lambda_max * delta
-lassi_fit$update_coords(lambda_not_quite_max, FALSE)
-test_that(
-  "a slightly smaller lambda results in nonzero beta vector",
-  expect_true(!all(lassi_fit$beta == 0))
-)
-
-#################################################
-# test a single coordinate descent update
-lassi_fit <- new(hal9001:::Lassi, x_basis, y, 100, 0.01, FALSE)
-n <- length(y)
-
-# which beta to update (1 - indexed)
-i <- 1
-xvar <- lassi_fit$X[, i]
-xscale_i <- lassi_fit$xscale[i]
-resid <- lassi_fit$resids
-
-ls_beta <- coef(lm(resid ~ xvar - 1)) * xscale_i
-# cd_beta <- mean(xvar/xscale_i * resid)
-
-lassi_fit$update_coord(i - 1, 0)
-beta_new <- lassi_fit$beta[i]
-
-
-test_that("coordinate descent works as it does in R", {
-  expect_equivalent(ls_beta, beta_new)
-})
-
-new_resid <- lassi_fit$resids
-verify_new_resid <- y - mean(y) - beta_new * xvar / xscale_i
-
-test_that("the updated residuals are as expected", {
-  expect_equal(new_resid, verify_new_resid)
-})
-
-
 ################################################################################
 # PREDICTION
 ################################################################################
@@ -118,32 +44,7 @@ test_that("the updated residuals are as expected", {
 new_data <- as.matrix(test_x)
 pred_x_basis <- hal9001:::make_design_matrix(new_data, basis_list)
 pred_x_basis <- hal9001:::apply_copy_map(pred_x_basis, copy_map)
-
-# lassi prediction and mses
-system.time({
-  lassi_fit <- hal9001:::lassi(x_basis, y, center = FALSE)
-})
-
-system.time({
-  lassi_fit <- hal9001:::lassi(x_basis, y, center = TRUE)
-})
-
-pred_mat <- predict(lassi_fit, pred_x_basis)
-mses <- apply(pred_mat, 2, function(preds) {
-  mean((preds - test_y)^2)
-})
-
-
 gpred_mat <- predict(glmnet_fit, pred_x_basis)
 gmses <- apply(gpred_mat, 2, function(preds) {
   mean((preds - test_y)^2)
 })
-
-test_that("lassi isn't doing much worse in terms of MSE", {
-  expect_lt((min(mses) - min(gmses)) / min(gmses), 0.05)
-})
-
-# library(ggplot2)
-# combined = data.frame(lambda = seq_len(100), mse = c(mses, gmses),
-#                      type = rep(c("lassi", "glmnet"), each = 100))
-# ggplot(combined, aes(x = lambda, y = mse, color = type)) + geom_line()