From 2e915c6e8bab9b31036ba9045cf3302cdef9d3dc Mon Sep 17 00:00:00 2001
From: Julien Chiquet <julien.chiquet@inrae.fr>
Date: Wed, 20 Nov 2024 18:13:29 +0100
Subject: [PATCH 1/7] putting sandwich back to business

---
 R/PLNfit-S3methods.R                 |  10 ++-
 R/PLNfit-class.R                     | 108 +++++++++------------------
 R/utils-zipln.R                      |   2 +-
 R/utils.R                            |   9 ++-
 inst/check/variance_estimates.R      |  13 ++--
 man/PLNfit.Rd                        |   2 +-
 man/PLNfit_fixedcov.Rd               |  50 +------------
 man/PLNnetworkfit.Rd                 |   2 +-
 man/standard_error.Rd                |   4 +-
 tests/testthat/test-standard-error.R |  13 +++-
 10 files changed, 70 insertions(+), 143 deletions(-)

diff --git a/R/PLNfit-S3methods.R b/R/PLNfit-S3methods.R
index 8fd95053..7dfe0dfd 100644
--- a/R/PLNfit-S3methods.R
+++ b/R/PLNfit-S3methods.R
@@ -175,7 +175,7 @@ standard_error <- function(object, type = c("variational", "jackknife", "sandwic
 
 #' @describeIn standard_error Component-wise standard errors of B in [`PLNfit`]
 #' @export
-standard_error.PLNfit <- function(object, type = c("variational", "jackknife", "bootstrap", "sandwich"), parameter = c("B", "Omega")) {
+standard_error.PLNfit <- function(object, type = c("variational", "sandwich", "jackknife", "bootstrap"), parameter = c("B", "Omega")) {
   type <- match.arg(type)
   par  <- match.arg(parameter)
   if (type == "variational" & is.null(attr(object$model_par$B, "variance_variational")))
@@ -184,14 +184,14 @@ standard_error.PLNfit <- function(object, type = c("variational", "jackknife", "
     stop("Jackknife estimation not available: rerun by setting `jackknife = TRUE` in the control list.")
   if (type == "bootstrap" & is.null(attr(object$model_par$B, "variance_bootstrap")))
     stop("Bootstrap estimation not available: rerun by setting `bootstrap > 0` in the control list.")
-  if (type == "sandwich")
-    stop("Sandwich estimator is only available for fixed covariance / precision matrix.")
+  if (type == "sandwich" & is.null(attr(object$model_par$B, "variance_sandwich")))
+    stop("Sandwich estimator not available: rerun by setting `sandwich_var = TRUE` in the control list.")
   attr(object$model_par[[par]], paste0("variance_", type)) %>% sqrt()
 }
 
 #' @describeIn standard_error Component-wise standard errors of B in [`PLNfit_fixedcov`]
 #' @export
-standard_error.PLNfit_fixedcov <- function(object, type = c("variational", "jackknife", "bootstrap", "sandwich"), parameter = c("B", "Omega")) {
+standard_error.PLNfit_fixedcov <- function(object, type = c("variational", "sandwich", "jackknife", "bootstrap", "sandwich"), parameter = c("B", "Omega")) {
   type <- match.arg(type)
   par  <- match.arg(parameter)
   if (par == "Omega")
@@ -202,5 +202,7 @@ standard_error.PLNfit_fixedcov <- function(object, type = c("variational", "jack
     stop("Jackknife estimation not available: rerun by setting `jackknife = TRUE` in the control list.")
   if (type == "bootstrap" & is.null(attr(object$model_par$B, "variance_bootstrap")))
     stop("Bootstrap estimation not available: rerun by setting `bootstrap > 0` in the control list.")
+  if (type == "sandwich" & is.null(attr(object$model_par$B, "variance_sandwich")))
+    stop("Sandwich estimator not available: rerun by setting `sandwich_var = TRUE` in the control list.")
   attr(object$model_par[[par]], paste0("variance_", type)) %>% sqrt()
 }
diff --git a/R/PLNfit-class.R b/R/PLNfit-class.R
index b964cab5..66e61b85 100644
--- a/R/PLNfit-class.R
+++ b/R/PLNfit-class.R
@@ -191,7 +191,7 @@ PLNfit <- R6Class(
     variance_variational = function(X, config = config_default_nlopt) {
     ## Variance of B for n data points
       fisher <- Matrix::bdiag(lapply(1:self$p, function(j) {
-        crossprod(X, private$A[, j] * X) # t(X) %*% diag(A[, i]) %*% X
+        crossprod(X, private$A[, j] * X) # t(X) %*% diag(A[, j]) %*% X
       }))
       vcov_B <- tryCatch(Matrix::solve(fisher), error = function(e) {e})
       if (is(vcov_B, "error")) {
@@ -220,22 +220,11 @@ PLNfit <- R6Class(
 
     compute_vcov_from_resamples = function(resamples){
       B_list = resamples %>% map("B")
-      #print (B_list)
       vcov_B = lapply(seq(1, ncol(private$B)), function(B_col){
         param_ests_for_col = B_list %>% map(~.x[, B_col])
         param_ests_for_col = do.call(rbind, param_ests_for_col)
-        #print (param_ests_for_col)
         row_vcov = cov(param_ests_for_col)
       })
-      #print ("vcov blocks")
-      #print (vcov_B)
-
-      #B_vcov <- resamples %>% map("B") %>% map(~( . )) %>% reduce(cov)
-
-      #var_jack   <- jacks %>% map("B") %>% map(~( (. - B_jack)^2)) %>% reduce(`+`) %>%
-      #  `dimnames<-`(dimnames(private$B))
-      #B_hat  <- private$B[,] ## strips attributes while preserving names
-
       vcov_B = Matrix::bdiag(vcov_B) %>% as.matrix()
 
       rownames(vcov_B) <- colnames(vcov_B) <-
@@ -244,18 +233,35 @@ PLNfit <- R6Class(
         ## Hack to make sure that species is first and varies slowest
         apply(1, paste0, collapse = "_")
 
-      #print (pheatmap::pheatmap(vcov_B, cluster_rows=FALSE, cluster_cols=FALSE))
-
-
-      #names = lapply(bootstrapped_df$cov_mat, function(m){ colnames(m)}) %>% unlist()
-      #rownames(bootstrapped_vhat) = names
-      #colnames(bootstrapped_vhat) = names
-
       vcov_B = methods::as(vcov_B, "dgCMatrix")
 
       return(vcov_B)
     },
 
+    vcov_sandwich_B = function(Y, X) {
+      getMat_iCnB <- function(i) {
+        a_i   <- as.numeric(private$A[i, ])
+        s2_i  <- as.numeric(private$S[i, ]**2)
+        omega <- as.numeric(diag(private$Omega))
+        diag_mat_i <- diag(1/a_i + s2_i^2 / (1 + s2_i * (a_i + omega)))
+        solve(private$Sigma + diag_mat_i)
+      }
+      YmA <- Y - private$A
+      Dn <- matrix(0, self$d*self$p, self$d*self$p)
+      Cn <- matrix(0, self$d*self$p, self$d*self$p)
+      for (i in 1:self$n) {
+        xxt_i <- tcrossprod(X[i, ])
+        Cn <- Cn - kronecker(getMat_iCnB(i) , xxt_i) / self$n
+        Dn <- Dn + kronecker(tcrossprod(YmA[i,]), xxt_i) / self$n
+      }
+      Cn_inv <- solve(Cn)
+      dim_names <- dimnames(attr(private$B, "vcov_variational"))
+      vcov_sand <- ((Cn_inv %*% Dn %*% Cn_inv) / self$n) %>% `dimnames<-`(dim_names)
+      attr(private$B, "vcov_sandwich") <- vcov_sand
+      attr(private$B, "variance_sandwich") <- matrix(diag(vcov_sand), nrow = self$d, ncol = self$p,
+                                                     dimnames = dimnames(private$B))
+    },
+
     variance_jackknife = function(Y, X, O, w, config = config_default_nlopt) {
       jacks <- future.apply::future_lapply(seq_len(self$n), function(i) {
         data <- list(Y = Y[-i, , drop = FALSE],
@@ -263,14 +269,11 @@ PLNfit <- R6Class(
                      O = O[-i, , drop = FALSE],
                      w = w[-i])
         args <- list(data = data,
-                     # params = list(B = private$B,
-                     #               M = matrix(0, self$n-1, self$p),
-                     #               S = private$S[-i, , drop = FALSE]),
                      params = do.call(compute_PLN_starting_point, data),
                      config = config)
         optim_out <- do.call(private$optimizer$main, args)
         optim_out[c("B", "Omega")]
-      })
+      }, future.seed = TRUE, future.scheduling = structure(TRUE, ordering = "random"))
 
       B_jack <- jacks %>% map("B") %>% reduce(`+`) / self$n
       var_jack   <- jacks %>% map("B") %>% map(~( (. - B_jack)^2)) %>% reduce(`+`) %>%
@@ -300,19 +303,15 @@ PLNfit <- R6Class(
         if (config$backend == "torch") # Convert data to torch tensors
           data   <- lapply(data, torch_tensor, device = config$device)                         # list with Y, X, O, w
 
-        #print (data$Y$device)
-
         args <- list(data = data,
-                     # params = list(B = private$B, M = matrix(0,self$n,self$p), S = private$S[resample, ]),
                      params = do.call(compute_PLN_starting_point, data),
                      config = config)
         if (config$backend == "torch") # Convert data to torch tensors
           args$params <- lapply(args$params, torch_tensor, requires_grad = TRUE, device = config$device) # list with B, M, S
 
         optim_out <- do.call(private$optimizer$main, args)
-        #print (optim_out)
         optim_out[c("B", "Omega", "monitoring")]
-      })
+      }, future.seed = TRUE, future.scheduling = structure(TRUE, ordering = "random"))
 
       B_boots <- boots %>% map("B") %>% reduce(`+`) / n_resamples
       attr(private$B, "variance_bootstrap") <-
@@ -455,7 +454,7 @@ PLNfit <- R6Class(
     #' * jackknife boolean indicating whether jackknife should be performed to evaluate bias and variance of the model parameters. Default is FALSE.
     #' * bootstrap integer indicating the number of bootstrap resamples generated to evaluate the variance of the model parameters. Default is 0 (inactivated).
     #' * variational_var boolean indicating whether variational Fisher information matrix should be computed to estimate the variance of the model parameters (highly underestimated). Default is FALSE.
-    #' * rsquared boolean indicating whether approximation of R2 based on deviance should be computed. Default is TRUE
+    #' * sandwich_var boolean indicating whether sandwich estimator should be computed to estimate the variance of the model parameters (highly underestimated). Default is FALSE.
     #' * trace integer for verbosity. should be > 1 to see output in post-treatments
     postTreatment = function(responses, covariates, offsets, weights = rep(1, nrow(responses)), config_post, config_optim, nullModel = NULL) {
       ## PARAMATERS DIMNAMES
@@ -496,6 +495,11 @@ PLNfit <- R6Class(
         }
         private$variance_bootstrap(responses, covariates, offsets, weights, n_resamples=config_post$bootstrap, config = config_optim)
       }
+      ## 5. compute and store matrix of standard variances for B with sandwich correction approximation
+      if (config_post$sandwich_var) {
+        if(config_post$trace > 1) cat("\n\tComputing sandwich estimator of the variance...")
+        private$vcov_sandwich_B(responses, covariates)
+      }
     },
 
     #' @description Predict position, scores or observations of new data.
@@ -920,25 +924,8 @@ PLNfit_fixedcov <- R6Class(
       optim_out <- do.call(private$optimizer$main, args)
       do.call(self$update, optim_out)
       private$Sigma <- solve(optim_out$Omega)
-    },
-
-    #' @description Update R2, fisher and std_err fields after optimization
-    #' @param config_post a list for controlling the post-treatments (optional bootstrap, jackknife, R2, etc.). See details
-    #' @param config_optim a list for controlling the optimization parameter. See details
-    #' @details The list of parameters `config` controls the post-treatment processing, with the following entries:
-    #' * trace integer for verbosity. should be > 1 to see output in post-treatments
-    #' * jackknife boolean indicating whether jackknife should be performed to evaluate bias and variance of the model parameters. Default is FALSE.
-    #' * bootstrap integer indicating the number of bootstrap resamples generated to evaluate the variance of the model parameters. Default is 0 (inactivated).
-    #' * variational_var boolean indicating whether variational Fisher information matrix should be computed to estimate the variance of the model parameters (highly underestimated). Default is FALSE.
-    #' * rsquared boolean indicating whether approximation of R2 based on deviance should be computed. Default is TRUE
-    postTreatment = function(responses, covariates, offsets, weights = rep(1, nrow(responses)), config_post, config_optim, nullModel = NULL) {
-      super$postTreatment(responses, covariates, offsets, weights, config_post, config_optim, nullModel)
-      ## 6. compute and store matrix of standard variances for B with sandwich correction approximation
-      if (config_post$sandwich_var) {
-        if(config_post$trace > 1) cat("\n\tComputing sandwich estimator of the variance...")
-        private$vcov_sandwich_B(responses, covariates)
-      }
     }
+
   ),
   private = list(
     ## %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
@@ -976,7 +963,7 @@ PLNfit_fixedcov <- R6Class(
                      config = config)
         optim_out <- do.call(private$optimizer$main, args)
         optim_out[c("B", "Omega")]
-      }, future.seed = TRUE)
+      }, future.seed = TRUE, future.scheduling = structure(TRUE, ordering = "random"))
 
       B_jack <- jacks %>% map("B") %>% reduce(`+`) / self$n
       var_jack   <- jacks %>% map("B") %>% map(~( (. - B_jack)^2)) %>% reduce(`+`) %>%
@@ -984,31 +971,6 @@ PLNfit_fixedcov <- R6Class(
       B_hat  <- private$B[,] ## strips attributes while preserving names
       attr(private$B, "bias") <- (self$n - 1) * (B_jack - B_hat)
       attr(private$B, "variance_jackknife") <- (self$n - 1) / self$n * var_jack
-    },
-
-    vcov_sandwich_B = function(Y, X) {
-      getMat_iCnB <- function(i) {
-        a_i   <- as.numeric(private$A[i, ])
-        s2_i  <- as.numeric(private$S[i, ]**2)
-        # omega <- as.numeric(1/diag(private$Sigma))
-        # diag_mat_i <- diag(1/a_i + s2_i^2 / (1 + s2_i * (a_i + omega)))
-        diag_mat_i <- diag(1/a_i + .5 * s2_i^2)
-        solve(private$Sigma + diag_mat_i)
-      }
-      YmA <- Y - private$A
-      Dn <- matrix(0, self$d*self$p, self$d*self$p)
-      Cn <- matrix(0, self$d*self$p, self$d*self$p)
-      for (i in 1:self$n) {
-        xxt_i <- tcrossprod(X[i, ])
-        Cn <- Cn - kronecker(getMat_iCnB(i) , xxt_i) / (self$n)
-        Dn <- Dn + kronecker(tcrossprod(YmA[i,]), xxt_i) / (self$n)
-      }
-      Cn_inv <- solve(Cn)
-      dim_names <- dimnames(attr(private$B, "vcov_variational"))
-      vcov_sand <- ((Cn_inv %*% Dn %*% Cn_inv) / self$n) %>% `dimnames<-`(dim_names)
-      attr(private$B, "vcov_sandwich") <- vcov_sand
-      attr(private$B, "variance_sandwich") <- matrix(diag(vcov_sand), nrow = self$d, ncol = self$p,
-                                                         dimnames = dimnames(private$B))
     }
   ),
   active = list(
diff --git a/R/utils-zipln.R b/R/utils-zipln.R
index 59e9233a..f62cdc0f 100644
--- a/R/utils-zipln.R
+++ b/R/utils-zipln.R
@@ -27,7 +27,7 @@ extract_model_zi <- function(call, envir) {
   call_args <- c(as.list(call_args), list(xlev = attr(call$formula, "xlevels"), na.action = NULL))
 
   ## Extract terms for ZI and PLN components
-  terms <- .extract_terms_zi(as.formula(eval(call$formula, env = envir)))
+  terms <- .extract_terms_zi(as.formula(eval(call$formula, envir = envir)))
   ## eval the call in the parent environment with adjustement due to ZI terms
   call_args$formula <- terms$formula
   frame <- do.call(stats::model.frame, call_args, envir = envir)
diff --git a/R/utils.R b/R/utils.R
index 2ccba19c..204861b8 100644
--- a/R/utils.R
+++ b/R/utils.R
@@ -55,7 +55,8 @@ config_post_default_PLNLDA <-
     jackknife       = FALSE,
     bootstrap       = 0L,
     rsquared        = TRUE,
-    variational_var = FALSE
+    variational_var = FALSE,
+    sandwich_var    = FALSE
   )
 
 config_post_default_PLNPCA <-
@@ -63,7 +64,8 @@ config_post_default_PLNPCA <-
     jackknife       = FALSE,
     bootstrap       = 0L,
     rsquared        = TRUE,
-    variational_var = FALSE
+    variational_var = FALSE,
+    sandwich_var    = FALSE
   )
 
 config_post_default_PLNmixture <-
@@ -71,7 +73,8 @@ config_post_default_PLNmixture <-
     jackknife       = FALSE,
     bootstrap       = 0L,
     rsquared        = TRUE,
-    variational_var = FALSE
+    variational_var = FALSE,
+    sandwich_var    = FALSE
   )
 
 status_to_message <- function(status) {
diff --git a/inst/check/variance_estimates.R b/inst/check/variance_estimates.R
index 65cafab7..8eebc43c 100644
--- a/inst/check/variance_estimates.R
+++ b/inst/check/variance_estimates.R
@@ -13,7 +13,7 @@ Y <- rPLN(n = nrow(X), mu = X %*% B, Sigma = params$Sigma, depths = params$depth
 data <- prepare_data(Y, X, offset = "none")
 logO <- attr(Y, "offsets")
 
-conf <- list(variational_var = TRUE, jackknife = TRUE, bootstrap = nrow(Y))
+conf <- list(variational_var = TRUE, jackknife = TRUE, bootstrap = nrow(Y), sandwich_var = TRUE)
 future::plan("multicore", workers = nb_cores)
 model <- PLN(Abundance ~ 0 + . + offset(logO), data = data, control = PLN_param(config_post = conf))
 future::plan("sequential")
@@ -22,12 +22,15 @@ B_hat <- coef(model)
 B_se_var <- standard_error(model, "variational")
 B_se_jk  <- standard_error(model, "jackknife")
 B_se_bt  <- standard_error(model, "bootstrap")
+B_se_var <- standard_error(model, "variational")
+B_se_jk  <- standard_error(model, "jackknife")
+B_se_sw  <- standard_error(model, "sandwich")
 
 data.frame(
-  B = rep(c(B), 3),
-  B_hat = rep(c(B_hat), 3),
-  se = c(B_se_var, B_se_jk, B_se_bt),
-  method = rep(c("variational", "jackknife", "bootstrap"), each = length(c(B))) ) %>%
+  B = rep(c(B), 4),
+  B_hat = rep(c(B_hat), 4),
+  se = c(B_se_var, B_se_jk, B_se_bt, B_se_sw),
+  method = rep(c("variational", "jackknife", "bootstrap", "sandwich"), each = length(c(B))) ) %>%
   ggplot(aes(x = B, y = B_hat)) +
   geom_errorbar(aes(ymin = B_hat - 2 * se,
                     ymax = B_hat + 2 * se), color = "blue") + facet_wrap(~ method) +
diff --git a/man/PLNfit.Rd b/man/PLNfit.Rd
index 303c21cb..f99471c0 100644
--- a/man/PLNfit.Rd
+++ b/man/PLNfit.Rd
@@ -273,7 +273,7 @@ The list of parameters \code{config} controls the post-treatment processing, wit
 \item jackknife boolean indicating whether jackknife should be performed to evaluate bias and variance of the model parameters. Default is FALSE.
 \item bootstrap integer indicating the number of bootstrap resamples generated to evaluate the variance of the model parameters. Default is 0 (inactivated).
 \item variational_var boolean indicating whether variational Fisher information matrix should be computed to estimate the variance of the model parameters (highly underestimated). Default is FALSE.
-\item rsquared boolean indicating whether approximation of R2 based on deviance should be computed. Default is TRUE
+\item sandwich_var boolean indicating whether sandwich estimator should be computed to estimate the variance of the model parameters (highly underestimated). Default is FALSE.
 \item trace integer for verbosity. should be > 1 to see output in post-treatments
 }
 }
diff --git a/man/PLNfit_fixedcov.Rd b/man/PLNfit_fixedcov.Rd
index 52e75903..d0e39325 100644
--- a/man/PLNfit_fixedcov.Rd
+++ b/man/PLNfit_fixedcov.Rd
@@ -36,7 +36,6 @@ print(myPLN)
 \itemize{
 \item \href{#method-PLNfit_fixedcov-new}{\code{PLNfit_fixedcov$new()}}
 \item \href{#method-PLNfit_fixedcov-optimize}{\code{PLNfit_fixedcov$optimize()}}
-\item \href{#method-PLNfit_fixedcov-postTreatment}{\code{PLNfit_fixedcov$postTreatment()}}
 \item \href{#method-PLNfit_fixedcov-clone}{\code{PLNfit_fixedcov$clone()}}
 }
 }
@@ -44,6 +43,7 @@ print(myPLN)
 <details><summary>Inherited methods</summary>
 <ul>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="optimize_vestep"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-optimize_vestep'><code>PLNmodels::PLNfit$optimize_vestep()</code></a></span></li>
+<li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="postTreatment"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-postTreatment'><code>PLNmodels::PLNfit$postTreatment()</code></a></span></li>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="predict"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-predict'><code>PLNmodels::PLNfit$predict()</code></a></span></li>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="predict_cond"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-predict_cond'><code>PLNmodels::PLNfit$predict_cond()</code></a></span></li>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="print"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-print'><code>PLNmodels::PLNfit$print()</code></a></span></li>
@@ -103,54 +103,6 @@ Call to the NLopt or TORCH optimizer and update of the relevant fields
 }
 \if{html}{\out{</div>}}
 }
-}
-\if{html}{\out{<hr>}}
-\if{html}{\out{<a id="method-PLNfit_fixedcov-postTreatment"></a>}}
-\if{latex}{\out{\hypertarget{method-PLNfit_fixedcov-postTreatment}{}}}
-\subsection{Method \code{postTreatment()}}{
-Update R2, fisher and std_err fields after optimization
-\subsection{Usage}{
-\if{html}{\out{<div class="r">}}\preformatted{PLNfit_fixedcov$postTreatment(
-  responses,
-  covariates,
-  offsets,
-  weights = rep(1, nrow(responses)),
-  config_post,
-  config_optim,
-  nullModel = NULL
-)}\if{html}{\out{</div>}}
-}
-
-\subsection{Arguments}{
-\if{html}{\out{<div class="arguments">}}
-\describe{
-\item{\code{responses}}{the matrix of responses (called Y in the model). Will usually be extracted from the corresponding field in PLNfamily-class}
-
-\item{\code{covariates}}{design matrix (called X in the model). Will usually be extracted from the corresponding field in PLNfamily-class}
-
-\item{\code{offsets}}{offset matrix (called O in the model). Will usually be extracted from the corresponding field in PLNfamily-class}
-
-\item{\code{weights}}{an optional vector of observation weights to be used in the fitting process.}
-
-\item{\code{config_post}}{a list for controlling the post-treatments (optional bootstrap, jackknife, R2, etc.). See details}
-
-\item{\code{config_optim}}{a list for controlling the optimization parameter. See details}
-
-\item{\code{nullModel}}{null model used for approximate R2 computations. Defaults to a GLM model with same design matrix but not latent variable.}
-}
-\if{html}{\out{</div>}}
-}
-\subsection{Details}{
-The list of parameters \code{config} controls the post-treatment processing, with the following entries:
-\itemize{
-\item trace integer for verbosity. should be > 1 to see output in post-treatments
-\item jackknife boolean indicating whether jackknife should be performed to evaluate bias and variance of the model parameters. Default is FALSE.
-\item bootstrap integer indicating the number of bootstrap resamples generated to evaluate the variance of the model parameters. Default is 0 (inactivated).
-\item variational_var boolean indicating whether variational Fisher information matrix should be computed to estimate the variance of the model parameters (highly underestimated). Default is FALSE.
-\item rsquared boolean indicating whether approximation of R2 based on deviance should be computed. Default is TRUE
-}
-}
-
 }
 \if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-PLNfit_fixedcov-clone"></a>}}
diff --git a/man/PLNnetworkfit.Rd b/man/PLNnetworkfit.Rd
index 7e531d24..5dad7d68 100644
--- a/man/PLNnetworkfit.Rd
+++ b/man/PLNnetworkfit.Rd
@@ -62,11 +62,11 @@ The function \code{\link[=PLNnetwork]{PLNnetwork()}}, the class \code{\link{PLNn
 <details><summary>Inherited methods</summary>
 <ul>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="optimize_vestep"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-optimize_vestep'><code>PLNmodels::PLNfit$optimize_vestep()</code></a></span></li>
+<li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="postTreatment"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-postTreatment'><code>PLNmodels::PLNfit$postTreatment()</code></a></span></li>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="predict"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-predict'><code>PLNmodels::PLNfit$predict()</code></a></span></li>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="predict_cond"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-predict_cond'><code>PLNmodels::PLNfit$predict_cond()</code></a></span></li>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="print"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-print'><code>PLNmodels::PLNfit$print()</code></a></span></li>
 <li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit" data-id="update"><a href='../../PLNmodels/html/PLNfit.html#method-PLNfit-update'><code>PLNmodels::PLNfit$update()</code></a></span></li>
-<li><span class="pkg-link" data-pkg="PLNmodels" data-topic="PLNfit_fixedcov" data-id="postTreatment"><a href='../../PLNmodels/html/PLNfit_fixedcov.html#method-PLNfit_fixedcov-postTreatment'><code>PLNmodels::PLNfit_fixedcov$postTreatment()</code></a></span></li>
 </ul>
 </details>
 }}
diff --git a/man/standard_error.Rd b/man/standard_error.Rd
index 37b81b1e..bfbc38df 100644
--- a/man/standard_error.Rd
+++ b/man/standard_error.Rd
@@ -24,13 +24,13 @@ standard_error(
 
 \method{standard_error}{PLNfit}(
   object,
-  type = c("variational", "jackknife", "bootstrap", "sandwich"),
+  type = c("variational", "sandwich", "jackknife", "bootstrap"),
   parameter = c("B", "Omega")
 )
 
 \method{standard_error}{PLNfit_fixedcov}(
   object,
-  type = c("variational", "jackknife", "bootstrap", "sandwich"),
+  type = c("variational", "sandwich", "jackknife", "bootstrap", "sandwich"),
   parameter = c("B", "Omega")
 )
 
diff --git a/tests/testthat/test-standard-error.R b/tests/testthat/test-standard-error.R
index e7136cea..d8b54a57 100644
--- a/tests/testthat/test-standard-error.R
+++ b/tests/testthat/test-standard-error.R
@@ -12,7 +12,7 @@ test_that("Check that fisher and standard_error return objects with proper dimen
   d <- myPLN_cov$d
 
 
-  sem <- standard_error(myPLN_cov)
+  sem <- standard_error(myPLN_cov, "variational")
   ## Dimensions
   expect_equal(dim(sem), c(d, p))
 
@@ -50,7 +50,7 @@ test_that("Check temporal consistency of Fisher matrix for PLN models with no co
 
   n <- nrow(myPLN$fitted)
   ## Consistency of the diagonal of the fisher matrix
-  fim.diag <- 1/(n * standard_error(myPLN)^2)
+  fim.diag <- 1/(n * standard_error(myPLN, "variational")^2)
   ## Values computed on the 2018/12/11 with PLNmodels version 0.5.9601)
   expected.fim.diag <- c(0.0612123698810698, 0.0612384161054906, 3.73462487824109, 0.122467107738817,
                          122.19280897578, 2.2230572191967, 0.285741065637069, 0.285687659219944,
@@ -59,7 +59,7 @@ test_that("Check temporal consistency of Fisher matrix for PLN models with no co
                          5.93888146445577)
 
   ## Consistency of the standard error matrix
-  sem <- standard_error(myPLN) %>% as.numeric()
+  sem <- standard_error(myPLN, "variational") %>% as.numeric()
   ## Values computed on the 2018/12/11 with PLNmodels version 0.5.9601)
   expected.sem <-
     c(0.577407423403546, 0.577284617461014, 0.0739228099688871, 0.40821807394677,
@@ -91,21 +91,24 @@ test_that("Check that variance estimation are coherent in PLNfit",  {
       jackknife       = TRUE,
       bootstrap       = 50L,
       variational_var = TRUE,
+      sandwich_var    = TRUE,
       rsquared        = FALSE,
       trace           = 2
     )
 
-  config_optim <- config_default_nlopt
+  config_optim <- PLNmodels:::config_default_nlopt
   myPLN$postTreatment(Y, X, log_O, config_post = config_post, config_optim = config_optim)
 
 
   tr_variational <- sum(standard_error(myPLN, "variational")^2)
   tr_bootstrap   <- sum(standard_error(myPLN, "bootstrap")^2)
   tr_jackknife   <- sum(standard_error(myPLN, "jackknife")^2)
+  tr_sandwich    <- sum(standard_error(myPLN, "sandwich")^2)
 
   expect_gt(tr_variational, 0)
   expect_gt(tr_jackknife  , 0)
   expect_gt(tr_bootstrap  , 0)
+  expect_gt(tr_sandwich   , 0)
 
   ## using control parameters
   myPLN_prime <- PLN(Abundance ~ Var_1 + 0 + offset(log(Offset)), data = data, control = PLN_param(config_post = config_post))
@@ -113,10 +116,12 @@ test_that("Check that variance estimation are coherent in PLNfit",  {
   tr_variational <- sum(standard_error(myPLN_prime, "variational")^2)
   tr_bootstrap   <- sum(standard_error(myPLN_prime, "bootstrap")^2)
   tr_jackknife   <- sum(standard_error(myPLN_prime, "jackknife")^2)
+  tr_sandwich    <- sum(standard_error(myPLN_prime, "sandwich")^2)
 
   expect_gt(tr_variational, 0)
   expect_gt(tr_jackknife  , 0)
   expect_gt(tr_bootstrap  , 0)
+  expect_gt(tr_sandwich  , 0)
 })
 
 test_that("Check that variance estimation are coherent in PLNnetwork",  {

From bee4365bbc0bc6876781b6226760a41c04e1877d Mon Sep 17 00:00:00 2001
From: Julien Chiquet <julien.chiquet@inrae.fr>
Date: Thu, 21 Nov 2024 10:42:04 +0100
Subject: [PATCH 2/7] cosmetics.

---
 R/PLNfit-class.R                | 8 ++++----
 inst/check/variance_estimates.R | 7 -------
 2 files changed, 4 insertions(+), 11 deletions(-)

diff --git a/R/PLNfit-class.R b/R/PLNfit-class.R
index 66e61b85..218ff1e7 100644
--- a/R/PLNfit-class.R
+++ b/R/PLNfit-class.R
@@ -240,10 +240,10 @@ PLNfit <- R6Class(
 
     vcov_sandwich_B = function(Y, X) {
       getMat_iCnB <- function(i) {
-        a_i   <- as.numeric(private$A[i, ])
-        s2_i  <- as.numeric(private$S[i, ]**2)
+        a_i <- as.numeric(private$A[i, ])
+        s_i <- as.numeric(private$S[i, ])
         omega <- as.numeric(diag(private$Omega))
-        diag_mat_i <- diag(1/a_i + s2_i^2 / (1 + s2_i * (a_i + omega)))
+        diag_mat_i <- diag(1/a_i + s_i^4 / (1 + s_i^2 * (a_i + omega)))
         solve(private$Sigma + diag_mat_i)
       }
       YmA <- Y - private$A
@@ -301,7 +301,7 @@ PLNfit <- R6Class(
                      O = O[resample, , drop = FALSE],
                      w = w[resample])
         if (config$backend == "torch") # Convert data to torch tensors
-          data   <- lapply(data, torch_tensor, device = config$device)                         # list with Y, X, O, w
+          data   <- lapply(data, torch_tensor, device = config$device)
 
         args <- list(data = data,
                      params = do.call(compute_PLN_starting_point, data),
diff --git a/inst/check/variance_estimates.R b/inst/check/variance_estimates.R
index 8eebc43c..ff8624a5 100644
--- a/inst/check/variance_estimates.R
+++ b/inst/check/variance_estimates.R
@@ -2,9 +2,6 @@ library(tidyverse)
 library(PLNmodels)
 set.seed(1234)
 
-nb_cores <- 10
-options(future.fork.enable = TRUE)
-
 params <- PLNmodels:::create_parameters(n = 50, p = 10, d = 1, depths = 1e3)
 X <- params$X
 B <- params$B
@@ -14,16 +11,12 @@ data <- prepare_data(Y, X, offset = "none")
 logO <- attr(Y, "offsets")
 
 conf <- list(variational_var = TRUE, jackknife = TRUE, bootstrap = nrow(Y), sandwich_var = TRUE)
-future::plan("multicore", workers = nb_cores)
 model <- PLN(Abundance ~ 0 + . + offset(logO), data = data, control = PLN_param(config_post = conf))
-future::plan("sequential")
 
 B_hat <- coef(model)
 B_se_var <- standard_error(model, "variational")
 B_se_jk  <- standard_error(model, "jackknife")
 B_se_bt  <- standard_error(model, "bootstrap")
-B_se_var <- standard_error(model, "variational")
-B_se_jk  <- standard_error(model, "jackknife")
 B_se_sw  <- standard_error(model, "sandwich")
 
 data.frame(

From 46fd6c3f4cd50df29b67a96a99685235e4424bb5 Mon Sep 17 00:00:00 2001
From: Julien Chiquet <julien.chiquet@inrae.fr>
Date: Thu, 21 Nov 2024 16:51:33 +0100
Subject: [PATCH 3/7] creating file for cpp imp of sandwich

---
 src/utils-R.cpp | 50 +++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 50 insertions(+)
 create mode 100644 src/utils-R.cpp

diff --git a/src/utils-R.cpp b/src/utils-R.cpp
new file mode 100644
index 00000000..470772b9
--- /dev/null
+++ b/src/utils-R.cpp
@@ -0,0 +1,50 @@
+#include "RcppArmadillo.h"
+
+// [[Rcpp::depends(RcppArmadillo)]]
+
+#include "utils.h"
+
+// [[Rcpp::export]]
+arma::mat get_sandwich_variance_B(
+  const arma::mat & Y,
+  const arma::mat & X,
+  const arma::mat & A,
+  const arma::mat & S,
+  const arma::mat & Sigma,
+  const arma::vec & Diag_Omega
+) {
+
+
+  arma::mat get_iCnB = [&A, &S, &D_omega, &Sigma](
+      ) {
+
+
+    return ;
+  }
+
+
+
+  return ;
+}
+
+// vcov_sandwich_B = function(Y, X) {
+//  getMat_iCnB <- function(i) {
+//     a_i <- as.numeric(private$A[i, ])
+//     s_i <- as.numeric(private$S[i, ])
+//     omega <- as.numeric(diag(private$Omega))
+//     diag_mat_i <- diag(1/a_i + s_i^4 / (1 + s_i^2 * (a_i + omega)))
+//     solve(private$Sigma + diag_mat_i)
+//  }
+//
+//  YmA <- Y - private$A
+//    Dn <- matrix(0, self$d*self$p, self$d*self$p)
+//    Cn <- matrix(0, self$d*self$p, self$d*self$p)
+//    for (i in 1:self$n) {
+//    xxt_i <- tcrossprod(X[i, ])
+//    Cn <- Cn - kronecker(getMat_iCnB(i) , xxt_i) / self$n
+//    Dn <- Dn + kronecker(tcrossprod(YmA[i,]), xxt_i) / self$n
+//  }
+//   Cn_inv <- solve(Cn)
+//     dim_names <- dimnames(attr(private$B, "vcov_variational"))
+//     vcov_sand <- ((Cn_inv %*% Dn %*% Cn_inv) / self$n) %>% `dimnames<-`(dim_names)
+//

From e7f78d4a5042b851d6f8833bec4c42cdd7ee8e55 Mon Sep 17 00:00:00 2001
From: Julien Chiquet <julien.chiquet@inrae.fr>
Date: Thu, 21 Nov 2024 17:26:04 +0100
Subject: [PATCH 4/7] some advances in cpp version onf sandwich

---
 R/RcppExports.R     |  4 ++++
 src/RcppExports.cpp | 17 +++++++++++++++++
 src/utils-R.cpp     | 24 +++++++++++++++++++-----
 3 files changed, 40 insertions(+), 5 deletions(-)

diff --git a/R/RcppExports.R b/R/RcppExports.R
index d1053c03..6213a68b 100644
--- a/R/RcppExports.R
+++ b/R/RcppExports.R
@@ -89,3 +89,7 @@ cpp_test_packing <- function() {
     .Call('_PLNmodels_cpp_test_packing', PACKAGE = 'PLNmodels')
 }
 
+get_sandwich_variance_B <- function(Y, X, A, S, Sigma, Diag_Omega) {
+    .Call('_PLNmodels_get_sandwich_variance_B', PACKAGE = 'PLNmodels', Y, X, A, S, Sigma, Diag_Omega)
+}
+
diff --git a/src/RcppExports.cpp b/src/RcppExports.cpp
index 01f8105d..07502dfa 100644
--- a/src/RcppExports.cpp
+++ b/src/RcppExports.cpp
@@ -330,6 +330,22 @@ BEGIN_RCPP
     return rcpp_result_gen;
 END_RCPP
 }
+// get_sandwich_variance_B
+arma::mat get_sandwich_variance_B(const arma::mat& Y, const arma::mat& X, const arma::mat& A, const arma::mat& S, const arma::mat& Sigma, const arma::vec& Diag_Omega);
+RcppExport SEXP _PLNmodels_get_sandwich_variance_B(SEXP YSEXP, SEXP XSEXP, SEXP ASEXP, SEXP SSEXP, SEXP SigmaSEXP, SEXP Diag_OmegaSEXP) {
+BEGIN_RCPP
+    Rcpp::RObject rcpp_result_gen;
+    Rcpp::RNGScope rcpp_rngScope_gen;
+    Rcpp::traits::input_parameter< const arma::mat& >::type Y(YSEXP);
+    Rcpp::traits::input_parameter< const arma::mat& >::type X(XSEXP);
+    Rcpp::traits::input_parameter< const arma::mat& >::type A(ASEXP);
+    Rcpp::traits::input_parameter< const arma::mat& >::type S(SSEXP);
+    Rcpp::traits::input_parameter< const arma::mat& >::type Sigma(SigmaSEXP);
+    Rcpp::traits::input_parameter< const arma::vec& >::type Diag_Omega(Diag_OmegaSEXP);
+    rcpp_result_gen = Rcpp::wrap(get_sandwich_variance_B(Y, X, A, S, Sigma, Diag_Omega));
+    return rcpp_result_gen;
+END_RCPP
+}
 
 static const R_CallMethodDef CallEntries[] = {
     {"_PLNmodels_cpp_test_nlopt", (DL_FUNC) &_PLNmodels_cpp_test_nlopt, 0},
@@ -354,6 +370,7 @@ static const R_CallMethodDef CallEntries[] = {
     {"_PLNmodels_optim_zipln_M", (DL_FUNC) &_PLNmodels_optim_zipln_M, 9},
     {"_PLNmodels_optim_zipln_S", (DL_FUNC) &_PLNmodels_optim_zipln_S, 7},
     {"_PLNmodels_cpp_test_packing", (DL_FUNC) &_PLNmodels_cpp_test_packing, 0},
+    {"_PLNmodels_get_sandwich_variance_B", (DL_FUNC) &_PLNmodels_get_sandwich_variance_B, 6},
     {NULL, NULL, 0}
 };
 
diff --git a/src/utils-R.cpp b/src/utils-R.cpp
index 470772b9..9af462d8 100644
--- a/src/utils-R.cpp
+++ b/src/utils-R.cpp
@@ -14,17 +14,31 @@ arma::mat get_sandwich_variance_B(
   const arma::vec & Diag_Omega
 ) {
 
+  arma::uword n = Y.n_rows ;
+  arma::uword p = Y.n_cols ;
+  arma::uword d = X.n_cols ;
 
-  arma::mat get_iCnB = [&A, &S, &D_omega, &Sigma](
-      ) {
+  auto get_iCnB = [&A, &S, &Diag_Omega, &Sigma](arma::uword i) {
+    arma::vec a = A.row(i) ;
+    arma::vec s = S.row(i) ;
+    arma::mat D = diagmat(pow(a, -1) + pow(s, 4) / (1 + pow(s,2) * (a + Diag_Omega))) ;
 
+    return arma::inv_sympd(Sigma + D);
+  };
 
-    return ;
+  arma::mat YmA = Y - A ;
+  arma::mat Cn = arma::zeros(d*p, d*p) ;
+  arma::mat Dn = arma::zeros(d*p, d*p) ;
+  for (int i=0; i<n; i++) {
+    arma::mat xxt_i = X.col(i) * X.col(i).t() ;
+    arma::mat yyt_i = YmA.col(i) * YmA.col(i).t() ;
+    Cn = Cn - arma::kron(get_iCnB(i), xxt_i) / n ;
+    Dn = Dn + arma::kron(yyt_i, xxt_i) / n ;
   }
 
+  arma::mat Cn_inv = arma::inv_sympd(Cn) ;
 
-
-  return ;
+  return (Cn_inv * Dn * Cn_inv) / n ;
 }
 
 // vcov_sandwich_B = function(Y, X) {

From 5d82dff7c7b1b4fbb3a04d0c66f445487d8f606a Mon Sep 17 00:00:00 2001
From: Julien Chiquet <julien.chiquet@inrae.fr>
Date: Fri, 22 Nov 2024 12:23:43 +0100
Subject: [PATCH 5/7] C++ working version of sandwich

---
 R/PLNfit-class.R | 21 +++---------------
 src/utils-R.cpp  | 55 +++++++++++++-----------------------------------
 2 files changed, 18 insertions(+), 58 deletions(-)

diff --git a/R/PLNfit-class.R b/R/PLNfit-class.R
index 218ff1e7..f7cd47aa 100644
--- a/R/PLNfit-class.R
+++ b/R/PLNfit-class.R
@@ -239,24 +239,9 @@ PLNfit <- R6Class(
     },
 
     vcov_sandwich_B = function(Y, X) {
-      getMat_iCnB <- function(i) {
-        a_i <- as.numeric(private$A[i, ])
-        s_i <- as.numeric(private$S[i, ])
-        omega <- as.numeric(diag(private$Omega))
-        diag_mat_i <- diag(1/a_i + s_i^4 / (1 + s_i^2 * (a_i + omega)))
-        solve(private$Sigma + diag_mat_i)
-      }
-      YmA <- Y - private$A
-      Dn <- matrix(0, self$d*self$p, self$d*self$p)
-      Cn <- matrix(0, self$d*self$p, self$d*self$p)
-      for (i in 1:self$n) {
-        xxt_i <- tcrossprod(X[i, ])
-        Cn <- Cn - kronecker(getMat_iCnB(i) , xxt_i) / self$n
-        Dn <- Dn + kronecker(tcrossprod(YmA[i,]), xxt_i) / self$n
-      }
-      Cn_inv <- solve(Cn)
-      dim_names <- dimnames(attr(private$B, "vcov_variational"))
-      vcov_sand <- ((Cn_inv %*% Dn %*% Cn_inv) / self$n) %>% `dimnames<-`(dim_names)
+      vcov_sand <- get_sandwich_variance_B(Y, X, private$A,
+                                           private$S, private$Sigma, diag(private$Omega)
+      )
       attr(private$B, "vcov_sandwich") <- vcov_sand
       attr(private$B, "variance_sandwich") <- matrix(diag(vcov_sand), nrow = self$d, ncol = self$p,
                                                      dimnames = dimnames(private$B))
diff --git a/src/utils-R.cpp b/src/utils-R.cpp
index 9af462d8..8af160da 100644
--- a/src/utils-R.cpp
+++ b/src/utils-R.cpp
@@ -4,6 +4,8 @@
 
 #include "utils.h"
 
+using namespace arma ;
+
 // [[Rcpp::export]]
 arma::mat get_sandwich_variance_B(
   const arma::mat & Y,
@@ -14,51 +16,24 @@ arma::mat get_sandwich_variance_B(
   const arma::vec & Diag_Omega
 ) {
 
-  arma::uword n = Y.n_rows ;
-  arma::uword p = Y.n_cols ;
-  arma::uword d = X.n_cols ;
+  const uword n = Y.n_rows ;
+  const uword p = Y.n_cols ;
+  const uword d = X.n_cols ;
 
-  auto get_iCnB = [&A, &S, &Diag_Omega, &Sigma](arma::uword i) {
-    arma::vec a = A.row(i) ;
-    arma::vec s = S.row(i) ;
-    arma::mat D = diagmat(pow(a, -1) + pow(s, 4) / (1 + pow(s,2) * (a + Diag_Omega))) ;
+  mat Cn(d*p, d*p, fill::zeros) ;
+  mat Dn(d*p, d*p, fill::zeros) ;
 
-    return arma::inv_sympd(Sigma + D);
-  };
+  mat D = pow(A, -1) + pow(S, 4) / (1 + square(S) % (A + ones(n) * Diag_Omega.t())) ;
+  mat YmA = Y - A ;
 
-  arma::mat YmA = Y - A ;
-  arma::mat Cn = arma::zeros(d*p, d*p) ;
-  arma::mat Dn = arma::zeros(d*p, d*p) ;
-  for (int i=0; i<n; i++) {
-    arma::mat xxt_i = X.col(i) * X.col(i).t() ;
-    arma::mat yyt_i = YmA.col(i) * YmA.col(i).t() ;
-    Cn = Cn - arma::kron(get_iCnB(i), xxt_i) / n ;
-    Dn = Dn + arma::kron(yyt_i, xxt_i) / n ;
+  for (uword i=0; i<n; i++) {
+    mat xxt_i = X.row(i).t() * X.row(i) ;
+    mat yyt_i = YmA.row(i).t() * YmA.row(i) ;
+    Cn -= kron(inv_sympd(Sigma + diagmat(D.row(i))), xxt_i) / n ;
+    Dn += kron(yyt_i, xxt_i) / n ;
   }
 
-  arma::mat Cn_inv = arma::inv_sympd(Cn) ;
+  mat Cn_inv = inv(Cn) ;
 
   return (Cn_inv * Dn * Cn_inv) / n ;
 }
-
-// vcov_sandwich_B = function(Y, X) {
-//  getMat_iCnB <- function(i) {
-//     a_i <- as.numeric(private$A[i, ])
-//     s_i <- as.numeric(private$S[i, ])
-//     omega <- as.numeric(diag(private$Omega))
-//     diag_mat_i <- diag(1/a_i + s_i^4 / (1 + s_i^2 * (a_i + omega)))
-//     solve(private$Sigma + diag_mat_i)
-//  }
-//
-//  YmA <- Y - private$A
-//    Dn <- matrix(0, self$d*self$p, self$d*self$p)
-//    Cn <- matrix(0, self$d*self$p, self$d*self$p)
-//    for (i in 1:self$n) {
-//    xxt_i <- tcrossprod(X[i, ])
-//    Cn <- Cn - kronecker(getMat_iCnB(i) , xxt_i) / self$n
-//    Dn <- Dn + kronecker(tcrossprod(YmA[i,]), xxt_i) / self$n
-//  }
-//   Cn_inv <- solve(Cn)
-//     dim_names <- dimnames(attr(private$B, "vcov_variational"))
-//     vcov_sand <- ((Cn_inv %*% Dn %*% Cn_inv) / self$n) %>% `dimnames<-`(dim_names)
-//

From 72e2c13fefc8bbd11301aa492e2956d6538bd850 Mon Sep 17 00:00:00 2001
From: Julien Chiquet <julien.chiquet@inrae.fr>
Date: Fri, 22 Nov 2024 14:17:25 +0100
Subject: [PATCH 6/7] removing old release for Mac OS in R check

---
 .github/workflows/R-CMD-check.yaml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/.github/workflows/R-CMD-check.yaml b/.github/workflows/R-CMD-check.yaml
index ade15537..7f390862 100644
--- a/.github/workflows/R-CMD-check.yaml
+++ b/.github/workflows/R-CMD-check.yaml
@@ -19,7 +19,6 @@ jobs:
       matrix:
         config:
           - {os: macOS-latest,   r: 'release'}
-          - {os: macOS-latest,   r: 'oldrel-1'}
           - {os: windows-latest, r: 'release'}
           - {os: windows-latest, r: 'oldrel-1'}
           - {os: ubuntu-latest,  r: 'release'}

From 18c1fdd6fd0869507fcc6f06de2583637f4c7136 Mon Sep 17 00:00:00 2001
From: Julien Chiquet <julien.chiquet@inrae.fr>
Date: Fri, 22 Nov 2024 16:12:01 +0100
Subject: [PATCH 7/7] toward more comprehensive tests for sandwich estiamtor of
 the variance

---
 inst/check/variance_estimates.R | 51 +++++++++++++++++++++++++--------
 1 file changed, 39 insertions(+), 12 deletions(-)

diff --git a/inst/check/variance_estimates.R b/inst/check/variance_estimates.R
index ff8624a5..331d1792 100644
--- a/inst/check/variance_estimates.R
+++ b/inst/check/variance_estimates.R
@@ -2,28 +2,55 @@ library(tidyverse)
 library(PLNmodels)
 set.seed(1234)
 
-params <- PLNmodels:::create_parameters(n = 50, p = 10, d = 1, depths = 1e3)
+rmse <- function(theta_hat, theta_star) {
+  sqrt(mean((theta_hat - theta_star)^2))
+}
+
+params <- PLNmodels:::create_parameters(n = 100, p = 10, d = 1, depths = 1e3)
 X <- params$X
 B <- params$B
-Y <- rPLN(n = nrow(X), mu = X %*% B, Sigma = params$Sigma, depths = params$depths)
+conf <- list(variational_var = TRUE, jackknife = TRUE, bootstrap = FALSE, sandwich_var = TRUE)
 
-data <- prepare_data(Y, X, offset = "none")
-logO <- attr(Y, "offsets")
 
-conf <- list(variational_var = TRUE, jackknife = TRUE, bootstrap = nrow(Y), sandwich_var = TRUE)
-model <- PLN(Abundance ~ 0 + . + offset(logO), data = data, control = PLN_param(config_post = conf))
+one_simu <- function(s) {
+
+  Y <- rPLN(n = nrow(X), mu = X %*% B, Sigma = params$Sigma, depths = params$depths)
+  data <- prepare_data(Y, X, offset = "none")
+  logO <- attr(Y, "offsets")
+  model <- PLN(Abundance ~ 0 + . + offset(logO), data = data, control = PLN_param(trace = FALSE, config_post = conf))
+
+  B_hat <- coef(model)
+  vcov_sandwich    <- attr(coef(model), "vcov_sandwich")
+  vcov_jackknife   <- attr(coef(model), "vcov_sandwich")
+  vcov_variational <- attr(coef(model), "vcov_variational")
+
+  data.frame(rmse = rmse(B_hat, B),
+       cover_sandwich    = mean(abs(as.numeric(B_hat - B) %*% solve(chol(vcov_sandwich))) < 1.96),
+       cover_jackknife   = mean(abs(as.numeric(B_hat - B) %*% solve(chol(vcov_jackknife))) < 1.96),
+       cover_variational = mean(abs(as.numeric(B_hat - B) %*% solve(chol(vcov_variational))) < 1.96),
+       simu = s)
+}
+
+res <- do.call(rbind, lapply(1:50, one_simu))
+
+boxplot(res$cover_sandwich, res$cover_jackknife, res$cover_variational)
+
+### Single test
 
-B_hat <- coef(model)
 B_se_var <- standard_error(model, "variational")
 B_se_jk  <- standard_error(model, "jackknife")
-B_se_bt  <- standard_error(model, "bootstrap")
 B_se_sw  <- standard_error(model, "sandwich")
 
+Y <- rPLN(n = nrow(X), mu = X %*% B, Sigma = params$Sigma, depths = params$depths)
+data <- prepare_data(Y, X, offset = "none")
+logO <- attr(Y, "offsets")
+model <- PLN(Abundance ~ 0 + . + offset(logO), data = data, control = PLN_param(config_post = conf))
+
 data.frame(
-  B = rep(c(B), 4),
-  B_hat = rep(c(B_hat), 4),
-  se = c(B_se_var, B_se_jk, B_se_bt, B_se_sw),
-  method = rep(c("variational", "jackknife", "bootstrap", "sandwich"), each = length(c(B))) ) %>%
+  B = rep(c(B), 3),
+  B_hat = rep(c(B_hat), 3),
+  se = c(B_se_var, B_se_jk, B_se_sw),
+  method = rep(c("variational", "jackknife", "sandwich"), each = length(c(B))) ) %>%
   ggplot(aes(x = B, y = B_hat)) +
   geom_errorbar(aes(ymin = B_hat - 2 * se,
                     ymax = B_hat + 2 * se), color = "blue") + facet_wrap(~ method) +