From 48bda128f3956131a7cc0dba698a93454f852af0 Mon Sep 17 00:00:00 2001
From: Daniel Sabanes Bove <daniel.sabanesbove@gmx.net>
Date: Mon, 20 Jan 2025 20:17:20 +0800
Subject: [PATCH 1/5] add design doc to align on approach

---
 misc/design_mcmc_improve.qmd | 205 +++++++++++++++++++++++++++++++++++
 1 file changed, 205 insertions(+)
 create mode 100644 misc/design_mcmc_improve.qmd

diff --git a/misc/design_mcmc_improve.qmd b/misc/design_mcmc_improve.qmd
new file mode 100644
index 00000000..a1719006
--- /dev/null
+++ b/misc/design_mcmc_improve.qmd
@@ -0,0 +1,205 @@
+# Design doc for improving MCMC sampling
+
+This design doc proposes several updates to the `rbmi` package to improve the options for MCMC sampling. The main goal is to provide more flexibility to the user in terms of the sampling behavior, while still keeping the package easy to use.
+
+## Wish list
+
+1. Stan sampling argument as input parameters (`rstan::sampling` control should be controllable)
+1. Keep current option (single chain; MMRM output as initial value as default)
+1. Add option to have multiple chains with random initial values
+1. Always have default prior and don't make prior the input parameter
+
+## Sampling controls
+
+Currently the `rstan` sampling is controlled by a hard coded list in [`fit_mcmc`](https://github.com/insightsengineering/rbmi/blob/main/R/mcmc.R#L94). 
+
+The `sampling()` function is described [here](https://mc-stan.org/rstan/reference/stanmodel-method-sampling.html). In particular, the `control` argument allows to further specify the sampling behavior, which is documented [here](https://mc-stan.org/rstan/reference/stan.html).
+
+Idea:
+
+- Provide a `control_bayes()` function that returns a list of control parameters for `rstan::stan()`
+  - This function should have a default behavior that is the same as the current behavior
+  - The user can override the default behavior by providing a list of control parameters
+  - Takes additional arguments which are then included in the returned list
+  - In order to simplify the user interface, the previous `method` parts `burn_in`, `burn_between`, `n_samples` are moved to the `control_bayes()` function, and will properly be deprecated from `method_bayes()`.
+- The `fit_mcmc` function should take the `control_bayes()` output as an additional argument and passes it internally to `rstan::sampling()`  
+
+## Multiple chains
+
+Currently just a single chain is used. 
+
+Idea: 
+
+- As part of the `control_bayes()` function, we could add an argument to specify the number of chains. 
+- If the number of chains is greater than 1, then the `init` argument of `rstan::sampling()` should be set to `random` (see [here](https://mc-stan.org/rstan/reference/stanmodel-method-sampling.html)).
+- We can make some experiments to ensure that chains converge to the stationary distribution within reasonable time frame if started from random values. If the Stan random initial values are not good enough, we could later have the option to use initial values sampled from the MLE distribution as the initial values for the chains.
+
+We note that due to the definition of the prior distribution for the covariance matrix, we still need to fit the frequentist MMRM model in any case to get the required prior parameter.
+
+Question: What do we need to adapt downstream when using multiple chains?
+
+## Default prior
+
+We would want to keep using a default prior, as it is currently implemented for the unstructured covariance structure already.
+
+That implies that we will need to come up with such default priors for the other covariance structures. This will be handled in the separate design doc.
+
+## Prototype
+
+This is how it could look like:
+
+```r
+control_bayes <- function( 
+    burn_in = 200,
+    burn_between = 50,
+    n_samples = 20,
+    chains = 1,
+    init = ife(chains > 1, "random", "mmrm"),
+    quiet = FALSE,
+    refresh = ife(
+      quiet,
+      0,
+      iter / 10
+    ),
+    seed = sample.int(.Machine$integer.max, 1),
+    ...
+) {
+    list(
+        warmup = burn_in,
+        thin = burn_between,
+        iter = burn_in + burn_between * n_samples,
+        chains = chains,
+        warmup = warmup,
+        thin = thin,
+        iter = iter,
+        quiet = quiet,
+        refresh = refresh,
+        init = init,
+        seed = seed,
+        additional = list(...)
+    )  
+}
+```
+
+This function's output `control` can then be used in `fit_mcmc()` like this (copied and adapted function code):
+
+```r
+fit_mcmc <- function(
+    designmat,
+    outcome,
+    group,
+    subjid,
+    visit,
+    method,
+    control) {
+
+    # Fit MMRM (needed for Sigma prior parameter and possibly initial values).
+    mmrm_initial <- fit_mmrm(
+        designmat = designmat,
+        outcome = outcome,
+        subjid = subjid,
+        visit = visit,
+        group = group,
+        cov_struct = "us",
+        REML = TRUE,
+        same_cov = method$same_cov
+    )
+
+    if (mmrm_initial$failed) {
+        stop("Fitting MMRM to original dataset failed")
+    }
+
+    stan_data <- prepare_stan_data(
+        ddat = designmat,
+        subjid = subjid,
+        visit = visit,
+        outcome = outcome,
+        group = ife(method$same_cov == TRUE, rep(1, length(group)), group)
+    )
+
+    stan_data$Sigma_init <- ife(
+        same_cov == TRUE,
+        list(mmrm_initial$sigma[[1]]),
+        mmrm_initial$sigma
+    )
+
+    sampling_args <- c(
+      list(
+        object = get_stan_model(),
+        data = stan_data,
+        pars = c("beta", "Sigma"),
+        chains = control$chains,
+        warmup = control$warmup,
+        thin = control$thin,
+        iter = control$iter,
+        init = ife(
+          control$init == "mmrm", 
+          list(list(
+            theta = as.vector(stan_data$R %*% mmrm_initial$beta),
+            sigma = mmrm_initial$sigma
+          )),
+          control$init
+        ),
+        refresh = control$refresh,
+        seed = control$seed
+      ),
+      control$additional
+    )
+
+    stan_fit <- record({
+        do.call(rstan::sampling, sampling_args)
+    })
+
+    if (!is.null(stan_fit$errors)) {
+        stop(stan_fit$errors)
+    }
+
+    ignorable_warnings <- c(
+        "Bulk Effective Samples Size (ESS) is too low, indicating posterior means and medians may be unreliable.\nRunning the chains for more iterations may help. See\nhttps://mc-stan.org/misc/warnings.html#bulk-ess",
+        "Tail Effective Samples Size (ESS) is too low, indicating posterior variances and tail quantiles may be unreliable.\nRunning the chains for more iterations may help. See\nhttps://mc-stan.org/misc/warnings.html#tail-ess"
+    )
+
+    # handle warning: display only warnings if
+    # 1) the warning is not in ignorable_warnings
+    warnings <- stan_fit$warnings
+    warnings_not_allowed <- warnings[!warnings %in% ignorable_warnings]
+    for (i in warnings_not_allowed) warning(warnings_not_allowed)
+
+    fit <- stan_fit$results
+    check_mcmc(fit, n_imputations)
+
+    draws <- extract_draws(fit)
+
+    ret_obj <- list(
+        "samples" = draws,
+        "fit" = fit
+    )
+
+    return(ret_obj)
+}
+```
+
+Finally, the user can call the `draws()` method now including the new `control` argument. This then also comprises the `quiet` argument. The method signature changes to:
+
+```{r}
+draws.bayes <- function(data, 
+                        data_ice = NULL, 
+                        vars, 
+                        method, 
+                        ncores = 1,  
+                        control = control_bayes()) 
+```
+
+and internally the `control` argument is just forwarded to `fit_mcmc()`.
+
+Note that it is important for easy usability that we just rely on all default arguments in the `control_bayes()` function. The user can then just override the defaults they need to override by
+specifying the corresponding arguments. In addition, we can still pass the Stan `control` argument inside `control_bayes()`, and it is not a problem that this argument has the same name as the `draws()` argument.
+
+So a call could e.g. just be:
+
+```r
+draws(
+    data = data, vars = c("beta", "Sigma"), method = method, chains = 4, 
+    control = control_bayes(seed = 123, control = list(adapt_delta = 0.99))
+)
+```
\ No newline at end of file

From 3d65bc595db0e9bab9558562f1aaa75a9a5c885d Mon Sep 17 00:00:00 2001
From: Daniel Sabanes Bove <daniel.sabanesbove@gmx.net>
Date: Thu, 23 Jan 2025 18:43:24 +0800
Subject: [PATCH 2/5] address comments

---
 misc/design_mcmc_improve.qmd | 29 +++++++++++++++++++++--------
 1 file changed, 21 insertions(+), 8 deletions(-)

diff --git a/misc/design_mcmc_improve.qmd b/misc/design_mcmc_improve.qmd
index a1719006..c68617e2 100644
--- a/misc/design_mcmc_improve.qmd
+++ b/misc/design_mcmc_improve.qmd
@@ -7,7 +7,7 @@ This design doc proposes several updates to the `rbmi` package to improve the op
 1. Stan sampling argument as input parameters (`rstan::sampling` control should be controllable)
 1. Keep current option (single chain; MMRM output as initial value as default)
 1. Add option to have multiple chains with random initial values
-1. Always have default prior and don't make prior the input parameter
+1. Always have default prior and don't make prior the input parameter.
 
 ## Sampling controls
 
@@ -22,8 +22,15 @@ Idea:
   - The user can override the default behavior by providing a list of control parameters
   - Takes additional arguments which are then included in the returned list
   - In order to simplify the user interface, the previous `method` parts `burn_in`, `burn_between`, `n_samples` are moved to the `control_bayes()` function, and will properly be deprecated from `method_bayes()`.
+  - Arguments of the new control function will be briefly documented (not just copied from the `rstan` documentation, but rather explained in the context of the `rbmi` package). The user will be referred to the `rstan` documentation for more details for additionally passed arguments.
 - The `fit_mcmc` function should take the `control_bayes()` output as an additional argument and passes it internally to `rstan::sampling()`  
 
+License considerations:
+
+- The `rstan` package is licensed under GPL-3.0, while `rbmi` is licensed under the MIT license.
+- Only using the `rstan::sampling()` function and specifying reasonable default values for some of its control arguments should not require to change the license of the `rbmi` package. This is because this does not constitute a derivative work. Instead, the `rbmi` package would continue to be "linking" to the GPL package.
+- Importantly, the `rbmi` package only has the `rstan` package in the `Suggests` field of the `DESCRIPTION` file, not in the `Imports` field. This means that the `rstan` package is not required to be installed to use the `rbmi` package. 
+
 ## Multiple chains
 
 Currently just a single chain is used. 
@@ -36,13 +43,14 @@ Idea:
 
 We note that due to the definition of the prior distribution for the covariance matrix, we still need to fit the frequentist MMRM model in any case to get the required prior parameter.
 
-Question: What do we need to adapt downstream when using multiple chains?
+Question: What do we need to adapt downstream when using multiple chains? 
+Answer: We will be able to test this in detail and address it, once we have implemented the possibility to use multiple chains in the development version. To avoid possible confusion, we can add a warning in the development version, which informs the user that multiple chains are not yet fully supported, while we are still working on it.
 
 ## Default prior
 
-We would want to keep using a default prior, as it is currently implemented for the unstructured covariance structure already.
+We would want to keep using a default prior, as it is currently implemented for the unstructured covariance structure already. The user should never have to specify the priors actively, because there should always be a reasonable default prior implemented by `rbmi`.
 
-That implies that we will need to come up with such default priors for the other covariance structures. This will be handled in the separate design doc.
+That implies that we will need to come up with such default priors for the other covariance structures. This will be handled in a separate, forthcoming design doc.
 
 ## Prototype
 
@@ -69,10 +77,6 @@ control_bayes <- function(
         thin = burn_between,
         iter = burn_in + burn_between * n_samples,
         chains = chains,
-        warmup = warmup,
-        thin = thin,
-        iter = iter,
-        quiet = quiet,
         refresh = refresh,
         init = init,
         seed = seed,
@@ -81,6 +85,15 @@ control_bayes <- function(
 }
 ```
 
+The rationale for using this control function approach is:
+
+- We provide sensible defaults to the user, however they can now override them if they want to.
+- The user can now also pass additional arguments to the `rstan::sampling()` function, but they are not required to do so.
+- If the `rstan` API changes, we can adapt the `control_bayes()` function accordingly, and the user does not have to change their code. We would be notified by CRAN reverse dependencies checks if the `rstan` API changes because we will include tests for the actual use of the `rstan` package in the `rbmi` package.
+- We have checked the stability of the `rstan` API over the past, by having a look at the GitHub repository ([link](https://github.com/stan-dev/rstan/blob/develop/rstan/rstan/R/stanmodel-class.R#L507)). It seems stable over the last 6 years:
+  - Via the [blame view](https://github.com/stan-dev/rstan/blame/develop/rstan/rstan/R/stanmodel-class.R#L507) we can see that the signature of the `sampling` method has not changed during the last 6 years. The signature explicitly includes all of our arguments, except for the `refresh` argument.
+  - The `refresh` argument is passed via `...`. We can see that the arguments provided via `...` are checked by `is_arg_deprecated()`, which only lists an argument `enable_random_init` as deprecated, and this has not changed in the last 9 years. Further we can see that in the `stan()` function's [blame view](https://github.com/stan-dev/rstan/blame/develop/rstan/rstan/R/rstan.R#L280) the `refresh` argument has been recognized for 11 years.
+
 This function's output `control` can then be used in `fit_mcmc()` like this (copied and adapted function code):
 
 ```r

From 16fa0e19aad350e5ae9e8184ca39ff2471c7c811 Mon Sep 17 00:00:00 2001
From: Daniel Sabanes Bove <daniel.sabanesbove@gmx.net>
Date: Mon, 27 Jan 2025 21:33:47 +0800
Subject: [PATCH 3/5] address review comments

---
 misc/design_mcmc_improve.qmd | 109 +++++++++++++++++++++++++----------
 1 file changed, 79 insertions(+), 30 deletions(-)

diff --git a/misc/design_mcmc_improve.qmd b/misc/design_mcmc_improve.qmd
index c68617e2..f6dae6f4 100644
--- a/misc/design_mcmc_improve.qmd
+++ b/misc/design_mcmc_improve.qmd
@@ -4,14 +4,14 @@ This design doc proposes several updates to the `rbmi` package to improve the op
 
 ## Wish list
 
-1. Stan sampling argument as input parameters (`rstan::sampling` control should be controllable)
+1. Allow more detailed Stan sampling arguments as input parameters (`rstan::sampling` control should be controllable)
 1. Keep current option (single chain; MMRM output as initial value as default)
 1. Add option to have multiple chains with random initial values
 1. Always have default prior and don't make prior the input parameter.
 
 ## Sampling controls
 
-Currently the `rstan` sampling is controlled by a hard coded list in [`fit_mcmc`](https://github.com/insightsengineering/rbmi/blob/main/R/mcmc.R#L94). 
+Currently the `rstan` sampling details are controlled by a hard coded list in [`fit_mcmc`](https://github.com/insightsengineering/rbmi/blob/main/R/mcmc.R#L94). A few of the parameters are exposed in `method_bayes()` to the user.
 
 The `sampling()` function is described [here](https://mc-stan.org/rstan/reference/stanmodel-method-sampling.html). In particular, the `control` argument allows to further specify the sampling behavior, which is documented [here](https://mc-stan.org/rstan/reference/stan.html).
 
@@ -21,9 +21,11 @@ Idea:
   - This function should have a default behavior that is the same as the current behavior
   - The user can override the default behavior by providing a list of control parameters
   - Takes additional arguments which are then included in the returned list
-  - In order to simplify the user interface, the previous `method` parts `burn_in`, `burn_between`, `n_samples` are moved to the `control_bayes()` function, and will properly be deprecated from `method_bayes()`.
+  - In order to simplify the user interface, the previous `method` parts `burn_in` and `burn_between`, are moved to the `control_bayes()` function, and will properly be deprecated from `method_bayes()`.
+  - In order to keep the pattern with the other `method_*()` functions, the `n_samples` argument remains in the `method_bayes()` function. The `method_bayes()` function gains an additional argument `control` where the `control_bayes()` function result is passed.
   - Arguments of the new control function will be briefly documented (not just copied from the `rstan` documentation, but rather explained in the context of the `rbmi` package). The user will be referred to the `rstan` documentation for more details for additionally passed arguments.
-- The `fit_mcmc` function should take the `control_bayes()` output as an additional argument and passes it internally to `rstan::sampling()`  
+- The `draws()` method keeps its current signature, but internally sets the `iter` and `refresh` arguments in the `method$control` list, based on the `method$n_samples` and the `quiet` arguments.
+- The `fit_mcmc` function processes the additional `control` output instead of the currently hard coded settings, and passes it internally to `rstan::sampling()`  
 
 License considerations:
 
@@ -43,8 +45,8 @@ Idea:
 
 We note that due to the definition of the prior distribution for the covariance matrix, we still need to fit the frequentist MMRM model in any case to get the required prior parameter.
 
-Question: What do we need to adapt downstream when using multiple chains? 
-Answer: We will be able to test this in detail and address it, once we have implemented the possibility to use multiple chains in the development version. To avoid possible confusion, we can add a warning in the development version, which informs the user that multiple chains are not yet fully supported, while we are still working on it.
+- *Question*: What do we need to adapt downstream when using multiple chains? 
+- *Answer*: We will be able to test this in detail and address it, once we have implemented the possibility to use multiple chains in the development version. To avoid possible confusion, we can add a warning in the development version, which informs the user that multiple chains are not yet fully supported, while we are still working on it.
 
 ## Default prior
 
@@ -54,28 +56,31 @@ That implies that we will need to come up with such default priors for the other
 
 ## Prototype
 
-This is how it could look like:
+### Control function
+
+This is how the control function could look like:
 
 ```r
 control_bayes <- function( 
     burn_in = 200,
     burn_between = 50,
-    n_samples = 20,
     chains = 1,
     init = ife(chains > 1, "random", "mmrm"),
-    quiet = FALSE,
-    refresh = ife(
-      quiet,
-      0,
-      iter / 10
-    ),
     seed = sample.int(.Machine$integer.max, 1),
+    n_samples = NULL,
+    iter = NULL,
+    refresh = NULL,
     ...
 ) {
+    if (!is.null(n_samples) || !is.null(iter)) {
+        stop("Please provide the number of samples directly via the `n_samples` argument of `method_bayes()`")
+    }
+    is (!is.null(refresh)) {
+        stop("Instead of the `refresh` argument here, please provide the `quiet` argument directly to `draws()`")
+    }
     list(
         warmup = burn_in,
         thin = burn_between,
-        iter = burn_in + burn_between * n_samples,
         chains = chains,
         refresh = refresh,
         init = init,
@@ -91,10 +96,38 @@ The rationale for using this control function approach is:
 - The user can now also pass additional arguments to the `rstan::sampling()` function, but they are not required to do so.
 - If the `rstan` API changes, we can adapt the `control_bayes()` function accordingly, and the user does not have to change their code. We would be notified by CRAN reverse dependencies checks if the `rstan` API changes because we will include tests for the actual use of the `rstan` package in the `rbmi` package.
 - We have checked the stability of the `rstan` API over the past, by having a look at the GitHub repository ([link](https://github.com/stan-dev/rstan/blob/develop/rstan/rstan/R/stanmodel-class.R#L507)). It seems stable over the last 6 years:
-  - Via the [blame view](https://github.com/stan-dev/rstan/blame/develop/rstan/rstan/R/stanmodel-class.R#L507) we can see that the signature of the `sampling` method has not changed during the last 6 years. The signature explicitly includes all of our arguments, except for the `refresh` argument.
-  - The `refresh` argument is passed via `...`. We can see that the arguments provided via `...` are checked by `is_arg_deprecated()`, which only lists an argument `enable_random_init` as deprecated, and this has not changed in the last 9 years. Further we can see that in the `stan()` function's [blame view](https://github.com/stan-dev/rstan/blame/develop/rstan/rstan/R/rstan.R#L280) the `refresh` argument has been recognized for 11 years.
+  - Via the [blame view](https://github.com/stan-dev/rstan/blame/develop/rstan/rstan/R/stanmodel-class.R#L507) we can see that the signature of the `sampling` method has not changed during the last 6 years. The signature explicitly includes all of our arguments.
+  - The `refresh` argument is not directly accessible, because we want to keep the `quiet` interface of the `draws()` method. Internally, it will still be used (as now as well). The `refresh` argument is passed via `...`. We can see that the arguments provided via `...` are checked by `is_arg_deprecated()`, which only lists an argument `enable_random_init` as deprecated, and this has not changed in the last 9 years. Further we can see that in the `stan()` function's [blame view](https://github.com/stan-dev/rstan/blame/develop/rstan/rstan/R/rstan.R#L280) the `refresh` argument has been recognized for 11 years.
+
+### Method function
+
+This is how the method function could look like:
+
+```r
+method_bayes <- function(
+    same_cov = TRUE,
+    n_samples = 500,
+    control = control_bayes(),
+    burn_in = NULL,
+    burn_between = NULL
+) {
+   assertthat::assert_that(
+      is.null(burn_in), msg = paste("The `burn_in` argument to `method_bayes()` has been deprecated;",
+        "please specify this inside `control = control_bayes()` instead.", collapse = " "))
+   assertthat::assert_that(
+      is.null(burn_between), msg = paste("The `burn_between` argument to `method_bayes()` has been deprecated;",
+        "please specify this inside `control = control_bayes()` instead.", collapse = " "))
+    x <- list(same_cov = same_cov, n_samples = n_samples, control = control)
+    return(as_class(x, c("method", "bayes")))
+}
+```
+
+- The `seed` argument has been deprecated in a previous release and can therefore be removed here.
+- We deprecate here the `burn_in` and `burn_between` arguments, and refer the user to the `control_bayes()` function instead. We will remove these arguments in a future release.
+
+### Fit function
 
-This function's output `control` can then be used in `fit_mcmc()` like this (copied and adapted function code):
+This function's output `control` inside the `method` list can then be used in `fit_mcmc()` like this (copied and adapted function code):
 
 ```r
 fit_mcmc <- function(
@@ -104,7 +137,7 @@ fit_mcmc <- function(
     subjid,
     visit,
     method,
-    control) {
+    quiet = FALSE) {
 
     # Fit MMRM (needed for Sigma prior parameter and possibly initial values).
     mmrm_initial <- fit_mmrm(
@@ -136,6 +169,7 @@ fit_mcmc <- function(
         mmrm_initial$sigma
     )
 
+    control <- method$control
     sampling_args <- c(
       list(
         object = get_stan_model(),
@@ -192,18 +226,23 @@ fit_mcmc <- function(
 }
 ```
 
-Finally, the user can call the `draws()` method now including the new `control` argument. This then also comprises the `quiet` argument. The method signature changes to:
+### Draws method
 
-```{r}
-draws.bayes <- function(data, 
-                        data_ice = NULL, 
-                        vars, 
-                        method, 
-                        ncores = 1,  
-                        control = control_bayes()) 
+Finally, the user can call the `draws()` method as before. The only differences are:
+
+- The `method` argument called by `method_bayes()` now also comprises the `control` argument.
+- Internally in the `draws()` method, additional elements are inserted in the `control` list:
+
+```r
+method$control$iter <- method$control$warmup + method$control$thin * method$n_samples
+method$control$refresh <- ife(
+    quiet,
+    0,
+    method$control$iter / 10
+)
 ```
 
-and internally the `control` argument is just forwarded to `fit_mcmc()`.
+This is to keep the pattern of having the `quiet` argument of the `draws` method. See above the corresponding checks we make in the `control_bayes()` function call to avoid problems if the user passes `refresh`, `iter` or `n_samples` to the `control_bayes()` function.
 
 Note that it is important for easy usability that we just rely on all default arguments in the `control_bayes()` function. The user can then just override the defaults they need to override by
 specifying the corresponding arguments. In addition, we can still pass the Stan `control` argument inside `control_bayes()`, and it is not a problem that this argument has the same name as the `draws()` argument.
@@ -212,7 +251,17 @@ So a call could e.g. just be:
 
 ```r
 draws(
-    data = data, vars = c("beta", "Sigma"), method = method, chains = 4, 
-    control = control_bayes(seed = 123, control = list(adapt_delta = 0.99))
+    data = data, 
+    vars = c("beta", "Sigma"), 
+    method = method_bayes(
+        n_samples = 500,
+        control = control_bayes(
+            chains = 4,
+            burn_in = 1000,
+            burn_between = 100,
+            seed = 123
+        )
+    ), 
+    ncores = 4    
 )
 ```
\ No newline at end of file

From e4d8152afa00a1d121bc6ea375099b142bb61034 Mon Sep 17 00:00:00 2001
From: Daniel Sabanes Bove <danielinteractive@users.noreply.github.com>
Date: Fri, 31 Jan 2025 22:30:29 +0800
Subject: [PATCH 4/5] Apply suggestions from code review

Co-authored-by: Craig Gower-Page <craiggower@gmail.com>
Signed-off-by: Daniel Sabanes Bove <danielinteractive@users.noreply.github.com>
---
 misc/design_mcmc_improve.qmd | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/misc/design_mcmc_improve.qmd b/misc/design_mcmc_improve.qmd
index f6dae6f4..e110a798 100644
--- a/misc/design_mcmc_improve.qmd
+++ b/misc/design_mcmc_improve.qmd
@@ -29,7 +29,7 @@ Idea:
 
 License considerations:
 
-- The `rstan` package is licensed under GPL-3.0, while `rbmi` is licensed under the MIT license.
+- The `rstan` package is licensed under GPL-3.0, while `rbmi` is licensed under the Apache 2.0 license.
 - Only using the `rstan::sampling()` function and specifying reasonable default values for some of its control arguments should not require to change the license of the `rbmi` package. This is because this does not constitute a derivative work. Instead, the `rbmi` package would continue to be "linking" to the GPL package.
 - Importantly, the `rbmi` package only has the `rstan` package in the `Suggests` field of the `DESCRIPTION` file, not in the `Imports` field. This means that the `rstan` package is not required to be installed to use the `rbmi` package. 
 
@@ -65,7 +65,7 @@ control_bayes <- function(
     burn_in = 200,
     burn_between = 50,
     chains = 1,
-    init = ife(chains > 1, "random", "mmrm"),
+    init = ifelse(chains > 1, "random", "mmrm"),
     seed = sample.int(.Machine$integer.max, 1),
     n_samples = NULL,
     iter = NULL,

From 946e0a7c927d3ee8a677ad6b134c06dbbb7e54f4 Mon Sep 17 00:00:00 2001
From: Daniel Sabanes Bove <daniel.sabanesbove@gmx.net>
Date: Fri, 31 Jan 2025 22:39:40 +0800
Subject: [PATCH 5/5] address review comments

---
 misc/design_mcmc_improve.qmd | 23 +++++++++++++----------
 1 file changed, 13 insertions(+), 10 deletions(-)

diff --git a/misc/design_mcmc_improve.qmd b/misc/design_mcmc_improve.qmd
index e110a798..a7866292 100644
--- a/misc/design_mcmc_improve.qmd
+++ b/misc/design_mcmc_improve.qmd
@@ -22,6 +22,7 @@ Idea:
   - The user can override the default behavior by providing a list of control parameters
   - Takes additional arguments which are then included in the returned list
   - In order to simplify the user interface, the previous `method` parts `burn_in` and `burn_between`, are moved to the `control_bayes()` function, and will properly be deprecated from `method_bayes()`.
+  - As we are creating these as new arguments we also rename them to `warmup` and `thin` to be consistent with Stan's nomenclature.
   - In order to keep the pattern with the other `method_*()` functions, the `n_samples` argument remains in the `method_bayes()` function. The `method_bayes()` function gains an additional argument `control` where the `control_bayes()` function result is passed.
   - Arguments of the new control function will be briefly documented (not just copied from the `rstan` documentation, but rather explained in the context of the `rbmi` package). The user will be referred to the `rstan` documentation for more details for additionally passed arguments.
 - The `draws()` method keeps its current signature, but internally sets the `iter` and `refresh` arguments in the `method$control` list, based on the `method$n_samples` and the `quiet` arguments.
@@ -42,6 +43,8 @@ Idea:
 - As part of the `control_bayes()` function, we could add an argument to specify the number of chains. 
 - If the number of chains is greater than 1, then the `init` argument of `rstan::sampling()` should be set to `random` (see [here](https://mc-stan.org/rstan/reference/stanmodel-method-sampling.html)).
 - We can make some experiments to ensure that chains converge to the stationary distribution within reasonable time frame if started from random values. If the Stan random initial values are not good enough, we could later have the option to use initial values sampled from the MLE distribution as the initial values for the chains.
+- In general it is the user's responsibility to ensure the convergence of the Markov chains. Since we expose the underlying Stan object, the user can always check the chains and the convergence diagnostics themselves. We can also provide some guidance in the documentation on how to check the convergence of the chains.
+
 
 We note that due to the definition of the prior distribution for the covariance matrix, we still need to fit the frequentist MMRM model in any case to get the required prior parameter.
 
@@ -62,25 +65,25 @@ This is how the control function could look like:
 
 ```r
 control_bayes <- function( 
-    burn_in = 200,
-    burn_between = 50,
+    warmup = 200,
+    thin = 50,
     chains = 1,
     init = ifelse(chains > 1, "random", "mmrm"),
     seed = sample.int(.Machine$integer.max, 1),
-    n_samples = NULL,
-    iter = NULL,
-    refresh = NULL,
     ...
 ) {
-    if (!is.null(n_samples) || !is.null(iter)) {
+    additional <- list(...)
+    additional_pars <- names(additional)
+    
+    if (any(c("n_samples", "iter") %in% additional_pars)) {
         stop("Please provide the number of samples directly via the `n_samples` argument of `method_bayes()`")
     }
-    is (!is.null(refresh)) {
+    is ("refresh" %in% additional_pars) {
         stop("Instead of the `refresh` argument here, please provide the `quiet` argument directly to `draws()`")
     }
     list(
-        warmup = burn_in,
-        thin = burn_between,
+        warmup = warmup,
+        thin = thin,
         chains = chains,
         refresh = refresh,
         init = init,
@@ -122,7 +125,7 @@ method_bayes <- function(
 }
 ```
 
-- The `seed` argument has been deprecated in a previous release and can therefore be removed here.
+- The `seed` argument has been deprecated in a previous release and can therefore be removed here. Note that it is now available in the `control_bayes()` function though, which replaces the hardcoded seed in the `fit_mcmc()` function.
 - We deprecate here the `burn_in` and `burn_between` arguments, and refer the user to the `control_bayes()` function instead. We will remove these arguments in a future release.
 
 ### Fit function