stan-dev
diff --git a/‎.github/workflows/cmdstan-tarball-check.yaml
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/cmdstan-tarball-check.yaml
Lines changed: 1 addition & 1 deletion
diff --git a/‎DESCRIPTION
Lines changed: 2 additions & 2 deletions b/‎DESCRIPTION
Lines changed: 2 additions & 2 deletions
diff --git a/‎NAMESPACE
Lines changed: 1 addition & 0 deletions b/‎NAMESPACE
Lines changed: 1 addition & 0 deletions
diff --git a/‎R/csv.R
Lines changed: 1 addition & 0 deletions b/‎R/csv.R
Lines changed: 1 addition & 0 deletions
diff --git a/‎R/data.R
Lines changed: 75 additions & 20 deletions b/‎R/data.R
Lines changed: 75 additions & 20 deletions
diff --git a/‎R/model.R
Lines changed: 11 additions & 2 deletions b/‎R/model.R
Lines changed: 11 additions & 2 deletions
diff --git a/‎_pkgdown.yml
Lines changed: 1 addition & 0 deletions b/‎_pkgdown.yml
Lines changed: 1 addition & 0 deletions
diff --git a/‎inst/logistic.stan
Lines changed: 4 additions & 2 deletions b/‎inst/logistic.stan
Lines changed: 4 additions & 2 deletions
diff --git a/‎man/draws_to_csv.Rd
Lines changed: 61 additions & 0 deletions b/‎man/draws_to_csv.Rd
Lines changed: 61 additions & 0 deletions
diff --git a/‎man/model-method-generate-quantities.Rd
Lines changed: 8 additions & 1 deletion b/‎man/model-method-generate-quantities.Rd
Lines changed: 8 additions & 1 deletion
diff --git a/‎tests/testthat/answers/model-code-output.rds
12 Bytes b/‎tests/testthat/answers/model-code-output.rds
12 Bytes
diff --git a/‎tests/testthat/answers/model-print-output.stan
Lines changed: 3 additions & 3 deletions b/‎tests/testthat/answers/model-print-output.stan
Lines changed: 3 additions & 3 deletions
diff --git a/‎tests/testthat/resources/stan/bernoulli.stan
Lines changed: 3 additions & 3 deletions b/‎tests/testthat/resources/stan/bernoulli.stan
Lines changed: 3 additions & 3 deletions
diff --git a/‎tests/testthat/resources/stan/bernoulli_fp.stan
Lines changed: 4 additions & 3 deletions b/‎tests/testthat/resources/stan/bernoulli_fp.stan
Lines changed: 4 additions & 3 deletions
diff --git a/‎tests/testthat/resources/stan/bernoulli_include.stan
Lines changed: 5 additions & 4 deletions b/‎tests/testthat/resources/stan/bernoulli_include.stan
Lines changed: 5 additions & 4 deletions
diff --git a/‎tests/testthat/resources/stan/bernoulli_log_lik.stan
Lines changed: 6 additions & 4 deletions b/‎tests/testthat/resources/stan/bernoulli_log_lik.stan
Lines changed: 6 additions & 4 deletions
@@ -19,7 +19,7 @@ jobs:
     name: ${{ matrix.config.os }} (${{ matrix.config.r }})
 
     strategy:
-      fail-fast: true
+      fail-fast: false
       matrix:
         config:
           - {os: macOS-latest, r: 'release'}
 
@@ -1,6 +1,6 @@
 Package: cmdstanr
 Title: R Interface to 'CmdStan'
-Version: 0.4.0.9000
+Version: 0.4.0.9001
 Date: 2021-04-15
 Authors@R: 
     c(person(given = "Jonah", family = "Gabry", role = c("aut", "cre"),
@@ -36,7 +36,7 @@ Imports:
     R6 (>= 2.4.0)
 Suggests: 
     bayesplot,
-    knitr,
+    knitr (>= 1.37),
     loo (>= 2.0.0),
     rlang (>= 0.4.7),
     rmarkdown,
 
@@ -15,6 +15,7 @@ export(cmdstan_model)
 export(cmdstan_path)
 export(cmdstan_version)
 export(cmdstanr_example)
+export(draws_to_csv)
 export(eng_cmdstan)
 export(install_cmdstan)
 export(num_threads)
 
@@ -179,6 +179,7 @@ read_cmdstan_csv <- function(files,
   if (length(uniq_seed) == 1) {
     metadata$seed <- uniq_seed
   }
+  metadata$time <- time
   if (metadata$method == "diagnose") {
     gradients <- metadata$gradients
     metadata$gradients <- NULL
 
@@ -204,27 +204,77 @@ any_zero_dims <- function(data) {
   any(has_zero_dims)
 }
 
-#' Write posterior draws objects to csv files
-#' @noRd
-#' @param draws A `draws_array` from posterior pkg
-#' @param sampler_diagnostics Either `NULL` or a `draws_array` of sampler diagnostics
+#' Write posterior draws objects to CSV files suitable for running standalone generated
+#' quantities with CmdStan.
+#'
+#' @export
+#' @param draws A `posterior::draws_*` object.
+#' @param sampler_diagnostics Either `NULL` or a `posterior::draws_*` object
+#'  of sampler diagnostics.
+#' @param dir (string) An optional path to the directory where the CSV files will be
+#'   written. If not set, [temporary directory][base::tempdir] is used.
+#' @param basename (string) If `dir` is specified, `basename`` is used for naming
+#' the output CSV files. If not specified, the file names are randomly generated.
+#'
 #' @return Paths to CSV files (one per chain).
 #'
-draws_to_csv <- function(draws, sampler_diagnostics = NULL) {
+#' @details
+#' `draws_to_csv()` generates a CSV suitable for running standalone generated
+#' quantities with CmdStan. The CSV file contains a single comment `#num_samples`,
+#' which equals the number of iterations in the supplied draws object.
+#'
+#' The comment is followed by the column names. The first column is the `lp__` value,
+#' followed by sampler diagnostics and finnaly other variables of the draws object.
+#' #' If the draws object does not contain the `lp__` or sampler diagnostics variables,
+#' columns with zeros are created in order to conform with the requirements of the
+#' standalone generated quantities method of CmdStan.
+#'
+#' The column names line is finally followed by the values of the draws in the same
+#' order as the column names.
+#'
+#' @examples
+#' \dontrun{
+#' draws <- posterior::example_draws()
+#'
+#' draws_csv_files <- draws_to_csv(draws)
+#' print(draws_csv_files)
+#'
+#' # draws_csv_files <- draws_to_csv(draws,
+#' #                                 sampler_diagnostic = sampler_diagnostics,
+#' #                                 dir = "~/my_folder",
+#' #                                 basename = "my-samples")
+#' }
+#'
+draws_to_csv <- function(draws,
+                         sampler_diagnostics = NULL,
+                         dir = tempdir(),
+                         basename = "fittedParams") {
+  sampler_diagnostics_names <- c(
+    "accept_stat__", "stepsize__", "treedepth__",
+    "n_leapfrog__", "divergent__", "energy__"
+  )
   n <- posterior::niterations(draws)
   n_chains <- posterior::nchains(draws)
+  draws_variables <- posterior::variables(draws)
+  sampler_diagnostics_variables <- posterior::variables(sampler_diagnostics)
+
+  # create dummy sampler diagnostics due to CmdStan requirement for all columns in GQ if needed
   zeros <- rep(0, n * n_chains) # filler for creating dummy sampler diagnostics and lp__ if necessary
   if (is.null(sampler_diagnostics)) {
-    # create dummy sampler diagnostics due to CmdStan requirement for all columns in GQ
-    sampler_diagnostics <- posterior::draws_array(
-      accept_stat__ = zeros,
-      stepsize__ = zeros,
-      treedepth__ = zeros,
-      n_leapfrog__ = zeros,
-      divergent__ = zeros,
-      energy__ = zeros,
-      .nchains = n_chains
-    )
+    missing_sampler_diagnostics <- sampler_diagnostics_names[!(sampler_diagnostics_names %in% draws_variables)]
+
+  } else {
+    missing_sampler_diagnostics <- sampler_diagnostics_names[!(sampler_diagnostics_names %in% draws_variables)]
+    missing_sampler_diagnostics <- missing_sampler_diagnostics[!(missing_sampler_diagnostics %in% sampler_diagnostics_variables)]
+  }
+  if (length(missing_sampler_diagnostics) > 0) {
+    additional_sampler_diagnostics <- list()
+    for (name in missing_sampler_diagnostics) {
+      additional_sampler_diagnostics[[name]] <- zeros
+    }
+    additional_sampler_diagnostics[[".nchains"]] <- n_chains
+    additional_sampler_diagnostics <- do.call(posterior::draws_array, additional_sampler_diagnostics)
+    sampler_diagnostics <- posterior::bind_draws(sampler_diagnostics, additional_sampler_diagnostics)
   }
 
   # the columns must be in order "lp__, sampler_diagnostics, parameters"
@@ -236,26 +286,31 @@ draws_to_csv <- function(draws, sampler_diagnostics = NULL) {
   }
   all_variables <- c(
     "lp__",
-    posterior::variables(sampler_diagnostics),
-    draws_variables[!(draws_variables %in% c("lp__", "lp_approx__"))]
+    sampler_diagnostics_names,
+    draws_variables[!(draws_variables %in% c("lp__", "lp_approx__", sampler_diagnostics_names))]
   )
   draws <- posterior::subset_draws(
     posterior::bind_draws(draws, sampler_diagnostics, lp__, along = "variable"),
     variable = all_variables
   )
 
   chains <- posterior::chain_ids(draws)
-  paths <- generate_file_names(basename = "fittedParams", ids = chains)
-  paths <- file.path(tempdir(), paths)
+  paths <- generate_file_names(basename = basename, ids = chains)
+  paths <- file.path(dir, paths)
   chain <- 1
   for (path in paths) {
     write(
       paste0("# num_samples = ", n, "\n", paste0(unrepair_variable_names(all_variables), collapse = ",")),
       file = path,
       append = FALSE
     )
+    data <- posterior::as_draws_df(posterior::subset_draws(draws, chain = chain))
+    class(data) <- "data.frame"
+    data$.chain <- NULL
+    data$.iteration <- NULL
+    data$.draw <- NULL
     data.table::fwrite(
-      posterior::as_draws_df(posterior::subset_draws(draws, chain = chain)),
+      data,
       sep = ",",
       file = path,
       col.names = FALSE,
 
@@ -587,7 +587,9 @@ compile <- function(quiet = TRUE,
     stop("An error occured during compilation! See the message above for more information.",
          call. = FALSE)
   }
-
+  if (file.exists(exe)) {
+    file.remove(exe)
+  }
   file.copy(tmp_exe, exe, overwrite = TRUE)
   private$exe_file_ <- exe
   private$cpp_options_ <- cpp_options
@@ -1311,6 +1313,13 @@ CmdStanModel$set("public", name = "variational", value = variational)
 #'  VB) object returned by CmdStanR's [`$draws()`][fit-method-draws] method.
 #'  * A character vector of paths to CmdStan CSV output files.
 #'
+#' NOTE: if you plan on making many calls to `$generate_quantities()` then the
+#' most efficient option is to pass the paths of the CmdStan CSV output files
+#' (this avoids CmdStanR having to rewrite the draws contained in the fitted
+#' model object to CSV each time). If you no longer have the CSV files you can
+#' use [draws_to_csv()] once to write them and then pass the resulting file
+#' paths to `$generate_quantities()` as many times as needed.
+#'
 #' @return A [`CmdStanGQ`] object.
 #'
 #' @template seealso-docs
@@ -1534,7 +1543,7 @@ cpp_options_to_compile_flags <- function(cpp_options) {
   for (i in seq_along(cpp_options)) {
     option_name <- names(cpp_options)[i]
     if (is.null(option_name) || !nzchar(option_name)) {
-      cpp_built_options <- c(cpp_built_options, toupper(cpp_options[[i]]))
+      cpp_built_options <- c(cpp_built_options, cpp_options[[i]])
     } else {
       cpp_built_options <- c(cpp_built_options, paste0(toupper(option_name), "=", cpp_options[[i]]))
     }
 
@@ -107,6 +107,7 @@ reference:
       - read_cmdstan_csv
       - write_stan_json
       - write_stan_file
+      - draws_to_csv
   - title: "Using CmdStanR with knitr and R Markdown"
     contents:
       - register_knitr_engine
 
@@ -1,7 +1,7 @@
 data {
   int<lower=0> N;
   int<lower=0> K;
-  int<lower=0,upper=1> y[N];
+  array[N] int<lower=0, upper=1> y;
   matrix[N, K] X;
 }
 parameters {
@@ -15,5 +15,7 @@ model {
 }
 generated quantities {
   vector[N] log_lik;
-  for (n in 1:N) log_lik[n] = bernoulli_logit_lpmf(y[n] | alpha + X[n] * beta);
+  for (n in 1 : N) {
+    log_lik[n] = bernoulli_logit_lpmf(y[n] | alpha + X[n] * beta);
+  }
 }
@@ -1,11 +1,11 @@
 data {
   int<lower=0> N;
-  int<lower=0,upper=1> y[N];
+  array[N] int<lower=0, upper=1> y;
 }
 parameters {
-  real<lower=0,upper=1> theta;
+  real<lower=0, upper=1> theta;
 }
 model {
-  theta ~ beta(1,1);  // uniform prior on interval 0,1
+  theta ~ beta(1, 1); // uniform prior on interval 0,1
   y ~ bernoulli(theta);
 }
@@ -1,11 +1,11 @@
 data {
   int<lower=0> N;
-  int<lower=0,upper=1> y[N];
+  array[N] int<lower=0, upper=1> y;
 }
 parameters {
-  real<lower=0,upper=1> theta;
+  real<lower=0, upper=1> theta;
 }
 model {
-  theta ~ beta(1,1);  // uniform prior on interval 0,1
+  theta ~ beta(1, 1); // uniform prior on interval 0,1
   y ~ bernoulli(theta);
 }
@@ -1,9 +1,10 @@
 transformed data {
   int<lower=0> N = 10;
-  real<lower=0,upper=1> theta = 0.35;
+  real<lower=0, upper=1> theta = 0.35;
 }
 generated quantities {
-  int y_sim[N];
-  for (n in 1:N)
+  array[N] int y_sim;
+  for (n in 1 : N) {
     y_sim[n] = bernoulli_rng(theta);
+  }
 }
@@ -3,13 +3,14 @@ functions {
 }
 data {
   int<lower=0> N;
-  int<lower=0,upper=1> y[N];
+  array[N] int<lower=0, upper=1> y;
 }
 parameters {
-  real<lower=0,upper=1> theta;
+  real<lower=0, upper=1> theta;
 }
 model {
-  theta ~ beta(divide_real_by_two(2.0),1);
-  for (n in 1:N)
+  theta ~ beta(divide_real_by_two(2.0), 1);
+  for (n in 1 : N) {
     y[n] ~ bernoulli(theta);
+  }
 }
@@ -1,15 +1,17 @@
 data {
   int<lower=0> N;
-  int<lower=0,upper=1> y[N];
+  array[N] int<lower=0, upper=1> y;
 }
 parameters {
-  real<lower=0,upper=1> theta;
+  real<lower=0, upper=1> theta;
 }
 model {
-  theta ~ beta(1,1);  // uniform prior on interval 0,1
+  theta ~ beta(1, 1); // uniform prior on interval 0,1
   y ~ bernoulli(theta);
 }
 generated quantities {
   vector[N] log_lik;
-  for (n in 1:N) log_lik[n] = bernoulli_lpmf(y | theta);
+  for (n in 1 : N) {
+    log_lik[n] = bernoulli_lpmf(y | theta);
+  }
 }
Original file line number	Diff line number	Diff line change
`@@ -179,6 +179,7 @@ read_cmdstan_csv <- function(files,`
`179`	`179`	`if (length(uniq_seed) == 1) {`
`180`	`180`	`metadata$seed <- uniq_seed`
`181`	`181`	`}`
	`182`	`+ metadata$time <- time`
`182`	`183`	`if (metadata$method == "diagnose") {`
`183`	`184`	`gradients <- metadata$gradients`
`184`	`185`	`metadata$gradients <- NULL`
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,7 @@`
`1`	`1`	`data {`
`2`	`2`	`int<lower=0> N;`
`3`	`3`	`int<lower=0> K;`
`4`		`- int<lower=0,upper=1> y[N];`
	`4`	`+ array[N] int<lower=0, upper=1> y;`
`5`	`5`	`matrix[N, K] X;`
`6`	`6`	`}`
`7`	`7`	`parameters {`
`@@ -15,5 +15,7 @@ model {`
`15`	`15`	`}`
`16`	`16`	`generated quantities {`
`17`	`17`	`vector[N] log_lik;`
`18`		`- for (n in 1:N) log_lik[n] = bernoulli_logit_lpmf(y[n] \| alpha + X[n] * beta);`
	`18`	`+ for (n in 1 : N) {`
	`19`	`+ log_lik[n] = bernoulli_logit_lpmf(y[n] \| alpha + X[n] * beta);`
	`20`	`+ }`
`19`	`21`	`}`
Original file line number	Diff line number	Diff line change
`@@ -1,11 +1,11 @@`
`1`	`1`	`data {`
`2`	`2`	`int<lower=0> N;`
`3`		`- int<lower=0,upper=1> y[N];`
	`3`	`+ array[N] int<lower=0, upper=1> y;`
`4`	`4`	`}`
`5`	`5`	`parameters {`
`6`		`- real<lower=0,upper=1> theta;`
	`6`	`+ real<lower=0, upper=1> theta;`
`7`	`7`	`}`
`8`	`8`	`model {`
`9`		`- theta ~ beta(1,1); // uniform prior on interval 0,1`
	`9`	`+ theta ~ beta(1, 1); // uniform prior on interval 0,1`
`10`	`10`	`y ~ bernoulli(theta);`
`11`	`11`	`}`
Original file line number	Diff line number	Diff line change
`@@ -1,9 +1,10 @@`
`1`	`1`	`transformed data {`
`2`	`2`	`int<lower=0> N = 10;`
`3`		`- real<lower=0,upper=1> theta = 0.35;`
	`3`	`+ real<lower=0, upper=1> theta = 0.35;`
`4`	`4`	`}`
`5`	`5`	`generated quantities {`
`6`		`- int y_sim[N];`
`7`		`- for (n in 1:N)`
	`6`	`+ array[N] int y_sim;`
	`7`	`+ for (n in 1 : N) {`
`8`	`8`	`y_sim[n] = bernoulli_rng(theta);`
	`9`	`+ }`
`9`	`10`	`}`
Original file line number	Diff line number	Diff line change
`@@ -3,13 +3,14 @@ functions {`
`3`	`3`	`}`
`4`	`4`	`data {`
`5`	`5`	`int<lower=0> N;`
`6`		`- int<lower=0,upper=1> y[N];`
	`6`	`+ array[N] int<lower=0, upper=1> y;`
`7`	`7`	`}`
`8`	`8`	`parameters {`
`9`		`- real<lower=0,upper=1> theta;`
	`9`	`+ real<lower=0, upper=1> theta;`
`10`	`10`	`}`
`11`	`11`	`model {`
`12`		`- theta ~ beta(divide_real_by_two(2.0),1);`
`13`		`- for (n in 1:N)`
	`12`	`+ theta ~ beta(divide_real_by_two(2.0), 1);`
	`13`	`+ for (n in 1 : N) {`
`14`	`14`	`y[n] ~ bernoulli(theta);`
	`15`	`+ }`
`15`	`16`	`}`
Original file line number	Diff line number	Diff line change
`@@ -1,15 +1,17 @@`
`1`	`1`	`data {`
`2`	`2`	`int<lower=0> N;`
`3`		`- int<lower=0,upper=1> y[N];`
	`3`	`+ array[N] int<lower=0, upper=1> y;`
`4`	`4`	`}`
`5`	`5`	`parameters {`
`6`		`- real<lower=0,upper=1> theta;`
	`6`	`+ real<lower=0, upper=1> theta;`
`7`	`7`	`}`
`8`	`8`	`model {`
`9`		`- theta ~ beta(1,1); // uniform prior on interval 0,1`
	`9`	`+ theta ~ beta(1, 1); // uniform prior on interval 0,1`
`10`	`10`	`y ~ bernoulli(theta);`
`11`	`11`	`}`
`12`	`12`	`generated quantities {`
`13`	`13`	`vector[N] log_lik;`
`14`		`- for (n in 1:N) log_lik[n] = bernoulli_lpmf(y \| theta);`
	`14`	`+ for (n in 1 : N) {`
	`15`	`+ log_lik[n] = bernoulli_lpmf(y \| theta);`
	`16`	`+ }`
`15`	`17`	`}`