stan-dev · bgoodri · Jul 8, 2020 · Apr 27, 2020 · Apr 27, 2020 · Apr 27, 2020
diff --git a/NAMESPACE b/NAMESPACE
@@ -95,6 +95,8 @@ export(bayes_R2)
 export(cauchy)
 export(compare_models)
 export(decov)
+export(default_prior_coef)
+export(default_prior_intercept)
 export(dirichlet)
 export(exponential)
 export(fixef)

diff --git a/R/priors.R b/R/priors.R
@@ -72,7 +72,7 @@
 #'   or equal to two, the mode of this Beta distribution does not exist
 #'   and an error will prompt the user to specify another choice for
 #'   \code{what}.
-#' @param autoscale A logical scalar, defaulting to \code{TRUE}. If \code{TRUE} 
+#' @param autoscale If \code{TRUE} 
 #'   then the scales of the priors on the intercept and regression coefficients 
 #'   may be additionally modified internally by \pkg{rstanarm} in the following 
 #'   cases. First, for Gaussian models only, the prior scales for the intercept, 
@@ -104,12 +104,11 @@
 #'   approaches the normal distribution and if the degrees of freedom are one,
 #'   then the Student t distribution is the Cauchy distribution.
 #'   
-#'   If \code{scale} is not specified it will default to \eqn{10} for the
-#'   intercept and \eqn{2.5} for the other coefficients, unless the probit link
-#'   function is used, in which case these defaults are scaled by a factor of 
-#'   \code{dnorm(0)/dlogis(0)}, which is roughly \eqn{1.6}.
+#'   If \code{scale} is not specified it will default to \eqn{2.5}, unless the
+#'   probit link function is used, in which case these defaults are scaled by a
+#'   factor of \code{dnorm(0)/dlogis(0)}, which is roughly \eqn{1.6}.
 #'   
-#'   If the \code{autoscale} argument is \code{TRUE} (the default), then the 
+#'   If the \code{autoscale} argument is \code{TRUE}, then the 
 #'   scales will be further adjusted as described above in the documentation of 
 #'   the \code{autoscale} argument in the \strong{Arguments} section.
 #' }
@@ -174,7 +173,7 @@
 #'   
 #'   It is also common in supervised learning to standardize the predictors 
 #'   before training the model. We do not recommend doing so. Instead, it is
-#'   better to specify \code{autoscale = TRUE} (the default value), which 
+#'   better to specify \code{autoscale = TRUE}, which 
 #'   will adjust the scales of the priors according to the dispersion in the
 #'   variables. See the documentation of the \code{autoscale} argument above 
 #'   and also the \code{\link{prior_summary}} page for more information.
@@ -436,22 +435,22 @@ NULL
 
 #' @rdname priors
 #' @export
-normal <- function(location = 0, scale = NULL, autoscale = TRUE) {
+normal <- function(location = 0, scale = NULL, autoscale = FALSE) {
   validate_parameter_value(scale)
   nlist(dist = "normal", df = NA, location, scale, autoscale)
 }
 
 #' @rdname priors
 #' @export
-student_t <- function(df = 1, location = 0, scale = NULL, autoscale = TRUE) {
+student_t <- function(df = 1, location = 0, scale = NULL, autoscale = FALSE) {
   validate_parameter_value(scale)
   validate_parameter_value(df)
   nlist(dist = "t", df, location, scale, autoscale)
 }
 
 #' @rdname priors
 #' @export
-cauchy <- function(location = 0, scale = NULL, autoscale = TRUE) {
+cauchy <- function(location = 0, scale = NULL, autoscale = FALSE) {
   student_t(df = 1, location = location, scale = scale, autoscale)
 }
 
@@ -485,13 +484,13 @@ hs_plus <- function(df1 = 1, df2 = 1, global_df = 1, global_scale = 0.01,
 
 #' @rdname priors
 #' @export
-laplace <- function(location = 0, scale = NULL, autoscale = TRUE) {
+laplace <- function(location = 0, scale = NULL, autoscale = FALSE) {
   nlist(dist = "laplace", df = NA, location, scale, autoscale)
 }
 
 #' @rdname priors
 #' @export
-lasso <- function(df = 1, location = 0, scale = NULL, autoscale = TRUE) {
+lasso <- function(df = 1, location = 0, scale = NULL, autoscale = FALSE) {
   nlist(dist = "lasso", df, location, scale, autoscale)
 }
 
@@ -510,7 +509,7 @@ product_normal <- function(df = 2, location = 0, scale = 1) {
 #'   \code{1}. For the exponential distribution, the rate parameter is the
 #'   \emph{reciprocal} of the mean.
 #' 
-exponential <- function(rate = 1, autoscale = TRUE) {
+exponential <- function(rate = 1, autoscale = FALSE) {
   stopifnot(length(rate) == 1)
   validate_parameter_value(rate)
   nlist(dist = "exponential", 
@@ -562,7 +561,22 @@ R2 <- function(location = NULL, what = c("mode", "mean", "median", "log")) {
   list(dist = "R2", location = location, what = what, df = 0, scale = 0)
 }
 
+#' @rdname priors
+#' @export
+default_prior_intercept = function() {
+  out <- normal(0, 2.5, autoscale=TRUE)
+  out$location <- NULL # not determined yet
+  out$default <- TRUE
+  out
+}
 
+#' @rdname priors
+#' @export
+default_prior_coef = function() {
+  out <- normal(0, 2.5, autoscale=TRUE)
+  out$default <- TRUE
+  out
+}
 
 
 # internal ----------------------------------------------------------------

diff --git a/R/stan_betareg.R b/R/stan_betareg.R
@@ -117,11 +117,11 @@ stan_betareg <-
            y = TRUE,
            x = FALSE,
            ...,
-           prior = normal(),
-           prior_intercept = normal(),
-           prior_z = normal(),
-           prior_intercept_z = normal(),
-           prior_phi = exponential(),
+           prior = normal(autoscale=TRUE),
+           prior_intercept = normal(autoscale=TRUE),
+           prior_z = normal(autoscale=TRUE),
+           prior_intercept_z = normal(autoscale=TRUE),
+           prior_phi = exponential(autoscale=TRUE),
            prior_PD = FALSE,
            algorithm = c("sampling", "optimizing", "meanfield", "fullrank"),
            adapt_delta = NULL,

diff --git a/R/stan_betareg.fit.R b/R/stan_betareg.fit.R
@@ -26,11 +26,11 @@ stan_betareg.fit <-
            offset = rep(0, NROW(x)),
            link = c("logit", "probit", "cloglog", "cauchit", "log", "loglog"), 
            link.phi = NULL, ...,
-           prior = normal(), 
-           prior_intercept = normal(),
-           prior_z = normal(), 
-           prior_intercept_z = normal(),
-           prior_phi = exponential(),
+           prior = normal(autoscale=TRUE), 
+           prior_intercept = normal(autoscale=TRUE),
+           prior_z = normal(autoscale=TRUE), 
+           prior_intercept_z = normal(autoscale=TRUE),
+           prior_phi = exponential(autoscale=TRUE),
            prior_PD = FALSE, 
            algorithm = c("sampling", "optimizing", "meanfield", "fullrank"),
            adapt_delta = NULL, 
@@ -101,7 +101,7 @@ stan_betareg.fit <-
     assign(i, prior_stuff[[i]])
 
   prior_intercept_stuff <- handle_glm_prior(prior_intercept, nvars = 1, 
-                                            default_scale = 10, link = link,
+                                            default_scale = 2.5, link = link,
                                             ok_dists = ok_intercept_dists)
   names(prior_intercept_stuff) <- paste0(names(prior_intercept_stuff), 
                                          "_for_intercept")
@@ -115,7 +115,7 @@ stan_betareg.fit <-
     assign(paste0(i,"_z"), prior_stuff_z[[i]])
 
   prior_intercept_stuff_z <- handle_glm_prior(prior_intercept_z, nvars = 1, 
-                                              link = link.phi, default_scale = 10,
+                                              link = link.phi, default_scale = 2.5,
                                               ok_dists = ok_intercept_dists)
   names(prior_intercept_stuff_z) <- paste0(names(prior_intercept_stuff_z), 
                                            "_for_intercept")

diff --git a/R/stan_clogit.R b/R/stan_clogit.R
@@ -91,7 +91,7 @@
 #'             
 #' @importFrom lme4 findbars
 stan_clogit <- function(formula, data, subset, na.action = NULL, ..., 
-                        strata, prior = normal(), 
+                        strata, prior = normal(autoscale=TRUE), 
                         prior_covariance = decov(), prior_PD = FALSE, 
                         algorithm = c("sampling", "optimizing", 
                                       "meanfield", "fullrank"),

diff --git a/R/stan_gamm4.R b/R/stan_gamm4.R
@@ -127,10 +127,10 @@ stan_gamm4 <-
            knots = NULL,
            drop.unused.levels = TRUE,
            ...,
-           prior = normal(),
-           prior_intercept = normal(),
+           prior = default_prior_coef(),
+           prior_intercept = default_prior_intercept(),
            prior_smooth = exponential(autoscale = FALSE),
-           prior_aux = exponential(),
+           prior_aux = exponential(autoscale=TRUE),
            prior_covariance = decov(),
            prior_PD = FALSE,
            algorithm = c("sampling", "meanfield", "fullrank"),

diff --git a/R/stan_glm.R b/R/stan_glm.R
@@ -138,7 +138,7 @@
 #'   counts ~ outcome + treatment, 
 #'   data = count_data, 
 #'   family = poisson(link="log"),
-#'   prior = normal(0, 2, autoscale = FALSE),
+#'   prior = normal(0, 2),
 #'   refresh = 0,
 #'   # for speed of example only
 #'   chains = 2, iter = 250 
@@ -207,9 +207,9 @@ stan_glm <-
            y = TRUE,
            contrasts = NULL,
            ...,
-           prior = normal(),
-           prior_intercept = normal(),
-           prior_aux = exponential(),
+           prior = default_prior_coef(),
+           prior_intercept = default_prior_intercept(),
+           prior_aux = exponential(autoscale=TRUE),
            prior_PD = FALSE,
            algorithm = c("sampling", "optimizing", "meanfield", "fullrank"),
            mean_PPD = algorithm != "optimizing",
@@ -319,9 +319,9 @@ stan_glm.nb <-
            contrasts = NULL,
            link = "log",
            ...,
-           prior = normal(),
-           prior_intercept = normal(),
-           prior_aux = exponential(),
+           prior = default_prior_coef(),
+           prior_intercept = default_prior_intercept(),
+           prior_aux = exponential(autoscale=TRUE),
            prior_PD = FALSE,
            algorithm = c("sampling", "optimizing", "meanfield", "fullrank"),
            mean_PPD = algorithm != "optimizing",

diff --git a/R/stan_glm.fit.R b/R/stan_glm.fit.R
@@ -41,9 +41,9 @@ stan_glm.fit <-
            offset = rep(0, NROW(y)), 
            family = gaussian(),
            ...,
-           prior = normal(),
-           prior_intercept = normal(),
-           prior_aux = exponential(),
+           prior = default_prior_coef(),
+           prior_intercept = default_prior_intercept(),
+           prior_aux = exponential(autoscale=TRUE),
            prior_smooth = exponential(autoscale = FALSE),
            prior_ops = NULL,
            group = list(),
@@ -132,6 +132,14 @@ stan_glm.fit <-
   ok_aux_dists <- c(ok_dists[1:3], exponential = "exponential")
 
   # prior distributions
+  if (isTRUE(prior_intercept$default)) {
+    m_y <- 0
+    if (family$family == "gaussian" && family$link == "identity") {
+      if (!is.null(y)) m_y <- mean(y) # y can be NULL if prior_PD=TRUE
+    }
+    prior_intercept$location <- m_y
+  }
+
   prior_stuff <- handle_glm_prior(
     prior,
     nvars,
@@ -147,7 +155,7 @@ stan_glm.fit <-
   prior_intercept_stuff <- handle_glm_prior(
     prior_intercept,
     nvars = 1,
-    default_scale = 10,
+    default_scale = 2.5,
     link = family$link,
     ok_dists = ok_intercept_dists
   )

diff --git a/R/stan_glmer.R b/R/stan_glmer.R
@@ -103,9 +103,9 @@ stan_glmer <-
            offset,
            contrasts = NULL,
            ...,
-           prior = normal(),
-           prior_intercept = normal(),
-           prior_aux = exponential(),
+           prior = default_prior_coef(),
+           prior_intercept = default_prior_intercept(),
+           prior_aux = exponential(autoscale=TRUE),
            prior_covariance = decov(),
            prior_PD = FALSE,
            algorithm = c("sampling", "meanfield", "fullrank"),
@@ -202,9 +202,9 @@ stan_lmer <-
            offset,
            contrasts = NULL,
            ...,
-           prior = normal(),
-           prior_intercept = normal(),
-           prior_aux = exponential(),
+           prior = default_prior_coef(),
+           prior_intercept = default_prior_intercept(),
+           prior_aux = exponential(autoscale=TRUE),
            prior_covariance = decov(),
            prior_PD = FALSE,
            algorithm = c("sampling", "meanfield", "fullrank"),
@@ -244,9 +244,9 @@ stan_glmer.nb <-
            contrasts = NULL,
            link = "log",
            ...,
-           prior = normal(),
-           prior_intercept = normal(),
-           prior_aux = exponential(),
+           prior = default_prior_coef(),
+           prior_intercept = default_prior_intercept(),
+           prior_aux = exponential(autoscale=TRUE),
            prior_covariance = decov(),
            prior_PD = FALSE,
            algorithm = c("sampling", "meanfield", "fullrank"),

diff --git a/R/stan_jm.R b/R/stan_jm.R
@@ -523,10 +523,10 @@ stan_jm <- function(formulaLong, dataLong, formulaEvent, dataEvent, time_var,
                     lag_assoc = 0, grp_assoc, epsilon = 1E-5,
                     basehaz = c("bs", "weibull", "piecewise"), basehaz_ops, 
                     qnodes = 15, init = "prefit", weights,	
-                    priorLong = normal(), priorLong_intercept = normal(), 
-                    priorLong_aux = cauchy(0, 5), priorEvent = normal(), 
-                    priorEvent_intercept = normal(), priorEvent_aux = cauchy(),
-                    priorEvent_assoc = normal(), prior_covariance = lkj(), 
+                    priorLong = normal(autoscale=TRUE), priorLong_intercept = normal(autoscale=TRUE), 
+                    priorLong_aux = cauchy(0, 5, autoscale=TRUE), priorEvent = normal(autoscale=TRUE), 
+                    priorEvent_intercept = normal(autoscale=TRUE), priorEvent_aux = cauchy(autoscale=TRUE),
+                    priorEvent_assoc = normal(autoscale=TRUE), prior_covariance = lkj(autoscale=TRUE), 
                     prior_PD = FALSE, algorithm = c("sampling", "meanfield", "fullrank"), 
                     adapt_delta = NULL, max_treedepth = 10L, QR = FALSE, 
                     sparse = FALSE, ...) {

diff --git a/R/stan_jm.fit.R b/R/stan_jm.fit.R
@@ -27,10 +27,10 @@ stan_jm.fit <- function(formulaLong = NULL, dataLong = NULL, formulaEvent = NULL
                         assoc = "etavalue", lag_assoc = 0, grp_assoc, 
                         epsilon = 1E-5, basehaz = c("bs", "weibull", "piecewise"), 
                         basehaz_ops, qnodes = 15, init = "prefit", weights,					          
-                        priorLong = normal(), priorLong_intercept = normal(), 
-                        priorLong_aux = cauchy(0, 5), priorEvent = normal(), 
-                        priorEvent_intercept = normal(), priorEvent_aux = cauchy(),
-                        priorEvent_assoc = normal(), prior_covariance = lkj(), prior_PD = FALSE, 
+                        priorLong = normal(autoscale=TRUE), priorLong_intercept = normal(autoscale=TRUE), 
+                        priorLong_aux = cauchy(0, 5, autoscale=TRUE), priorEvent = normal(autoscale=TRUE), 
+                        priorEvent_intercept = normal(autoscale=TRUE), priorEvent_aux = cauchy(autoscale=TRUE),
+                        priorEvent_assoc = normal(autoscale=TRUE), prior_covariance = lkj(autoscale=TRUE), prior_PD = FALSE, 
                         algorithm = c("sampling", "meanfield", "fullrank"), 
                         adapt_delta = NULL, max_treedepth = 10L, 
                         QR = FALSE, sparse = FALSE, ...) {

diff --git a/R/stan_mvmer.R b/R/stan_mvmer.R
@@ -129,9 +129,9 @@
 #' }
 #' 
 stan_mvmer <- function(formula, data, family = gaussian, weights,				          
-                       prior = normal(), prior_intercept = normal(), 
-                       prior_aux = cauchy(0, 5),
-                       prior_covariance = lkj(), prior_PD = FALSE, 
+                       prior = normal(autoscale=TRUE), prior_intercept = normal(autoscale=TRUE), 
+                       prior_aux = cauchy(0, 5, autoscale=TRUE),
+                       prior_covariance = lkj(autoscale=TRUE), prior_PD = FALSE, 
                        algorithm = c("sampling", "meanfield", "fullrank"), 
                        adapt_delta = NULL, max_treedepth = 10L, 
                        init = "random", QR = FALSE, sparse = FALSE, ...) {

diff --git a/R/stan_nlmer.R b/R/stan_nlmer.R
@@ -95,8 +95,8 @@ stan_nlmer <-
            offset,
            contrasts = NULL,
            ...,
-           prior = normal(),
-           prior_aux = exponential(),
+           prior = normal(autoscale=TRUE),
+           prior_aux = exponential(autoscale=TRUE),
            prior_covariance = decov(),
            prior_PD = FALSE,
            algorithm = c("sampling", "meanfield", "fullrank"),