tidymodels · alexpghayes · Apr 8, 2019 · Apr 4, 2019 · Apr 5, 2019 · Apr 5, 2019
diff --git a/DESCRIPTION b/DESCRIPTION
@@ -199,7 +199,17 @@ Authors@R:
              family = "Krauska",
              role = "ctb",
              email = "krauskae@gmail.com",
-             comment = c(ORCID = "0000-0002-1466-5850")))
+             comment = c(ORCID = "0000-0002-1466-5850")),
+      person(given = "Malcolm",
+             family = "Barrett",
+             role = "ctb",
+             email = "malcolmbarrett@gmail.com", 
+             comment = c(ORCID = "0000-0003-0299-5825")),
+      person(given = "Charles",
+             family = "Gray",
+             role = "ctb",
+             email = "charlestigray@gmail.com",
+             comment = c(ORCID = "0000-0002-9978-011X")))
 Description: Summarizes key information about statistical
     objects in tidy tibbles. This makes it easy to report results, create
     plots and consistently work with large numbers of models at once.
@@ -304,7 +314,8 @@ Suggests:
     testthat,
     tseries,
     xergm,
-    zoo
+    zoo,
+    metafor
 VignetteBuilder: 
     knitr
 Remotes: 
@@ -378,6 +389,7 @@ Collate:
     'quantreg-nlrq-tidiers.R'
     'quantreg-rq-tidiers.R'
     'quantreg-rqs-tidiers.R'
+    'rma-tidiers.R'
     'robust-glmrob-tidiers.R'
     'robust-lmrob-tidiers.R'
     'sp-tidiers.R'

diff --git a/NAMESPACE b/NAMESPACE
@@ -26,6 +26,7 @@ S3method(augment,poLCA)
 S3method(augment,polr)
 S3method(augment,prcomp)
 S3method(augment,rlm)
+S3method(augment,rma)
 S3method(augment,rq)
 S3method(augment,rqs)
 S3method(augment,smooth.spline)
@@ -81,6 +82,7 @@ S3method(glance,polr)
 S3method(glance,pyears)
 S3method(glance,ridgelm)
 S3method(glance,rlm)
+S3method(glance,rma)
 S3method(glance,rq)
 S3method(glance,rqs)
 S3method(glance,smooth.spline)
@@ -178,6 +180,7 @@ S3method(tidy,ref.grid)
 S3method(tidy,regsubsets)
 S3method(tidy,ridgelm)
 S3method(tidy,rlm)
+S3method(tidy,rma)
 S3method(tidy,roc)
 S3method(tidy,rq)
 S3method(tidy,rqs)

diff --git a/NEWS.md b/NEWS.md
@@ -67,9 +67,9 @@ TODO: sort out what happens to `glance.aov()`
 - `tidy.lsmobj()` gained a `conf.int` argument
 
 ## New tidiers, features and bugfixes
-
+
+- Added tidiers for `rma` objects from the `metafor` package (#674, @malcolmbarrett, @softloud)
 - `ordinal` tidier rewrite
-
 - Added tidiers for `pam` objects from the `cluster` package. (#637)
 - Previously, F-statistics for weak instruments were returned through `glance.ivreg()`. F-statistics are now returned through `tidy.ivreg(instruments = TRUE)`. Default is `tidy.ivreg(instruments = FALSE)`. `glance.ivreg()` still returns Wu-Hausman and Sargan test statistics.
 - Added `tidy.regsubsets()` for best subsets linear regression from the `leaps` package

diff --git a/R/rma-tidiers.R b/R/rma-tidiers.R
@@ -0,0 +1,222 @@
+#' Tidying methods for meta-analyis objects
+#'
+#' These methods tidy the results of meta-analysis objects from the metafor package
+#'
+#' @param x An `rma` created by the `metafor` package.
+#' @inheritParams tidy.lm
+#' @param include_studies Logical. Should individual studies be included in the
+#'    output?
+#' @param ... Additional arguments
+#' @param measure Measure type. See [metafor::rma()]
+#'
+#' @return A `tibble`
+#' @export
+#'
+#' @examples
+#' 
+#' library(metafor)
+#' 
+#' df <-
+#'   escalc(
+#'     measure = "RR",
+#'     ai = tpos,
+#'     bi = tneg,
+#'     ci = cpos,
+#'     di = cneg,
+#'     data = dat.bcg
+#'   )
+#' 
+#' meta_analysis <- rma(yi, vi, data = df, method = "EB")
+#'
+#' tidy(meta_analysis)
+#'
+#' @rdname tidiers
-#' @rdname tidiers
+#' @rdname metafor_tidiers
-#' @rdname tidiers
+#' @rdname metafor_tidiers
+#' 
+tidy.rma <- function(x, conf.int = FALSE, conf.level = 0.95, exponentiate = FALSE,
+                     include_studies = TRUE, measure = "GEN", ...) {
+
+  estimates <- metafor::escalc(yi = x$yi.f, vi = x$vi.f, measure = measure) %>%
+    summary(level = conf.level * 100) %>% 
+    as.data.frame(stringsAsFactors = FALSE)
+
+  estimates <- cbind(x$slab, "study", estimates[, c("yi", "sei", "zi")], NA,
+                     estimates[, c("ci.lb", "ci.ub")], stringsAsFactors = FALSE)
+  names(estimates) <- c("study", "type", "estimate", "std.error", "statistic",
+                        "p.value", "conf.low", "conf.high")
+  estimates <- tibble::as_tibble(estimates)
+
+  betas <- x$beta
+  if (!is.null(nrow(betas)) && nrow(betas) > 1) {
+    # get estimate type and fix spelling
+    study <- rownames(betas)
+    swap <- grepl("intrcpt", study)
+    study[swap] <- "intercept"
+    betas <- as.double(betas)
+  } else {
+    study <- "overall"
+    betas <- betas[1]
+  }
+
+  results <- tibble::tibble(study = study, type = "summary",
+                            estimate = betas, std.error = x$se,
+                            statistic = x$zval, p.value = x$pval,
+                            conf.low = x$ci.lb, conf.high = x$ci.ub)
+  .data <- if (include_studies) rbind(estimates, results) else results
+
+  if (exponentiate) {
+    .data$estimate <- exp(.data$estimate)
+    .data$conf.low <- exp(.data$conf.low)
+    .data$conf.high <- exp(.data$conf.high)
+  }
+
+  if (!conf.int) {
+    .data <- .data[-which(names(.data) %in% c("conf.low", "conf.high"))]
+  }
+
+  attributes(.data$study) <- NULL
+
+  tibble::remove_rownames(.data)
+}
+
+#' Construct a one-row summary of meta-analysis model fit statistics.
+#'
+#' `glance()` computes a one-row summary of  meta-analysis objects,
+#'  including estimates of heterogenity and model fit.
+#'
+#' @param x An `rma` created by the `metafor` package.
+#' @param ... Additional arguments
+#'
+#' @return a `tibble`
+#' @export
+#'
+#' @examples
+#'
+#' library(metafor)
+#' 
+#' df <-
+#'   escalc(
+#'     measure = "RR",
+#'     ai = tpos,
+#'     bi = tneg,
+#'     ci = cpos,
+#'     di = cneg,
+#'     data = dat.bcg
+#'   )
+#' 
+#' meta_analysis <- rma(yi, vi, data = df, method = "EB")
+#'
+#' glance(meta_analysis)
+#'
+glance.rma <- function(x, ...) {
+  fit_stats <- metafor::fitstats(x)
+  fit_stats <- fit_stats %>%
+    t() %>%
+    as.data.frame()
+  names(fit_stats) <-
+    stringr::str_replace(names(fit_stats), "\\:", "")
+
+  list(
+    nobs = x$k,
+    measure = x$measure,
+    method = x$method,
+    i.squared = x$I2,
+    h.squared = x$H2,
+    tau.squared = x$tau2,
+    tau.squared.se = x$se.tau2,
+    qe = x$QE,
+    p.value.qe = x$QEp,
+    qm = x$QM,
+    p.value.qm = x$QMp,
+    fit_stats
+  ) %>%
+    # get rid of null values
+    purrr::discard(is.null) %>%
+    # don't include multivariate model stats
+    purrr::discard(~length(.x) >= 2) %>%
+    # change to tibble with correct column and row names
+    as.data.frame() %>%
+    tibble::as_tibble() %>%
+    tibble::remove_rownames()
+}
+
+#' Augment data with values from a meta-analysis model
+#'
+#' Augment the original data with model residuals, fitted values, and influence
+#' statistics.
+#'
+#' @param x An `rma` created by the `metafor` package.
+#' @param ... additional arguments
+#'
+#' @return a `tibble`
+#' @export
+#'
+#' @examples
+#'
+#' library(metafor)
+#' 
+#' df <-
+#'   escalc(
+#'     measure = "RR",
+#'     ai = tpos,
+#'     bi = tneg,
+#'     ci = cpos,
+#'     di = cneg,
+#'     data = dat.bcg
+#'   )
+#' 
+#' meta_analysis <- rma(yi, vi, data = df, method = "EB")
+#'
+#' augment(meta_analysis)
+#'
+#' @rdname augmenters
+augment.rma <- function(x, ...) {
+  blup0 <- purrr::possibly(metafor::blup, NULL)
+  residuals0 <- purrr::possibly(stats::residuals, NULL)
+  influence0 <- purrr::possibly(stats::influence, NULL)
+
+  y <- x$yi
+  pred <- blup0(x)
+  if (is.null(pred)) pred <- predict(x)
+  pred <- as.data.frame(pred)
+
+  # fix names
+  names(pred)[1:4] <- c(".fitted", ".se.fit", ".conf.low", ".conf.high")
+  credible_intervals <- names(pred) %in% c("cr.lb", "cr.ub")
+  names(pred)[credible_intervals] <- c(".cred.low", ".cred.high")
+  moderator <- names(pred) == "X"
+  names(pred)[moderator] <- ".moderator"
+
+  res <- residuals0(x)
+  inf <- influence0(x)
+  if (!is.null(inf)) {
+    inf <- cbind(as.data.frame(inf$inf), dfbetas = inf$dfbs$intrcpt)
+    inf <- dplyr::select(
+      inf, 
+      .hat = hat, 
+      .cooksd = cook.d, 
+      .std.resid = rstudent,
+      .dffits = dffits, 
+      .cov.ratio = cov.r,
+      .tau.squared.del = tau2.del, 
+      .qe.del = QE.del,
+      .weight = weight, 
+      .dfbetas = dfbetas
+    )
+  }
+
+  ret <- cbind(
+    .rownames = x$slab,
+    y,
+    pred,
+    .resid = res
+  )
+
+  ret <- tibble::as_tibble(ret) %>%
+    tibble::remove_rownames()
+
+  if (all(ret$.rownames == seq_along(ret$.rownames))) {
+    ret$.rownames <- NULL
+  }
+
+  ret
+}
diff --git a/R/utilities.R b/R/utilities.R
@@ -458,8 +458,12 @@ globalVariables(
     "comparison",
     "conf.high",
     "conf.low", 
+    "cook.d",
+    "cov.r",
     "cutoffs",
     "data",
+    "dffits",
+    "dfbetas",
     "df.residual",
     "distance",
     "effect",
@@ -470,6 +474,7 @@ globalVariables(
     "GCV",
     "group1",
     "group2",
+    "hat",
     "index",
     "Intercept",
     "item1", 
@@ -490,11 +495,14 @@ globalVariables(
     "p.value", 
     "PC",
     "percent",
+    "P-perm (1-tailed)",
     "pvalue",
+    "QE.del",
     "rd_roclet",
     "rhs", 
     "rmsea.ci.upper",
     "rowname", 
+    "rstudent",
     "se", 
     "series",
     "Slope",
@@ -504,13 +512,15 @@ globalVariables(
     "step",
     "stratum",
     "surv",
+    "tau2.del",
     "term",
     "type",
     "value",
     "Var1",
     "Var2", 
     "variable",
     "wald.test",
+    "weight",
     "y",
     "z"
   )

diff --git a/man/augmenters.Rd b/man/augmenters.Rd
diff --git a/man/broom.Rd b/man/broom.Rd