R/apply.R

# Functions ------------------------------------------------------------------

.na.if.different <- function(x) {
  if (length(unique(x)) > 1) NA else x[1]
}

# ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
.apply_workhorse <- function(data, MARGIN, FUN, ...) {
  if (length(data$spc) == 0) {
    stop("empty spectra matrix.")
  }

  spc <- apply(data[, "spc", drop = FALSE], MARGIN, FUN, ...)

  if (MARGIN == 1) {
    if (is.null(spc)) {
      spc <- matrix(ncol = 0, nrow = nrow(data))
    } else if (is.vector(spc)) {
      dim(spc) <- c(length(spc), 1)
    } else if (is.matrix(spc)) {
      spc <- t(spc)
    }

    data$spc <- I(spc)
  } else if (MARGIN == 2) {
    if (is.null(spc)) {
      return(data[0, ])
    }
    if (is.null(dim(spc))) {
      dim(spc) <- c(1, ncol(data$spc))
    }

    if (all(dim(spc) == dim(data$spc))) {
      data$spc <- spc
    } else {
      nrow <- nrow(spc)

      cols <- colnames(data)
      cols <- which(cols != "spc")
      if (length(cols) > 0) {
        data[1, cols] <- lapply(data[, cols, drop = FALSE], .na.if.different)
      }

      data <- data[rep(1, nrow), , drop = FALSE]

      data$spc <- I(spc)
      rownames(data) <- rownames(spc)
    }
  }

  data$spc <- unclass(data$spc)
  data
}

# ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
.apply <- function(X, MARGIN, FUN, ..., label.wl = NULL,
                   label.spc = NULL, new.wavelength = NULL, simplify) {
  validObject(X)

  if (missing(MARGIN)) { # apply for functions that the complete spectra matrix
    ## is easier: tmp <- apply (x, , FUN, ...)
    ## does:
    ## tmp <- x
    ## tmp[[]] <- FUN (x[[]], ...)

    X@data$spc <- do.call(FUN, list(X@data$spc, ...))
  } else if (all(MARGIN == 1:2)) { # apply for functions that take scalar arguments.

    tmp <- apply(X@data$spc, MARGIN = MARGIN, FUN, ...)
    tmp <- as.numeric(tmp) # otherwise surprises will be waiting

    dim(tmp) <- dim(X@data$spc)

    X@data$spc <- tmp
  } else {
    ## the usual: for each row / for each column

    X@data <- .apply_workhorse(X@data, MARGIN = MARGIN, FUN = FUN, ...)

    if (all(MARGIN == 1)) {
      ## if the number of data points per spectrum is changed, the wavelength
      ## vector needs to be adapted, too

      if (ncol(X@data$spc) != length(X@wavelength)) {
        ## only internal functions here: the validation will fail until the wavelength axis is
        ## adjusted

        if (!is.null(new.wavelength)) { # vector with new wavelength is given
          if (is.numeric(new.wavelength)) { # either directly,
            .wl(X) <- new.wavelength
          } else {
            dots <- list(...)
            .wl(X) <- dots[[new.wavelength]] # or as name of the argument that becomes the new
            # wavelength vector
          }
        } else if (ncol(X@data$spc) != length(X@wavelength)) {
          wl <- as.numeric(colnames(X@data$spc)) # if not given, try to make from colnames of the
          # spectra matrix

          if (length(wl) != ncol(X@data$spc) || any(is.na(wl))) {
            wl <- seq_len(ncol(X@data$spc))
          } # or just number sequentially

          .wl(X) <- wl
        }
      }
    }
  }

  if (!is.null(label.wl)) {
    X@label$.wavelength <- label.wl
  }

  if (!is.null(label.spc)) {
    X@label$spc <- label.spc
  }

  validObject(X)

  X
}

#' Compute summary statistics for the spectra of a `hyperSpec` object
#'
#' [apply()] gives the functionality of [base::apply()] for `hyperSpec` objects.
#'
#' The generic functions of group [methods::Math()] are not defined
#' for `hyperSpec` objects. Instead, `apply` can be used. For
#' functions like `log()` that work on scalars, `MARGIN = 1:2` gives
#' the appropriate behavior.
#'
#' `spcapply` does the same as `apply` with `MARGIN = 1`, but
#' additionally allows to set a new wavelength axis and adjust the labels.
#'
#' `wlapply` does the same as `apply` with `MARGIN = 2`, but
#' additionally allows to set a new wavelength axis and adjust the labels.
#'
#' @name apply
#' @rdname apply
#' @aliases apply
#'          apply,hyperSpec-method
#' @docType methods
#'
#' @param X,spc a `hyperSpec` object
#' @param MARGIN The subscript which the function will be applied over.
#'
#' - `1` indicates rows (`FUN` is applied to each spectrum),
#' - `2` indicates columns (`FUN` is applied to each wavelength),
#' - `1:2` indicates that `FUN` should be applied to each single
#'   element of the spectra matrix. Note that many basic mathematical
#'   functions are already defined for hyperSpec objects (see
#'   [Math()]).
#'
#' If `MARGIN` is missing, the whole spectra matrix is handed to
#'   `FUN`, see also the examples.
#' @param FUN function to compute the summary statistics
#' @param ... further arguments passed to `FUN`
#' @param simplify ignored: apply for hyperSpec results are always simplified
#' @param label.wl,label.spc new labels for wavelength and spectral intensity
#'   axes
#' @param new.wavelength for `MARGIN = 2`: numeric vector or name of the
#'   argument in \dots{} that is to be used (character) as wavelength axis of
#'   the resulting object.
#'
#' @return A `hyperSpec` object
#'
#'
#' @seealso [base::apply()], for applying `FUN` to subgroups of
#'   the `hyperSpec` object: [hyperSpec::aggregate()].
#'
#'
#' @author C. Beleites
#'
#'
#' @keywords methods iteration
#' @concept manipulation
#' @concept stats
#'
#' @export
#'
#' @examples
#'
#'
#' plot_spc(apply(faux_cell, 2, range))
#'
#' avg_flu <- apply(flu, 1, mean,
#'   label.spc = expression(bar(I)),
#'   new.wavelength = mean(wl(flu))
#' )
#' avg_flu
#'
#' flu[[, , 405:407]]
#' apply(flu, 1:2, "*", -1)[[, , 405:407]]
#'
#' ## without MARGIN the whole matrix is handed to FUN
#' apply(flu[, , 405:407], , print)[[]]
#'
#' ## whereas MARGIN = 1 : 2 leads to FUN being called
#' ## for each element separately
#' apply(flu[, , 405:407], 1:2, print)[[]]
setMethod("apply", signature = signature(X = "hyperSpec"), .apply)


# Unit tests -----------------------------------------------------------------

hySpc.testthat::test(.apply) <- function() {
  context("apply")

  test_that("check whether .na.if.different is working correctly", {
    flu$equal <- 1
    tmp <- apply(flu, 2, mean)$..
    expect_equal(
      is.na(tmp),
      structure(c(TRUE, TRUE, FALSE),
        .Dim = c(1L, 3L),
        .Dimnames = list(NULL, c("filename", "c", "equal"))
      )
    )
    expect_equal(tmp$equal, 1)
  })

  test_that("POSIXct", {
    flu$ct <- as.POSIXct(Sys.time())
    expect_equal(apply(flu, 2, mean)$ct, flu$ct[1])
  })

  test_that("POSIXlt", {
    flu$lt <- as.POSIXlt(Sys.time())
    expect_equal(apply(flu, 2, mean)$lt, flu$lt[1])
  })
}