Apply.R 12.7 KB
Newer Older
Alasdair Hunter's avatar
Alasdair Hunter committed
#' Wrapper for Applying Atomic Functions to Arrays.
Alasdair Hunter's avatar
Alasdair Hunter committed
#'
Alasdair Hunter's avatar
Alasdair Hunter committed
#' The Apply function is an extension of the mapply function, which instead of taking lists of unidimensional objects as input, takes lists of multidimensional objects as input, which may have different numbers of dimensions and dimension lengths. The user can specify which dimensions of each array (or matrix) the function is to be applied over with the margins option. 
#' @param data A single object (vector, matrix or array) or a list of objects. They must be in the same order as expected by AtomicFun.
#' @param target_dims List of vectors containing the dimensions to be input into AtomicFun for each of the objects in the data. These vectors can contain either integers specifying the dimension position, or characters corresponding to the dimension names. If both margins and target_dims are specified, margins takes priority over target_dims.
Alasdair Hunter's avatar
Alasdair Hunter committed
#' @param AtomicFun Function to be applied to the arrays.
#' @param ... Additional arguments to be used in the AtomicFun.
#' @param margins List of vectors containing the margins for the input objects to be split by. Or, if there is a single vector of margins specified and a list of objects in data, then the single set of margins is applied over all objects. These vectors can contain either integers specifying the dimension position, or characters corresponding to the dimension names. If both margins and target_dims are specified, margins takes priority over target_dims.
Alasdair Hunter's avatar
Alasdair Hunter committed
#' @param parallel Logical, should the function be applied in parallel.
#' @param ncores The number of cores to use for parallel computation.
Alasdair Hunter's avatar
Alasdair Hunter committed
#' @details When using a single object as input, Apply is almost identical to the apply function. For multiple input objects, the output array will have dimensions equal to the dimensions specified in 'margins'.
Alasdair Hunter's avatar
Alasdair Hunter committed
#' @return Array or matrix or vector resulting from AtomicFun.
Alasdair Hunter's avatar
Alasdair Hunter committed
#' @references Wickham, H (2011), The Split-Apply-Combine Strategy for Data Analysis, Journal of Statistical Software.
#' @export
#' @examples
Alasdair Hunter's avatar
Alasdair Hunter committed
#' #Change in the rate of exceedance for two arrays, with different 
#' #dimensions, for some matrix of exceedances.
#' data = list(array(rnorm(2000), c(10,10,20)), array(rnorm(1000), c(10,10,10)), 
#'             array(rnorm(100), c(10, 10)))
#' test_fun <- function(x, y, z) {((sum(x > z) / (length(x))) / 
#'                                (sum(y > z) / (length(y)))) * 100}
#' margins = list(c(1, 2), c(1, 2), c(1,2))
#' test <- Apply(data, margins, AtomicFun = "test_fun")
Apply <- function(data, target_dims = NULL, AtomicFun, ..., margins = NULL, parallel = FALSE, ncores = NULL) {
  # Check data
Alasdair Hunter's avatar
Alasdair Hunter committed
  if (!is.list(data)) {
    data <- list(data)
  }
  if (any(!sapply(data, is.numeric))) {
    stop("Parameter 'data' must be one or a list of numeric objects.")
  }
Nicolau Manubens's avatar
Nicolau Manubens committed
  is_vector <- rep(FALSE, length(data))
  for (i in 1 : length(data)) {
    if (is.null(dim(data[[i]]))) {
      is_vector[i] <- TRUE
      dim(data[[i]]) <- length(data[[i]])
    }
  }
  # Check target_dims and margins
  if (is.null(margins) && is.null(target_dims)) {
    stop("One of 'margins' or 'target_dims' must be specified.")
  }
Alasdair Hunter's avatar
Alasdair Hunter committed
  if (!is.null(margins)) {
    target_dims <- NULL
Alasdair Hunter's avatar
Alasdair Hunter committed
  }
Nicolau Manubens's avatar
Nicolau Manubens committed
  margins_names <- vector('list', length(data))
  target_dims_names <- vector('list', length(data))
  if (!is.null(margins)) {
  # Check margins and build target_dims accordingly
    if (!is.list(margins)) {
      margins <- rep(list(margins), length(data))
    }
    if (any(!sapply(margins, 
Nicolau Manubens's avatar
Nicolau Manubens committed
                    function(x) is.character(x) || is.numeric(x) || is.null(x)))) {
      stop("Parameter 'margins' must be one or a list of numeric or ",
           "character vectors.")
    }
    duplicate_dim_specs <- sapply(margins, 
      function(x) {
        length(unique(x)) != length(x)
      })
    if (any(duplicate_dim_specs)) {
      stop("Parameter 'margins' must not contain duplicated dimension ",
           "specifications.")
    }
    target_dims <- vector('list', length(data))
    for (i in 1 : length(data)) {
Nicolau Manubens's avatar
Nicolau Manubens committed
      if (length(margins[[i]]) > 0) {
        if (is.character(unlist(margins[i]))) {
          if (is.null(names(dim(data[[i]])))) {
            stop("Parameter 'margins' contains dimension names, but ",
                 "some of the corresponding objects in 'data' do not have ",
                 "dimension names.")
          }
          margins_new <- margins[[i]]
          for (j in 1 : length(margins_new)) {
            matches <- which(names(dim(data[[i]])) == margins_new[j])
            if (length(matches) < 1) {
              stop("Could not find dimension '", margins_new[j], "' in ", i, 
                   "th object provided in 'data'.")
            }
            margins_new[j] <- matches[1]
          }
          margins_names[[i]] <- margins[[i]]
          margins[[i]] <- margins_new
        }
        if (!is.null(names(dim(data[[i]])))) {
          target_dims_names[[i]] <- names(dim(data[[i]]))[- margins[[i]]]
        }
        target_dims[[i]] <- c(1 : length(dim(data[[i]])))[- margins[[i]]]
      } else {
        target_dims[[i]] <- 1 : length(dim(data[[i]]))
        if (!is.null(names(dim(data[[i]])))) {
          target_dims_names[[i]] <- names(dim(data[[i]]))
    }
  } else {
  # Check target_dims and build margins accordingly
    if (!is.list(target_dims)) {
      target_dims <- rep(list(target_dims), length(data))
    }
    if (any(!sapply(target_dims, 
                    function(x) is.character(x) || is.numeric(x)))) {
      stop("Parameter 'target_dims' must be one or a list of numeric or ",
           "character vectors.")
    }
    if (any(sapply(target_dims, length) == 0)) {
      stop("Parameter 'target_dims' must not contain length-0 vectors.")
    duplicate_dim_specs <- sapply(target_dims, 
      function(x) {
        length(unique(x)) != length(x)
      })
    if (any(duplicate_dim_specs)) {
      stop("Parameter 'target_dims' must not contain duplicated dimension ",
           "specifications.")
    }
    margins <- vector('list', length(data))
      if (is.character(unlist(target_dims[i]))) {
Nicolau Manubens's avatar
Nicolau Manubens committed
        if (is.null(names(dim(data[[i]])))) {
          stop("Parameter 'target_dims' contains dimension names, but ",
               "some of the corresponding objects in 'data' do not have ",
               "dimension names.")
        }
        margins2_new <- target_dims[[i]]
        for (j in 1 : length(margins2_new)) {
          matches <- which(names(dim(data[[i]])) == margins2_new[j])
          if (length(matches) < 1) {
            stop("Could not find dimension '", margins2_new[j], "' in ", i, 
                 "th object provided in 'data'.")
          }
          margins2_new[j] <- matches[1]
Nicolau Manubens's avatar
Nicolau Manubens committed
        target_dims_names[[i]] <- target_dims[[i]]
        target_dims[[i]] <- margins2_new
Nicolau Manubens's avatar
Nicolau Manubens committed
      if (!is.null(names(dim(data[[i]])))) {
        margins_names[[i]] <- names(dim(data[[i]]))[- target_dims[[i]]]
      }
      margins[[i]] <- c(1 : length(dim(data[[i]]))[- target_dims[[i]]])
      
Alasdair Hunter's avatar
Alasdair Hunter committed
    }
  # Reorder dimensions of input data for target dims to be left-most
Nicolau Manubens's avatar
Nicolau Manubens committed
  # and in the required order.
  for (i in 1 : length(data)) {
    if (is.unsorted(target_dims[[i]]) || 
        (max(target_dims[[i]]) > length(target_dims[[i]]))) {
      marg_dims <- (1 : length(dim(data[[i]])))[- target_dims[[i]]]
Nicolau Manubens's avatar
Nicolau Manubens committed
      data[[i]] <- .aperm2(data[[i]], c(target_dims[[i]], marg_dims))
      target_dims[[i]] <- 1 : length(target_dims[[i]])
      margins[[i]] <- (length(target_dims[[i]]) + 1) : length(dim(data[[i]]))
Alasdair Hunter's avatar
Alasdair Hunter committed
    }
  }
  # Check AtomicFun
  if (is.character(AtomicFun)) {
    try({AtomicFun <- get(AtomicFun)}, silent = TRUE)
    if (!is.function(AtomicFun)) {
      stop("Could not find the function '", AtomicFun, "'.")
  if (!is.function(AtomicFun)) {
    stop("Parameter 'AtomicFun' must be a function or a character string ",
         "with the name of a function.")
  }
  # Check parallel
Alasdair Hunter's avatar
Alasdair Hunter committed
  if (!is.logical(parallel)) {
    stop("Parameter 'parallel' must be logical.")
Alasdair Hunter's avatar
Alasdair Hunter committed
  }
  # Check ncores
  if (parallel) {
    if (is.null(ncores)) {
      ncores <- availableCores() - 1
    }
    if (!is.numeric(ncores)) {
      stop("Parameter 'ncores' must be numeric.")
    }
    ncores <- round(ncores)
    ncores <- min(availableCores() - 1, ncores)
  }

Nicolau Manubens Gil's avatar
Nicolau Manubens Gil committed
  # Consistency checks of margins of all arrays
#  accumulated_found_margins <- list()
#  steps: 
#  for each data array, add its margins to the list if not present.
#                               if there are unnamed margins in the list, check their size matches the margins being added 
#                                                                         and simply assing them a name
#                       those margins present, check that they match
#                       if unnamed margins, check consistency with found margins
#                                           if more mrgins than found, add numbers to the list, without names
#  with this we end up with a named list of margin sizes
#  for data arrays with unnamed margins, we can assume their margins names are those of the first entries in the resulting list
#  then need to check which margins are common for all the data arrays. Those will be used by llply.
#  For the margins that are not common, we will need to iterate manually across them, and use data arrays repeatedly as needed
#  Extra: take into account in this process that there can be empty margin vectors
#
#  for (i in 1 : length(data)) {
#    if (!is.null(names(dim(data[[i]])))) {
#      matches <- which(names(dim(data[[i]])) %in% names(accumulated_found_sizes))
#      no_match_names <- names(dim(data[[i]]))
#      if (length(matches) > 0) {
#        match_names <- names(dim(data[[i]]))[matches]
#        if (any(unlist(accumulated_found_sizes[match_names]) != dim(data[[i]])[match_names])) {
#          stop("Found dimensions with the same name and different size in 'data'.")
#        }
#        no_match_names <- no_match_names[- matches]
#      }
#      accumulated_found_sizes <- c(accumulated_found_sizes, as.list(dim(data[[i]])[no_match_names]))
#    }
#        

Alasdair Hunter's avatar
Alasdair Hunter committed
  names <- names(dim(data[[1]]))[margins[[1]]]
Alasdair Hunter's avatar
Alasdair Hunter committed
  input <- list()

  splatted_f <- splat(AtomicFun)

Nicolau Manubens's avatar
Nicolau Manubens committed
  if (any(!sapply(margins, is.null))) {
    #Check margins match for input objects
Nicolau Manubens's avatar
Nicolau Manubens committed
    all_dims <- c(sapply(1 : length(data), 
                         function(x) sum(dim(data[[x]])[margins[[x]]])))
    print(all_dims)
Nicolau Manubens's avatar
Nicolau Manubens committed
    pos_dim <-  which.max(all_dims)[1]
    dim_template <- dim(data[[pos_dim]])[margins[[pos_dim]]]
    print(pos_dim)
    print(dim_template)
    for (i in 1 : length(data)) {
      if (identical(dim(data[[i]])[margins[[i]]], dim_template) == FALSE) {
        for (j in 1 : (length(dim(data[[i]])[margins[[i]]]))) {
          print("OK")
          print(c(dim(data[[i]])[margins[[i]]])[j] != dim_template[j])
          if (c(dim(data[[i]])[margins[[i]]])[j] != dim_template[j]) {
            print(class(data[[i]]))
            data[[i]] <- InsertDim(data[[i]], posdim = margins[[i]][j], lendim = dim_template[j])
            data[[i]] <- adrop(data[[i]], drop = (margins[[i]][j] + 1))
            print(class(data[[i]]))
           }
         }
       }
    }
    print(dim(data)[[2]])
    .isolate <- function(data, margin_length, drop = TRUE) {
      eval(dim(environment()$data))
      structure(list(env = environment(), index = margin_length, subs = as.name("[")), 
                class = c("indexed_array"))
    }
Alasdair Hunter's avatar
Alasdair Hunter committed
    for (i in 1 : length(data)) {
      margin_length <- lapply(dim(data[[i]]), function(x) 1 : x)
      margin_length[-margins[[i]]] <- ""
      margin_length <- expand.grid(margin_length, KEEP.OUT.ATTRS = FALSE, 
                                   stringsAsFactors = FALSE)
      input[[i]] <- .isolate(data[[i]], margin_length)
Alasdair Hunter's avatar
Alasdair Hunter committed
    }
Alasdair Hunter's avatar
Alasdair Hunter committed
    dims <- dim(data[[1]])[margins[[1]]]
    i_max <- length(input[[1]])[1] / dims[[1]]
Alasdair Hunter's avatar
Alasdair Hunter committed
    k <- length(input[[1]]) / i_max
    if (parallel == TRUE) {
Alasdair Hunter's avatar
Alasdair Hunter committed
      registerDoParallel(ncores)  
Alasdair Hunter's avatar
Alasdair Hunter committed
    }
    WrapperFun <- llply(1 : i_max, function(i)
Alasdair Hunter's avatar
Alasdair Hunter committed
      sapply((k * i - (k - 1)) : (k * i), function(x) splatted_f(lapply(input, `[[`, x),...), simplify = FALSE),
Alasdair Hunter's avatar
Alasdair Hunter committed
      .parallel = parallel)
Alasdair Hunter's avatar
Alasdair Hunter committed
    if (parallel == TRUE) {
      registerDoSEQ()
    }
Alasdair Hunter's avatar
Alasdair Hunter committed
    if (is.null(dim(WrapperFun[[1]][[1]]))) {
      WrapperFun <- array(as.numeric(unlist(WrapperFun)), dim=c(c(length((WrapperFun[[1]])[[1]])),
Alasdair Hunter's avatar
Alasdair Hunter committed
                                                                dim(data[[1]])[margins[[1]]]))
    } else {
      WrapperFun <- array(as.numeric(unlist(WrapperFun)), dim=c(c(dim(WrapperFun[[1]][[1]])),
                                                                dim(data[[1]])[margins[[1]]]))
    }
  } else {
Alasdair Hunter's avatar
Alasdair Hunter committed
    WrapperFun <- splatted_f(data, ...)
  }
  if (!is.null(dim(WrapperFun))) {
    names(dim(WrapperFun))[(length(dim(WrapperFun)) - length(names) + 1) : length(dim(WrapperFun))] <- c(names)
Alasdair Hunter's avatar
Alasdair Hunter committed
  }
Nicolau Manubens's avatar
Nicolau Manubens committed

Alasdair Hunter's avatar
Alasdair Hunter committed
  out <- WrapperFun
}