#' @include MultiAssayExperiment-class.R ExperimentList-class.R
#'
#' @import BiocGenerics S4Vectors methods
#' @importFrom BiocGenerics duplicated anyDuplicated
#' @importFrom utils .DollarNames
#' @importFrom stats reshape
#' @importFrom GenomicRanges GRanges
#' @importFrom IRanges IRanges findOverlaps subsetByOverlaps overlapsAny
#' @importFrom IRanges splitAsList SplitDataFrameList
#' @importFrom IRanges IntegerList CharacterList LogicalList
#' @importFrom S4Vectors endoapply mendoapply
#' @importFrom SummarizedExperiment findOverlaps assays
NULL
.checkOverlapsAny <- function(obj_cl) {
return(
any(hasMethod("overlapsAny", signature(obj_cl, "GRanges"),
getNamespace("GenomicRanges")),
hasMethod("overlapsAny", signature(obj_cl, "GRanges"),
getNamespace("SummarizedExperiment")),
hasMethod("overlapsAny", signature(obj_cl, "GRanges"),
getNamespace("IRanges")))
)
}
.rowIdx <- function(x) {
IntegerList(lapply(x, function(exper) seq_len(dim(exper)[[1L]])))
}
.getHits <- function(expList, i, ...) {
IntegerList(lapply(expList, function(element) {
if (is(i, "Vector")) {
if (is(element, "RangedSummarizedExperiment"))
element <- rowRanges(element)
if (is(element, "VcfStack"))
i <- which(rownames(element) %in% as.character(seqnames(i)))
if (.checkOverlapsAny(class(element)) &&
!is(element, "SummarizedExperiment"))
i <- which(overlapsAny(element, i, ...))
else
i <- match(intersect(as.character(i), rownames(element)),
rownames(element))
# i <- na.omit(match(rownames(element), as.character(i)))
} else if (is.character(i)) {
i <- match(intersect(i, rownames(element)), rownames(element))
# i <- na.omit(match(rownames(element), i))
} else {
i <- as.integer(i)
}
i
}))
}
.matchReorderSub <- function(assayMap, identifiers) {
positions <- unlist(
lapply(identifiers,
function(ident) {
which(!is.na(match(assayMap[["primary"]], ident)))
}))
assayMap[positions, ]
}
#' @name subsetBy
#' @title Subsetting a MultiAssayExperiment object
#' @description A set of functions for extracting and dividing a
#' \code{MultiAssayExperiment}
#'
#' @param x A \code{MultiAssayExperiment} or \code{ExperimentList}
#' @param i Either a \code{character}, \code{integer}, \code{logical} or
#' \code{GRanges} object for subsetting by rows
#' @param j Either a \code{character}, \code{logical}, or \code{numeric} vector
#' for subsetting by \code{colData} rows. See details for more information.
#' @param k Either a \code{character}, \code{logical}, or \code{numeric} vector
#' for subsetting by assays
#' @param ... Additional arguments passed on to lower level functions.
#' @param drop logical (default TRUE) whether to drop empty assay elements
#' in the \code{ExperimentList}
#'
#' @aliases [,MultiAssayExperiment,ANY-method subsetByColData subsetByRow
#' subsetByColumn subsetByAssay subset subsetBy
#'
#' @details
#' Subsetting a MultiAssayExperiment by the \strong{j} index can yield a call
#' to either \code{subsetByColData} or \code{subsetByColumn}. For vector inputs,
#' the subset will be applied to the \code{colData} rows. For \code{List}-type
#' inputs, the List will be applied to each of the elements in the
#' \code{ExperimentList}.
#' The order of the subsetting elements in the
#' \code{List} must match that of the \code{ExperimentList} in the
#' \code{MultiAssayExperiment}.
#'
#' \itemize{
#' \item subsetBycolData: Select biological units by vector input types
#' \item subsetByColumn: Select observations by assay or for each assay
#' \item subsetByRow: Select rows by assay or for each assay
#' \item subsetByAssay: Select experiments
#' }
#'
#' @examples
#' ## Load the example MultiAssayExperiment
#' example("MultiAssayExperiment")
#'
#' ## Using experiment names
#' subsetByAssay(myMultiAssayExperiment, "Affy")
#'
#' ## Using numeric indices
#' subsetByAssay(myMultiAssayExperiment, 1:2)
#'
#' ## Using a logical vector
#' subsetByAssay(myMultiAssayExperiment, c(TRUE, FALSE, TRUE))
#'
#' ## Subset by character vector (Jack)
#' subsetByColData(myMultiAssayExperiment, "Jack")
#'
#' ## Subset by numeric index of colData rows (Jack and Bob)
#' subsetByColData(myMultiAssayExperiment, c(1, 3))
#'
#' ## Subset by logical indicator of colData rows (Jack and Jill)
#' subsetByColData(myMultiAssayExperiment, c(TRUE, TRUE, FALSE, FALSE))
#'
#' subsetByColumn(myMultiAssayExperiment, list(Affy = 1:2,
#' Methyl450k = c(3,5,2), RNASeqGene = 2:4, GISTIC = 1))
#'
#' subsetWith <- S4Vectors::mendoapply(`[`, colnames(myMultiAssayExperiment),
#' MoreArgs = list(1:2))
#' subsetByColumn(myMultiAssayExperiment, subsetWith)
#'
#' ## Use a GRanges object to subset rows where ranged data present
#' egr <- GenomicRanges::GRanges(seqnames = "chr2",
#' IRanges::IRanges(start = 11, end = 13), strand = "-")
#' subsetByRow(myMultiAssayExperiment, egr)
#'
#' ## Use a logical vector (recycling used)
#' subsetByRow(myMultiAssayExperiment, c(TRUE, FALSE))
#'
#' ## Use a character vector
#' subsetByRow(myMultiAssayExperiment, "ENST00000355076")
#'
NULL
# subsetBy Generics -------------------------------------------------------
#' @rdname subsetBy
#' @export subsetByRow
setGeneric("subsetByRow", function(x, y, ...) standardGeneric("subsetByRow"))
#' @rdname subsetBy
#' @export subsetByColData
setGeneric("subsetByColData", function(x, y) standardGeneric("subsetByColData"))
#' @rdname subsetBy
#' @export subsetByColumn
setGeneric("subsetByColumn", function(x, y) standardGeneric("subsetByColumn"))
#' @rdname subsetBy
#' @export subsetByAssay
#' @param y Any argument used for subsetting, can be a \code{character},
#' \code{logical}, \code{integer}, \code{list} or \code{List} vector
setGeneric("subsetByAssay", function(x, y) standardGeneric("subsetByAssay"))
.subsetCOLS <- function(object, cutter) {
mendoapply(function(x, j) {
x[, j, drop = FALSE]
}, x = object, j = cutter)
}
.subsetROWS <- function(object, cutter) {
mendoapply(function(x, i) {
x[i, , drop = FALSE]
}, x = object, i = cutter)
}
# subsetByRow,ExperimentList-methods -----------------------------------------
#' @rdname subsetBy
setMethod("subsetByRow", c("ExperimentList", "ANY"), function(x, y, ...) {
rowIds <- .rowIdx(x)
if (is.integer(y)) {
lowerLimit <- min(max(rowIds))
if (max(y) > lowerLimit)
stop("subscript contains out-of-bounds indices,\n",
" use an ", sQuote("IntegerList"), " index for finer control")
}
subsetor <- .getHits(x, y, ...)
Y <- rowIds[subsetor]
subsetByRow(x, Y)
})
#' @rdname subsetBy
setMethod("subsetByRow", c("ExperimentList", "list"), function(x, y) {
if (!all(names(y) %in% names(x)))
stop("list-like subscript has names not in list-like object to subset")
inNames <- names(x) %in% names(y)
x[inNames] <- x[y]
x
})
#' @rdname subsetBy
setMethod("subsetByRow", c("ExperimentList", "List"), function(x, y) {
if (!all(names(y) %in% names(x)))
stop("list-like subscript has names not in list-like object to subset")
if (is(y, "DataFrame"))
stop("Provide a list of indices for subsetting")
inNames <- names(x) %in% names(y)
x[inNames] <- x[y]
x
})
#' @rdname subsetBy
setMethod("subsetByRow", c("ExperimentList", "logical"), function(x, y) {
logi <- LogicalList(rep(list(y), length(x)))
x[logi]
})
# subsetByColumn,ExperimentList-methods -----------------------------------
#' @rdname subsetBy
setMethod("subsetByColumn", c("ExperimentList", "list"), function(x, y) {
y <- y[names(x)]
ExperimentList(mapply(function(exps, j) {
exps[, j, drop = FALSE]
}, exps = x, j = y, SIMPLIFY = FALSE))
})
#' @rdname subsetBy
setMethod("subsetByColumn", c("ExperimentList", "List"), function(x, y) {
Y <- as.list(y)
subsetByColumn(x, Y)
})
#' @rdname subsetBy
setMethod("subsetByColumn", c("ExperimentList", "logical"), function(x, y) {
Y <- endoapply(colnames(x), `[`, y)
.subsetCOLS(x, Y)
})
# subsetByAssay,ExperimentList-methods ------------------------------------
#' @rdname subsetBy
setMethod("subsetByAssay", c("ExperimentList", "ANY"), function(x, y) {
x[y]
})
# subsetByColData,MultiAssayExperiment-methods -----------------------------------------
#' @rdname subsetBy
setMethod("subsetByColData", c("MultiAssayExperiment", "ANY"), function(x, y) {
if (is.logical(y) || is.numeric(y))
y <- unique(rownames(colData(x))[y])
selectors <- y[y %in% rownames(colData(x))]
newcolData <- colData(x)[
match(selectors, rownames(colData(x))), , drop = FALSE]
listMap <- mapToList(sampleMap(x), "assay")
listMap <- lapply(listMap, function(elementMap, keepers) {
.matchReorderSub(elementMap, keepers)
}, keepers = selectors)
newMap <- listToMap(listMap)
columns <- lapply(listMap, function(mapChunk) {
mapChunk[, "colname", drop = TRUE]
})
newSubset <- mapply(function(x, j) {x[, j, drop = FALSE]},
x = experiments(x), j = columns, SIMPLIFY = FALSE)
newSubset <- ExperimentList(newSubset)
experiments(x) <- newSubset
sampleMap(x) <- newMap
colData(x) <- newcolData
return(x)
})
#' @rdname subsetBy
setMethod("subsetByColData", c("MultiAssayExperiment", "character"),
function(x, y) {
y <- unique(y)
if (!any(rownames(colData(x)) %in% y))
stop("No matching identifiers found")
if (!all(y %in% rownames(colData(x))))
warning("Not all identifiers found in data")
callNextMethod(x = x, y = y)
})
# subsetByRow,MultiAssayExperiment-method ---------------------------------
#' @rdname subsetBy
setMethod("subsetByRow", c("MultiAssayExperiment", "ANY"), function(x, y, ...) {
experiments(x) <- subsetByRow(experiments(x), y)
return(x)
})
# subsetByColumn,MultiAssayExperiment-method ------------------------------
#' @rdname subsetBy
setMethod("subsetByColumn", c("MultiAssayExperiment", "ANY"), function(x, y) {
if (is.character(y) || is.logical(y) || is.numeric(y))
subsetByColData(x, y)
else {
experiments(x) <- subsetByColumn(experiments(x), y)
newSamps <- as.list(colnames(x))
listMap <- mapToList(sampleMap(x), "assay")
newMap <- mapply(function(lMap, nSamps) {
lMap[na.omit(match(nSamps, as.character(lMap[["colname"]]))), ]
}, lMap = listMap, nSamps = newSamps, SIMPLIFY = FALSE)
newMap <- listToMap(newMap)
selectors <- unique(as.character(newMap[["primary"]]))
colData(x) <- colData(x)[rownames(colData(x)) %in% selectors, , drop = FALSE]
sampleMap(x) <- newMap
return(x)
}
})
# subsetByAssay,MultiAssayExperiment-method -------------------------------
#' @rdname subsetBy
setMethod("subsetByAssay", c("MultiAssayExperiment", "ANY"), function(x, y) {
expers <- experiments(x)[y]
listMap <- mapToList(sampleMap(x), "assay")
## TODO: Add sensible error message here
newMap <- listMap[y]
newMap <- listToMap(newMap)
sampleMap(x) <- newMap
experiments(x) <- expers
x
})
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.