#' Shuffle motifs by column.
#'
#' Given a set of motifs, shuffle the columns to create new motifs. Currently does not
#' support keeping the 'multifreq' slot. Only the 'bkg', 'nsites', 'strand',
#' and 'bkgsites' slots will be preserved. Uses the same shuffling methods
#' as [shuffle_sequences()]. When shuffling more than one motif, all motif
#' columns are merged into a single pool and shuffled together, finally returning
#' them as motifs of identical lengths as the input motifs.
#' To instead shuffle motifs individually, call [shuffle_motifs()]
#' using `lapply()`.
#'
#' @param motifs See [convert_motifs()] for acceptable formats.
#' @param k `numeric(1)` K-let size.
#' @param method `character(1)` Currently only 'linear' is accepted.
#'
#' @return Motifs. See [convert_motifs()] for available output
#' formats.
#'
#' @author Benjamin Jean-Marie Tremblay, \email{benjamin.tremblay@@uwaterloo.ca}
#' @seealso [shuffle_sequences()]
#' @export
shuffle_motifs <- function(motifs, k = 2, method = "linear") {
# TODO: implement euler by instead shuffling the consensus sequences and
# keeping track of the indices.
# param check --------------------------------------------
args <- as.list(environment())
all_checks <- character(0)
if (!method %in% c("linear", "random")) {
method_check <- paste0(" * Incorrect 'shuffle.method': expected `linear`;",
" got `", method, "`")
method_check <- wmsg2(method_check, 4, 2)
all_checks <- c(all_checks, method_check)
}
char_check <- check_fun_params(list(method = args$method),
numeric(), logical(), TYPE_CHAR)
num_check <- check_fun_params(list(k = args$k), 1, FALSE, TYPE_NUM)
all_checks <- c(all_checks, char_check, num_check)
if (length(all_checks) > 0) stop(all_checks_collapse(all_checks))
#---------------------------------------------------------
if (is(motifs, "universalmotif")) undo.list <- TRUE else undo.list <- FALSE
if (is.list(motifs)) CLASS_IN <- vapply(motifs, .internal_convert, character(1))
else CLASS_IN <- .internal_convert(motifs)
motifs <- convert_motifs(motifs)
if (!is.list(motifs)) motifs <- list(motifs)
motifs <- convert_type_internal(motifs, "PPM")
mot.alphs <- vapply(motifs, function(x) x@alphabet, character(1))
if (length(unique(mot.alphs)) > 1)
stop("all motifs must share the same alphabet")
mot.lens <- vapply(motifs, function(x) ncol(x@motif), numeric(1))
mot.mats <- lapply(motifs, function(x) x@motif)
mot.cols <- do.call(cbind, mot.mats)
col.order <- seq_len(ncol(mot.cols))
if (k == 1) {
new.order <- sample(col.order, ncol(mot.cols))
} else {
switch(method,
"linear" = {
new.order <- shuffle_linear(col.order, k, mode = 2)
new.order <- as.numeric(new.order)
},
stop("only 'linear' is currently supported")
)
}
mot.cols <- mot.cols[, new.order]
mot.offsets <- cumsum(c(0, mot.lens[-length(mot.lens)]))
new.mats <- lapply(seq_along(mot.mats),
function(x) mot.cols[, (1 + mot.offsets[x]):(mot.lens[x] + mot.offsets[x])])
new.motifs <- mapply(shuffle_new_mot, new.mats, motifs,
SIMPLIFY = FALSE)
new.motifs <- .internal_convert(new.motifs, unique(CLASS_IN))
if (undo.list && is.list(new.motifs)) new.motifs <- new.motifs[[1]]
new.motifs
}
shuffle_new_mot <- function(new.mat, motif) {
mot <- universalmotif_cpp(motif = new.mat, alphabet = motif@alphabet,
bkg = motif@bkg, bkgsites = motif@bkgsites,
nsites = motif@nsites, strand = motif@strand,
name = collapse_cpp(c(motif@name, " [shuffled]")))
validObject_universalmotif(mot)
mot
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.