tests/testthat/test-3subset.R

context("Subsetting SequenceData")
test_that("Subsetting SequenceData:",{
  skip_on_bioc()
  data(msi,package = "RNAmodR")
  data(psd,package = "RNAmodR")
  # arguments
  expect_error(RNAmodR:::.norm_subset_args(),'argument "x" is missing')
  expect_error(RNAmodR:::.norm_subset_args(list()),'argument "x" is missing')
  actual <- RNAmodR:::.norm_subset_args(list(),msi)
  expect_error(RNAmodR:::.norm_subset_args(list(name = 1),msi),
               "'name' must be a character with a width > 0L")
  expect_error(RNAmodR:::.norm_subset_args(list(type = 1),msi),
               "'type' must be a character with a width > 0L")
  expect_error(RNAmodR:::.norm_subset_args(list(type = "meep"),msi),
               "'type' must be one or more elements of 'shortName")
  expect_error(RNAmodR:::.norm_subset_args(list(flanking = 1),msi),
        "'flanking' must be a single integer value equal or higher than 0L")
  expect_error(RNAmodR:::.norm_subset_args(list(rawData = 1),msi),
               "'rawData' must be a single logical value")
  expect_error(RNAmodR:::.norm_subset_args(list(perTranscript = 1),msi),
               "'perTranscript' must be a single logical value")
  expect_error(RNAmodR:::.norm_subset_args(list(sequenceData = 1),msi),
               "'sequenceData' must be a single logical value")
  expect_type(actual,"list")
  expect_named(actual,c("name","type","merge","flanking","perTranscript",
                        "sequenceData","rawData"))
  actual <- RNAmodR:::.norm_subset_args(list(),psd)
  expect_type(actual,"list")
  expect_named(actual,c("name","type","merge","flanking","perTranscript",
                        "sequenceData","rawData"))
  expect_equal(RNAmodR:::.norm_subset_args(list(name = "abc"),msi)$name,"abc")
  expect_equal(RNAmodR:::.norm_subset_args(list(type = "I"),msi)$type,"I")
  expect_equal(RNAmodR:::.norm_subset_args(list(flanking = 1L),msi)$flanking,1L)
  expect_equal(RNAmodR:::.norm_subset_args(list(rawData = TRUE),msi)$rawData,
               TRUE)
  expect_equal(RNAmodR:::.norm_subset_args(list(rawData = FALSE),msi)$rawData,
               FALSE)
  expect_equal(RNAmodR:::.norm_subset_args(list(perTranscript = TRUE),msi)$perTranscript,
               TRUE)
  expect_equal(RNAmodR:::.norm_subset_args(list(perTranscript = FALSE),msi)$perTranscript,
               FALSE)
  expect_equal(RNAmodR:::.norm_subset_args(list(sequenceData = TRUE),msi)$sequenceData,
               TRUE)
  expect_equal(RNAmodR:::.norm_subset_args(list(sequenceData = FALSE),msi)$sequenceData,
               FALSE)
  # coords
  coord <- modifications(msi)[[1]]
  expect_error(RNAmodR:::.norm_coord(coord),'argument "type" is missing')
  expect_error(actual <- RNAmodR:::.norm_coord(DataFrame(),NA))
  coord2 <- coord
  width(coord2) <- 2
  expect_error(RNAmodR:::.norm_coord(coord2,NA),
               "Elements with a width != 1L are not supported")
  coord2 <- coord
  coord2$Parent <- c("a","b","c","d","e","f")
  actual <- RNAmodR:::.norm_coord(coord,NA)
  expect_s4_class(actual, "GRangesList")
  expect_equal(length(coord),length(actual))
  actual2 <- RNAmodR:::.norm_coord(coord,"I")
  expect_equal(actual,actual2)
  expect_equal(actual,RNAmodR:::.norm_coord(actual,NA))
  expect_error(RNAmodR:::.norm_coord(coord,"Ix"),
               "No modifications of type 'Ix'")
  coord3 <- coord
  coord3$Parent <- NULL
  expect_error(RNAmodR:::.norm_coord(coord3,NA),"Parent column must be present")
  #
  coord <- actual
  # subsetting
  actual <- subsetByCoord(sequenceData(msi[[1]]),coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_equal(actual,
               subsetByCoord(sequenceData(msi[[1]]),unlist(coord)))
  expect_equal(colnames(actual@unlistData),
               colnames(aggregate(sequenceData(msi[[1]]))@unlistData))
  expect_error(subsetByCoord(sequenceData(msi[[1]]),coord2),
               "No intersection between names in data of 'x' and Parent")
  # flanking
  actual <- subsetByCoord(sequenceData(msi[[1]]),coord,flanking = 3L)
  expect_equal(nrow(actual[[1]]),7L)
  # perTranscript
  expect_equal(subsetByCoord(sequenceData(msi[[1]]),coord),
               subsetByCoord(sequenceData(msi[[1]]),coord,perTranscript = TRUE))
  expect_equal(subsetByCoord(msi[[1]],coord),
               subsetByCoord(msi[[1]],coord,perTranscript = TRUE))
  expect_equal(subsetByCoord(msi,coord),
               subsetByCoord(msi,coord,perTranscript = TRUE))
  # labelling
  actual <- labelByCoord(sequenceData(msi[[1]]), coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_equal(colnames(actual@unlistData),
               c(colnames(aggregate(sequenceData(msi[[1]]))@unlistData),
                 "labels"))
  expect_type(actual@unlistData$labels,"logical")
  # SequenceDataSet specific
  coord <- GenomicRanges::GRanges(seqnames = "chr1",
                            ranges = IRanges::IRanges(start = 50L, width=1L),
                            strand = "+",
                            DataFrame(mod = "I",
                                      Parent = "1"))
  coord <- split(coord,factor(coord$Parent, levels = unique(coord$Parent)))
  data(e5sd,package = "RNAmodR")
  sds <- SequenceDataSet(e5sd,psd)
  actual <- subsetByCoord(sds,coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_equal(actual,subsetByCoord(sds,unlist(coord)))
  actual <- labelByCoord(sds,coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_type(actual@unlistData$labels,"logical")
  # SequenceDataList specific
  data(e5sd,package = "RNAmodR")
  sdl <- SequenceDataList(sds,e5sd,psd)
  actual <- subsetByCoord(sdl,coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_equal(actual,subsetByCoord(sdl,unlist(coord)))
  actual <- labelByCoord(sdl,coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_type(actual@unlistData$labels,"logical")
  # raw data
  expect_error(subsetByCoord(sequenceData(msi[[1]]),coord, rawData = 1),
               "'rawData' must be a single logical value")
  expect_error(subsetByCoord(sequenceData(msi[[1]]),coord, rawData = c(TRUE,TRUE)),
               "'rawData' must be a single logical value")
  actual <- subsetByCoord(sequenceData(msi[[1]]),coord, rawData = TRUE)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_equal(unique(ncols(actual)),15)
  actual <- subsetByCoord(sds,coord, rawData = TRUE)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_equal(unique(ncols(actual)),18)
  expect_equivalent(cbind(subsetByCoord(sds[[1]],coord, rawData = TRUE),
                     subsetByCoord(sds[[2]],coord, rawData = TRUE)),
                    subsetByCoord(sds,coord, rawData = TRUE))
  actual <- labelByCoord(sds[[1]],coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_type(actual@unlistData$labels,"logical")
  expect_true(all(c("means.treated","sds.treated") %in% 
                    colnames(actual@unlistData)))
  actual <- labelByCoord(sds[[1]],coord,
                                                         rawData = TRUE)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_type(actual@unlistData$labels,"logical")
  expect_true(all(c("end5.treated.1","end5.treated.2","end5.treated.3") %in% 
                    colnames(actual@unlistData)))
  actual <- labelByCoord(sds, coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_type(actual@unlistData$labels,"logical")
  expect_true(all(c("End5SequenceData.means.treated",
                    "End5SequenceData.sds.treated") %in% 
                    colnames(actual@unlistData)))
  actual <- labelByCoord(sds, coord, rawData = TRUE)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_type(actual@unlistData$labels,"logical")
  expect_true(all(c("End5SequenceData.end5.treated.1",
                    "End5SequenceData.end5.treated.2",
                    "End5SequenceData.end5.treated.3") %in% 
                    colnames(actual@unlistData)))
  actual <- labelByCoord(sdl, coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_type(actual@unlistData$labels,"logical")
  expect_true(all(c("End5SequenceData_PileupSequenceData.End5SequenceData.means.treated",
                    "End5SequenceData.means.treated",
                    "End5SequenceData.sds.treated") %in% 
                    colnames(actual@unlistData)))
  actual <- labelByCoord(sdl, coord, rawData = TRUE)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_type(actual@unlistData$labels,"logical")
  expect_true(all(c("End5SequenceData_PileupSequenceData.End5SequenceData.end5.treated.1",
                    "End5SequenceData_PileupSequenceData.End5SequenceData.end5.treated.2",
                    "End5SequenceData_PileupSequenceData.End5SequenceData.end5.treated.3",
                    "End5SequenceData.end5.treated.1",
                    "End5SequenceData.end5.treated.2",
                    "End5SequenceData.end5.treated.3") %in% 
                    colnames(actual@unlistData)))
  # other errors
  coord <- unlist(coord)
  end(coord) <- end(coord) + 100
  start(coord) <- start(coord) + 100
  expect_error(subsetByCoord(psd,coord),
               "'coord' for the following modifications")
  expect_error(subsetByCoord(psd,c(coord,coord)),
               "'coord' for the following modifications")
})

context("Subsetting Modifier/ModifierSet")
test_that("Subsetting Modifier/ModifierSet:",{
  data(msi,package = "RNAmodR")
  # element names
  coord <- RNAmodR:::.norm_coord(modifications(msi)[[1]],NA)
  expect_error(RNAmodR:::.get_element_names(getAggregateData(msi[[1]]),coord),
               'argument "type" is missing')
  expect_error(RNAmodR:::.get_element_names(getAggregateData(msi[[1]]),coord,NA),
               'argument "type" is missing')
  actual <- RNAmodR:::.get_element_names(getAggregateData(msi[[1]]),coord,NA,NA)
  expect_type(actual,"character")
  actual <- RNAmodR:::.get_element_names(getAggregateData(msi[[1]]),coord,"2",NA)
  expect_equal(actual,"2")
  # subsetting
  actual <- subsetByCoord(msi[[1]],coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_equal(colnames(actual@unlistData),mainScore(msi[[1]]))
  expect_equal(actual,subsetByCoord(msi[[1]],unlist(coord)))
  expect_equal(subsetByCoord(sequenceData(msi[[1]]),coord),
               subsetByCoord(msi[[1]],coord,sequenceData = TRUE))
  actual2 <- subsetByCoord(msi,coord)
  expect_named(actual2,names(msi))
  expect_equal(actual2[[1]],actual)
  expect_equal(actual2,subsetByCoord(msi,unlist(coord)))
  actual3 <- subsetByCoord(msi,coord,sequenceData = TRUE)
  expect_type(actual3,"list")
  actual4 <- lapply(msi,subsetByCoord,coord,sequenceData = TRUE)
  expect_equal(actual3,actual4)
  # labelling
  actual <- labelByCoord(msi[[1]],coord)
  expect_s4_class(actual,"CompressedSplitDataFrameList")
  expect_equal(colnames(actual@unlistData),c(mainScore(msi[[1]]),"labels"))
  expect_type(actual@unlistData$labels,"logical")
  
})

context("Combining SequenceData")
test_that("Combining SequenceData:",{
  data(psd,package = "RNAmodR")
  expect_error(c(psd[1],psd[1]),
               "Input must have unique names.")
  expect_error(cbind(psd[1],psd[2]),
               "Inputs must have the same lengths.")
  expect_error(cbind(psd[1],psd),
               "Inputs must have the same lengths.")
  expect_error(rbind(psd[1],psd[,1:2]),
               "Inputs must have the same width.")
  expect_s4_class(c(psd[1],psd[2]),
                  "PileupSequenceData")
  expect_true(all(all(c(psd[1],psd[2]) == psd)))
  expect_s4_class(cbind(psd[1],psd[1]),
                  "PileupSequenceData")
  expect_s4_class(rbind(psd[1],psd),
                  "PileupSequenceData")
  expect_equal(relist(unlist(psd),psd),psd)
  expect_equal(relist(unlist(psd,use.names = FALSE),psd),psd)
})
FelixErnst/RNAmodR documentation built on March 27, 2024, 2:42 a.m.