tests/testthat/test_estimatePsite.R

gtf <- system.file("extdata",
                   "Danio_rerio.GRCz10.91.chr1.gtf.gz",
                   package="ribosomeProfilingQC")
txdb <- makeTxDbFromGFF(gtf,
                        organism = "Danio rerio",
                        chrominfo = seqinfo(Drerio)["chr1"],
                        taxonomyId = 7955)
CDS <- prepareCDS(txdb)
tmpbam <- tempdir()
bamfilenames <- character(0)
samples <- character(0)
yieldSize <- 10000000

possiblePsites <- 13 #c(12, 13, 14)
Drerio_chr1 <- getSeq(Drerio, as(seqinfo(Drerio)["chr1"], 'GRanges'))

bamfilename13 <- tempfile(tmpdir = tmpbam, fileext = ".bam")
test_that("simulateRPF works not correct for DNAStringSet", {
  sample <- sub(".bam", "", basename(bamfilename13))
  reads <- simulateRPF(txdb, tmpbam, samples=sample, genome=Drerio_chr1,
                       readsPerSample = 1e4, psite = 13,
                       frame0=.90, frame1=.05, frame2=.05,
                       includeReadsSeq = TRUE)
})
test_that("codonBias works not correct", {
    cb <- codonBias(bamfilename13, gtf=gtf, genome=Drerio_chr1, bestpsite = 13)
    reads.vs.ref <- cb$reads[, -seq.int(3)]/cb$reference[, -seq.int(3)]
    expect_equal(mean(reads.vs.ref), 1, tolerance = 0.01)
    expect_true(sd(reads.vs.ref)<0.05)
    p <- t.test(cb$reads[, 4], cb$reference[, 4])$p.value
    expect_true(p>0.99)
})

for(psite in possiblePsites){
  bamfilename <- tempfile(tmpdir = tmpbam, fileext = ".bam")
  sample <- sub(".bam", "", basename(bamfilename))
  reads <- simulateRPF(txdb, tmpbam, samples=sample, genome=Drerio,
                       readsPerSample = 1e4, psite = psite,
                       frame0=.90, frame1=.05, frame2=.05)
  bamfilenames[psite] <- bamfilename
  samples[psite] <- sample
}

bamfile <- lapply(bamfilenames[possiblePsites], BamFile, yieldSize = yieldSize)
names(bamfile) <- possiblePsites

test_that("estimatePsite works not correct", {
  for(psite in possiblePsites){
    bestpsite <- estimatePsite(bamfile[[as.character(psite)]], CDS, Drerio)
    expect_equal(bestpsite, psite)
    ## test for DNAStringSet
    bestpsite <- estimatePsite(bamfile[[as.character(psite)]], CDS, Drerio_chr1)
    expect_equal(bestpsite, psite)
    ## from 3'end
    bestpsite <- estimatePsite(bamfile[[as.character(psite)]], CDS, Drerio, anchor='3end')
    expect_equal(bestpsite, psite-29)
  }
})

test_that("readsEndPlot works not correct", {
  for(psite in possiblePsites){
    h <- readsEndPlot(bamfile[[as.character(psite)]], CDS, toStartCodon=TRUE)
    h <- h$heights
    dist <- as.numeric(names(h))
    gp <- c(dist[dist<0&dist>-10] %% 3, (dist[dist>0]-1) %% 3)
    gph <- rowsum(h[dist>-10], gp)
    m <- c(13, 12, 14)[which.max(gph)]
    expect_equal(m, psite)
  }
})

pcs <- mapply(getPsiteCoordinates, bamfile, possiblePsites)

test_that("summaryReadsLength works not correct", {
  for(psite in possiblePsites){
    readsLen <- summaryReadsLength(pcs[[as.character(psite)]])
    expect_equal(readsLen, c("28"=1))
  }
})

test_that("strandPlot works not correct", {
  for(psite in possiblePsites){
    sP <- strandPlot(pcs[[as.character(psite)]], CDS = CDS)$data
    sP <- sP[sP$x=="sense", "y"]
    expect_equal(sP, 100, tolerance=.1)
  }
})

pcs <- lapply(pcs, assignReadingFrame, CDS=CDS)

test_that("assignReadingFrame works not correct", {
  for(psite in possiblePsites){
    m <- table(pcs[[as.character(psite)]]$readingFrame)
    expect_gt(m["0"], m["1"])
    expect_gt(m["0"], m["2"])
    m0 <- plotFrameDensity(pcs[[as.character(psite)]])
    m <- round(m0$data$y)
    names(m) <- m0$data$x
    expect_equal(unname(m['0']), 90, tolerance=1)
    expect_equal(unname(m['1']), 5, tolerance=1)
    expect_equal(unname(m['2']), 5, tolerance=1)
  }
})

pcs <- lapply(pcs, readsDistribution, txdb=txdb, plot=FALSE)
test_that("readsDistribution works not correct", {
  for(psite in possiblePsites){
    cs <- mcols(pcs[[as.character(psite)]])[, c("Intron",
                                                "upstream",
                                                "downstream",
                                                "InterGenic")]
    cs <- as.data.frame(cs)
    cs <- colSums(cs)
    expect_true(all(cs==0))
  }
})


test_that("codonUsage works not correct", {
  for(psite in possiblePsites){
    startcodon <- codonUsage(pcs[[as.character(psite)]],
                             start = TRUE, genome = Drerio)
    expect_true(names(startcodon)[1] == "ATG")
    stopcodon <- codonUsage(pcs[[as.character(psite)]],
                            start = FALSE, genome = Drerio)
    expect_true(names(stopcodon)[1] %in% c("TAG", "TAA", "TGA"))
    ## test for DNAStringSet
    startcodon <- codonUsage(pcs[[as.character(psite)]],
                             start = TRUE, genome = Drerio_chr1)
    expect_true(names(startcodon)[1] == "ATG")
    stopcodon <- codonUsage(pcs[[as.character(psite)]],
                            start = FALSE, genome = Drerio_chr1)
    expect_true(names(stopcodon)[1] %in% c("TAG", "TAA", "TGA"))
  }
})
jianhong/ribosomeProfilingQC documentation built on Jan. 6, 2025, 10:01 a.m.