test_that("Filter SNPs based on FRQ", {
## Call uses reference genome as default with more than 2GB of memory,
## which is more than what 32-bit Windows can handle so remove tests
is_32bit_windows <-
.Platform$OS.type == "windows" && .Platform$r_arch == "i386"
if (!is_32bit_windows) {
file <- tempfile()
# write the Educational Attainment GWAS to a temp file for testing
eduAttainOkbay <- readLines(system.file("extdata", "eduAttainOkbay.txt",
package = "MungeSumstats"
))
writeLines(eduAttainOkbay, con = file)
# read it in and make N
sumstats_dt <- data.table::fread(file, nThread = 1)
# Add N column and make it not an integer
set.seed(101)
sumstats_dt[, FRQ := runif(nrow(sumstats_dt)) * 2]
# get SNPs with INFO<0.9
rmv_snps <- sumstats_dt[FRQ < 0.9, ]$MarkerName
data.table::fwrite(x = sumstats_dt, file = file, sep = "\t")
# Run MungeSumstats code
reformatted <- MungeSumstats::format_sumstats(file,
ref_genome = "GRCh37",
FRQ_filter = 0.9,
on_ref_genome = FALSE,
strand_ambig_filter = FALSE,
bi_allelic_filter = FALSE,
allele_flip_check = FALSE,
log_folder_ind = TRUE,
imputation_ind = TRUE,
dbSNP=144
)
res_dt <- data.table::fread(reformatted$sumstats, nThread = 1)
testthat::expect_equal(all(!rmv_snps %in% res_dt$SNP), TRUE)
# Now check with renaming FRQ column to major
reformatted2 <- MungeSumstats::format_sumstats(file,
ref_genome = "GRCh37",
FRQ_filter = 0.9,
on_ref_genome = FALSE,
strand_ambig_filter = FALSE,
bi_allelic_filter = FALSE,
allele_flip_check = FALSE,
frq_is_maf = FALSE,
log_folder_ind = TRUE,
imputation_ind = TRUE,
dbSNP=144
)
# should be the same as above if column renamed
res_dt2 <- data.table::fread(reformatted2$sumstats, nThread = 1)
setnames(res_dt2, "MAJOR_ALLELE_FRQ", "FRQ")
testthat::expect_equal(all.equal(res_dt, res_dt2), TRUE)
}
else{
expect_equal(is_32bit_windows, TRUE)
expect_equal(is_32bit_windows, TRUE)
}
})
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.