test_that("test simplify marix needs a data frame", {
expect_error(summarize_by_patient(gene_binary = c(1:10)))
})
test_that("test no error in summarize_by_patient", {
samples <- as.character(unique(gnomeR::mutations$sampleId))[1:50]
gen_dat <- create_gene_binary(samples = samples,
mutation = gnomeR::mutations,
fusion = gnomeR::sv) %>%
mutate(patient_id = extract_patient_id(sample_id))
expect_no_error(gen_dat2 <- summarize_by_patient(gen_dat))
})
test_that("test output matches summarize_by_gene if only 1 sample per patient", {
# restrict to 1 sample/patient
samples <- gnomeR::mutations %>%
mutate(patient_id = gnomeR::extract_patient_id(sampleId)) %>%
distinct(patient_id, .keep_all = TRUE) %>%
pull(sampleId)
gen_dat <- create_gene_binary(samples = samples,
mutation = gnomeR::mutations,
fusion = gnomeR::sv) %>%
mutate(patient_id = extract_patient_id(sample_id))
expect_equal(summarize_by_gene(gen_dat, other_vars = patient_id) %>% select(-sample_id, -patient_id),
summarize_by_patient(gen_dat) %>% select(-patient_id))
})
test_that("test error when no patient_id", {
# restrict to 1 sample/patient
samples <- gnomeR::mutations %>%
pull(sampleId)
gen_dat <- create_gene_binary(samples = samples,
mutation = gnomeR::mutations,
fusion = gnomeR::sv)
expect_error(summarize_by_patient(gen_dat), "Can't find")
})
test_that("test that results are the same with and without sample_id", {
# restrict to 1 sample/patient
samples <- gnomeR::mutations %>%
pull(sampleId)
gen_dat <- create_gene_binary(samples = samples[1:20],
mutation = gnomeR::mutations,
fusion = gnomeR::sv) %>%
mutate(patient_id = extract_patient_id(sample_id))
a <- summarize_by_patient(gen_dat)
b <- summarize_by_patient(select(gen_dat, -sample_id))
expect_equal(a, b)
})
test_that("test that output is only 1 row/patient", {
# restrict to 1 sample/patient
# bind gnomeR::mutations to ensure there are duplicates
samples <- bind_rows(gnomeR::mutations,
gnomeR::mutations) %>%
mutate(patient_id = gnomeR::extract_patient_id(sampleId)) %>%
pull(sampleId)
gen_dat <- create_gene_binary(samples = samples,
mutation = gnomeR::mutations,
fusion = gnomeR::sv) %>%
mutate(patient_id = gnomeR::extract_patient_id(sample_id))
n_rec_pt <- summarize_by_patient(gen_dat) %>%
count(patient_id, name = "n_rec_pt") %>%
distinct(n_rec_pt) %>%
pull(n_rec_pt)
expect_equal(n_rec_pt, 1)
})
test_that("test that genes are properly summarized", {
samples <- Reduce(intersect, list(gnomeR::mutations$sampleId, gnomeR::cna$sampleId,
gnomeR::sv$sampleId))
expect_message(bin_impact <- create_gene_binary(samples=samples,
mutation = gnomeR::mutations,
cna = gnomeR::cna,
fusion = gnomeR::sv,
specify_panel = "impact") %>%
mutate(patient_id = gnomeR::extract_patient_id(sample_id)) %>%
dplyr::select(c(sample_id, patient_id, starts_with("ARI"), starts_with("MAPK1"), starts_with("ERG"))))
sum_impact <- summarize_by_patient(bin_impact) %>%
dplyr::mutate(across(!patient_id, as.numeric)) %>%
arrange(patient_id)
bin_impact_test <- bin_impact %>%
mutate(patient_id = gnomeR::extract_patient_id(sample_id)) %>%
select(-sample_id) %>%
tidyr::pivot_longer(cols = c(everything(), -patient_id)) %>%
mutate(name = str_remove(name, ".Amp|.Del|.fus"))%>%
tidyr::pivot_wider(names_from = name, values_from = value, values_fn = function (x) sum(x)) %>%
mutate(across(.cols = c(-patient_id),
~ifelse(. > 0, 1, 0))) %>%
mutate_if(~ all(is.na(.)), ~as.numeric(NA_integer_)) %>%
relocate(colnames(sum_impact)) %>%
arrange(patient_id)
expect_equal(sum_impact, bin_impact_test)
})
test_that("test alteration hierarchy", {
# alteration if alteration on any sample
# no alteration if no alteration on all samples (no NAs)
# else NA
# dummy binary matrix with comparisons of interest
bin_impact_dummy <- tribble(~sample_id, ~ALK, ~EGFR, ~KRAS, ~TP53, ~KMT2D, ~SMARCA4,
paste0(gnomeR::mutations$patientId[1], "-T01", "-IM5"), 1, 0, 1, 1, 0, NA_integer_,
paste0(gnomeR::mutations$patientId[1], "-T01", "-IM5"), 1, 0, 0, NA_integer_, NA_integer_, NA_integer_) %>%
mutate(patient_id = gnomeR::mutations$patientId[1])
sum_impact <- summarize_by_patient(bin_impact_dummy) %>%
dplyr::mutate(across(!patient_id, as.numeric)) %>%
arrange(patient_id)
bin_impact_expected <- tribble(~patient_id, ~ALK, ~EGFR, ~KRAS, ~TP53, ~KMT2D, ~SMARCA4,
gnomeR::mutations$patientId[1], 1, 0, 1, 1, NA_integer_, NA_integer_) %>%
mutate(across(-patient_id, as.numeric))
expect_equal(sum_impact, bin_impact_expected)
})
test_that("test what happens to columns with all NA", {
samples <- Reduce(intersect, list(gnomeR::mutations$sampleId, gnomeR::cna$sampleId,
gnomeR::sv$sampleId))
bin_impact <- create_gene_binary(samples=samples,
mutation = gnomeR::mutations,
cna = gnomeR::cna,
fusion = gnomeR::sv,
specify_panel = "impact") %>%
mutate(patient_id = gnomeR::extract_patient_id(sample_id)) %>%
select(c(sample_id, patient_id, starts_with("AR"), starts_with("PLCG2"), starts_with("PPM1D")))
sum_impact <- summarize_by_patient(bin_impact)%>%
mutate(across(!patient_id, as.numeric)) %>%
arrange(patient_id)
bin_impact_test <- bin_impact %>%
mutate(patient_id = gnomeR::extract_patient_id(sample_id)) %>%
select(-sample_id) %>%
tidyr::pivot_longer(cols = c(everything(), -patient_id)) %>%
mutate(name = str_remove(name, ".Amp|.Del|.fus"))%>%
tidyr::pivot_wider(names_from = name, values_from = value, values_fn = function (x) sum(x)) %>%
mutate(across(.cols = c(-patient_id),
~ifelse(. > 0, 1, 0))) %>%
mutate_if(~ all(is.na(.)), ~as.numeric(NA_integer_)) %>%
relocate(colnames(sum_impact)) %>%
arrange(patient_id)
expect_equal(sum_impact, bin_impact_test)
expect_equal(ncol(as.data.frame(
sum_impact[,sapply(sum_impact, function(x) all(is.na(x)))])), 1)
})
test_that("other vars are retained", {
samples <- gnomeR::mutations %>%
head(50) %>%
pull(sampleId) %>%
unique()
bin_impact <- create_gene_binary(samples = samples,
mutation = gnomeR::mutations,
cna = gnomeR::cna,
fusion = gnomeR::sv,
specify_panel = "impact") %>%
mutate(patient_id = gnomeR::extract_patient_id(sample_id)) %>%
select(c(sample_id, patient_id, starts_with("AR"), starts_with("PLCG2"), starts_with("PPM1D")))
set.seed(20230828)
bin_impact$random_color = sample(c("blue", "red", "yellow"),
size = length(samples), replace = TRUE)
expect_true("random_color" %in% names(bin_impact))
sum_impact <- summarize_by_patient(bin_impact,
other_vars = "random_color")
expect_true("random_color" %in% names(sum_impact))
expect_true("blue" %in% sum_impact$random_color)
# one patient retains two observations
expect_length(sum_impact$patient_id, 40)
sum_impact_no_other_var <- summarize_by_patient(select(bin_impact, -random_color))
# expect that keeping additional var creates a data frame with more rows
expect_gt(nrow(sum_impact), nrow(sum_impact_no_other_var))
})
test_that("other vars resulting in non-unique samples will throw warning", {
samples <- gnomeR::mutations %>%
head(50) %>%
pull(sampleId) %>%
unique()
bin_impact <- create_gene_binary(samples = samples,
mutation = gnomeR::mutations,
cna = gnomeR::cna,
fusion = gnomeR::sv,
specify_panel = "impact") %>%
mutate(patient_id = gnomeR::extract_patient_id(sample_id)) %>%
select(c(sample_id, patient_id, starts_with("AR"), starts_with("PLCG2"), starts_with("PPM1D")))
set.seed(20230828)
bin_impact$random_color = sample(c("blue", "red", "yellow"),
size = length(samples), replace = TRUE)
expect_true("random_color" %in% names(bin_impact))
expect_message(summarize_by_patient(bin_impact,
other_vars = "random_color"))
})
test_that("no warning message thrown when only 1 alt type", {
samples <- gnomeR::mutations$sampleId
bin.mut <- create_gene_binary(
samples = samples, mutation = gnomeR::mutations,
mut_type = "omit_germline", snp_only = FALSE,
include_silent = FALSE
) %>%
mutate(patient_id = gnomeR::extract_patient_id(sample_id))
expect_no_warning(summarize_by_patient(bin.mut))
})
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.