R/utils_depmap.R

Defines functions .make_gene_tag .make_dependency_tag get_depmap_essentiality build_depmap_db .error_if_no_mygene .error_if_no_pool .error_if_no_rsqlite .error_if_no_depmap

Documented in build_depmap_db get_depmap_essentiality

# nocov start
.error_if_no_depmap <- function() {
    if (!requireNamespace("depmap", quietly = TRUE)) {
        stop("'depmap' installation required for using depmap data.")
    }
}


.error_if_no_rsqlite <- function() {
    if (!requireNamespace("RSQLite", quietly = TRUE)) {
        stop("'RSQLite' installation required for building and using depmap database.")
    }
}


.error_if_no_pool <- function() {
    if (!requireNamespace("pool", quietly = TRUE)) {
        stop("'pool' installation required for building and using depmap database.")
    }
}


.error_if_no_mygene <- function() {
    if (!requireNamespace("mygene", quietly = TRUE)) {
        stop("'mygene' installation required to display gene information.")
    }
}
# nocov end

#' Build SQLite database of DepMap data
#'
#' @param retrieve Character vector of data to retrieve from DepMap. Options include:
#' \itemize{
#'   \item \code{rnai}: RNAi screen data from \code{\link[depmap]{depmap_rnai}}.
#'   \item \code{crispr}: CRISPR screen data from \code{\link[depmap]{depmap_crispr}}.
#'   \item \code{cn}: Copy number data from \code{\link[depmap]{depmap_copyNumber}}.
#'   \item \code{ccle_tpm}: TPM data from \code{\link[depmap]{depmap_TPM}}.
#'   \item \code{meta}: Cell line metadata from \code{\link[depmap]{depmap_metadata}}.
#'   \item \code{drug}: Drug sensitivity data from \code{\link[depmap]{depmap_drug_sensitivity}}.
#'   \item \code{gene.summary}: Gene summary data from \code{\link[depmap]{depmap_gene_summary}}.
#'   \item \code{release}: DepMap release information from from \code{\link[depmap]{depmap_release}}.
#' }
#' @param file Name of SQLite database file to create.
#'
#' @return Name of SQLite database containing DepMap data.
#'
#' @export
#' @author Jared Andrews
#'
#' @seealso \code{\link[depmap]{depmap_rnai}}, \code{\link[depmap]{depmap_crispr}},
#' \code{\link[depmap]{depmap_copyNumber}}, \code{\link[depmap]{depmap_TPM}},
#' \code{\link[depmap]{depmap_metadata}}, \code{\link[depmap]{depmap_gene_summary}},
#' \code{\link[depmap]{depmap_drug_sensitivity}}, \code{\link[depmap]{depmap_release}}
#' \code{\link[pool]{dbPool}}, \code{\link[DBI]{dbWriteTable}}
#'
#' @examples
#' library(CRISPRball)
#' build_depmap_db(retrieve = "release")
build_depmap_db <- function(retrieve = c(
                                "rnai", "crispr", "dependency", "cn",
                                "ccle_tpm", "meta", "drug", "gene.summary",
                                "release"
                            ),
                            file = "depmap_db.sqlite") {
    .error_if_no_depmap()
    .error_if_no_pool()
    .error_if_no_rsqlite()

    pool <- pool::dbPool(RSQLite::SQLite(), dbname = file)

    # Get depmap data and make table in database.
    if ("rnai" %in% retrieve) {
        rnai <- depmap::depmap_rnai()
        rnai$gene <- NULL
        rnai$cell_line <- NULL
        pool::dbWriteTable(pool, "rnai", rnai, overwrite = TRUE, append = FALSE)
        rm(rnai)
    }

    if ("crispr" %in% retrieve) {
        crispr <- depmap::depmap_crispr()
        crispr$gene <- NULL
        crispr$cell_line <- NULL
        pool::dbWriteTable(pool, "crispr", crispr, overwrite = TRUE, append = FALSE)
        rm(crispr)
    }

    if ("cn" %in% retrieve) {
        cn <- depmap::depmap_copyNumber()
        cn$gene <- NULL
        cn$cell_line <- NULL
        pool::dbWriteTable(pool, "cn", cn, overwrite = TRUE, append = FALSE)
        rm(cn)
    }

    if ("ccle_tpm" %in% retrieve) {
        ccle_tpm <- depmap::depmap_TPM()
        ccle_tpm$gene <- NULL
        ccle_tpm$cell_line <- NULL
        pool::dbWriteTable(pool, "ccle_tpm", ccle_tpm, overwrite = TRUE, append = FALSE)
        rm(ccle_tpm)
    }

    if ("meta" %in% retrieve) {
        meta <- depmap::depmap_metadata()
        pool::dbWriteTable(pool, "meta", as.data.frame(meta), overwrite = TRUE, append = FALSE)
        rm(meta)
    }

    if ("drug" %in% retrieve) {
        drug <- depmap::depmap_drug_sensitivity()
        drug$gene <- NULL
        drug$cell_line <- NULL
        drug$smiles <- NULL
        pool::dbWriteTable(pool, "drug", drug, overwrite = TRUE, append = FALSE)
        rm(drug)
    }

    if ("gene.summary" %in% retrieve) {
        gene.summary <- depmap::depmap_gene_summary()
        pool::dbWriteTable(pool, "gene.summary", as.data.frame(gene.summary), overwrite = TRUE, append = FALSE)
        rm(gene.summary)
    }

    if ("release" %in% retrieve) {
        release <- depmap::depmap_release()
        pool::dbWriteTable(pool, "release", as.data.frame(list("depmap_release" = depmap::depmap_release())), overwrite = TRUE, append = FALSE)
        rm(release)
    }

    pool::poolClose(pool)

    file
}


#' Get essential/selective gene information from DepMap summary table.
#'
#' @param gene Character scalar for gene symbol.
#' @param depmap.summary data.frame containing DepMap gene summary information.
#' @return Named list containing RNAi and CRISPR named lists containing dataset information for the provided gene,
#'   if available. If the gene is not found in the summary data.frame, the \code{avail} element for the RNAi and CRISPR lists
#'   will be set to \code{FALSE}.
#'
#' @export
#' @author Jared Andrews
#'
#' @examples
#' library(CRISPRball)
#' build_depmap_db(retrieve = "gene.summary")
#' pool <- pool::dbPool(RSQLite::SQLite(), dbname = "depmap_db.sqlite")
#' depmap.gene <- pool::dbGetQuery(pool, "SELECT * FROM 'gene.summary'")
#'
#' essentials <- get_depmap_essentiality(gene = "CDK2", depmap.summary = depmap.gene)
get_depmap_essentiality <- function(gene, depmap.summary) {
    crispr <- list(avail = FALSE)
    rnai <- list(avail = FALSE)

    if (gene %in% depmap.summary$gene_name) {
        df <- depmap.summary[depmap.summary$gene_name == gene, ]

        if ("RNAi_merged" %in% df$dataset) {
            rnai$avail <- TRUE
            rnai$dataset <- "RNAi_merged"
            rnai$dep_lines <- df$dependent_cell_lines[df$dataset == rnai$dataset]
            rnai$total_lines <- df$cell_lines_with_data[df$dataset == rnai$dataset]

            if (df$common_essential[df$gene_name == gene & df$dataset == rnai$dataset] == 1) {
                rnai$label <- "COMMON ESSENTIAL"
            } else if (df$strongly_selective[df$gene_name == gene & df$dataset == rnai$dataset] == 1) {
                rnai$label <- "STRONGLY SELECTIVE"
            }
        }

        # Check for various potential CRISPR datasets.
        if ("Chronos_Combined" %in% df$dataset) {
            crispr$dataset <- "Chronos_Combined"
        } else if ("Chronos_Achilles" %in% df$dataset) {
            crispr$dataset <- "Chronos_Achilles"
        } else if ("Chronos_Score" %in% df$dataset) {
            crispr$dataset <- "Chronos_Score"
        }

        if (!is.null(crispr$dataset)) {
            crispr$avail <- TRUE
            crispr$dep_lines <- df$dependent_cell_lines[df$dataset == crispr$dataset]
            crispr$total_lines <- df$cell_lines_with_data[df$dataset == crispr$dataset]

            if (df$common_essential[df$gene_name == gene & df$dataset == crispr$dataset] == 1) {
                crispr$label <- "COMMON ESSENTIAL"
            } else if (df$strongly_selective[df$gene_name == gene & df$dataset == crispr$dataset] == 1) {
                crispr$label <- "STRONGLY SELECTIVE"
            }
        }
    }

    outs <- list(crispr = crispr, rnai = rnai)
    return(outs)
}


#' Generate dependency summary info tagList
#' @param dep.info Named list containing summary CRISPR and RNAi info.
#' @param dep.release Character scalar for DepMap release as returned by \code{\link[depmap]{depmap_release}}.
#' @param crispr.color Character scalar for color to use for CRISPR title.
#' @param rnai.color Character scalar for color to use for RNAi title.
#'
#' @return TagList containing dependency summary information.
#'
#' @importFrom shiny span strong tagList div icon
#' @importFrom shinyBS popify
#' @author Jared Andrews
#' @rdname INTERNAL_make_dependency_tag
.make_dependency_tag <- function(dep.info, dep.release, crispr.color, rnai.color) {
    cinfo <- "N/A"
    if (dep.info$crispr$avail) {
        cinfo <- paste0(dep.info$crispr$dep_lines, "/", dep.info$crispr$total_lines)
    }

    rinfo <- "N/A"
    if (dep.info$rnai$avail) {
        rinfo <- paste0(dep.info$rnai$dep_lines, "/", dep.info$rnai$total_lines)
    }

    c.lab <- NULL
    r.lab <- NULL

    cess.mess <- c(
        "A gene which, in a large, pan-cancer screen, ranks in the top X most ",
        "depleting genes in at least 90% of cell lines. X is chosen empirically ",
        "using the minimum of the distribution of gene ranks in their 90th percentile ",
        "least depleting lines."
    )

    ssel.mess <- c(
        "A gene whose dependency is at least 100 times more likely to have been sampled",
        "from a skewed distribution than a normal distribution."
    )

    if (!is.null(dep.info$crispr$label)) {
        outpop <- if (dep.info$crispr$label == "COMMON ESSENTIAL") cess.mess else ssel.mess
        c.lab <- span(strong(dep.info$crispr$label),
            popify(icon("info-circle", style = "font-size: 12px"), dep.info$crispr$label,
                outpop,
                placement = "right", trigger = c("hover", "click"), options = list(container = "body")
            ), br(),
            style = paste0("background: ", crispr.color, "; color: #ffffff; border-radius: 5px; padding: 3px;")
        )
    }

    if (!is.null(dep.info$rnai$label)) {
        outpop <- if (dep.info$rnai$label == "COMMON ESSENTIAL") cess.mess else ssel.mess
        r.lab <- span(strong(dep.info$rnai$label),
            popify(icon("info-circle", style = "font-size: 12px"), dep.info$rnai$label,
                outpop,
                placement = "right", trigger = c("hover", "click"), options = list(container = "body")
            ), br(),
            style = paste0("background: ", rnai.color, "; color: #ffffff; border-radius: 5px; padding: 3px;")
        )
    }

    out <- tagList(
        div(span(strong(paste0("CRISPR (DepMap ", dep.release, ", ", dep.info$crispr$dataset, "): ", cinfo)),
            style = paste0("color: ", crispr.color, ";")
        ), style = "margin-bottom: 7px;"),
        c.lab,
        div(span(strong(paste0("RNAi (DepMap ", dep.release, ", ", dep.info$rnai$dataset, "): ", rinfo)),
            style = paste0("color: ", rnai.color, ";")
        ), style = "margin-bottom: 7px; margin-top: 8px"),
        r.lab
    )

    return(out)
}


#' Generate gene tagList via mygene API
#'
#' Given a query gene symbol, this function will query the mygene API and parse the results
#' into a tagList of relevant information for display in the UI.
#'
#' @details
#' Occasionally, the top hit returned by mygene will not be the gene symbol of interest.
#' Typically, this occurs when the gene symbol is out of date or has an associated antisense gene.
#'
#' @param gene Character scalar for gene symbol to use as query.
#'
#' @return TagList containing dependency summary information.
#'
#' @author Jared Andrews
#' @seealso \code{\link[mygene]{query}}
#' @rdname INTERNAL_make_gene_tag
.make_gene_tag <- function(gene) {
    .error_if_no_mygene()
    info <- mygene::query(gene, fields = "all", size = 1)

    if (length(info$hits) > 0) {
        info <- info$hits
        out <- tagList(
            splitLayout(span(strong("Gene: "), info$symbol), span(strong("Aliases: "), paste0(unlist(info$alias), collapse = ", "))),
            splitLayout(
                span(strong("Position: "), paste0(info$genomic_pos$chr, ":", info$genomic_pos$start, "-", info$genomic_pos$end)),
                span(strong("Gene type: "), info$type_of_gene)
            ),
            splitLayout(
                span(strong("Entrez: "), a(info$entrezgene, href = paste0("https://www.ncbi.nlm.nih.gov/gene/", info$entrezgene))),
                span(strong("Ensembl: "), a(info$ensembl$gene, href = paste0("http://www.ensembl.org/id/", info$ensembl$gene)))
            ),
            div(br(), span(strong("Summary: "), info$summary))
        )
    } else {
        out <- tagList(div(span("Unable to find gene information.")))
    }

    return(out)
}
j-andrews7/CRISPRball documentation built on Dec. 23, 2024, 9:45 a.m.