####################
## Visualize data ##
####################
#' Visualize data in one function
#'
#' This function is an universal visualization function that allow calling other
#' hpaVis functions via a single function call. By default, this function will
#' use the dataset bundled with HPAanalyze, and provide a grid of all available
#' plots. The types of plots in the output can be specified via the
#' \code{visType} argument. If only one plot type is specified, this function
#' will return the exact same output as the specific hpaVis function used to
#' create the plot.
#'
#' @param data Input the list object generated by \code{hpa_download()} or
#' \code{hpa_subset()}. By default this function use the example dataset
#' bundled with HPAanalyze.
#' @param targetGene Vector of strings of HGNC gene symbols. By default it is
#' set to \code{c('TP53', 'EGFR', 'CD44', 'PTEN', 'IDH1')}. You can also mix
#' HGNC gene symbols and ensemnl ids (start with ENSG) and they will be
#' converted to HGNC gene symbols.
#' @param targetTissue Vector of strings of normal tissue names. By default it
#' is set to \code{"breast"}.
#' @param targetCellType Vector of strings of normal cell types. By default
#' inludes all available cell types in the target tissues.
#' @param targetCancer Vector of strings of normal tissues. By default it
#' is set to \code{"breast cancer"}.
#' @param visType Vector of strings indicating which plots will be generated.
#' Currently available values are \code{"all"}, \code{"Tissue"},
#' \code{"Patho"}, \code{"Cancer"}, \code{"Subcell"}.
#' @param color Vector of 4 colors used to depict different expression levels.
#' @param customTheme Logical argument. If \code{TRUE}, the function will return
#' a barebone ggplot2 plot to be customized further.
#' @param ... Additional arguments to be passed downstream to other hpaVis
#' functions being called behind the scene. These arguments includes
#' \code{targetTissue}, \code{targetCellType}, \code{targetCancer}. See
#' documentation for individual hpaVis functions for more information.
#'
#' @return If multiple visType is chosen, this function will return multiple
#' graphs in one panel. If only one visType is chosen, this function will
#' return a ggplot2 plot object, which can be further modified if desirable.
#' See help file for each of the hpaVis function for more information about
#' individual graphs.
#'
#' @seealso \code{\link{hpaDownload}}, \code{\link{hpaSubset}}
#' @family visualization functions
#'
#' @examples
#' hpaVis()
#'
#' @export
hpaVis <- function(data=NULL,
targetGene=NULL,
targetTissue=NULL,
targetCellType=NULL,
targetCancer=NULL,
visType=c('Tissue', 'Patho', 'Subcell'),
color=c("#FCFDBF", "#FE9F6D", "#DE4968", "#8C2981"),
customTheme=FALSE,
...) {
# Initiate empty variables
infoDisp <- FALSE
plot <- list()
# Check if data is provided or not
if (is.null(data)) {
message(paste0('No data provided. Use version ',
hpa_histology_data$metadata$HPAversion,
"."))
data = HPAanalyze::hpa_histology_data
}
# Check if targetGene is provided
if (is.null(targetGene)) {
message('targetGene variable not specified, default to TP53, RB1, MYC, KRAS and EGFR.')
targetGene <- c('TP53', 'EGFR', 'CD44', 'PTEN', 'IDH1')
infoDisp <- TRUE
}
# Generate a list of visType if choose 'all'
if (identical(visType,'all')) {
visType <- c('Tissue', 'Patho', 'Subcell')
}
# Make tissue plot
if ('Tissue' %in% visType) {
if (is.null(targetTissue)) {
message('targetTissue variable not specified, default to breast.')
targetTissue <- 'breast'
infoDisp <- TRUE
}
if (is.null(targetCellType)) {
message('targetCellType variable not specified, visualize all.')
targetCellType <- NULL
infoDisp <- TRUE
}
plot$Tissue <- hpaVisTissue(data=data,
targetGene=targetGene,
targetTissue=targetTissue,
targetCellType=targetCellType,
color=color,
customTheme=customTheme)
}
# Make cancer plot
if ('Patho' %in% visType | 'Cancer' %in% visType) {
if (is.null(targetCancer)) {
message('targetCancer variable not specified, default to breast cancer')
targetCancer <- 'breast cancer'
infoDisp <- TRUE
}
plot$Patho <- hpaVisPatho(data=data,
targetGene=targetGene,
targetCancer=targetCancer,
color=color,
customTheme=customTheme)
}
# Make Subcell plot
if ('Subcell' %in% visType) {
plot$Subcell <- hpaVisSubcell(data=data,
targetGene=targetGene,
color=color,
customTheme=customTheme)
}
# Show a message if any parameter is not defined
if (infoDisp) {
message('Use hpaListParam() to list possible values for target variables.')
}
# return a grid if more than one plot, otherwise return the ggplot
if (length(plot) > 1) {
return(gridExtra::grid.arrange(grobs = plot, ncol = 2))
} else {
return(plot[[1]])
}
}
#######################################
## Universal XML extraction function ##
#######################################
#' Extract details about an individual protein from XML file in one function
#'
#' This function is the umbrella function for the hpaXml function family. It
#' take the input of either one Ensembl gene id or a imported XML object
#' resulting from a \code{hpaXmlGet()} function call. By default, it will
#' extract all information available for HPAanalyze user from the XML file by
#' calling every hpaXml function and put all results into a list.
#'
#' @param inputXml Input can be either one Ensembl gene id (start with ENSG) or
#' a imported XML object resulting from a \code{hpaXmlGet()} function call.
#' You can also use HGNC gene symbol and it will be converted to ensembl id.
#' @param extractType A vector of strings indicate which information is desired
#' for extraction. By default this function will call all \code{hpaXml}
#' functions available. Other options are \code{'ProtClass'},
#' \code{'TissueExprSum'}, \code{'Antibody'}, \code{'TissueExpr'}.
#' @param ... Additional arguments to be passed downstream to other hpaXml
#' functions being called behind the scene. See help files of other hpaXml
#' functions for more information.
#'
#' @return This function returns a list. Each element of the list is information
#' extracted from the XML file specified using other hpaXml functions. See
#' help file for each XML function for more information.
#'
#' @family xml functions
#'
#' @examples
#' hpaXml(inputXml='ENSG00000131979', extractType=c('ProtClass', 'TissueExprSum', 'Antibody'))
#'
#' @export
hpaXml <- function(inputXml,
extractType = c('ProtClass', 'TissueExprSum', 'Antibody', 'TissueExpr'),
...) {
# initate variables
xml_output <- list()
# Test if input is a string or an xml object. If string, download the xml.
if (is.character(inputXml)) {
inputXml <- hpaXmlGet(targetEnsemblId=inputXml,
version = 'latest')
}
# Generate a list of extractType
if (identical(extractType,'all')) {
extractType <- c('ProtClass', 'TissueExprSum', 'Antibody', 'TissueExpr')
}
# Extract protein classes
if ('ProtClass' %in% extractType) {
xml_output$ProtClass <- hpaXmlProtClass(importedXml=inputXml)
}
# Extract tissue expression summary
if ('TissueExprSum' %in% extractType) {
xml_output$TissueExprSum <- hpaXmlTissueExprSum(importedXml=inputXml,
downloadImg=FALSE)
}
# Extract antibody
if ('Antibody' %in% extractType) {
xml_output$Antibody <- hpaXmlAntibody(importedXml=inputXml)
}
# Extract tissue expression
if ('TissueExpr' %in% extractType) {
xml_output$TissueExpr <- hpaXmlTissueExpr(importedXml=inputXml)
}
return(xml_output)
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.