.GenomicScoresMetadataFromUrl <- function(baseUrl, track) {
require(GenomeInfoDb)
## genus+species to NCBI taxon identifier from GenomeInfoDb
load(system.file("extdata", "assembly_accessions.rda", package="GenomeInfoDb"))
assembly_accessions <- get("assembly_accessions") ## just to avoid a NOTE during R CMD check
gd <- readRDS(gzcon(url(sprintf("%s%s/refgenomeGD.rds", baseUrl, track),
open="rb")))
rdsFiles <- GenomicScores:::.getSubDirs(sprintf("%s%s", baseUrl, track))
rdsFiles <- rdsFiles[grep(track, rdsFiles)]
taxonId <- as.integer(subset(assembly_accessions, organism_name == organism(gd))$taxid)[1]
obj <- readRDS(gzcon(url(sprintf("%s%s/%s", baseUrl, track, rdsFiles[1]),
open="rb")))
rDataPath <- sprintf("%s/%s", track, rdsFiles)
chr <- sub(".rds", "", sub(paste0(track, "."), "", rdsFiles))
stopifnot(all(chr %in% seqnames(gd))) ## QC
metadf <- data.frame(title=rdsFiles,
species=rep(organism(gd), length(rdsFiles)),
taxonomyId=rep(taxonId, length(rdsFiles)),
genome=rep(providerVersion(gd), length(rdsFiles)),
sourceUrl=sprintf("%s%s/%s", baseUrl, track, rdsFiles),
sourceVersion=rep(metadata(obj)$provider_version, length(rdsFiles)),
description=sprintf("CADD scores for %s on %s", organism(gd), chr),
rDataPath=rDataPath,
stringsAsFactors=FALSE)
rownames(metadf) <- NULL
metadf
}
makeMetadata_CADD.v1.3.hg19 <- function()
{
biocver <- "3.6"
baseUrl <- "http://functionalgenomics.upf.edu/annotationhub/cadd/"
meta <- .GenomicScoresMetadataFromUrl(baseUrl, "cadd.v1.3.hg19")
n <- nrow(meta)
data.frame(
BiocVersion=rep(biocver, n),
Description=meta$description,
Genome=meta$genome,
SourceUrl=meta$sourceUrl,
SourceType=rep("VCF", n),
SourceVersion=meta$sourceVersion,
Species=meta$species,
TaxonomyId=meta$taxonomyId,
Title=meta$title,
ResourceName=meta$title,
RDataPath=meta$rDataPath,
Coordinate_1_based=rep(TRUE, n),
DataProvider=rep("UWashington", n),
Maintainer=rep("Robert Castelo <robert.castelo@upf.edu>", n),
RDataClass=rep("Rle", n),
DispatchClass=rep("RDS", n),
Location_Prefix=baseUrl,
Tags=rep(paste("CADD", "GScores", sep=","), n))
}
metadata <- makeMetadata_CADD.v1.3.hg19()
write.csv(metadata, file="../extdata/metadata_CADD.v1.3.hg19.csv", row.names=FALSE)
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.