inst/extdata/dataRecipes/gcp_broad_gatk_hg19.R

script <- "
filename=$1
idx=$2

url=https://storage.googleapis.com/gcp-public-data--broad-references/hg19/v0/$filename
wget $url
if [[ $idx ]]; then wget $url.$idx; fi
"
gcp_broad_gatk_hg19 <- recipeMake(shscript = script,
                                  paramID = c("filename", "idx"),
                                  paramType = c("string", "string?"),
                                  outputID = "gfile",
                                  outputGlob = "$(inputs.filename)*")

gcp_broad_gatk_hg19 <- addMeta(
    gcp_broad_gatk_hg19,
    label = "gcp_broad_gatk_hg19",
    doc = "GATK annotation bundle for hg19 from GCP (gs://gcp-public-data--broad-references/hg19/v0/)",
    inputLabels = c("file name", "index"),
    inputDocs = c("The file basename to download from the broad GCP bucket",
                  "The 'idx' or 'tbi' index file if existing"),
    outputLabels = c("gfile"),
    outputDocs = c("The downloaded annotation files"),
    extensions = list(
        author = "rworkflow team",
        date = Sys.Date(),
        url = "https://console.cloud.google.com/storage/browser/gcp-public-data--broad-references/hg19/v0",
        example = paste(
            "gcp_broad_gatk_hg19 <- recipeLoad('gcp_broad_gatk_hg19')",
            "gcp_broad_gatk_hg19$filename <- '1000G_omni2.5.b37.vcf.gz'",
            "getData(gcp_broad_gatk_hg19, outdir = 'data/folder', notes = c('gcp', 'broad', 'reference', 'hg19', 'v0', '1000G', 'omni2.5'))",
            "",
            "## Get data from local catch",
            "dataUpdate('data/folder')", 
            "dataSearch(c('gcp', 'broad', 'hg19'))",
            "", 
            sep="\n"))
)
rworkflow/ReUseData documentation built on Dec. 7, 2023, 11 p.m.