Skip to content

Commit

Permalink
Sketch of using Nirvana reference disk
Browse files Browse the repository at this point in the history
  • Loading branch information
mcovarr committed Jan 24, 2023
1 parent c15e5fc commit da5537c
Show file tree
Hide file tree
Showing 2 changed files with 97 additions and 0 deletions.
8 changes: 8 additions & 0 deletions .dockstore.yml
Original file line number Diff line number Diff line change
Expand Up @@ -253,6 +253,14 @@ workflows:
branches:
- master
- ah_var_store
- name: NirvanaReferenceDisk
subclass: WDL
primaryDescriptorPath: /scripts/variantstore/wdl/NirvanaReferenceDisk.wdl
filters:
branches:
- master
- ah_var_store
- mc_nirvana_reference_disk
- name: MitochondriaPipeline
subclass: WDL
primaryDescriptorPath: /scripts/mitochondria_m2_wdl/MitochondriaPipeline.wdl
Expand Down
89 changes: 89 additions & 0 deletions scripts/variantstore/wdl/NirvanaReferenceDisk.wdl
Original file line number Diff line number Diff line change
@@ -0,0 +1,89 @@
version 1.0

workflow NirvanaReferenceDisk {
input {
}

call ReferenceDiskTask {
}

output {
File stdout = ReferenceDiskTask.stdout
}
}


task ReferenceDiskTask {
input {
# Nirvana references sourced from firecloud-develop cromwell-reference-images.conf.
Array[File] references = [
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/phyloP_hg38.npd",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/phyloP_hg38.npd.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/gnomAD_gene_scores_2.1.nga",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/1000_Genomes_Project_Phase_3_v3_plus.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/1000_Genomes_Project_Phase_3_v3_plus_refMinor.rma.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/References/Homo_sapiens.GRCh38.Nirvana.dat",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/Cache/GRCh38/Both.sift.ndb",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/ClinGen_Dosage_Sensitivity_Map_20220512.nsi",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/SpliceAi_1.3.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/dbSNP_151_globalMinor.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/TOPMed_freeze_5.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/Gerp_20110522.gsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/Cache/GRCh38/Both.transcripts.ndb",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/MultiZ100Way_20171006.pcs",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/dbSNP_155.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/ClinVar_20220505.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/dbSNP_155.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/Cache/GRCh38/Both.polyphen.ndb",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/TOPMed_freeze_5.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/gnomAD_SV_2.1.nsi",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/ClinGen_disease_validity_curations_20220512.nga",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/OMIM_20220516.nga",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/REVEL_20200205.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/GME_20160618.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/DANN_20200205.gsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/PrimateAI_0.2.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/ClinVar_20220505.nsi",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/GME_20160618.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/1000_Genomes_Project_Phase_3_v3_plus.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/gnomAD_LCR_2.1.lcr",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/PrimateAI_0.2.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/ClinGen_Dosage_Sensitivity_Map_20220512.nga",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/MITOMAP_SV_20200819.nsi",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/REVEL_20200205.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/ClinGen_20160414.nsi",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/SpliceAi_1.3.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/DECIPHER_201509.nsi",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/DANN_20200205.gsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/gnomAD_3.1.2.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/COSMIC_GeneFusions_94.gfj",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/dbSNP_151_globalMinor.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/FusionCatcher_1.33.gfs",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/1000_Genomes_Project_(SV)_Phase_3_v5a.nsi",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/MITOMAP_20200819.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/ClinVar_20220505.nsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/1000_Genomes_Project_Phase_3_v3_plus_refMinor.rma",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/Gerp_20110522.gsa.idx",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/MITOMAP_20200819.nsa",
"gs://broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1/SupplementaryAnnotation/GRCh38/gnomAD_3.1.2.nsa"
]
}

command <<<
# Prepend date, time and pwd to xtrace log entries.
PS4='\D{+%F %T} \w $ '
set -o errexit -o nounset -o pipefail -o xtrace

NIRVANA_REFERENCE_DIR=/cromwell_root/broad-public-datasets/gvs/vat-annotations/Nirvana/3.18.1

find $NIRVANA_REFERENCE_DIR -print
>>>

runtime {
docker: "ubuntu:latest"
}

output {
File stdout = read_string(stdout())
}
}

0 comments on commit da5537c

Please sign in to comment.