test.config.yaml

###############################################################################
# Len Taing 2019 (TGBTG)
###############################################################################
# Automator test configuration file
###############################################################################
# Updated 2022-06-22 to use s1609 fast set

# Give the new instance a unique name, e.g. the wes run name
# NOTE: "wes-auto" will automatically be prepended to this string
instance_name: "fast-test"

# Define the number of cores for the wes instance
# Options- 32 (default), 64, 96 
cores: 32

# Define the disk size to use in GB, default 500
# the name of the persistent disk will be: "wes_auto_{instance_name}_disk"
disk_size: 200

#DEFINE the path to the google bucket path for the run
google_bucket_path: gs://lens_bucket2/wes_automator/test4/

# Uncomment the following and define the specific wes commit string to use
wes_commit: "3fc07db"

#Uncomment the following and define the specific wes GCP image to use
#NOTE: IF a specific GCP image is not set via config['image'], then
#the default behavior is to get the latest wes image
image: 'wes-ver3-01a'

#Define the wes reference snapshot to use, default wes-ref-ver1-0
wes_ref_snapshot: 'wes-human-ref-ver1-7'

# SOMATIC CALLER to use, options are {tnsnv, tnhaplotyper2, tnscope}
# tnscope is the default EVEN if the somatic_caller param is NOT defined
somatic_caller: tnscope

# CIMAC center: choices are {'mocha', 'mda', 'broad' (default)}
cimac_center: 'mda'

# Trim soft clip reads when calling somatic variants? False (default)
# NOT available for tnsnv
trim_soft_clip: False

# DEFINE the samples- each sample should have a name, e.g. SAMPLE1
# and a Google bucket path to the input file, 
# e.g. gs://mybucket/data/sample1.fastq.gz
# VALID INPUTS: fastq, fastq.gz
# NOTE: for PAIRED-END fastq/fastq.gz, give both pairs to the sample:
# SAMPLE_1_PE:
#   - gs://mybucket/data/sample1_pair1.fastq
#   - gs://mybucket/data/sample1_pair2.fastq
samples:
  C3RXBPC7E.01:
    - gs://lens_bucket2/wes_automator/jacob_s1609_fastset/C3RXBPC7E.01_N_10mill_R1.fastq.gz
    - gs://lens_bucket2/wes_automator/jacob_s1609_fastset/C3RXBPC7E.01_N_10mill_R2.fastq.gz
  C3RXBPCKM.01:
    - gs://lens_bucket2/wes_automator/jacob_s1609_fastset/C3RXBPCKM.01_T_10mill_R1.fastq.gz
    - gs://lens_bucket2/wes_automator/jacob_s1609_fastset/C3RXBPCKM.01_T_10mill_R2.fastq.gz

# metahseet- Group the samples into Tumor/Normal "runs"
# each run should have a name, e.g. run_1:
# then under each run, define a tumor and a normal sample
# EXAMPLE:
# metasheet:
#  run_1:
#    tumor: SAMPLE_Tumor
#    normal: SAMPLE_normal
metasheet:
  C3RXBPCKM.01:
    tumor: C3RXBPCKM.01
    normal: C3RXBPC7E.01

# (Optional) Define any RNA-seq expression data associated with the TUMOR
# samples only.  Currently, only expression results from Salmon are supported.
# The sample names in this section must match the same names used in the
# previous section.
#rna:
#  CA209009-Tumor:
#    bam_file: gs://lens_bucket2/wes_automator/test_rna/rna_data/B4.sorted.clean.bam
#    expression_file: gs://lens_bucket2/wes_automator/test_rna/rna_data/B4.quant.sf

# specify the GCP zone
zone: us-east1-c