-
Notifications
You must be signed in to change notification settings - Fork 0
/
test.config.yaml
84 lines (70 loc) · 3.14 KB
/
test.config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
###############################################################################
# Len Taing 2019 (TGBTG)
###############################################################################
# Automator test configuration file
###############################################################################
# Updated 2022-06-22 to use s1609 fast set
# Give the new instance a unique name, e.g. the wes run name
# NOTE: "wes-auto" will automatically be prepended to this string
instance_name: "fast-test"
# Define the number of cores for the wes instance
# Options- 32 (default), 64, 96
cores: 32
# Define the disk size to use in GB, default 500
# the name of the persistent disk will be: "wes_auto_{instance_name}_disk"
disk_size: 200
#DEFINE the path to the google bucket path for the run
google_bucket_path: gs://lens_bucket2/wes_automator/test4/
# Uncomment the following and define the specific wes commit string to use
wes_commit: "3fc07db"
#Uncomment the following and define the specific wes GCP image to use
#NOTE: IF a specific GCP image is not set via config['image'], then
#the default behavior is to get the latest wes image
image: 'wes-ver3-01a'
#Define the wes reference snapshot to use, default wes-ref-ver1-0
wes_ref_snapshot: 'wes-human-ref-ver1-7'
# SOMATIC CALLER to use, options are {tnsnv, tnhaplotyper2, tnscope}
# tnscope is the default EVEN if the somatic_caller param is NOT defined
somatic_caller: tnscope
# CIMAC center: choices are {'mocha', 'mda', 'broad' (default)}
cimac_center: 'mda'
# Trim soft clip reads when calling somatic variants? False (default)
# NOT available for tnsnv
trim_soft_clip: False
# DEFINE the samples- each sample should have a name, e.g. SAMPLE1
# and a Google bucket path to the input file,
# e.g. gs://mybucket/data/sample1.fastq.gz
# VALID INPUTS: fastq, fastq.gz
# NOTE: for PAIRED-END fastq/fastq.gz, give both pairs to the sample:
# SAMPLE_1_PE:
# - gs://mybucket/data/sample1_pair1.fastq
# - gs://mybucket/data/sample1_pair2.fastq
samples:
C3RXBPC7E.01:
- gs://lens_bucket2/wes_automator/jacob_s1609_fastset/C3RXBPC7E.01_N_10mill_R1.fastq.gz
- gs://lens_bucket2/wes_automator/jacob_s1609_fastset/C3RXBPC7E.01_N_10mill_R2.fastq.gz
C3RXBPCKM.01:
- gs://lens_bucket2/wes_automator/jacob_s1609_fastset/C3RXBPCKM.01_T_10mill_R1.fastq.gz
- gs://lens_bucket2/wes_automator/jacob_s1609_fastset/C3RXBPCKM.01_T_10mill_R2.fastq.gz
# metahseet- Group the samples into Tumor/Normal "runs"
# each run should have a name, e.g. run_1:
# then under each run, define a tumor and a normal sample
# EXAMPLE:
# metasheet:
# run_1:
# tumor: SAMPLE_Tumor
# normal: SAMPLE_normal
metasheet:
C3RXBPCKM.01:
tumor: C3RXBPCKM.01
normal: C3RXBPC7E.01
# (Optional) Define any RNA-seq expression data associated with the TUMOR
# samples only. Currently, only expression results from Salmon are supported.
# The sample names in this section must match the same names used in the
# previous section.
#rna:
# CA209009-Tumor:
# bam_file: gs://lens_bucket2/wes_automator/test_rna/rna_data/B4.sorted.clean.bam
# expression_file: gs://lens_bucket2/wes_automator/test_rna/rna_data/B4.quant.sf
# specify the GCP zone
zone: us-east1-c