forked from dnanexus-archive/parliament2
-
Notifications
You must be signed in to change notification settings - Fork 10
/
parliament2.py
80 lines (64 loc) · 6.12 KB
/
parliament2.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
#!/usr/bin/env python
import argparse
import subprocess
import gzip
import os
def parse_arguments():
args = argparse.ArgumentParser(description='Parliament2')
args.add_argument('--bam', required=True, help="The name of the Illumina BAM file for which to call structural variants containing mapped reads.")
args.add_argument('--bai', required=False, help="(Optional) The name of the corresponding index for the Illumina BAM file.")
args.add_argument('-r', '--ref_genome', required=True, help="The name of the reference file that matches the reference used to map the Illumina inputs.")
args.add_argument('--fai', required=False, help="(Optional) The name of the corresponding index for the reference genome file.")
args.add_argument('--prefix', required=False, help="(Optional) If provided, all output files will start with this. If absent, the base of the BAM file name will be used.")
args.add_argument('--filter_short_contigs', action="store_true", help="If selected, SV calls will not be generated on contigs shorter than 1 MB.")
args.add_argument('--breakdancer', action="store_true", help="If selected, the program Breakdancer will be one of the SV callers run.")
args.add_argument('--breakseq', action="store_true", help="If selected, the program BreakSeq2 will be one of the SV callers run.")
args.add_argument('--manta', action="store_true", help="If selected, the program Manta will be one of the SV callers run.")
args.add_argument('--cnvnator', action="store_true", help="If selected, the program CNVnator will be one of the SV callers run.")
args.add_argument('--lumpy', action="store_true", help="If selected, the program Lumpy will be one of the SV callers run.")
args.add_argument('--delly_deletion', action="store_true", help="If selected, the deletion module of the program Delly2 will be one of the SV callers run.")
args.add_argument('--delly_insertion', action="store_true", help="If selected, the insertion module of the program Delly2 will be one of the SV callers run.")
args.add_argument('--delly_inversion', action="store_true", help="If selected, the inversion module of the program Delly2 will be one of the SV callers run.")
args.add_argument('--delly_duplication', action="store_true", help="If selected, the duplication module of the program Delly2 will be one of the SV callers run.")
args.add_argument('--genotype', action="store_true", help="If selected, candidate events determined from the individual callers will be genotyped and merged to create a consensus output.")
args.add_argument('--svviz', action="store_true", help="If selected, visualizations of genotyped SV events will be produced with SVVIZ, one screenshot of support per event. For this option to take effect, Genotype must be selected.")
args.add_argument('--svviz_only_validated_candidates', action="store_true", help="Run SVVIZ only on validated candidates? For this option to be relevant, SVVIZ must be selected. NOT selecting this will make the SVVIZ component run longer.")
args.add_argument('--dnanexus', action="store_true", help=argparse.SUPPRESS)
return args.parse_args()
def gunzip_input(input_file):
if input_file.endswith('.gz'):
if os.path.isfile(input_file[:-3]):
return input_file[:-3]
else:
subprocess.check_call(['gunzip', input_file])
return input_file[:-3]
else:
return input_file
def run_parliament(bam, bai, ref_genome, fai, prefix, filter_short_contigs, breakdancer, breakseq, manta, cnvnator, lumpy, delly_deletion, delly_insertion, delly_inversion, delly_duplication, genotype, svviz, svviz_only_validated_candidates, dnanexus):
if bai is not None:
if fai is not None:
subprocess.check_call(['bash', 'parliament2.sh', bam, bai, ref_genome, fai, prefix, str(filter_short_contigs), str(breakdancer), str(breakseq), str(manta), str(cnvnator), str(lumpy), str(delly_deletion), str(delly_insertion), str(delly_inversion), str(delly_duplication), str(genotype), str(svviz), str(svviz_only_validated_candidates), str(dnanexus)])
else:
subprocess.check_call(['bash', 'parliament2.sh', bam, bai, ref_genome, "None", prefix, str(filter_short_contigs), str(breakdancer), str(breakseq), str(manta), str(cnvnator), str(lumpy), str(delly_deletion), str(delly_insertion), str(delly_inversion), str(delly_duplication), str(genotype), str(svviz), str(svviz_only_validated_candidates), str(dnanexus)])
else:
if fai is not None:
subprocess.check_call(['bash', 'parliament2.sh', bam, "None", ref_genome, fai, prefix, str(filter_short_contigs), str(breakdancer), str(breakseq), str(manta), str(cnvnator), str(lumpy), str(delly_deletion), str(delly_insertion), str(delly_inversion), str(delly_duplication), str(genotype), str(svviz), str(svviz_only_validated_candidates), str(dnanexus)])
else:
subprocess.check_call(['bash', 'parliament2.sh', bam, "None", ref_genome, "None", prefix, str(filter_short_contigs), str(breakdancer), str(breakseq), str(manta), str(cnvnator), str(lumpy), str(delly_deletion), str(delly_insertion), str(delly_inversion), str(delly_duplication), str(genotype), str(svviz), str(svviz_only_validated_candidates), str(dnanexus)])
def main():
args = parse_arguments()
prefix = args.prefix
if prefix is None:
if args.bam.endswith(".bam"):
prefix = args.bam[:-4]
else:
prefix = args.bam[:-5]
if not args.bam.startswith("/home/dnanexus/in/"):
args.bam = "/home/dnanexus/in/{0}".format(args.bam)
args.bai = "/home/dnanexus/in/{0}".format(args.bai)
args.ref_genome = "/home/dnanexus/in/{0}".format(args.ref_genome)
args.fai = "/home/dnanexus/in/{0}".format(args.fai)
ref_genome_name = gunzip_input(args.ref_genome)
run_parliament(args.bam, args.bai, ref_genome_name, args.fai, prefix, args.filter_short_contigs, args.breakdancer, args.breakseq, args.manta, args.cnvnator, args.lumpy, args.delly_deletion, args.delly_insertion, args.delly_inversion, args.delly_duplication, args.genotype, args.svviz, args.svviz_only_validated_candidates, args.dnanexus)
if __name__ == '__main__':
main()