comparison breakdancer.xml @ 0:694cbef83948 draft

planemo upload for repository https://github.com/portiahollyoak/Tools commit 9700cff725be112c4a813f914eca946e158fbebd-dirty
author portiahollyoak
date Fri, 13 May 2016 11:47:32 -0400
parents
children 8c1e654262b1
comparison
equal deleted inserted replaced
-1:000000000000 0:694cbef83948
1 <tool id="breakdancer_max" name="BreakdancerMax" version="1.3.6">
2 <description></description>
3 <requirements>
4 <requirement type="package" version="0.1.19">samtools</requirement>
5 <requirement type="package" version="1.4.5">breakdancer</requirement>
6 </requirements>
7 <stdio>
8 <exit_code range="1:" />
9 </stdio>
10 <command><![CDATA[
11 ln -f -s "$input_file.metadata.bam_index" alignment.bam.bai &&
12 ln -f -s "$input_file" alignment.bam &&
13 python $__tool_directory__/create_config_file.py
14 --input_file alignment.bam
15 --mean "$mean"
16 --std_dev "$std_dev"
17 --read_length "$read_length"
18 --sample_name "$sample_name"
19 --output_config_file output_config_file &&
20 cat output_config_file &&
21 breakdancer-max
22 -s "$min_length"
23 -c "$cutoff"
24 -m "$maximum_sv"
25 -q "$quality"
26 -r "$min_rp"
27 -x "$hap_seq_threshold"
28 -b "$buffer_size"
29 $transchr_rearr
30 -d "$sample_name"
31 -g "$sample_name"
32 $illumina_long
33 $copy_number_bam
34 $allele_freq
35 -y "$output_score_filter"
36 output_config_file &&
37 mv "$sample_name" "$results_bed"
38 ]]></command>
39 <inputs>
40 <param name="input_file" type="data" format="bam" label="One or more alignment files"/>
41 <param name="mean" type="integer" value="" label="Mean Insert Size"/>
42 <param name="std_dev" type="integer" value="" label="The standard deviation of insert size"/>
43 <param name="read_length" type="integer" value="" label="Average read length"/>
44 <param name="sample_name" type="text" label="Sample name"/>
45 <param name="min_length" type="integer" value="7"
46 label="Minimal required size of a SV anchoring region from which the anomalously mapped reads are found"/>
47 <param name="cutoff" type="integer" value="3" label="Cutoff in unit of standard deviation"/>
48 <param name="maximum_sv" type="integer" value="1000000000" label="Maximum SV Size"/>
49 <param name="quality" type="integer" value="35" label="Minimum MAQ mapping quality threshold"/>
50 <param name="min_rp" type="integer" value="2"
51 label="Minimum number of read pairs required to establish a connection"/>
52 <param name="hap_seq_threshold" type="integer" value="1000"
53 label="Maximum threshold of haploid sequence coverage for regions to be ignored"/>
54 <param name="buffer_size" type="integer" value="100"
55 label="Buffer size for building connection"/>
56 <param name="transchr_rearr" type="boolean" checked="false" truevalue="-t" falsevalue=""
57 label="Only detect transchromosomal rearrangement (Default = No)"/>
58 <param name="illumina_long" type="boolean" checked="false" truevalue="-l" falsevalue=""
59 label="Analyze Illumina long insert (mate-pair) library"/>
60 <param name="copy_number_bam" type="boolean" checked="false" truevalue="-a" falsevalue=""
61 label="Compute copy number and support reads per library rather than per bam (Default = No)"/>
62 <param name="allele_freq" type="boolean" checked="false" truevalue="-h" falsevalue=""
63 label="Print out Allele Frequencing column (Default= No)"/>
64 <param name="output_score_filter" type="integer" value="30" label="Output Score filter"/>
65 </inputs>
66 <outputs>
67 <data name="results_bed" type="data" format="bed" help="BED file containing SVs and supporting reads" label="${sample_name}.bed"/>
68 </outputs>
69 <tests>
70 <test>
71 <param name="input_file" value="X_Hum1.bwa.bam" ftype="bam"/>
72 <param name="mean" value="227"/>
73 <param name="std_dev" value="98"/>
74 <param name="read_length" value="125"/>
75 <param name="sample_name" value="X_HUM1"/>
76 <param name="output_config_file" value="config_X_HUM1" ftype="txt"/>
77 <param name="chromosome" value="ALL"/>
78 <param name="min_length" value="7"/>
79 <param name="cutoff" value="3"/>
80 <param name="maximum_sv" value="1000000000"/>
81 <param name="quality" value="35"/>
82 <param name="min_rp" value="2"/>
83 <param name="hap_seq_threshold" value="1000"/>
84 <param name="buffer_size" value="100"/>
85 <param name="transchr_rearr" value=""/>
86 <param name="prefix" value=""/>
87 <param name="illumina_long" value=""/>
88 <param name="copy_number_bam" value=""/>
89 <param name="allele_freq" value=""/>
90 <param name="output_score_filter" value="40"/>
91 <output name="results_bed" file="X_HUM1" ftype="bed"/>
92 </test>
93 </tests>
94 <help> <![CDATA[
95 BreakDancer (previously BreakDancerMax) provides genome-wide detection of five types of structural variants: insertions, deletions, inversions, inter- and intra-chromosomal translocations from next-generation short paired-end sequencing reads using read pairs that are mapped with unexpected separation distances or orientation.
96
97 The following inputs are required:
98 ----------------------------------
99
100 - One or more BAM alignment files produced by a front-end aligner such as MAQ, BWA, NovoAlign or Bfast. Listing multiple alignment files enables pooled analysis. For individual analysis, run alignment files through Breakdancer individually.
101 - Mean Insert Size for each alignment file
102 - The standard deviation for each alignment file
103 - The Average Read length for each alignment file
104 - The sample name for each alignment file
105 - Name of BED output file containg SVs and supporting reads
106
107 The following parameters can be set:
108 ------------------------------------
109
110 - Which chromosome to operate on (chromosome name must match one used in alignment file.
111 - The minimal required size of a SV anchoring region from which the anomalously mapped reads are found. (Default = 7). This parameter has some small effects on the SV detection accuracy. Increasing minimal required size improves the specificity but also reduces the sensitivity.
112 - Cutoff in unit of standard deviation. (Default = 3). Therefore, the upper and the lower separation threshold would be: mean + 3 std and mean - 3 std respectively. It is useful to explicitly specify the upper and the lower separation thresholds when the insert size distribution is not symmetric to the mean.
113 - Maximum SV size. (Default = 1000000000)
114 - Minimum MAQ mapping quality threshold. Can be used to skip reads that are not confidently mapped. (Default = 35)
115 - Minimum number of read pairs required to establish a connection. (Default = 2)
116 - Maximum threshold of haploid sequence coverage for regions to be ignored. (Default = 1000)
117 - Buffer size for building connection. The -b parameter specifies the number of anomalous regions resides in the RAM before SV hypotheses begin to form among these regions. For dataset that is exceptionally large, it may be helpful to reduce it to cut the resident RAM usage. (Default = 100)
118 - Only detect transchromosomal rearrangement. (Default = off)
119 - Prefix of fastq files to which SV supporting reads will be saved to, by library
120 - Analyze Illumina long insert (mate-pair) library (Default = off)
121 - Compute copy number by bam file rather than by library (Default = on)
122 - Print out Allele Frequencing column (Default = off)
123 - Output Score filter (Default = 40)
124
125 Output files
126 ------------
127 BreakDancer output is a BED file containing SVs and supporting reads. It has the following columns:
128 1. Chromosome 1
129 2. Position 1
130 3. Orientation 1
131 4. Chromosome 2
132 5. Position 2
133 6. Orientation 2
134 7. Type of a SV
135 8. Size of a SV
136 9. Confidence Score
137 10. Total number of supporting read pairs
138 11. Total number of supporting read pairs from each map file
139 12. Estimated allele frequency
140 13. Software version
141 14. The run parameters
142
143 Columns 1-3 and 4-6 are used to specify the coordinates of the two SV breakpoints. The orientation is a string that records the number of reads mapped to the plus (+) or the minus (-) strand in the anchoring regions.
144
145 Column 7 is the type of SV detected: DEL (deletions), INS (insertion), INV (inversion), ITX (intra-chromosomal translocation), CTX (inter-chromosomal translocation), and Unknown.
146 Column 8 is the size of the SV in bp. It is meaningless for inter-chromosomal translocations.
147 Column 9 is the confidence score associated with the prediction.
148 Column 11 can be used to dissect the origin of the supporting read pairs, which is useful in pooled analysis. For example, one may want to give SVs that are supported by more than one libraries higher confidence than those detected in only one library. It can also be used to distinguish somatic events from the germline, i.e., those detected in only the tumor libraries versus those detected in both the tumor and the normal libraries.
149 Column 12 is currently a placeholder for displaying estimated allele frequency. The allele frequencies estimated in this version are not accurate and should not be trusted.
150 Column 13 and 14 are information useful to reproduce the results.
151
152 Example 1:
153 1 10000 10+0- 2 20000 7+10- CTX -296 99 10 tB|10 1.00 BreakDancerMax-0.0.1 t1
154
155 An inter-chromosomal translocation that starts from chr1:10000 and goes into chr2:20000 with 10 supporting read pairs from the library tB and a confidence score of 99.
156
157 Example 2:
158 1 59257 5+1- 1 60164 0+5- DEL 862 99 5 nA|2:tB|1 0.56 BreakDancerMax-0.0.1 c4
159
160 A deletion between chr1:59257 and chr1:60164 connected by 5 read pairs, among which 2 in library nA and 1 in library tB support the deletion hypothesis. This deletion is detected by BreakDancerMax-0.0.1 with a separation threshold of 4 s.d.
161
162 Example 3:
163 1 62767 10+0- 1 63126 0+10- INS -13 36 10 NA|10 1.00 BreakDancerMini-0.0.1 q10
164
165 An 13 bp insertion detected by BreakDancerMini between chr1:62767 and chr1:63126 with 10 supporting read pairs from a single library 'NA' and a confidence score of 36.
166
167 Notes:
168 Real SV breakpoints are expected to reside within the predicted boundaries with a margin > the read length.
169
170
171
172 ]]> </help>
173 <citations>
174 <citation type="doi">doi:10.1038/nmeth.1363</citation>
175 </citations>
176 </tool>
177