annotate bwa-mem.xml @ 5:fbf460831036 draft

planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
author devteam
date Tue, 21 Jul 2015 13:51:02 -0400
parents ac30bfd3e2a8
children 09a7281d24c5
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
1 <?xml version="1.0"?>
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
2 <tool id="bwa_mem" name="Map with BWA-MEM" version="0.3">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
3 <description>- map medium and long reads (&gt; 100 bp) against reference genome</description>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
4 <macros>
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
5 <import>read_group_macros.xml</import>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
6 <import>bwa_macros.xml</import>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
7 </macros>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
8 <requirements>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
9 <requirement type="package" version="0.7.10.039ea20639">bwa</requirement>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
10 <requirement type="package" version="1.1">samtools</requirement>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
11 </requirements>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
12 <stdio>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
13 <exit_code range="1:" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
14 </stdio>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
15 <command>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
16 #set $reference_fasta_filename = "localref.fa"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
17
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
18 #if str( $reference_source.reference_source_selector ) == "history":
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
19 ln -s "${reference_source.ref_file}" "${reference_fasta_filename}" &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
20
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
21 ## The following shell commands decide with of the BWA indexing algorithms (IS or BWTSW) will be run
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
22 ## depending ob the size of the input FASTA dataset
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
23 (
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
24 size=`stat -c %s "${reference_fasta_filename}" 2&gt;/dev/null`; ## Linux
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
25 if [ $? -eq 0 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
26 then
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
27 if [ "\$size" -lt 2000000000 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
28 then
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
29 bwa index -a is "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
30 echo "Generating BWA index with is algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
31 else
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
32 bwa index -a bwtsw "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
33 echo "Generating BWA index with bwtsw algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
34 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
35 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
36
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
37 eval \$(stat -s "${reference_fasta_filename}" 2&gt;/dev/null); ## OSX
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
38 if [ -n "\$st_size" ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
39 then
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
40 if [ "\$st_size" -lt 2000000000 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
41 then
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
42 bwa index -a is "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
43 echo "Generating BWA index with is algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
44 else
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
45 bwa index -a bwtsw "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
46 echo "Generating BWA index with bwtsw algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
47 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
48 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
49 ) &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
50
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
51 #else:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
52 #set $reference_fasta_filename = str( $reference_source.ref_file.fields.path )
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
53 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
54
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
55 ## Begin BWA-MEM command line
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
56
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
57 bwa mem
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
58 -t "\${GALAXY_SLOTS:-1}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
59 -v 1 ## Verbosity is set to 1 (errors only)
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
60
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
61 #if str( $fastq_input.fastq_input_selector ) == "paired_iv": ## For interleaved fastq files set -p option
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
62 -p
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
63 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
64 -I "${fastq_input.iset_stats}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
65 #end if
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
66 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
67
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
68 #if str( $analysis_type.analysis_type_selector ) == "pacbio":
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
69 -x pacbio
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
70 #elif str( $analysis_type.analysis_type_selector ) == "full":
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
71 #if str( $analysis_type.algorithmic_options.algorithmic_options_selector ) == "set": ## Algorithmic options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
72 -k "${analysis_type.algorithmic_options.k}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
73 -w "${analysis_type.algorithmic_options.w}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
74 -d "${analysis_type.algorithmic_options.d}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
75 -r "${analysis_type.algorithmic_options.r}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
76 -y "${analysis_type.algorithmic_options.y}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
77 -c "${analysis_type.algorithmic_options.c}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
78 -D "${analysis_type.algorithmic_options.D}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
79 -W "${analysis_type.algorithmic_options.W}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
80 -m "${analysis_type.algorithmic_options.m}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
81 ${analysis_type.algorithmic_options.S}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
82 ${analysis_type.algorithmic_options.P}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
83 ${analysis_type.algorithmic_options.e}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
84 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
85
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
86 #if str( $analysis_type.scoring_options.scoring_options_selector ) == "set": ## Scoring options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
87 -A "${analysis_type.scoring_options.A}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
88 -B "${analysis_type.scoring_options.B}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
89 -O "${analysis_type.scoring_options.O}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
90 -E "${analysis_type.scoring_options.E}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
91 -L "${analysis_type.scoring_options.L}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
92 -U "${analysis_type.scoring_options.U}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
93 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
94
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
95 #if str( $analysis_type.io_options.io_options_selector ) == "set": ## IO options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
96 -T "${analysis_type.io_options.T}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
97 -h "${analysis_type.io_options.h}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
98 ${analysis_type.io_options.a}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
99 ${analysis_type.io_options.C}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
100 ${analysis_type.io_options.V}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
101 ${analysis_type.io_options.Y}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
102 ${analysis_type.io_options.M}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
103 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
104
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
105 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
106
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
107 ## Handle read group options...
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
108 @define_read_group_helpers@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
109 #if str( $fastq_input.fastq_input_selector ) == "paired":
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
110 #set $rg_auto_name = $read_group_name_default($fastq_input.fastq_input1, $fastq_input.fastq_input2)
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
111 #else:
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
112 #set $rg_auto_name = $read_group_name_default($fastq_input.fastq_input1)
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
113 #end if
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
114 @set_use_rg_var@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
115 @set_read_group_vars@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
116 #if $use_rg
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
117 @set_rg_string@
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
118 -R '$rg_string'
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
119 #end if
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
120
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
121 #if str( $fastq_input.fastq_input_selector ) == "paired":
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
122 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
123 -I "${fastq_input.iset_stats}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
124 #end if
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
125
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
126 "${reference_fasta_filename}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
127 "${fastq_input.fastq_input1}" "${fastq_input.fastq_input2}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
128 #elif str( $fastq_input.fastq_input_selector ) == "paired_collection":
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
129 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
130 -I "${fastq_input.iset_stats}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
131 #end if
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
132
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
133 "${reference_fasta_filename}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
134 "${fastq_input.fastq_input1.forward}" "${fastq_input.fastq_input1.reverse}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
135 #else:
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
136 "${reference_fasta_filename}"
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
137 "${fastq_input.fastq_input1}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
138 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
139
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
140 | samtools view -Sb - > temporary_bam_file.bam &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
141
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
142 samtools sort -f temporary_bam_file.bam ${bam_output}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
143 </command>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
144
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
145 <inputs>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
146
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
147 <conditional name="reference_source">
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
148 <param name="reference_source_selector" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options. See `Indexes` section of help below">
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
149 <option value="cached">Use a built-in genome index</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
150 <option value="history">Use a genome from history and build index</option>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
151 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
152 <when value="cached">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
153 <param name="ref_file" type="select" label="Using reference genome" help="Select genome from the list">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
154 <options from_data_table="bwa_mem_indexes">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
155 <filter type="sort_by" column="2" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
156 <validator type="no_options" message="No indexes are available" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
157 </options>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
158 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
159 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
160 </when>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
161 <when value="history">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
162 <param name="ref_file" type="data" format="fasta" label="Use the following dataset as the reference sequence" help="You can upload a FASTA sequence to the history and use it as reference" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
163 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
164 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
165 <conditional name="fastq_input">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
166 <param name="fastq_input_selector" type="select" label="Single or Paired-end reads" help="Select between paired and single end data">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
167 <option value="paired">Paired</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
168 <option value="single">Single</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
169 <option value="paired_collection">Paired Collection</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
170 <option value="paired_iv">Paired Interleaved</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
171 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
172 <when value="paired">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
173 <param name="fastq_input1" type="data" format="fastqsanger" label="Select first set of reads" help="Specify dataset with forward reads"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
174 <param name="fastq_input2" type="data" format="fastqsanger" label="Select second set of reads" help="Specify dataset with reverse reads"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
175 <param name="iset_stats" type="text" optional="True" size="10" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
176 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
177 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
178 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
179 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
180 </when>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
181 <when value="single">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
182 <param name="fastq_input1" type="data" format="fastqsanger" label="Select fastq dataset" help="Specify dataset with single reads"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
183 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
184 <when value="paired_collection">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
185 <param name="fastq_input1" format="fastqsanger" type="data_collection" collection_type="paired" label="Select a paired collection" help="See help section for an explanation of dataset collections"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
186 <param name="iset_stats" type="text" optional="True" size="10" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
187 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
188 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
189 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
190 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
191 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
192 <when value="paired_iv">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
193 <param name="fastq_input1" type="data" format="fastqsanger" label="Select fastq dataset" help="Specify dataset with interleaved reads"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
194 <param name="iset_stats" type="text" optional="True" size="10" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
195 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
196 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
197 </sanitizer>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
198 </param>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
199 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
200 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
201
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
202 <expand macro="read_group_conditional" />
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
203
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
204 <conditional name="analysis_type">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
205 <param name="analysis_type_selector" type="select" label="Select analysis mode">
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
206 <option value="illumina">1.Simple Illumina mode</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
207 <option value="pacbio">2.PacBio mode (-x pacbio)</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
208 <option value="full">3.Full list of options</option>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
209 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
210 <when value="illumina">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
211 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
212 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
213 <when value="pacbio">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
214 <!-- do nothing. all magic happens within <command> tag -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
215 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
216 <when value="full">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
217 <conditional name="algorithmic_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
218 <param name="algorithmic_options_selector" type="select" label="Set algorithmic options?" help="Sets -k, -w, -d, -r, -y, -c, -D, -W, -m, -S, -P, and -e options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
219 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
220 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
221 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
222 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
223 <param name="k" type="integer" value="19" label="Minimum seed length" help="-k; default=19"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
224 <param name="w" type="integer" value="100" label="Band width for banded alignment" help="-w; default=100"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
225 <param name="d" type="integer" value="100" label="Off-diagonal X-dropoff" help="-d; default=100"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
226 <param name="r" type="float" value="1.5" label="Look for internal seeds inside a seed longer than -k * THIS VALUE" help="-r; default=1.5; This is a key heuristic parameter for tuning the performance. Larger value yields fewer seeds, which leads to faster alignment speed but lower accuracy" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
227 <param name="y" type="integer" value="20" label="Seed occurrence for the 3rd round seeding" help="-y; default=20" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
228 <param name="c" type="integer" value="500" label="Skip seeds with more than that many occurrences" help="-c; default=500"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
229 <param name="D" type="float" value="0.5" label="Drop chains shorter than this fraction of the longest overlapping chain" help="-D; default=0.5"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
230 <param name="W" type="integer" value="0" label="Discard a chain if seeded bases shorter than THIS VALUE" help="-W; default=0"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
231 <param name="m" type="integer" value="50" label="Perform at most this many rounds of mate rescues for each read" help="-m; default=50"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
232 <param name="S" type="boolean" truevalue="-S" falsevalue="" label="Skip mate rescue" help="-S"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
233 <param name="P" type="boolean" truevalue="-P" falsevalue="" label="Skip pairing; mate rescue performed unless -S also in use" help="-P"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
234 <param name="e" type="boolean" truevalue="-e" falsevalue="" label="Discard full-length exact matches" help="-e"/>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
235 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
236 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
237 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
238 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
239 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
240
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
241 <conditional name="scoring_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
242 <param name="scoring_options_selector" type="select" label="Set scoring options?" help="Sets -A, -B, -O, -E, -L, and -U options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
243 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
244 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
245 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
246 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
247 <param name="A" type="integer" value="1" label="Score for a sequence match" help="-A; scales options -T, -d, -B, -O, -E, -L, and -U unless overridden; default=1"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
248 <param name="B" type="integer" value="4" label="Penalty for a mismatch" help="-B; default=4"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
249 <param name="O" type="text" value="6,6" label="Gap open penalties for deletions and insertions" help="-O; default=6,6">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
250 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
251 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
252 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
253 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
254 <param name="E" type="text" value="1,1" label="Gap extension penalties; a gap of size k cost &#39;-O + -E*k&#39;. If two numbers are specified, the first is the penalty of extending a deletion and the second for extending an insertion" help="-E; default=1,1">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
255 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
256 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
257 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
258 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
259 <param name="L" type="text" value="5,5" label="Penalties for 5&#39;-end and 3&#39;-end clipping" help="-L; default=5,5; When performing Smith-Waterman extension, BWA-MEM keeps track of the best score reaching the end of query. If this score is larger than the best Smith-Waterman score minus the clipping penalty, clipping will not be applied. Note that in this case, the SAM AS tag reports the best Smith-Waterman score; clipping penalty is not deduced">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
260 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
261 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
262 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
263 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
264 <param name="U" type="integer" value="17" label="Penalty for an unpaired read pair" help="-U; default=17"/>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
265 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
266 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
267 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
268 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
269 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
270
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
271 <conditional name="io_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
272 <param name="io_options_selector" type="select" label="Set input/output options" help="Sets -T, -h, -a, -C, -V, -Y, and -M options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
273 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
274 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
275 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
276 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
277 <param name="T" type="integer" value="30" label="Minimum score to output" help="-T; default=30"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
278 <param name="h" type="integer" value="5" label="If there are less than THIS VALUE hits with score &gt;80% of the max score, output them all in the XA tag" help="-h; default=5" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
279 <param name="a" type="boolean" truevalue="-a" falsevalue="" label="Output all alignments for single-ends or unpaired paired-ends" help="-a; These alignments will be flagged as secondary alignments"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
280 <param name="C" type="boolean" truevalue="-C" falsevalue="" label="Append FASTA/FASTQ comment to BAM output" help="-C"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
281 <param name="V" type="boolean" truevalue="-V" falsevalue="" label="Output the reference FASTA header in the XR tag" help="-C"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
282 <param name="Y" type="boolean" truevalue="-Y" falsevalue="" label="Use soft clipping for supplementary alignments" help="-Y; By default, BWA-MEM uses soft clipping for the primary alignment and hard clipping for supplementary alignments" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
283 <param name="M" type="boolean" truevalue="-M" falsevalue="" label="Mark shorter split hits of a chimeric alignment in the FLAG field as 'secondary alignment' instead of 'supplementary alignment'" help="-M; For Picard&lt;1.96 compatibility" />
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
284 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
285 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
286 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
287 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
288 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
289 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
290 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
291 </inputs>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
292
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
293 <outputs>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
294 <data format="bam" name="bam_output" label="${tool.name} on ${on_string} (mapped reads in BAM format)"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
295 </outputs>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
296
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
297 <tests>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
298 <test>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
299 <param name="reference_source_selector" value="history" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
300 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
301 <param name="fastq_input_selector" value="paired"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
302 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
303 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
304 <param name="analysis_type_selector" value="illumina"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
305 <output name="bam_output" ftype="bam" file="bwa-mem-test1.bam" lines_diff="2" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
306 </test>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
307 <test>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
308 <param name="reference_source_selector" value="history" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
309 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
310 <param name="fastq_input_selector" value="paired"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
311 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
312 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
313 <param name="rg_selector" value="set"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
314 <param name="ID" value="rg1"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
315 <param name="PL" value="CAPILLARY"/>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
316 <param name="LB" value="AARDVARK-1" />
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
317 <param name="analysis_type_selector" value="illumina"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
318 <output name="bam_output" ftype="bam" file="bwa-mem-test2.bam" lines_diff="2" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
319 </test>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
320 </tests>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
321 <help>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
322 **What is does**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
323
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
324 From http://arxiv.org/abs/1303.3997:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
325
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
326 BWA-MEM is a new alignment algorithm for aligning sequence reads or long query sequences against a large reference genome such as human.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
327 It automatically chooses between local and end-to-end alignments, supports paired-end reads and performs chimeric alignment.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
328 The algorithm is robust to sequencing errors and applicable to a wide range of sequence lengths from 70bp to a few megabases.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
329 For mapping 100bp sequences, BWA-MEM shows better performance than several state-of-art read aligners to date.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
330
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
331 It is best suited for mapping long (>70 nt) reads against large reference genomes.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
332
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
333 This Galaxy tool wraps bwa-mem module of bwa read mapping tool. Galaxy implementation takes fastq files as input and produces output in BAM (not SAM) format, which can be further processed using various BAM utilities exiting in Galaxy (BAMTools, SAMTools, Picard).
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
334
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
335 -----
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
336
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
337 **Indices: Selecting reference genomes for BWA**
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
338
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
339 Galaxy wrapper for BWA allows you select between precomputed and user-defined indices for reference genomes using **Will you select a reference genome from your history or use a built-in index?** flag. This flag has two options:
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
340
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
341 1. **Use a built-in genome index** - when selected (this is default), Galaxy provides the user with **Select reference genome index** dropdown. Genomes listed in this dropdown have been pre-indexed with bwa index utility and are ready to be mapped against.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
342 2. **Use a genome from the history and build index** - when selected, Galaxy provides the user with **Select reference genome sequence** dropdown. This dropdown is populated by all FASTA formatted files listed in your current history. If your genome of interest is uploaded into history it will be shown there. Selecting a genome from this dropdown will cause Galaxy to first transparently index it using `bwa index` command, and then run mapping with `bwa mem`.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
343
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
344 If your genome of interest is not listed here you have two choices:
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
345
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
346 1. Contact galaxy team using **Help->Support** link at the top of the interface and let us know that an index needs to be added
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
347 2. Upload your genome of interest as a FASTA file to Galaxy history and selected **Use a genome from the history and build index** option.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
348
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
349 -----
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
350
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
351 **Galaxy-specific option**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
352
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
353 Galaxy allows four levels of control over bwa-mem options provided by **Select analysis mode** menu option. These are:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
354
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
355 1. *Simple Illumina mode*: The simplest possible bwa mem application in which it alignes single or paired-end data to reference using default parameters. It is equivalent to the following command: bwa mem &lt;reference index&gt; &lt;fastq dataset1&gt; [fastq dataset2]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
356 2. *PacBio mode*: The mode adjusted specifically for mapping of long PacBio subreads. Equivalent to the following command: bwa mem -k17 -W40 -r10 -A1 -B1 -O1 -E1 -L0 &lt;reference index&gt; &lt;PacBio dataset in fastq format&gt;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
357 3. *Full list of options*: Allows access to all options through Galaxy interface.
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
358
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
359 ------
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
360
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
361 **BWA MEM options**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
362
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
363 Each Galaxy parameter widget corresponds to command line flags listed below:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
364
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
365 Algorithm options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
366
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
367 -k INT minimum seed length [19]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
368 -w INT band width for banded alignment [100]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
369 -d INT off-diagonal X-dropoff [100]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
370 -r FLOAT look for internal seeds inside a seed longer than {-k} * FLOAT [1.5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
371 -y INT find MEMs longer than {-k} * {-r} with size less than INT [0]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
372 -c INT skip seeds with more than INT occurrences [500]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
373 -D FLOAT drop chains shorter than FLOAT fraction of the longest overlapping chain [0.50]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
374 -W INT discard a chain if seeded bases shorter than INT [0]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
375 -m INT perform at most INT rounds of mate rescues for each read [50]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
376 -S skip mate rescue
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
377 -P skip pairing; mate rescue performed unless -S also in use
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
378 -e discard full-length exact matches
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
379
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
380 Scoring options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
381
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
382 -A INT score for a sequence match, which scales options -TdBOELU unless overridden [1]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
383 -B INT penalty for a mismatch [4]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
384 -O INT[,INT] gap open penalties for deletions and insertions [6,6]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
385 -E INT[,INT] gap extension penalty; a gap of size k cost '{-O} + {-E}*k' [1,1]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
386 -L INT[,INT] penalty for 5'- and 3'-end clipping [5,5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
387 -U INT penalty for an unpaired read pair [17]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
388
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
389 Input/output options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
390
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
391 -p first query file consists of interleaved paired-end sequences
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
392 -R STR read group header line such as '@RG\tID:foo\tSM:bar' [null]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
393
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
394 -v INT verbose level: 1=error, 2=warning, 3=message, 4+=debugging [3]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
395 -T INT minimum score to output [30]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
396 -h INT if there are &lt;INT hits with score &gt;80% of the max score, output all in XA [5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
397 -a output all alignments for SE or unpaired PE
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
398 -C append FASTA/FASTQ comment to SAM output
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
399 -V output the reference FASTA header in the XR tag
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
400 -Y use soft clipping for supplementary alignments
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
401 -M mark shorter split hits as secondary
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
402
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
403 -I FLOAT[,FLOAT[,INT[,INT]]]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
404 specify the mean, standard deviation (10% of the mean if absent), max
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
405 (4 sigma from the mean if absent) and min of the insert size distribution.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
406 FR orientation only. [inferred]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
407
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
408 @dataset_collections@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
409
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
410 @RG@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
411
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
412 @info@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
413 </help>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
414 <citations>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
415 <citation type="doi">10.1093/bioinformatics/btp324</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
416 <citation type="doi">10.1093/bioinformatics/btp698</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
417 <citation type="bibtex">@misc{1303.3997,
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
418 Author = {Heng Li},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
419 Title = {Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
420 Year = {2013},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
421 Eprint = {arXiv:1303.3997},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
422 url = {http://arxiv.org/abs/1303.3997},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
423 }</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
424 </citations>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
425 </tool>