annotate bwa-mem.xml @ 7:d8c9597bfb09 draft

planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
author devteam
date Tue, 03 Nov 2015 09:36:45 -0500
parents 09a7281d24c5
children 7bee165c3a44
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
1 <?xml version="1.0"?>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
2 <tool id="bwa_mem" name="Map with BWA-MEM" version="0.4.1">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
3 <description>- map medium and long reads (&gt; 100 bp) against reference genome</description>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
4 <macros>
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
5 <import>read_group_macros.xml</import>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
6 <import>bwa_macros.xml</import>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
7 </macros>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
8 <expand macro="requirements" />
6
09a7281d24c5 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents: 5
diff changeset
9 <expand macro="stdio" />
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
10 <command>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
11 #set $reference_fasta_filename = "localref.fa"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
12
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
13 #if str( $reference_source.reference_source_selector ) == "history":
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
14 ln -s "${reference_source.ref_file}" "${reference_fasta_filename}" &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
15
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
16 ## The following shell commands decide with of the BWA indexing algorithms (IS or BWTSW) will be run
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
17 ## depending ob the size of the input FASTA dataset
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
18 (
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
19 size=`stat -c %s "${reference_fasta_filename}" 2&gt;/dev/null`; ## Linux
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
20 if [ $? -eq 0 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
21 then
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
22 if [ "\$size" -lt 2000000000 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
23 then
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
24 bwa index -a is "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
25 echo "Generating BWA index with is algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
26 else
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
27 bwa index -a bwtsw "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
28 echo "Generating BWA index with bwtsw algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
29 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
30 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
31
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
32 eval \$(stat -s "${reference_fasta_filename}" 2&gt;/dev/null); ## OSX
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
33 if [ -n "\$st_size" ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
34 then
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
35 if [ "\$st_size" -lt 2000000000 ];
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
36 then
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
37 bwa index -a is "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
38 echo "Generating BWA index with is algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
39 else
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
40 bwa index -a bwtsw "${reference_fasta_filename}";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
41 echo "Generating BWA index with bwtsw algorithm";
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
42 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
43 fi;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
44 ) &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
45
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
46 #else:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
47 #set $reference_fasta_filename = str( $reference_source.ref_file.fields.path )
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
48 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
49
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
50 ## Begin BWA-MEM command line
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
51
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
52 bwa mem
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
53 -t "\${GALAXY_SLOTS:-1}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
54 -v 1 ## Verbosity is set to 1 (errors only)
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
55
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
56 #if str( $fastq_input.fastq_input_selector ) == "paired_iv": ## For interleaved fastq files set -p option
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
57 -p
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
58 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
59 -I "${fastq_input.iset_stats}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
60 #end if
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
61 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
62
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
63 #if str( $analysis_type.analysis_type_selector ) == "pacbio":
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
64 -x pacbio
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
65 #elif str( $analysis_type.analysis_type_selector ) == "full":
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
66 #if str( $analysis_type.algorithmic_options.algorithmic_options_selector ) == "set": ## Algorithmic options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
67 -k "${analysis_type.algorithmic_options.k}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
68 -w "${analysis_type.algorithmic_options.w}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
69 -d "${analysis_type.algorithmic_options.d}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
70 -r "${analysis_type.algorithmic_options.r}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
71 -y "${analysis_type.algorithmic_options.y}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
72 -c "${analysis_type.algorithmic_options.c}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
73 -D "${analysis_type.algorithmic_options.D}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
74 -W "${analysis_type.algorithmic_options.W}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
75 -m "${analysis_type.algorithmic_options.m}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
76 ${analysis_type.algorithmic_options.S}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
77 ${analysis_type.algorithmic_options.P}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
78 ${analysis_type.algorithmic_options.e}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
79 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
80
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
81 #if str( $analysis_type.scoring_options.scoring_options_selector ) == "set": ## Scoring options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
82 -A "${analysis_type.scoring_options.A}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
83 -B "${analysis_type.scoring_options.B}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
84 -O "${analysis_type.scoring_options.O}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
85 -E "${analysis_type.scoring_options.E}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
86 -L "${analysis_type.scoring_options.L}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
87 -U "${analysis_type.scoring_options.U}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
88 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
89
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
90 #if str( $analysis_type.io_options.io_options_selector ) == "set": ## IO options
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
91 -T "${analysis_type.io_options.T}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
92 -h "${analysis_type.io_options.h}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
93 ${analysis_type.io_options.a}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
94 ${analysis_type.io_options.C}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
95 ${analysis_type.io_options.V}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
96 ${analysis_type.io_options.Y}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
97 ${analysis_type.io_options.M}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
98 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
99
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
100 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
101
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
102 ## Handle read group options...
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
103 @define_read_group_helpers@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
104 #if str( $fastq_input.fastq_input_selector ) == "paired":
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
105 #set $rg_auto_name = $read_group_name_default($fastq_input.fastq_input1, $fastq_input.fastq_input2)
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
106 #else:
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
107 #set $rg_auto_name = $read_group_name_default($fastq_input.fastq_input1)
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
108 #end if
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
109 @set_use_rg_var@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
110 @set_read_group_vars@
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
111 #if $use_rg
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
112 @set_rg_string@
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
113 -R '$rg_string'
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
114 #end if
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
115
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
116 #if str( $fastq_input.fastq_input_selector ) == "paired":
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
117 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
118 -I "${fastq_input.iset_stats}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
119 #end if
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
120
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
121 "${reference_fasta_filename}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
122 "${fastq_input.fastq_input1}" "${fastq_input.fastq_input2}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
123 #elif str( $fastq_input.fastq_input_selector ) == "paired_collection":
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
124 #if str( $fastq_input.iset_stats ): ## check that insert statistics is used
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
125 -I "${fastq_input.iset_stats}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
126 #end if
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
127
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
128 "${reference_fasta_filename}"
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
129 "${fastq_input.fastq_input1.forward}" "${fastq_input.fastq_input1.reverse}"
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
130 #else:
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
131 "${reference_fasta_filename}"
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
132 "${fastq_input.fastq_input1}"
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
133 #end if
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
134
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
135 | samtools view -Sb - > temporary_bam_file.bam &amp;&amp;
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
136
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
137 samtools sort -f temporary_bam_file.bam ${bam_output}
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
138 </command>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
139
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
140 <inputs>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
141
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
142 <conditional name="reference_source">
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
143 <param name="reference_source_selector" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options. See `Indexes` section of help below">
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
144 <option value="cached">Use a built-in genome index</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
145 <option value="history">Use a genome from history and build index</option>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
146 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
147 <when value="cached">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
148 <param name="ref_file" type="select" label="Using reference genome" help="Select genome from the list">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
149 <options from_data_table="bwa_mem_indexes">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
150 <filter type="sort_by" column="2" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
151 <validator type="no_options" message="No indexes are available" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
152 </options>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
153 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
154 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
155 </when>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
156 <when value="history">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
157 <param name="ref_file" type="data" format="fasta" label="Use the following dataset as the reference sequence" help="You can upload a FASTA sequence to the history and use it as reference" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
158 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
159 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
160 <conditional name="fastq_input">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
161 <param name="fastq_input_selector" type="select" label="Single or Paired-end reads" help="Select between paired and single end data">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
162 <option value="paired">Paired</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
163 <option value="single">Single</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
164 <option value="paired_collection">Paired Collection</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
165 <option value="paired_iv">Paired Interleaved</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
166 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
167 <when value="paired">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
168 <param name="fastq_input1" type="data" format="fastqsanger" label="Select first set of reads" help="Specify dataset with forward reads"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
169 <param name="fastq_input2" type="data" format="fastqsanger" label="Select second set of reads" help="Specify dataset with reverse reads"/>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
170 <param name="iset_stats" type="text" optional="True" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
171 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
172 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
173 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
174 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
175 </when>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
176 <when value="single">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
177 <param name="fastq_input1" type="data" format="fastqsanger" label="Select fastq dataset" help="Specify dataset with single reads"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
178 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
179 <when value="paired_collection">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
180 <param name="fastq_input1" format="fastqsanger" type="data_collection" collection_type="paired" label="Select a paired collection" help="See help section for an explanation of dataset collections"/>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
181 <param name="iset_stats" type="text" optional="True" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
182 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
183 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
184 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
185 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
186 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
187 <when value="paired_iv">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
188 <param name="fastq_input1" type="data" format="fastqsanger" label="Select fastq dataset" help="Specify dataset with interleaved reads"/>
7
d8c9597bfb09 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bwa commit ddb8bdb9d62399f086b06b3469450d0aad2113bd
devteam
parents: 6
diff changeset
189 <param name="iset_stats" type="text" optional="True" label="Enter mean, standard deviation, max, and min for insert lengths." help="-I; This parameter is only used for paired reads. Only mean is required while sd, max, and min will be inferred. Examples: both &quot;250&quot; and &quot;250,25&quot; will work while &quot;250,,10&quot; will not. See below for details.">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
190 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
191 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
192 </sanitizer>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
193 </param>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
194 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
195 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
196
5
fbf460831036 planemo upload commit d0e3412c58bd3bdc1a483a1e2f7f9c2aa5c87a1f-dirty
devteam
parents: 4
diff changeset
197 <expand macro="read_group_conditional" />
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
198
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
199 <conditional name="analysis_type">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
200 <param name="analysis_type_selector" type="select" label="Select analysis mode">
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
201 <option value="illumina">1.Simple Illumina mode</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
202 <option value="pacbio">2.PacBio mode (-x pacbio)</option>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
203 <option value="full">3.Full list of options</option>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
204 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
205 <when value="illumina">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
206 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
207 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
208 <when value="pacbio">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
209 <!-- do nothing. all magic happens within <command> tag -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
210 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
211 <when value="full">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
212 <conditional name="algorithmic_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
213 <param name="algorithmic_options_selector" type="select" label="Set algorithmic options?" help="Sets -k, -w, -d, -r, -y, -c, -D, -W, -m, -S, -P, and -e options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
214 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
215 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
216 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
217 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
218 <param name="k" type="integer" value="19" label="Minimum seed length" help="-k; default=19"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
219 <param name="w" type="integer" value="100" label="Band width for banded alignment" help="-w; default=100"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
220 <param name="d" type="integer" value="100" label="Off-diagonal X-dropoff" help="-d; default=100"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
221 <param name="r" type="float" value="1.5" label="Look for internal seeds inside a seed longer than -k * THIS VALUE" help="-r; default=1.5; This is a key heuristic parameter for tuning the performance. Larger value yields fewer seeds, which leads to faster alignment speed but lower accuracy" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
222 <param name="y" type="integer" value="20" label="Seed occurrence for the 3rd round seeding" help="-y; default=20" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
223 <param name="c" type="integer" value="500" label="Skip seeds with more than that many occurrences" help="-c; default=500"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
224 <param name="D" type="float" value="0.5" label="Drop chains shorter than this fraction of the longest overlapping chain" help="-D; default=0.5"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
225 <param name="W" type="integer" value="0" label="Discard a chain if seeded bases shorter than THIS VALUE" help="-W; default=0"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
226 <param name="m" type="integer" value="50" label="Perform at most this many rounds of mate rescues for each read" help="-m; default=50"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
227 <param name="S" type="boolean" truevalue="-S" falsevalue="" label="Skip mate rescue" help="-S"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
228 <param name="P" type="boolean" truevalue="-P" falsevalue="" label="Skip pairing; mate rescue performed unless -S also in use" help="-P"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
229 <param name="e" type="boolean" truevalue="-e" falsevalue="" label="Discard full-length exact matches" help="-e"/>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
230 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
231 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
232 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
233 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
234 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
235
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
236 <conditional name="scoring_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
237 <param name="scoring_options_selector" type="select" label="Set scoring options?" help="Sets -A, -B, -O, -E, -L, and -U options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
238 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
239 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
240 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
241 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
242 <param name="A" type="integer" value="1" label="Score for a sequence match" help="-A; scales options -T, -d, -B, -O, -E, -L, and -U unless overridden; default=1"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
243 <param name="B" type="integer" value="4" label="Penalty for a mismatch" help="-B; default=4"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
244 <param name="O" type="text" value="6,6" label="Gap open penalties for deletions and insertions" help="-O; default=6,6">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
245 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
246 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
247 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
248 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
249 <param name="E" type="text" value="1,1" label="Gap extension penalties; a gap of size k cost &#39;-O + -E*k&#39;. If two numbers are specified, the first is the penalty of extending a deletion and the second for extending an insertion" help="-E; default=1,1">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
250 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
251 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
252 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
253 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
254 <param name="L" type="text" value="5,5" label="Penalties for 5&#39;-end and 3&#39;-end clipping" help="-L; default=5,5; When performing Smith-Waterman extension, BWA-MEM keeps track of the best score reaching the end of query. If this score is larger than the best Smith-Waterman score minus the clipping penalty, clipping will not be applied. Note that in this case, the SAM AS tag reports the best Smith-Waterman score; clipping penalty is not deduced">
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
255 <sanitizer invalid_char="">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
256 <valid initial="string.digits"><add value=","/> </valid>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
257 </sanitizer>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
258 </param>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
259 <param name="U" type="integer" value="17" label="Penalty for an unpaired read pair" help="-U; default=17"/>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
260 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
261 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
262 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
263 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
264 </conditional>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
265
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
266 <conditional name="io_options">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
267 <param name="io_options_selector" type="select" label="Set input/output options" help="Sets -T, -h, -a, -C, -V, -Y, and -M options.">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
268 <option value="set">Set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
269 <option value="do_not_set" selected="True">Do not set</option>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
270 </param>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
271 <when value="set">
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
272 <param name="T" type="integer" value="30" label="Minimum score to output" help="-T; default=30"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
273 <param name="h" type="integer" value="5" label="If there are less than THIS VALUE hits with score &gt;80% of the max score, output them all in the XA tag" help="-h; default=5" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
274 <param name="a" type="boolean" truevalue="-a" falsevalue="" label="Output all alignments for single-ends or unpaired paired-ends" help="-a; These alignments will be flagged as secondary alignments"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
275 <param name="C" type="boolean" truevalue="-C" falsevalue="" label="Append FASTA/FASTQ comment to BAM output" help="-C"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
276 <param name="V" type="boolean" truevalue="-V" falsevalue="" label="Output the reference FASTA header in the XR tag" help="-C"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
277 <param name="Y" type="boolean" truevalue="-Y" falsevalue="" label="Use soft clipping for supplementary alignments" help="-Y; By default, BWA-MEM uses soft clipping for the primary alignment and hard clipping for supplementary alignments" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
278 <param name="M" type="boolean" truevalue="-M" falsevalue="" label="Mark shorter split hits of a chimeric alignment in the FLAG field as 'secondary alignment' instead of 'supplementary alignment'" help="-M; For Picard&lt;1.96 compatibility" />
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
279 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
280 <when value="do_not_set">
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
281 <!-- do nothing -->
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
282 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
283 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
284 </when>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
285 </conditional>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
286 </inputs>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
287
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
288 <outputs>
6
09a7281d24c5 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents: 5
diff changeset
289 <data format="bam" name="bam_output" label="${tool.name} on ${on_string} (mapped reads in BAM format)">
09a7281d24c5 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents: 5
diff changeset
290 <expand macro="dbKeyActionsBwaMem" />
09a7281d24c5 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents: 5
diff changeset
291 </data>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
292 </outputs>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
293
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
294 <tests>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
295 <test>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
296 <param name="reference_source_selector" value="history" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
297 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
298 <param name="fastq_input_selector" value="paired"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
299 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
300 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
301 <param name="analysis_type_selector" value="illumina"/>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
302 <output name="bam_output" ftype="bam" file="bwa-mem-test1.bam" lines_diff="2" />
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
303 </test>
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
304 <test>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
305 <param name="reference_source_selector" value="history" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
306 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
307 <param name="fastq_input_selector" value="paired"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
308 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
309 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
310 <param name="rg_selector" value="set"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
311 <param name="ID" value="rg1"/>
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
312 <param name="PL" value="CAPILLARY"/>
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
313 <param name="LB" value="AARDVARK-1" />
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
314 <param name="analysis_type_selector" value="illumina"/>
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
315 <output name="bam_output" ftype="bam" file="bwa-mem-test2.bam" lines_diff="2" />
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
316 </test>
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
317 </tests>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
318 <help>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
319 **What is does**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
320
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
321 From http://arxiv.org/abs/1303.3997:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
322
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
323 BWA-MEM is a new alignment algorithm for aligning sequence reads or long query sequences against a large reference genome such as human.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
324 It automatically chooses between local and end-to-end alignments, supports paired-end reads and performs chimeric alignment.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
325 The algorithm is robust to sequencing errors and applicable to a wide range of sequence lengths from 70bp to a few megabases.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
326 For mapping 100bp sequences, BWA-MEM shows better performance than several state-of-art read aligners to date.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
327
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
328 It is best suited for mapping long (>70 nt) reads against large reference genomes.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
329
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
330 This Galaxy tool wraps bwa-mem module of bwa read mapping tool. Galaxy implementation takes fastq files as input and produces output in BAM (not SAM) format, which can be further processed using various BAM utilities exiting in Galaxy (BAMTools, SAMTools, Picard).
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
331
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
332 -----
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
333
4
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
334 **Indices: Selecting reference genomes for BWA**
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
335
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
336 Galaxy wrapper for BWA allows you select between precomputed and user-defined indices for reference genomes using **Will you select a reference genome from your history or use a built-in index?** flag. This flag has two options:
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
337
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
338 1. **Use a built-in genome index** - when selected (this is default), Galaxy provides the user with **Select reference genome index** dropdown. Genomes listed in this dropdown have been pre-indexed with bwa index utility and are ready to be mapped against.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
339 2. **Use a genome from the history and build index** - when selected, Galaxy provides the user with **Select reference genome sequence** dropdown. This dropdown is populated by all FASTA formatted files listed in your current history. If your genome of interest is uploaded into history it will be shown there. Selecting a genome from this dropdown will cause Galaxy to first transparently index it using `bwa index` command, and then run mapping with `bwa mem`.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
340
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
341 If your genome of interest is not listed here you have two choices:
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
342
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
343 1. Contact galaxy team using **Help->Support** link at the top of the interface and let us know that an index needs to be added
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
344 2. Upload your genome of interest as a FASTA file to Galaxy history and selected **Use a genome from the history and build index** option.
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
345
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
346 -----
ac30bfd3e2a8 planemo upload commit a50a3947aebc8a1d11bac39599f4efd8ed9a3bd5
devteam
parents: 2
diff changeset
347
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
348 **Galaxy-specific option**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
349
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
350 Galaxy allows four levels of control over bwa-mem options provided by **Select analysis mode** menu option. These are:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
351
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
352 1. *Simple Illumina mode*: The simplest possible bwa mem application in which it alignes single or paired-end data to reference using default parameters. It is equivalent to the following command: bwa mem &lt;reference index&gt; &lt;fastq dataset1&gt; [fastq dataset2]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
353 2. *PacBio mode*: The mode adjusted specifically for mapping of long PacBio subreads. Equivalent to the following command: bwa mem -k17 -W40 -r10 -A1 -B1 -O1 -E1 -L0 &lt;reference index&gt; &lt;PacBio dataset in fastq format&gt;
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
354 3. *Full list of options*: Allows access to all options through Galaxy interface.
2
e29bc5c169bc Uploaded
devteam
parents: 1
diff changeset
355
0
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
356 ------
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
357
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
358 **BWA MEM options**
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
359
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
360 Each Galaxy parameter widget corresponds to command line flags listed below:
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
361
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
362 Algorithm options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
363
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
364 -k INT minimum seed length [19]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
365 -w INT band width for banded alignment [100]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
366 -d INT off-diagonal X-dropoff [100]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
367 -r FLOAT look for internal seeds inside a seed longer than {-k} * FLOAT [1.5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
368 -y INT find MEMs longer than {-k} * {-r} with size less than INT [0]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
369 -c INT skip seeds with more than INT occurrences [500]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
370 -D FLOAT drop chains shorter than FLOAT fraction of the longest overlapping chain [0.50]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
371 -W INT discard a chain if seeded bases shorter than INT [0]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
372 -m INT perform at most INT rounds of mate rescues for each read [50]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
373 -S skip mate rescue
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
374 -P skip pairing; mate rescue performed unless -S also in use
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
375 -e discard full-length exact matches
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
376
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
377 Scoring options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
378
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
379 -A INT score for a sequence match, which scales options -TdBOELU unless overridden [1]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
380 -B INT penalty for a mismatch [4]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
381 -O INT[,INT] gap open penalties for deletions and insertions [6,6]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
382 -E INT[,INT] gap extension penalty; a gap of size k cost '{-O} + {-E}*k' [1,1]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
383 -L INT[,INT] penalty for 5'- and 3'-end clipping [5,5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
384 -U INT penalty for an unpaired read pair [17]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
385
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
386 Input/output options::
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
387
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
388 -p first query file consists of interleaved paired-end sequences
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
389 -R STR read group header line such as '@RG\tID:foo\tSM:bar' [null]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
390
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
391 -v INT verbose level: 1=error, 2=warning, 3=message, 4+=debugging [3]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
392 -T INT minimum score to output [30]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
393 -h INT if there are &lt;INT hits with score &gt;80% of the max score, output all in XA [5]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
394 -a output all alignments for SE or unpaired PE
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
395 -C append FASTA/FASTQ comment to SAM output
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
396 -V output the reference FASTA header in the XR tag
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
397 -Y use soft clipping for supplementary alignments
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
398 -M mark shorter split hits as secondary
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
399
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
400 -I FLOAT[,FLOAT[,INT[,INT]]]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
401 specify the mean, standard deviation (10% of the mean if absent), max
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
402 (4 sigma from the mean if absent) and min of the insert size distribution.
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
403 FR orientation only. [inferred]
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
404
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
405 @dataset_collections@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
406
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
407 @RG@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
408
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
409 @info@
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
410 </help>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
411 <citations>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
412 <citation type="doi">10.1093/bioinformatics/btp324</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
413 <citation type="doi">10.1093/bioinformatics/btp698</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
414 <citation type="bibtex">@misc{1303.3997,
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
415 Author = {Heng Li},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
416 Title = {Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
417 Year = {2013},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
418 Eprint = {arXiv:1303.3997},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
419 url = {http://arxiv.org/abs/1303.3997},
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
420 }</citation>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
421 </citations>
ff1ae217ccc2 Uploaded
devteam
parents:
diff changeset
422 </tool>