5
|
1 <tool id="bismark_bowtie" name="Bismark" version="0.10.2">
|
3
|
2 <!-- Wrapper compatible with Bismark version 0.10 -->
|
0
|
3 <description>bisulfite mapper (bowtie)</description>
|
|
4 <!--<version_command>bismark version</version_command>-->
|
|
5 <requirements>
|
|
6 <requirement type="set_environment">SCRIPT_PATH</requirement>
|
2
|
7 <requirement type="package" version="0.1.19">samtools</requirement>
|
0
|
8 <requirement type="package" version="0.12.8">bowtie</requirement>
|
|
9 </requirements>
|
4
|
10 <stdio>
|
|
11 <exit_code range="1:" />
|
|
12 <exit_code range=":-1" />
|
|
13 <regex match="Error:" />
|
|
14 <regex match="Exception:" />
|
|
15 </stdio>
|
0
|
16 <command interpreter="python">
|
4
|
17 <![CDATA[
|
0
|
18 bismark_wrapper.py
|
|
19
|
4
|
20 ##--bismark_path \$SCRIPT_PATH
|
0
|
21
|
|
22 ##
|
|
23 ## Bismark Genome Preparation, if desired.
|
|
24 ##
|
|
25
|
|
26 ## Handle reference file.
|
|
27 #if $refGenomeSource.genomeSource == "history":
|
|
28 --own-file=$refGenomeSource.ownFile
|
|
29 #else:
|
|
30 --indexes-path ${refGenomeSource.index.fields.path}
|
|
31 #end if
|
|
32
|
|
33
|
|
34 ##
|
|
35 ## Input parameters
|
|
36 ##
|
|
37
|
|
38
|
|
39 #if $singlePaired.sPaired == "single":
|
|
40 --single-paired $singlePaired.input_singles
|
|
41
|
|
42 #if $singlePaired.input_singles.ext == "fastqillumina":
|
|
43 --phred64-quals
|
|
44 --fastq
|
|
45 #elif $singlePaired.input_singles.ext == "fastqsanger":
|
|
46 --fastq
|
|
47 #elif $singlePaired.input_singles.ext == "fasta":
|
|
48 --fasta
|
|
49 #end if
|
|
50 #else:
|
|
51 --mate-paired
|
|
52 #set $mate1 = list()
|
|
53 #set $mate2 = list()
|
|
54 #for $mate_pair in $singlePaired.mate_list
|
|
55 $mate1.append( str($mate_pair.input_mate1) )
|
|
56 $mate2.append( str($mate_pair.input_mate2) )
|
|
57 #end for
|
|
58
|
|
59 --mate1 #echo ','.join($mate1)
|
|
60 --mate2 #echo ','.join($mate2)
|
|
61
|
4
|
62 #for $mate_pair in $singlePaired.mate_list:
|
|
63 #if $mate_pair.input_mate1.ext == "fastqillumina":
|
|
64 --phred64-quals
|
|
65 --fastq
|
|
66 #elif $mate_pair.input_mate1.ext == "fastqsanger":
|
|
67 --fastq
|
|
68 #elif $mate_pair.input_mate1.ext == "fasta":
|
|
69 --fasta
|
|
70 #end if
|
|
71 #break
|
|
72 #end for
|
0
|
73
|
|
74 -I $singlePaired.minInsert
|
|
75 -X $singlePaired.maxInsert
|
|
76 #end if
|
|
77
|
|
78
|
|
79 ## for now hardcode the value for the required memory per thread in --best mode
|
|
80 --chunkmbs 512
|
|
81
|
|
82
|
|
83 #if $params.settingsType == "custom":
|
|
84
|
|
85 ## default 20
|
|
86 --seed-len $params.seed_len
|
|
87 ## default 0
|
|
88 --seed-mismatches $params.seed_mismatches
|
|
89
|
|
90 ## default 70
|
|
91 ##--maqerr $params.maqerr
|
|
92
|
|
93 ## default unlimited
|
|
94 #if $params.qupto != 0:
|
|
95 --qupto $params.qupto
|
|
96 #end if
|
|
97 #if $params.skip_reads != 0:
|
|
98 --skip-reads $params.skip_reads
|
|
99 #end if
|
|
100
|
|
101 #if $params.bismark_stdout:
|
|
102 --stdout $output_stdout
|
|
103 #end if
|
|
104
|
|
105 #if $params.isReportOutput:
|
|
106 --output-report-file $report_file
|
|
107 #end if
|
|
108
|
|
109 #end if
|
|
110
|
|
111 ##
|
|
112 ## Output parameters.
|
|
113 ##
|
|
114 --output $output
|
|
115 ##$suppress_header
|
|
116
|
|
117 #if str( $singlePaired.sPaired ) == "single"
|
|
118 #if $output_unmapped_reads_l
|
|
119 --output-unmapped-reads $output_unmapped_reads_l
|
|
120 #end if
|
|
121 #if $output_suppressed_reads_l
|
|
122 --output-suppressed-reads $output_suppressed_reads_l
|
|
123 #end if
|
|
124 #else
|
|
125 #if $output_unmapped_reads_l and $output_unmapped_reads_r
|
|
126 --output-unmapped-reads-l $output_unmapped_reads_l
|
|
127 --output-unmapped-reads-r $output_unmapped_reads_r
|
|
128 #end if
|
|
129 #if $output_suppressed_reads_l and $output_suppressed_reads_l
|
|
130 --output-suppressed-reads-l $output_suppressed_reads_l
|
|
131 --output-suppressed-reads-r $output_suppressed_reads_r
|
|
132 #end if
|
|
133 #end if
|
|
134
|
4
|
135 ]]>
|
0
|
136 </command>
|
|
137 <inputs>
|
|
138 <conditional name="refGenomeSource">
|
|
139 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options">
|
|
140 <option value="indexed">Use a built-in index</option>
|
|
141 <option value="history">Use one from the history</option>
|
|
142 </param>
|
|
143 <when value="indexed">
|
|
144 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact your Galaxy admin.">
|
|
145 <options from_data_table="bowtie_indexes">
|
|
146 <filter type="sort_by" column="2"/>
|
|
147 <validator type="no_options" message="No indexes are available for the selected input dataset"/>
|
|
148 </options>
|
|
149 </param>
|
|
150 </when> <!-- build-in -->
|
|
151 <when value="history">
|
|
152 <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" />
|
|
153 </when> <!-- history -->
|
|
154 </conditional> <!-- refGenomeSource -->
|
|
155
|
|
156 <!-- Input Parameters -->
|
|
157 <conditional name="singlePaired">
|
|
158 <param name="sPaired" type="select" label="Is this library mate-paired?">
|
|
159 <option value="single">Single-end</option>
|
|
160 <option value="paired">Paired-end</option>
|
|
161 </param>
|
|
162 <when value="single">
|
|
163 <param name="input_singles" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
|
|
164 </when>
|
|
165 <when value="paired">
|
|
166 <repeat name="mate_list" title="Paired End Pairs" min="1">
|
|
167 <param name="input_mate1" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Mate pair 1" help="FASTQ or FASTA files." />
|
|
168 <param name="input_mate2" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Mate pair 2" help="FASTQ or FASTA files." />
|
|
169 </repeat>
|
|
170 <param name="minInsert" type="integer" value="0" label="Minimum insert size for valid paired-end alignments" />
|
|
171 <param name="maxInsert" type="integer" value="500" label="Maximum insert size for valid paired-end alignments" />
|
|
172 </when>
|
|
173 </conditional>
|
|
174
|
|
175
|
|
176 <conditional name="params">
|
|
177 <param name="settingsType" type="select" label="Bismark settings to use" help="You can use the default settings or set custom values for any of Bismark's parameters.">
|
|
178 <option value="default">Use Defaults</option>
|
|
179 <option value="custom">Full parameter list</option>
|
|
180 </param>
|
|
181 <when value="default" />
|
|
182 <!-- Full/advanced params. -->
|
|
183 <when value="custom">
|
|
184 <!-- -n -->
|
|
185 <param name="seed_mismatches" type="select" label="The maximum number of mismatches permitted in the 'seed'">
|
|
186 <option value="0">0</option>
|
|
187 <option value="1">1</option>
|
|
188 <option value="2" selected="true">2</option>
|
|
189 <option value="3">3</option>
|
|
190 </param>
|
|
191 <!-- -l -->
|
|
192 <param name="seed_len" type="integer" value="28" label="The 'seed length'; The number of bases of the high quality end of the read to which the maximum number of mismatches applies" />
|
|
193 <!--
|
|
194 <param name="maqerr" type="integer" value="70" label="Maximum permitted total of quality values at all mismatched read positions throughout the entire alignment, not just in the 'seed'." />
|
|
195 -->
|
|
196 <param name="qupto" type="integer" value="0" label="Only aligns the first N reads or read pairs from the input" help="Default is 0 and means 'no-limit'." />
|
|
197 <param name="skip_reads" type="integer" value="0" label="Skip (i.e. do not align) the first N reads or read pairs from the input" />
|
|
198
|
|
199 <param name="suppressed_read_file" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write ambiguous reads to an extra output file" help="Write all reads which produce more than one valid alignment with the same number of lowest mismatches or other reads that fail to align uniquely." />
|
|
200 <param name="unmapped_read_file" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write all reads that could not be aligned to a file" />
|
|
201 <!-- output Options -->
|
|
202 <param name="bismark_stdout" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write the bismark output and summary information to an extra file" />
|
|
203 <param name="isReportOutput" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Offer all report files concatenated in one file" />
|
4
|
204 <!--end output options -->
|
0
|
205 </when> <!-- full -->
|
|
206 </conditional> <!-- params -->
|
|
207 <!--
|
|
208 <param name="suppress_header" type="boolean" truevalue="..suppress-header" falsevalue="" checked="false" label="Suppress the header in the output SAM file" help="Bowtie produces SAM with several lines of header information by default." />
|
|
209 -->
|
|
210 </inputs>
|
|
211 <outputs>
|
|
212 <data format="txt" name="report_file" label="${tool.name} on ${on_string}: Report">
|
|
213 <filter>
|
|
214 ((
|
|
215 params['settingsType'] == "custom" and
|
|
216 params['isReportOutput'] is True
|
|
217 ))
|
|
218 </filter>
|
|
219 </data>
|
|
220 <data format="txt" name="output_stdout" label="${tool.name} on ${on_string}: Summary">
|
|
221 <filter>
|
|
222 ((
|
|
223 params['settingsType'] == "custom" and
|
|
224 params['bismark_stdout'] is True
|
|
225 ))
|
|
226 </filter>
|
|
227 </data>
|
|
228
|
|
229 <data format="bam" name="output" label="${tool.name} on ${on_string}: mapped reads">
|
|
230 <actions>
|
|
231 <conditional name="refGenomeSource.genomeSource">
|
|
232 <when value="indexed">
|
|
233 <action type="metadata" name="dbkey">
|
|
234 <option type="from_data_table" name="bowtie2_indexes" column="1" offset="0">
|
|
235 <filter type="param_value" column="0" value="#" compare="startswith" keep="False"/>
|
|
236 <filter type="param_value" ref="refGenomeSource.index" column="0"/>
|
|
237 </option>
|
|
238 </action>
|
|
239 </when>
|
|
240 <when value="history">
|
|
241 <action type="metadata" name="dbkey">
|
|
242 <option type="from_param" name="refGenomeSource.ownFile" param_attribute="dbkey" />
|
|
243 </action>
|
|
244 </when>
|
|
245 </conditional>
|
|
246 </actions>
|
|
247 </data>
|
|
248
|
|
249 <data format="fastq" name="output_suppressed_reads_l" label="${tool.name} on ${on_string}: suppressed reads (L)">
|
|
250 <filter>
|
|
251 ((
|
|
252 params['settingsType'] == "custom" and
|
|
253 params['suppressed_read_file'] is True
|
|
254 ))
|
|
255 </filter>
|
|
256 <actions>
|
|
257 <conditional name="singlePaired.sPaired">
|
|
258 <when value="single">
|
|
259 <action type="format">
|
|
260 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
|
|
261 </action>
|
|
262 </when>
|
|
263 <when value="paired">
|
4
|
264 <!--action type="format">
|
0
|
265 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" />
|
4
|
266 </action-->
|
0
|
267 </when>
|
|
268 </conditional>
|
|
269 </actions>
|
|
270 </data>
|
|
271
|
|
272 <data format="fastq" name="output_suppressed_reads_r" label="${tool.name} on ${on_string}: suppressed reads (R)">
|
|
273 <filter>singlePaired['sPaired'] == "paired"</filter>
|
|
274 <filter>params['settingsType'] == "custom"</filter>
|
|
275 <filter>params['supressed_read_file'] is True</filter>
|
|
276 <actions>
|
|
277 <conditional name="singlePaired.sPaired">
|
|
278 <when value="single">
|
|
279 <action type="format">
|
|
280 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
|
|
281 </action>
|
|
282 </when>
|
|
283 <when value="paired">
|
4
|
284 <!--action type="format">
|
0
|
285 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" />
|
4
|
286 </action-->
|
0
|
287 </when>
|
|
288 </conditional>
|
|
289 </actions>
|
|
290 </data>
|
|
291
|
|
292 <!-- Outout unmapped reads -->
|
|
293 <data format="fastq" name="output_unmapped_reads_l" label="${tool.name} on ${on_string}: unmapped reads (L)">
|
|
294 <filter>
|
|
295 ((
|
|
296 params['settingsType'] == "custom" and
|
|
297 params['unmapped_read_file'] is True
|
|
298 ))
|
|
299 </filter>
|
|
300 <actions>
|
|
301 <conditional name="singlePaired.sPaired">
|
|
302 <when value="single">
|
|
303 <action type="format">
|
|
304 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
|
|
305 </action>
|
|
306 </when>
|
|
307 <when value="paired">
|
4
|
308 <!--action type="format">
|
0
|
309 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" />
|
4
|
310 </action-->
|
0
|
311 </when>
|
|
312 </conditional>
|
|
313 </actions>
|
|
314 </data>
|
|
315 <data format="fastq" name="output_unmapped_reads_r" label="${tool.name} on ${on_string}: unmapped reads (R)">
|
|
316 <filter>singlePaired['sPaired'] == "paired"</filter>
|
|
317 <filter>params['settingsType'] == "custom"</filter>
|
|
318 <filter>params['unmapped_read_file'] is True</filter>
|
|
319 <actions>
|
|
320 <conditional name="singlePaired.sPaired">
|
|
321 <when value="single">
|
|
322 <action type="format">
|
|
323 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
|
|
324 </action>
|
|
325 </when>
|
|
326 <when value="paired">
|
4
|
327 <!--action type="format">
|
0
|
328 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" />
|
4
|
329 </action-->
|
0
|
330 </when>
|
|
331 </conditional>
|
|
332 </actions>
|
|
333 </data>
|
|
334 </outputs>
|
|
335
|
|
336 <tests>
|
|
337 </tests>
|
|
338
|
|
339 <help>
|
4
|
340 <![CDATA[
|
0
|
341
|
|
342 **What it does**
|
|
343
|
|
344 Bismark_ is a bisulfite mapper and methylation caller. Bismark takes in FastA or FastQ files and aligns the
|
|
345 reads to a specified bisulfite genome. Sequence reads are transformed into a bisulfite converted forward strand
|
|
346 version (C->T conversion) or into a bisulfite treated reverse strand (G->A conversion of the forward strand).
|
|
347 Each of these reads are then aligned to bisulfite treated forward strand index of a reference genome
|
|
348 (C->T converted) and a bisulfite treated reverse strand index of the genome (G->A conversion of the
|
|
349 forward strand, by doing this alignments will produce the same positions). These 4 instances of Bowtie (1 or 2)
|
|
350 are run in parallel. The sequence file(s) are then read in again sequence by sequence to pull out the original
|
|
351 sequence from the genome and determine if there were any protected C's present or not.
|
|
352
|
|
353 .. _Bismark: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
|
|
354
|
|
355 As of version 0.7.0 Bismark will only run 2 alignment threads for OT and OB in parallel, the 4 strand mode can be
|
|
356 re-enabled by using non_directional mode.
|
|
357
|
|
358 It is developed by Krueger F and Andrews SR. at the Babraham Institute. Krueger F, Andrews SR. (2011) Bismark: a flexible aligner and methylation caller for Bisulfite-Seq applications. Bioinformatics, 27, 1571-2.
|
|
359
|
|
360 ------
|
|
361
|
|
362 **Know what you are doing**
|
|
363
|
|
364 .. class:: warningmark
|
|
365
|
|
366 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy.
|
|
367
|
|
368 .. __: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
|
|
369
|
|
370
|
|
371 .. class:: warningmark
|
|
372
|
|
373 Make sure all your input reads are in the correct and same format. If thats not the case please adjust/convert the filetype with galaxy's build-in converters.
|
|
374
|
|
375 ------
|
|
376
|
|
377 **Input formats**
|
|
378
|
|
379 Bismark accepts files in either Sanger FASTQ format (galaxy type *fastqsanger*), Illumina FASTQ format (galaxy type *fastqillumina*) or FASTA format (galaxy type *fasta*). Use the FASTQ Groomer to prepare your files.
|
|
380
|
|
381 ------
|
|
382
|
|
383 **A Note on Built-in Reference Genomes**
|
|
384
|
|
385 The default variant for all genomes is "Full", defined as all primary chromosomes (or scaffolds/contigs) including mitochondrial plus associated unmapped, plasmid, and other segments. When only one version of a genome is available in this tool, it represents the default "Full" variant. Some genomes will have more than one variant available. The "Canonical Male" or sometimes simply "Canonical" variant contains the primary chromosomes for a genome. For example a human "Canonical" variant contains chr1-chr22, chrX, chrY, and chrM. The "Canonical Female" variant contains the primary chromosomes excluding chrY.
|
|
386
|
|
387 ------
|
|
388
|
|
389 The final output of Bismark is in SAM format by default.
|
|
390
|
|
391 **Outputs**
|
|
392
|
|
393 The output is in SAM format, and has the following columns::
|
|
394
|
|
395 Column Description
|
|
396 -------- --------------------------------------------------------
|
|
397 1 QNAME seq-ID
|
4
|
398 2 FLAG this flag tries to take the strand a bisulfite read
|
|
399 originated from into account
|
0
|
400 (this is different from ordinary DNA alignment flags!)
|
|
401 3 RNAME chromosome
|
|
402 4 POS start position
|
|
403 5 MAPQ always 255
|
|
404 6 CIGAR extended CIGAR string
|
|
405 7 MRNM Mate Reference sequence NaMe ('=' if same as RNAME)
|
|
406 8 MPOS 1-based Mate POSition
|
|
407 9 ISIZE Inferred insert SIZE
|
|
408 10 SEQ query SEQuence on the same strand as the reference
|
|
409 11 QUAL Phred33 scale
|
|
410 12 NM-tag edit distance to the reference)
|
4
|
411 13 XX-tag base-by-base mismatches to the reference.
|
0
|
412 This does not include indels.
|
|
413 14 XM-tag methylation call string
|
|
414 15 XR-tag read conversion state for the alignment
|
|
415 16 XG-tag genome conversion state for the alignment
|
4
|
416
|
0
|
417
|
|
418 Each read of paired-end alignments is written out in a separate line in the above format.
|
|
419
|
|
420
|
|
421 It looks like this (scroll sideways to see the entire example)::
|
|
422
|
|
423 QNAME FLAG RNAME POS MAPQ CIAGR MRNM MPOS ISIZE SEQ QUAL OPT
|
|
424 HWI-EAS91_1_30788AAXX:1:1:1761:343 4 * 0 0 * * 0 0 AAAAAAANNAAAAAAAAAAAAAAAAAAAAAAAAAAACNNANNGAGTNGNNNNNNNGCTTCCCACAGNNCTGG hhhhhhh;;hhhhhhhhhhh^hOhhhhghhhfhhhgh;;h;;hhhh;h;;;;;;;hhhhhhghhhh;;Phhh
|
|
425 HWI-EAS91_1_30788AAXX:1:1:1578:331 4 * 0 0 * * 0 0 GTATAGANNAATAAGAAAAAAAAAAATGAAGACTTTCNNANNTCTGNANNNNNNNTCTTTTTTCAGNNGTAG hhhhhhh;;hhhhhhhhhhhhhhhhhhhhhhhhhhhh;;h;;hhhh;h;;;;;;;hhhhhhhhhhh;;hhVh
|
|
426
|
|
427 -------
|
|
428
|
|
429 **Bismark settings**
|
|
430
|
|
431 All of the options have a default value. You can change any of them. If any Bismark function is missing please contact the tool author or your Galaxy admin.
|
|
432
|
|
433 ------
|
|
434
|
|
435 **Bismark parameter list**
|
|
436
|
|
437 This is an exhaustive list of Bismark options.
|
|
438
|
|
439 Input::
|
|
440
|
|
441 --singles A comma- or space-separated list of files containing the reads to be aligned (e.g.
|
|
442 lane1.fq,lane2.fq lane3.fq). Reads may be a mix of different lengths. Bismark will
|
|
443 produce one mapping result and one report file per input file.
|
|
444
|
|
445 -1 mates1 Comma-separated list of files containing the #1 mates (filename usually includes
|
|
446 "_1"), e.g. flyA_1.fq,flyB_1.fq). Sequences specified with this option must
|
|
447 correspond file-for-file and read-for-read with those specified in mates2.
|
|
448 Reads may be a mix of different lengths. Bismark will produce one mapping result
|
|
449 and one report file per paired-end input file pair.
|
|
450
|
|
451 -2 mates2 Comma-separated list of files containing the #2 mates (filename usually includes
|
|
452 "_2"), e.g. flyA_1.fq,flyB_1.fq). Sequences specified with this option must
|
|
453 correspond file-for-file and read-for-read with those specified in mates1.
|
|
454 Reads may be a mix of different lengths.
|
|
455
|
|
456 -q/--fastq The query input files (specified as mate1,mate2 or singles are FASTQ
|
|
457 files (usually having extension .fg or .fastq). This is the default. See also
|
|
458 --solexa-quals.
|
|
459
|
|
460 -f/--fasta The query input files (specified as mate1,mate2 or singles are FASTA
|
|
461 files (usually havin extension .fa, .mfa, .fna or similar). All quality values
|
|
462 are assumed to be 40 on the Phred scale.
|
|
463
|
|
464 -s/--skip INT Skip (i.e. do not align) the first INT reads or read pairs from the input.
|
|
465
|
|
466 -u/--upto INT Only aligns the first INT reads or read pairs from the input. Default: no limit.
|
|
467
|
|
468 --phred33-quals FASTQ qualities are ASCII chars equal to the Phred quality plus 33. Default: on.
|
|
469
|
|
470 --phred64-quals FASTQ qualities are ASCII chars equal to the Phred quality plus 64. Default: off.
|
|
471
|
|
472 --solexa-quals Convert FASTQ qualities from solexa-scaled (which can be negative) to phred-scaled
|
4
|
473 (which can't). The formula for conversion is:
|
0
|
474 phred-qual = 10 * log(1 + 10 ** (solexa-qual/10.0)) / log(10). Used with -q. This
|
|
475 is usually the right option for use with (unconverted) reads emitted by the GA
|
|
476 Pipeline versions prior to 1.3. Works only for Bowtie 1. Default: off.
|
|
477
|
|
478 --solexa1.3-quals Same as --phred64-quals. This is usually the right option for use with (unconverted)
|
|
479 reads emitted by GA Pipeline version 1.3 or later. Default: off.
|
|
480
|
|
481
|
|
482 Alignment::
|
|
483
|
|
484 -n/--seedmms INT The maximum number of mismatches permitted in the "seed", i.e. the first L base pairs
|
4
|
485 of the read (where L is set with -l/--seedlen). This may be 0, 1, 2 or 3 and the
|
0
|
486 default is 1. This option is only available for Bowtie 1 (for Bowtie 2 see -N).
|
|
487
|
|
488 -l/--seedlen The "seed length"; i.e., the number of bases of the high quality end of the read to
|
|
489 which the -n ceiling applies. The default is 28. Bowtie (and thus Bismark) is faster for
|
|
490 larger values of -l. This option is only available for Bowtie 1 (for Bowtie 2 see -L).
|
|
491
|
|
492 -e/--maqerr INT Maximum permitted total of quality values at all mismatched read positions throughout
|
|
493 the entire alignment, not just in the "seed". The default is 70. Like Maq, bowtie rounds
|
|
494 quality values to the nearest 10 and saturates at 30. This value is not relevant for
|
|
495 Bowtie 2.
|
|
496
|
|
497 --chunkmbs INT The number of megabytes of memory a given thread is given to store path descriptors in
|
|
498 --best mode. Best-first search must keep track of many paths at once to ensure it is
|
|
499 always extending the path with the lowest cumulative cost. Bowtie tries to minimize the
|
|
500 memory impact of the descriptors, but they can still grow very large in some cases. If
|
|
501 you receive an error message saying that chunk memory has been exhausted in --best mode,
|
|
502 try adjusting this parameter up to dedicate more memory to the descriptors. This value
|
|
503 is not relevant for Bowtie 2. Default: 512.
|
|
504
|
|
505 -I/--minins INT The minimum insert size for valid paired-end alignments. E.g. if -I 60 is specified and
|
|
506 a paired-end alignment consists of two 20-bp alignments in the appropriate orientation
|
|
507 with a 20-bp gap between them, that alignment is considered valid (as long as -X is also
|
|
508 satisfied). A 19-bp gap would not be valid in that case. Default: 0.
|
|
509
|
|
510 -X/--maxins INT The maximum insert size for valid paired-end alignments. E.g. if -X 100 is specified and
|
|
511 a paired-end alignment consists of two 20-bp alignments in the proper orientation with a
|
|
512 60-bp gap between them, that alignment is considered valid (as long as -I is also satisfied).
|
|
513 A 61-bp gap would not be valid in that case. Default: 500.
|
|
514
|
|
515
|
|
516
|
|
517 Output::
|
|
518
|
|
519 --non_directional The sequencing library was constructed in a non strand-specific manner, alignments to all four
|
|
520 bisulfite strands will be reported. Default: OFF.
|
|
521
|
|
522 (The current Illumina protocol for BS-Seq is directional, in which case the strands complementary
|
|
523 to the original strands are merely theoretical and should not exist in reality. Specifying directional
|
|
524 alignments (which is the default) will only run 2 alignment threads to the original top (OT)
|
|
525 or bottom (OB) strands in parallel and report these alignments. This is the recommended option
|
|
526 for sprand-specific libraries).
|
|
527
|
|
528 --sam-no-hd Suppress SAM header lines (starting with @). This might be useful when very large input files are
|
|
529 split up into several smaller files to run concurrently and the output files are to be merged.
|
|
530
|
|
531 --quiet Print nothing besides alignments.
|
|
532
|
|
533 --vanilla Performs bisulfite mapping with Bowtie 1 and prints the 'old' output (as in Bismark 0.5.X) instead
|
|
534 of SAM format output.
|
|
535
|
|
536 -un/--unmapped Write all reads that could not be aligned to a file in the output directory. Written reads will
|
|
537 appear as they did in the input, without any translation of quality values that may have
|
|
538 taken place within Bowtie or Bismark. Paired-end reads will be written to two parallel files with _1
|
|
539 and _2 inserted in their filenames, i.e. _unmapped_reads_1.txt and unmapped_reads_2.txt. Reads
|
|
540 with more than one valid alignment with the same number of lowest mismatches (ambiguous mapping)
|
|
541 are also written to _unmapped_reads.txt unless the option --ambiguous is specified as well.
|
|
542
|
|
543 --ambiguous Write all reads which produce more than one valid alignment with the same number of lowest
|
|
544 mismatches or other reads that fail to align uniquely to a file in the output directory.
|
|
545 Written reads will appear as they did in the input, without any of the translation of quality
|
|
546 values that may have taken place within Bowtie or Bismark. Paired-end reads will be written to two
|
|
547 parallel files with _1 and _2 inserted in theit filenames, i.e. _ambiguous_reads_1.txt and
|
|
548 _ambiguous_reads_2.txt. These reads are not written to the file specified with --un.
|
|
549
|
|
550 -o/--output_dir DIR Write all output files into this directory. By default the output files will be written into
|
|
551 the same folder as the input file(s). If the specified folder does not exist, Bismark will attempt
|
|
552 to create it first. The path to the output folder can be either relative or absolute.
|
|
553
|
|
554 --temp_dir DIR Write temporary files to this directory instead of into the same directory as the input files. If
|
|
555 the specified folder does not exist, Bismark will attempt to create it first. The path to the
|
|
556 temporary folder can be either relative or absolute.
|
|
557
|
4
|
558 ]]>
|
0
|
559 </help>
|
4
|
560 <citations>
|
|
561 <citation type="doi">10.1093/bioinformatics/btr167</citation>
|
|
562 </citations>
|
0
|
563 </tool>
|