comparison vsearch_macros.xml @ 0:fae6527990af draft

Imported from capsule None
author iuc
date Thu, 21 May 2015 03:58:09 -0400
parents
children 8c4e2933a17a
comparison
equal deleted inserted replaced
-1:000000000000 0:fae6527990af
1 <macros>
2 <xml name="requirements">
3 <requirements>
4 <requirement type="package" version="1.1.3">vsearch</requirement>
5 </requirements>
6 </xml>
7 <xml name="version_command">
8 <version_command>vsearch --version | head -n 1 | awk '{print $2}' | sed 's/,//'</version_command>
9 </xml>
10 <xml name="stdio">
11 <stdio>
12 <exit_code range="1:" />
13 <exit_code range=":-1" />
14 <regex match="Error:" />
15 <regex match="Exception:" />
16 </stdio>
17 </xml>
18
19 <xml name="topn">
20 <param name="topn" type="integer" value="" optional="True" label="Output just first n sequences"
21 help="(--topn)"/>
22 </xml>
23
24 <xml name="maxaccepts">
25 <param name="maxaccepts" type="integer" value="1" label="Number of hits to accept and show per strand"
26 help="(--maxaccepts)"/>
27 </xml>
28 <xml name="maxrejects">
29 <param name="maxrejects" type="integer" value="32" label="Number of non-matching hits to consider"
30 help="(--maxrejects)"/>
31 </xml>
32 <xml name="qmask">
33 <param name="qmask" type="select" label="Mask sequences" help="(--qmask)">
34 <option value="no">No masking</option>
35 <option value="dust" selected="True">dust</option>
36 <option value="soft">soft</option>
37 </param>
38 </xml>
39
40 <xml name="hardmask">
41 <param name="hardmask" type="boolean" truevalue="--hardmask" falsevalue="" checked="False"
42 label="Mask by replacing with N instead of lower case" help="(--hardmask)"/>
43 </xml>
44
45 <xml name="id_and_iddef">
46 <param name="iddef" type="select" label="ID definition" help="(--iddef)">
47 <option value="0">CD-HIT</option>
48 <option value="1">all</option>
49 <option value="2" selected="True">int</option>
50 <option value="3">MBL</option>
51 <option value="4">BLAST</option>
52 </param>
53 <param name="id" type="float" value="" optional="True" label="Reject hit if identity is lower than this value"
54 help="(--id)"/>
55 </xml>
56
57 <xml name="self_and_selfid">
58 <param name="self_param" type="boolean" truevalue="--self" falsevalue="" checked="False"
59 label="Exclude identical labels for --uchime_ref" help="(--self)"/>
60 <param name="selfid_param" type="boolean" truevalue="--selfid" falsevalue="" checked="False"
61 label="Exclude identical sequences for --uchime_ref" help="(--selfid)"/>
62 </xml>
63
64 <xml name="strand">
65 <param name="strand" type="select" label="Strand specific clustering" help="(--strand)">
66 <option value="plus" selected="True">Plus strand</option>
67 <option value="both">Both strands</option>
68 </param>
69 </xml>
70
71 <xml name="sizein">
72 <param name="sizein" type="boolean" truevalue="--sizein" falsevalue="" checked="False"
73 label="Read abundance annotation from input" help="(--sizein)"/>
74 </xml>
75
76 <xml name="sizeout">
77 <param name="sizeout" type="boolean" truevalue="--sizeout" falsevalue="" checked="False"
78 label="Write cluster abundances to centroid file" help="(--sizeout)"/>
79 </xml>
80
81 <xml name="uclust_like_output">
82 <param name="uc" type="boolean" truevalue="--uc" falsevalue="" checked="False"
83 label="UCLUST-like output" help="(--uc)"/>
84 </xml>
85
86 <token name="@GENERAL@">
87 --threads "\${GALAXY_SLOTS:-4}"
88 --notrunclabels
89 </token>
90 <token name="@USERFIELDS@">
91 #if $userfields_output.userfields_output_select == 'yes':
92 --userfields '#echo '+'.join( str($userfields_output.userfields).split(',') )#'
93 --userout $userout
94 #end if
95 </token>
96 <xml name="userfields_output">
97 <data name="userout" format="tabular" label="${tool.name} on ${on_string}: tabular output">
98 <filter>userfields_output.userfields_output_select == 'yes'</filter>
99 </data>
100 </xml>
101
102 <xml name="userfields">
103 <conditional name="userfields_output">
104 <param name="userfields_output_select" type="select" label="User defined tabular output" help="(--userfields)">
105 <option value="yes">Yes</option>
106 <option value="no" selected="True">No</option>
107 </param>
108 <when value="yes">
109 <param name="userfields" type="select" multiple="True" label="Fields in tabular output" help="For more information about the columns please scroll down to the tool help. (--userfields)">
110 <option value="aln">Print a string of M (match), D (delete, i.e. a gap in the query) and I (insert, i.e. a gap in the target) representing the pairwise alignment</option>
111 <option value="alnlen">Print the length of the query-target alignment (number of columns)</option>
112 <option value="bits">Bit score (not computed for nucleotide alignments)</option>
113 <option value="caln">Compact representation of the pairwise alignment using the CIGAR format (Compact Idiosyncratic Gapped Alignment Report): M (match), D (deletion) and I (insertion)</option>
114 <option value="evalue" selected="True">E-value (not computed for nucleotide alignments)</option>
115 <option value="exts">Number of columns containing a gap extension (zero or positive integer value)</option>
116 <option value="gaps">Number of columns containing a gap (zero or positive integer value)</option>
117 <option value="id">Percentage of identity</option>
118 <option value="id0">CD-HIT definition of the percentage of identity</option>
119 <option value="id1">The percentage of identity</option>
120 <option value="id2">The percentage of identity</option>
121 <option value="id3">Marine Biological Lab definition of the percentage of identity</option>
122 <option value="id4">BLAST definition of the percentage of identity</option>
123 <option value="ids">Number of matches in the alignment</option>
124 <option value="mism">Number of mismatches in the alignment</option>
125 <option value="opens">Number of columns containing a gap opening</option>
126 <option value="pairs">Number of columns containing only nucleotides</option>
127 <option value="pctgaps">Number of columns containing gaps expressed as a percentage of the alignment length</option>
128 <option value="pctpv">Percentage of positive columns. When working with nucleotide sequences, this is equivalent to the percentage of matches</option>
129 <option value="pv">Number of positive columns. When working with nucleotide sequences, this is equivalent to the number of matches</option>
130 <option value="qcov">Fraction of the query sequence that is aligned with the target sequence</option>
131 <option value="qframe">Query frame (-3 to +3). That field only concerns coding sequences and is not computed by vsearch</option>
132 <option value="qhi">Last nucleotide of the query aligned with the target</option>
133 <option value="qihi">Last nucleotide of the query aligned with the target</option>
134 <option value="qilo">First nucleotide of the query aligned with the target</option>
135 <option value="ql">Query sequence length</option>
136 <option value="qlo">First nucleotide of the query aligned with the target</option>
137 <option value="qrow">Print the sequence of the query segment as seen in the pairwise alignment</option>
138 <option value="qs">Query segment length</option>
139 <option value="qstrand">Query strand orientation (+ or - for nucleotide sequences)</option>
140 <option value="query" selected="True">Query label</option>
141 <option value="raw">Raw alignment score (negative, null or positive integer value)</option>
142 <option value="target" selected="True">Target label</option>
143 <option value="tcov">Fraction of the target sequence that is aligned with the query sequence</option>
144 <option value="tframe">Target frame (-3 to +3) - not computed by vsearch</option>
145 <option value="thi">Last nucleotide of the target aligned with the query</option>
146 <option value="tihi">Last nucleotide of the target aligned with the query (ignoring terminal gaps)</option>
147 <option value="tilo">First nucleotide of the target aligned with the query (ignoring initial gaps)</option>
148 <option value="tl">Target sequence length (positive integer value)</option>
149 <option value="tlo">First nucleotide of the target aligned with the query</option>
150 <option value="trow">Print the sequence of the target segment as seen in the pairwise alignment</option>
151 <option value="ts">Target segment length</option>
152 <option value="tstrand">Target strand orientation (+ or - for nucleotide sequences)</option>
153 </param>
154 </when>
155 <when value="no" />
156 </conditional>
157 </xml>
158
159 <xml name="general_output">
160 <param name="outputs" type="select" multiple="True" label="Select output files" help="">
161 <option value="--alnout">Human-readable alignment output</option>
162 <option value="--blast6out" selected="True">Blast-like tab-separated output</option>
163 <option value="--fastapairs">Write query/target pairs of sequences</option>
164 <yield/>
165 <validator type="no_options" message="Please select at least one output." />
166 </param>
167 </xml>
168
169 <token name="@VERSION@">1.1.3</token>
170 <token name="@EXTERNAL_DOCUMENTATION@">
171 <![CDATA[
172
173 For details about this tool, please refer to the `github account <https://github.com/torognes/vsearch>`_ or the `vsearch manual <https://github.com/torognes/vsearch/raw/master/doc/vsearch_manual.pdf>`_.
174
175 ]]>
176 </token>
177 <token name="@REFERENCES@">
178 </token>
179 <token name="@USERFIELDS_HELP@">
180 **Available fields in user defined tabular output**
181
182 ========= ================
183 Key Description
184 ========= ================
185 aln Print a string of M (match), D (delete, i.e. a gap in the query) and I (insert, i.e. a gap in the target) representing the pairwise alignment. Empty field if there is no alignment.
186 alnlen Print the length of the query-target alignment (number of columns). The field is set to 0 if there is no alignment.
187 bits Bit score (not computed for nucleotide alignments). Always set to 0.
188 caln Compact representation of the pairwise alignment using the CIGAR format (Compact Idiosyncratic Gapped Alignment Report): M (match), D (deletion) and I (insertion). Empty field if there is no alignment.
189 evalue E-value (not computed for nucleotide alignments). Always set to -1.
190 exts Number of columns containing a gap extension (zero or positive integer value).
191 gaps Number of columns containing a gap (zero or positive integer value).
192 id Percentage of identity (real value ranging from 0.0 to 100.0). The percentage identity is defined as 100 * (matching columns) / (alignment length - terminal gaps).
193 id0 CD-HIT definition of the percentage of identity (real value ranging from 0.0 to 100.0) using the length of the shortest sequence in the pairwise alignment as denominator: 100 * (matching columns) / (shortest sequence length).
194 id1 The percentage of identity (real value ranging from 0.0 to 100.0) is defined as the edit distance: 100 * (matching columns) / (alignment length).
195 id2 The percentage of identity (real value ranging from 0.0 to 100.0) is defined as the edit distance, excluding terminal gaps. The field id2 is an alias for the field id.
196 id3 Marine Biological Lab definition of the percentage of identity (real value ranging from 0.0 to 100.0), counting each extended gap (internal or terminal) as a single difference and using the length of the longest sequence in the pairwise alignment as denominator: 100 * (1.0 - [(mismatches + gaps) / (longest sequence length)]).
197 id4 BLAST definition of the percentage of identity (real value ranging from 0.0 to 100.0), equivalent to −−iddef 2 in a context of global pairwise alignment.
198 ids Number of matches in the alignment (zero or positive integer value).
199 mism Number of mismatches in the alignment (zero or positive integer value).
200 opens Number of columns containing a gap opening (zero or positive integer value).
201 pairs Number of columns containing only nucleotides. That value corresponds to the length of the alignment minus the gap-containing columns (zero or positive integer value).
202 pctgaps Number of columns containing gaps expressed as a percentage of the alignment length (real value ranging from 0.0 to 100.0).
203 pctpv Percentage of positive columns. When working with nucleotide sequences, this is equivalent to the percentage of matches (real value ranging from 0.0 to 100.0).
204 pv Number of positive columns. When working with nucleotide sequences, this is equivalent to the number of matches (zero or positive integer value).
205 qcov Fraction of the query sequence that is aligned with the target sequence (real value ranging from 0.0 to 100.0). The query coverage is computed as 100.0 * (matches + mismatches) / query sequence length. Internal or terminal gaps are not taken into account. The field is set to 0.0 if there is no alignment.
206 qframe Query frame (-3 to +3). That field only concerns coding sequences and is not computed by vsearch. Always set to +0.
207 qhi Last nucleotide of the query aligned with the target. Always equal to the length of the pairwise alignment. The field is set to 0 if there is no alignment.
208 qihi Last nucleotide of the query aligned with the target (ignoring terminal gaps). Nucleotide numbering starts from 1. The field is set to 0 if there is no alignment.
209 qilo First nucleotide of the query aligned with the target (ignoring initial gaps). Nucleotide numbering starts from 1. The field is set to 0 if there is no alignment.
210 ql Query sequence length (positive integer value). The field is set to 0 if there is no alignment.
211 qlo First nucleotide of the query aligned with the target. Always equal to 1 if there is an alignment, 0 otherwise.
212 qrow Print the sequence of the query segment as seen in the pairwise alignment (i.e. with gap insertions if need be). Empty field if there is no alignment.
213 qs Query segment length. Always equal to query sequence length.
214 qstrand Query strand orientation (+ or - for nucleotide sequences). Empty field if there is no alignment.
215 query Query label.
216 raw Raw alignment score (negative, null or positive integer value). The score is the sum of match rewards minus mismatch penalties, gap openings and gap extensions. The field is set to 0 if there is no alignment.
217 target Target label. The field is set to "*" if there is no alignment.
218 tcov Fraction of the target sequence that is aligned with the query sequence (real value rang-ing from 0.0 to 100.0). The target coverage is computed as 100.0 * (matches + mis-matches) / target sequence length. Internal or terminal gaps are not taken into account. The field is set to 0.0 if there is no alignment.
219 tframe Target frame (-3 to +3). That field only concerns coding sequences and is not computed by vsearch. Always set to +0.
220 thi Last nucleotide of the target aligned with the query. Always equal to the length of the pairwise alignment. The field is set to 0 if there is no alignment.
221 tihi Last nucleotide of the target aligned with the query (ignoring terminal gaps). Nucleotide numbering starts from 1. The field is set to 0 if there is no alignment.
222 tilo First nucleotide of the target aligned with the query (ignoring initial gaps). Nucleotide numbering starts from 1. The field is set to 0 if there is no alignment.
223 tl Target sequence length (positive integer value). The field is set to 0 if there is no alignment.
224 tlo First nucleotide of the target aligned with the query. Always equal to 1 if there is an alignment, 0 otherwise.
225 trow Print the sequence of the target segment as seen in the pairwise alignment (i.e. with gap insertions if need be). Empty field if there is no alignment.
226 ts Target segment length. Always equal to target sequence length. The field is set to 0 if there is no alignment.
227 tstrand Target strand orientation (+ or - for nucleotide sequences). Always set to "+", so reverse strand matches have tstrand "+" and qstrand "-". Empty field if there is no alignment.
228 ========= ================
229
230 </token>
231 <xml name="citations">
232 <citations>
233 <citation type="doi">10.5281/zenodo.15524</citation>
234 <yield />
235 </citations>
236 </xml>
237 </macros>