comparison search.xml @ 0:fae6527990af draft

Imported from capsule None
author iuc
date Thu, 21 May 2015 03:58:09 -0400
parents
children f29e21388219
comparison
equal deleted inserted replaced
-1:000000000000 0:fae6527990af
1 <tool id="vsearch_search" name="VSearch search" version="@VERSION@.0">
2 <description></description>
3 <macros>
4 <import>vsearch_macros.xml</import>
5 </macros>
6 <expand macro="requirements" />
7 <expand macro="stdio" />
8 <expand macro="version_command" />
9 <command>
10 <![CDATA[
11 vsearch
12
13 @GENERAL@
14 --db $dbfile
15 --dbmask $dbmask
16
17 ##--fulldp full dynamic programming alignment (always on)
18 ##--gapext STRING penalties for gap extension (2I/1E)
19 ##--gapopen STRING penalties for gap opening (20I/2E)
20 $hardmask
21 --id $id
22 --iddef $iddef
23
24 #if $qmask != 'no':
25 --qmask $qmask
26 #end if
27
28 ## --rowlen INT width of alignment lines in alnout output (64)
29
30 $self_param
31 $selfid_param
32 #if $sizeout:
33 --sizeout $sizeout
34 #end if
35 --strand $strand
36 --usearch_global $queryfile
37
38 #if '--alnout' in str($outputs):
39 --alnout $alnout
40 #end if
41 #if '--blast6out' in str($outputs):
42 --blast6out $blast6out
43 #end if
44 #if '--dbmatched' in str($outputs):
45 --dbmatched $dbmatched
46 #end if
47 #if '--dbnotmatched' in str($outputs):
48 --dbnotmatched $dbnotmatched
49 #end if
50 #if '--fastapairs' in str($outputs):
51 --fastapairs $fastapairs
52 #end if
53 #if '--notmatched' in str($outputs):
54 --notmatched $notmatched
55 #end if
56 #if '--matched' in str($outputs):
57 --matched $matched
58 #end if
59
60 #if $adv_opts.adv_opts_selector == "advanced":
61 $adv_opts.top_hits_only
62 $adv_opts.rightjust
63 $adv_opts.leftjust
64 --target_cov $adv_opts.target_cov
65 --query_cov $adv_opts.query_cov
66
67
68 #if $adv_opts.maxid:
69 --maxid $adv_opts.maxid
70 #end if
71 #if $adv_opts.maxqt:
72 --maxqt $adv_opts.maxqsize
73 #end if
74 #if $adv_opts.maxsizeratio:
75 --maxsizeratio $adv_opts.maxsizeratio
76 #end if
77 #if $adv_opts.maxsl:
78 --maxsl $adv_opts.maxsl
79 #end if
80 #if $adv_opts.mid:
81 --mid $adv_opts.mid
82 #end if
83 #if $adv_opts.minqt:
84 --minqt $adv_opts.minqt
85 #end if
86 #if $adv_opts.minsizeratio:
87 --minsizeratio $adv_opts.minseqlength
88 #end if
89 #if $adv_opts.minsl:
90 --minsl $adv_opts.minsl
91 #end if
92
93 #if $adv_opts.mintsize:
94 --mintsize $adv_opts.mintsize
95 #end if
96 #if $adv_opts.mismatch:
97 --mismatch $adv_opts.mismatch
98 #end if
99 #if $adv_opts.maxqsize:
100 --maxqsize $adv_opts.maxqsize
101 #end if
102 #if $adv_opts.mincols:
103 --mincols $adv_opts.mincols
104 #end if
105 #if $adv_opts.maxsubs:
106 --maxsubs $adv_opts.maxsubs
107 #end if
108 #if $adv_opts.maxrejects:
109 --maxrejects $adv_opts.maxrejects
110 #end if
111 #if $adv_opts.maxaccepts:
112 --maxaccepts $adv_opts.maxaccepts
113 #end if
114 #if $adv_opts.maxdiffs:
115 --maxdiffs $adv_opts.maxdiffs
116 #end if
117 #if $adv_opts.maxgaps:
118 --maxgaps $adv_opts.maxgaps
119 #end if
120 #if $adv_opts.maxhits:
121 --maxhits $adv_opts.maxhits
122 #end if
123 #if $adv_opts.match:
124 --match $adv_opts.match
125 #end if
126 #if $adv_opts.idprefix:
127 --idprefix $adv_opts.idprefix
128 #end if
129 #if $adv_opts.idsuffix:
130 --idsuffix $adv_opts.idsuffix
131 #end if
132
133 #if $adv_opts.uclust_output.uclust_output_select == 'yes':
134 --uc
135 $adv_opts.uclust_output.uc_allhits
136 #end if
137
138 #if $adv_opts.userfields_output.userfields_output_select == 'yes':
139 --userfields '#echo '+'.join( str($adv_opts.userfields_output.userfields).split(',') )#'
140 --userout $userout
141 #end if
142
143 ##--weak_id REAL include aligned hits with >= id; continue search
144 --wordlength $adv_opts.wordlength
145
146 $$adv_opts.output_no_hits
147
148 #end if
149
150
151 ]]>
152 </command>
153 <inputs>
154 <param name="queryfile" type="data" format="fasta" label="Select your query FASTA file" help="(--usearch_global)" />
155 <param name="dbfile" type="data" format="fasta" label="Select your database FASTA file" help="(--db)" />
156
157 <expand macro="qmask" />
158 <expand macro="sizeout" />
159 <expand macro="strand" />
160 <expand macro="self_and_selfid" />
161 <expand macro="id_and_iddef" />
162 <expand macro="hardmask" />
163
164 <param name="dbmask" type="select" optional="True" label="Mask database sequences" help="(--dbmask)">
165 <option value="none" selected="True">No masking</option>
166 <option value="dust" selected="True">dust</option>
167 <option value="soft">soft</option>
168 </param>
169
170 <expand macro="general_output">
171 <option value="--dbmatched">FASTA file for matching database sequences</option>
172 <option value="--dbnotmatched">FASTA file for non-matching database sequences</option>
173 <option value="--notmatched">Write non-matching query sequences to separate file</option>
174 <option value="--matched">Write matching query sequences to separate file</option>
175 </expand>
176
177 <conditional name="adv_opts">
178 <param name="adv_opts_selector" type="select" label="Advanced Options">
179 <option value="basic" selected="True">Hide Advanced Options</option>
180 <option value="advanced">Show Advanced Options</option>
181 </param>
182 <when value="basic" />
183 <when value="advanced">
184
185 <param name="top_hits_only" type="boolean" truevalue="--top_hits_only" falsevalue="" checked="False"
186 label="Output only hits with identity equal to the best" help="(--top_hits_only)"/>
187 <param name="rightjust" type="boolean" truevalue="--rightjust" falsevalue="" checked="False"
188 label="Reject if terminal gaps at alignment right end" help="(--rightjust)"/>
189 <param name="leftjust" type="boolean" truevalue="--leftjust" falsevalue="" checked="False"
190 label="Reject if terminal gaps at alignment left end" help="(--leftjust)"/>
191
192 <param name="query_cov" type="float" value="" optional="True" label="Reject if fraction of query seq. aligned lower than this value"
193 help="(--query_cov)"/>
194 <param name="target_cov" type="float" value="" optional="True" label="Reject if fraction of target seq. aligned lower than this value"
195 help="(--target_cov)"/>
196 <param name="maxid" type="float" value="" optional="True" label="Reject if identity higher than this value"
197 help="(--maxid)"/>
198 <param name="maxqt" type="float" value="" optional="True" label="Reject if query/target length ratio higher than this value"
199 help="(--maxqt)"/>
200 <param name="maxsizeratio" type="float" value="" optional="True" label="Reject if query/target abundance ratio higher than this value"
201 help="(--maxsizeratio)"/>
202 <param name="maxsl" type="float" value="" optional="True" label="Reject if shorter/longer length ratio higher than this value"
203 help="(--maxsl)"/>
204 <param name="mid" type="float" value="" optional="True" label="Reject if percent identity lower than this value, ignoring gaps"
205 help="(--mid)"/>
206 <param name="minqt" type="float" value="" optional="True" label="Reject if query/target length ratio lower than this value"
207 help="(--minqt)"/>
208 <param name="minsl" type="float" value="" optional="True" label="Reject if shorter/longer length ratio lower than this value"
209 help="(--minsl)"/>
210 <param name="minsizeratio" type="float" value="" optional="True" label="Reject if query/target abundance ratio lower than this value"
211 help="(--minsizeratio)"/>
212
213 <param name="maxqsize" type="integer" value="" optional="True" label="Reject if query abundance larger than this value"
214 help="(--maxqsize)"/>
215 <param name="mincols" type="integer" value="" optional="True" label="Reject if alignment length shorter than this value"
216 help="(--mincols)"/>
217 <param name="maxsubs" type="integer" value="" optional="True" label="Reject if more substitutions than this value"
218 help="(--maxsubs)"/>
219 <expand macro="maxrejects" />
220 <expand macro="maxaccepts" />
221 <param name="maxdiffs" type="integer" value="" optional="True" label="Reject if more substitutions or indels than this value"
222 help="(--maxdiffs)"/>
223 <param name="maxgaps" type="integer" value="" optional="True" label="Reject if more indels than this value"
224 help="(--maxgaps)"/>
225 <param name="maxhits" type="integer" value="" optional="True" label="Maximum number of hits to show"
226 help="(--maxhits)"/>
227 <param name="match" type="integer" value="2" label="Score for match"
228 help="(--match)"/>
229 <param name="idprefix" type="integer" value="" optional="True" label="Reject if first n nucleotides do not match"
230 help="(--idprefix)"/>
231 <param name="idsuffix" type="integer" value="" optional="True" label="Reject if last n nucleotides do not match"
232 help="(--idsuffix)"/>
233 <param name="mintsize" type="integer" value="" optional="True" label="Reject if target abundance lower"
234 help="(--mintsize)"/>
235 <param name="mismatch" type="integer" value="-4" label="Score for mismatch"
236 help="(--mismatch)"/>
237
238 <conditional name="uclust_output">
239 <param name="uclust_output_select" type="select" label="UCLUST-like output" help="(--uc)">
240 <option value="yes">Yes</option>
241 <option value="no" selected="True">No</option>
242 </param>
243 <when value="yes">
244 <param name="uc_allhits" type="boolean" truevalue="--uc_allhits" falsevalue="" checked="False"
245 label="Show all, not just top hits" help="(--uc_allhits)"/>
246 </when>
247 <when value="no" />
248 </conditional>
249
250 <param name="wordlength" type="integer" value="8" min="3" max="15" label="Length of words for database index 3-15"
251 help="Allowed values: 3-15 (--wordlength)"/>
252 <param name="output_no_hits" type="boolean" truevalue="--output_no_hits" falsevalue="" checked="False"
253 label="Write non-matching queries to the output file" help="(--output_no_hits)"/>
254
255 <expand macro="userfields" />
256 </when>
257 </conditional>
258
259
260 </inputs>
261 <outputs>
262 <data name="uc" format="fasta" label="${tool.name} on ${on_string}: UCLUST like output">
263 <filter>adv_opts.uclust_output.uclust_output_select == 'yes'</filter>
264 </data>
265 <data name="dbnotmatched" format="fasta" label="${tool.name} on ${on_string}: Non-matched database sequences">
266 <filter>'--dbnotmatchedt' in outputs</filter>
267 </data>
268 <data name="dbmatched" format="fasta" label="${tool.name} on ${on_string}: Matched database sequences">
269 <filter>'--dbmatched' in outputs</filter>
270 </data>
271 <data name="alnout" format="fasta" label="${tool.name} on ${on_string}: Alignment">
272 <filter>'--alnout' in outputs</filter>
273 </data>
274 <data name="blast6out" format="tabular" label="${tool.name} on ${on_string}: BLAST like tabular">
275 <filter>'--blast6out' in outputs</filter>
276 </data>
277 <data name="notmatched" format="fasta" label="${tool.name} on ${on_string}: Non-matched queries">
278 <filter>'--notmatched' in outputs</filter>
279 </data>
280 <data name="matched" format="fasta" label="${tool.name} on ${on_string}: Matching query sequences">
281 <filter>'--matched' in outputs</filter>
282 </data>
283 <data name="fastapairs" format="fasta" label="${tool.name} on ${on_string}: Query/Target sequences">
284 <filter>'--fastapairs' in outputs</filter>
285 </data>
286 <data name="userout" format="tabular" label="${tool.name} on ${on_string}: tabular output">
287 <filter>adv_opts.userfields_output.userfields_output_select == 'yes'</filter>
288 </data>
289 </outputs>
290 <tests>
291 <test>
292 <param name="dbfile" value="three_human_mRNA.fasta" ftype="fasta" />
293 <param name="queryfile" value="query.fasta" ftype="fasta" />
294 <param name="outputs" value="--blast6out,--dbmatched" />
295 <param name="dbmask" value="none" />
296 <param name="adv_opts_selector" value="advanced" />
297 <param name="top_hits_only" value="True" />
298 <output name="dbmatched" file="search_dbmatched_result1.fasta" ftype="fasta" />
299 <output name="blast6out" file="search_blast6out_result1.tabular" ftype="tabular" />
300 </test>
301 <test>
302 <param name="dbfile" value="three_human_mRNA.fasta" ftype="fasta" />
303 <param name="queryfile" value="query.fasta" ftype="fasta" />
304 <param name="outputs" value="--fastapairs,--matched" />
305 <param name="dbmask" value="none" />
306 <param name="adv_opts_selector" value="advanced" />
307 <param name="userfields_output_select" value="yes" />
308 <param name="userfields" value="query,target,evalue" />
309 <param name="top_hits_only" value="True" />
310 <param name="output_no_hits" value="True" />
311 <output name="matched" file="search_matched_result2.fasta" ftype="fasta" />
312 <output name="fastapairs" file="search_fastapairs_result2.fasta" ftype="fasta" />
313 <output name="userout" file="search_userfields_result2.tabular" ftype="tabular" />
314 </test>
315 </tests>
316 <help>
317 <![CDATA[
318 **What it does**
319
320 Sequence search based on vsearch.
321
322 @USERFIELDS_HELP@
323
324 Searching options
325 --alnout FILENAME filename for human-readable alignment output
326 --blast6out FILENAME filename for blast-like tab-separated output
327 --db FILENAME filename for FASTA formatted database for search
328 --dbmask mask db with "dust", "soft" or "none" method (dust)
329 --dbmatched FILENAME FASTA file for matching database sequences
330 --dbnotmatched FILENAME FASTA file for non-matching database sequences
331 --fastapairs FILENAME FASTA file with pairs of query and target
332 --fulldp full dynamic programming alignment (always on)
333 --gapext STRING penalties for gap extension (2I/1E)
334 --gapopen STRING penalties for gap opening (20I/2E)
335 --hardmask mask by replacing with N instead of lower case
336 --id REAL reject if identity lower
337 --iddef INT id definition, 0-4=CD-HIT,all,int,MBL,BLAST (2)
338 --idprefix INT reject if first n nucleotides do not match
339 --idsuffix INT reject if last n nucleotides do not match
340 --leftjust reject if terminal gaps at alignment left end
341 --match INT score for match (2)
342 --matched FILENAME FASTA file for matching query sequences
343 --maxaccepts INT number of hits to accept and show per strand (1)
344 --maxdiffs INT reject if more substitutions or indels
345 --maxgaps INT reject if more indels
346 --maxhits INT maximum number of hits to show (unlimited)
347 --maxid REAL reject if identity higher
348 --maxqsize INT reject if query abundance larger
349 --maxqt REAL reject if query/target length ratio higher
350 --maxrejects INT number of non-matching hits to consider (32)
351 --maxsizeratio REAL reject if query/target abundance ratio higher
352 --maxsl REAL reject if shorter/longer length ratio higher
353 --maxsubs INT reject if more substitutions
354 --mid REAL reject if percent identity lower, ignoring gaps
355 --mincols INT reject if alignment length shorter
356 --minqt REAL reject if query/target length ratio lower
357 --minsizeratio REAL reject if query/target abundance ratio lower
358 --minsl REAL reject if shorter/longer length ratio lower
359 --mintsize INT reject if target abundance lower
360 --mismatch INT score for mismatch (-4)
361 --notmatched FILENAME FASTA file for non-matching query sequences
362 --output_no_hits output non-matching queries to output files
363 --qmask mask query with "dust", "soft" or "none" method (dust)
364 --query_cov REAL reject if fraction of query seq. aligned lower
365 --rightjust reject if terminal gaps at alignment right end
366 --rowlen INT width of alignment lines in alnout output (64)
367 --self reject if labels identical
368 --selfid reject if sequences identical
369 --sizeout write abundance annotation to output
370 --strand search "plus" or "both" strands (plus)
371 --target_cov REAL reject if fraction of target seq. aligned lower
372 --top_hits_only output only hits with identity equal to the best
373 --uc FILENAME filename for UCLUST-like output
374 --uc_allhits show all, not just top hit with uc output
375 --usearch_global FILENAME filename of queries for global alignment search
376 --userfields STRING fields to output in userout file
377 --userout FILENAME filename for user-defined tab-separated output
378 --weak_id REAL include aligned hits with >= id; continue search
379 --wordlength INT length of words for database index 3-15 (8)
380
381 @EXTERNAL_DOCUMENTATION@
382
383 -------
384
385 @REFERENCES@
386
387
388 ]]>
389 </help>
390 <expand macro="citations" />
391 </tool>