annotate qiime/pick_otus.xml @ 1:2c1d19ebac20 draft default tip

Deleted selected files
author azuzolo
date Wed, 06 Jun 2012 16:41:00 -0400
parents 003162f90751
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
003162f90751 Uploaded
azuzolo
parents:
diff changeset
1 <tool id="pick_otus" name="pick_otus" version="2.0.0">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
2 <description>OTU picking</description>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
3 <requirements>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
4 <requirement type="binary">pick_otus.py</requirement>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
5 </requirements>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
6 <command interpreter="python">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
7 qiime_wrapper.py
003162f90751 Uploaded
azuzolo
parents:
diff changeset
8 --galaxy_outputdir='$log.extra_files_path'
003162f90751 Uploaded
azuzolo
parents:
diff changeset
9 #if $pick.otu_picking_method == 'uclust' and $pick.refseqs_fp.__str__ != 'None':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
10 --galaxy_datasets='^\S+_otus\.txt$:'$otus,'^\S+_otus\.log$:'$log,'^\S+_failures\.txt$:'$failures
003162f90751 Uploaded
azuzolo
parents:
diff changeset
11 #else:
003162f90751 Uploaded
azuzolo
parents:
diff changeset
12 --galaxy_datasets='^\S+_otus\.txt$:'$otus,'^\S+_otus\.log$:'$log
003162f90751 Uploaded
azuzolo
parents:
diff changeset
13 #end if
003162f90751 Uploaded
azuzolo
parents:
diff changeset
14 pick_otus.py
003162f90751 Uploaded
azuzolo
parents:
diff changeset
15 --input_seqs_filepath=$input_seqs_filepath
003162f90751 Uploaded
azuzolo
parents:
diff changeset
16 #if $pick.otu_picking_method.__str__ == 'uclust':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
17 #if $pick.refseqs_fp.__str__ != 'None':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
18 --refseqs_fp=$pick.refseqs_fp
003162f90751 Uploaded
azuzolo
parents:
diff changeset
19 --otu_picking_method='uclust_ref'
003162f90751 Uploaded
azuzolo
parents:
diff changeset
20 $pick.suppress_new_clusters
003162f90751 Uploaded
azuzolo
parents:
diff changeset
21 #else:
003162f90751 Uploaded
azuzolo
parents:
diff changeset
22 --otu_picking_method=$pick.otu_picking_method
003162f90751 Uploaded
azuzolo
parents:
diff changeset
23 #end if
003162f90751 Uploaded
azuzolo
parents:
diff changeset
24 --similarity=$pick.similarity
003162f90751 Uploaded
azuzolo
parents:
diff changeset
25 $pick.enable_rev_strand_match
003162f90751 Uploaded
azuzolo
parents:
diff changeset
26 $pick.optimal_uclust
003162f90751 Uploaded
azuzolo
parents:
diff changeset
27 $pick.exact_uclust
003162f90751 Uploaded
azuzolo
parents:
diff changeset
28 $pick.user_sort
003162f90751 Uploaded
azuzolo
parents:
diff changeset
29 $pick.suppress_presort_by_abundance_uclust
003162f90751 Uploaded
azuzolo
parents:
diff changeset
30 --max_accepts=$pick.max_accepts
003162f90751 Uploaded
azuzolo
parents:
diff changeset
31 --max_rejects=$pick.max_rejects
003162f90751 Uploaded
azuzolo
parents:
diff changeset
32 #if $pick.uclust_otu_id_prefix != None and $pick.uclust_otu_id_prefix.__str__ != 'None' and $pick.uclust_otu_id_prefix.__str__ != '':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
33 --uclust_otu_id_prefix=$pick.uclust_otu_id_prefix
003162f90751 Uploaded
azuzolo
parents:
diff changeset
34 #end if
003162f90751 Uploaded
azuzolo
parents:
diff changeset
35 $pick.uclust_stable_sort
003162f90751 Uploaded
azuzolo
parents:
diff changeset
36 $pick.save_uc_files
003162f90751 Uploaded
azuzolo
parents:
diff changeset
37 #elif $pick.otu_picking_method.__str__ == 'mothur':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
38 --otu_picking_method=$pick.otu_picking_method
003162f90751 Uploaded
azuzolo
parents:
diff changeset
39 --clustering_algorithm=$pick.clustering_algorithm
003162f90751 Uploaded
azuzolo
parents:
diff changeset
40 --similarity=$pick.similarity
003162f90751 Uploaded
azuzolo
parents:
diff changeset
41 #elif $pick.otu_picking_method.__str__ == 'trie':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
42 --otu_picking_method=$pick.otu_picking_method
003162f90751 Uploaded
azuzolo
parents:
diff changeset
43 $pick.trie_reverse_seqs
003162f90751 Uploaded
azuzolo
parents:
diff changeset
44 #elif $pick.otu_picking_method.__str__ == 'prefix_suffix':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
45 --otu_picking_method=$pick.otu_picking_method
003162f90751 Uploaded
azuzolo
parents:
diff changeset
46 --prefix_length=$pick.prefix_length
003162f90751 Uploaded
azuzolo
parents:
diff changeset
47 --suffix_length=$pick.suffix_length
003162f90751 Uploaded
azuzolo
parents:
diff changeset
48 #elif pick.otu_picking_method.__str__ == 'blast':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
49 --otu_picking_method=$pick.otu_picking_method
003162f90751 Uploaded
azuzolo
parents:
diff changeset
50 #if $refseqs_fp.__str__ != 'None':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
51 --refseqs_fp=$pick.refseqs_fp
003162f90751 Uploaded
azuzolo
parents:
diff changeset
52 #end if
003162f90751 Uploaded
azuzolo
parents:
diff changeset
53 #if $pick.blast_db != None and $pick.blast_db.__str__ != 'None' and $pick.blast_db.__str__ != '':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
54 --blast_db=$pick.blast_db
003162f90751 Uploaded
azuzolo
parents:
diff changeset
55 #end if
003162f90751 Uploaded
azuzolo
parents:
diff changeset
56 --similarity=$pick.similarity
003162f90751 Uploaded
azuzolo
parents:
diff changeset
57 --max_e_value=$pick.max_e_value
003162f90751 Uploaded
azuzolo
parents:
diff changeset
58 --min_aligned_percent=$pick.min_aligned_percent
003162f90751 Uploaded
azuzolo
parents:
diff changeset
59 #elif $pick.otu_picking_method == 'cdhit':
003162f90751 Uploaded
azuzolo
parents:
diff changeset
60 --otu_picking_method=$pick.otu_picking_method
003162f90751 Uploaded
azuzolo
parents:
diff changeset
61 --similarity=$pick.similarity
003162f90751 Uploaded
azuzolo
parents:
diff changeset
62 --max_cdhit_memory=$pick.max_cdhit_memory
003162f90751 Uploaded
azuzolo
parents:
diff changeset
63 #if $pick.prefix_prefilter_length != 0:
003162f90751 Uploaded
azuzolo
parents:
diff changeset
64 --prefix_prefilter_length=$pick.prefix_prefilter_length
003162f90751 Uploaded
azuzolo
parents:
diff changeset
65 #end if
003162f90751 Uploaded
azuzolo
parents:
diff changeset
66 $pick.trie_prefilter
003162f90751 Uploaded
azuzolo
parents:
diff changeset
67 #end if
003162f90751 Uploaded
azuzolo
parents:
diff changeset
68 --output_dir='$log.extra_files_path'
003162f90751 Uploaded
azuzolo
parents:
diff changeset
69 </command>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
70 <inputs>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
71 <param name="input_seqs_filepath" type="data" format="fasta" label="input_seqs_filepath"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
72 help="Input sequences [REQUIRED]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
73 <conditional name="pick">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
74 <param name="otu_picking_method" type="select" label="otu_picking_method"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
75 help="Method for picking OTUs. Valid choices are: mothur, trie, uclust_ref, prefix_suffix, blast, cdhit, uclust. The mothur method requires an input file of aligned sequences [default: uclust]">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
76 <option value="uclust" selected="true">uclust</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
77 <option value="mothur">mothur</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
78 <option value="trie">trie</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
79 <option value="prefix_suffix">prefix_suffix</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
80 <option value="blast">blast</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
81 <option value="cdhit">cdhit</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
82 </param>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
83 <when value="mothur">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
84 <param name="clustering_algorithm" type="select" label="clustering_algorithm"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
85 help="Clustering algorithm for mothur otu picking method. [default: furthest]">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
86 <option value="furthest" selected="true">furthest</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
87 <option value="nearest">nearest</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
88 <option value="average">average</option>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
89 </param>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
90 <param name="similarity" type="float" value="0.97" label="similarity"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
91 help="Sequence similarity threshold (for cdhit, uclust, or uclust_ref) [default: 0.97]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
92 </when> <!-- mothur -->
003162f90751 Uploaded
azuzolo
parents:
diff changeset
93 <when value="trie">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
94 <param name="trie_reverse_seqs" type="boolean" truevalue="--trie_reverse_seqs" falsevalue="" checked="false" label="trie_reverse_seqs"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
95 help="Reverse seqs before picking OTUs with the Trie OTU picker for suffix (rather than prefix) collapsing [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
96 </when> <!-- trie -->
003162f90751 Uploaded
azuzolo
parents:
diff changeset
97 <when value="uclust">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
98 <param name="refseqs_fp" type="data" format="fasta" label="refseqs_fp" optional="true"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
99 help="Reference sequences to search against when using blast, uclust_ref, or usearch_ref [OPTIONAL]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
100 <param name="suppress_new_clusters" type="boolean" truevalue="--suppress_new_clusters" falsevalue="" checked="false" label="suppress_new_clusters"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
101 help="Suppress creation of new clusters using seqs that don't match reference when using -m uclust_ref [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
102 <param name="suppress_presort_by_abundance_uclust" type="boolean" truevalue="--suppress_presort_by_abundance_uclust" falsevalue="" checked="false" label="suppress_presort_by_abundance_uclust"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
103 help="Suppress presorting of sequences by abundance when picking OTUs with uclust or uclust_ref [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
104 <param name="similarity" type="float" value="0.97" label="similarity"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
105 help="Sequence similarity threshold (for cdhit, uclust, or uclust_ref) [default: 0.97]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
106 <param name="enable_rev_strand_match" type="boolean" truevalue="--enable_rev_strand_match" falsevalue="" checked="false" label="enable_rev_strand_match"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
107 help="Enable reverse strand matching for uclust otu picking, will double the amount of memory used. [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
108 <param name="optimal_uclust" type="boolean" truevalue="--optimal_uclust" falsevalue="" checked="false" label="optimal_uclust"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
109 help="Pass the --optimal flag to uclust for uclust otu picking. [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
110 <param name="exact_uclust" type="boolean" truevalue="--exact_uclust" falsevalue="" checked="false" label="exact_uclust"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
111 help="Pass the --exact flag to uclust for uclust otu picking. [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
112 <param name="user_sort" type="boolean" truevalue="--user_sort" falsevalue="" checked="false" label="user_sort"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
113 help="Pass the --user_sort flag to uclust for uclust otu picking. [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
114 <param name="max_accepts" type="integer" value="20" label="max_accepts"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
115 help="max_accepts value to uclust and uclust_ref [default: 20]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
116 <param name="max_rejects" type="integer" value="500" label="max_rejects"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
117 help="max_rejects value to uclust and uclust_ref [default: 500]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
118 <param name="uclust_otu_id_prefix" type="text" label="uclust_otu_id_prefix"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
119 help="OTU identifier prefix (string) for the de novo uclust OTU picker [default: None, OTU ids are ascending integers]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
120 <param name="uclust_stable_sort" type="boolean" truevalue="--uclust_stable_sort" falsevalue="" checked="false" label="uclust_stable_sort"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
121 help="pass --stable_sort to uclust (uclust versions uclustq1.2.15 and later only) [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
122 <param name="save_uc_files" type="boolean" truevalue="" falsevalue="--save_uc_files" checked="false" label="save_uc_files"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
123 help="Enable preservation of intermediate uclust (.uc) files that are used to generate clusters via uclust. [default: True]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
124 </when> <!-- uclust -->
003162f90751 Uploaded
azuzolo
parents:
diff changeset
125 <when value="prefix_suffix">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
126 <param name="prefix_length" type="integer" value="50" label="prefix_length"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
127 help="Prefix length when using the prefix_suffix otu picker; WARNING: CURRENTLY DIFFERENT FROM prefix_prefilter_length (-n)! [default: 50]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
128 <param name="suffix_length" type="integer" value="50" label="suffix_length"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
129 help="Suffix length when using the prefix_suffix otu picker [default: 50]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
130
003162f90751 Uploaded
azuzolo
parents:
diff changeset
131 </when> <!-- prefix_suffix -->
003162f90751 Uploaded
azuzolo
parents:
diff changeset
132 <when value="blast">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
133 <param name="refseqs_fp" type="data" format="fasta" label="refseqs_fp" optional="true"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
134 help="Reference sequences to search against"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
135 <param name="blast_db" type="data" format="txt" optional="True" label="blast_db"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
136 help="Pre-existing database to blast against when using -m blast [OPTIONAL]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
137 <param name="min_aligned_percent" type="float" value="0.5" label="min_aligned_percent"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
138 help="Minimum percent of query sequence that can be aligned to consider a hit (BLAST OTU picker only) [default: 0.5]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
139 <param name="max_e_value" type="float" value="1e-10" label="max_e_value"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
140 help="Max E-value when clustering with BLAST [default: 1e-10]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
141 </when> <!-- blast -->
003162f90751 Uploaded
azuzolo
parents:
diff changeset
142 <when value="cdhit">
003162f90751 Uploaded
azuzolo
parents:
diff changeset
143 <param name="max_cdhit_memory" type="integer" value="400" label="max_cdhit_memory"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
144 help="Maximum available memory to cd-hit-est (via the program's -M option) for cdhit OTU picking method (units of Mbyte) [default: 400]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
145 <param name="similarity" type="float" value="0.97" label="similarity"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
146 help="Sequence similarity threshold (for cdhit, uclust, or uclust_ref) [default: 0.97]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
147 <param name="prefix_prefilter_length" type="integer" value="0" label="prefix_prefilter_length"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
148 help="Prefilter data so seqs with identical first prefix_prefilter_length are automatically grouped into a single OTU. This is useful for large sequence collections where OTU picking doesn't scale well [default: None; 100 is a good value]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
149 <param name="trie_prefilter" type="boolean" truevalue="--trie_prefilter" falsevalue="" checked="false" label="trie_prefilter"
003162f90751 Uploaded
azuzolo
parents:
diff changeset
150 help="prefilter data so seqs which are identical prefixes of a longer seq are automatically grouped into a single OTU; useful for large sequence collections where OTU picking doesn't scale well [default: False]"/>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
151 </when> <!-- cdhit -->
003162f90751 Uploaded
azuzolo
parents:
diff changeset
152 </conditional> <!-- pick -->
003162f90751 Uploaded
azuzolo
parents:
diff changeset
153 </inputs>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
154 <outputs>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
155 <data format="txt" name="log" label="${tool.name} on ${on_string}: log" />
003162f90751 Uploaded
azuzolo
parents:
diff changeset
156 <data format="qiimeotu" name="otus" label="${tool.name} on ${on_string}: otus" />
003162f90751 Uploaded
azuzolo
parents:
diff changeset
157 <data format="txt" name="failures" label="${tool.name} on ${on_string}: failures.txt" >
003162f90751 Uploaded
azuzolo
parents:
diff changeset
158 <filter>(pick['otu_picking_method'] == 'uclust' and pick['refseqs_fp'])</filter>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
159 </data>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
160 </outputs>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
161 <tests>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
162 </tests>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
163 <help>For more information, see pick_otus_ in the Qiime documentation.
003162f90751 Uploaded
azuzolo
parents:
diff changeset
164
003162f90751 Uploaded
azuzolo
parents:
diff changeset
165 Updated and validated 01/16/12 by Amanda Zuzolo, Microbiome Analysis Center, George Mason University, Fairfax, VA
003162f90751 Uploaded
azuzolo
parents:
diff changeset
166
003162f90751 Uploaded
azuzolo
parents:
diff changeset
167 Qiime integration courtesy Jim Johnson, Minnesota Supercomputing Institute, University of Minnesota, Minneapolis, MN
003162f90751 Uploaded
azuzolo
parents:
diff changeset
168
003162f90751 Uploaded
azuzolo
parents:
diff changeset
169 .. _pick_otus: http://qiime.org/scripts/pick_otus.html</help>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
170 </tool>
003162f90751 Uploaded
azuzolo
parents:
diff changeset
171