Mercurial > repos > iuc > das_tool
comparison das_tool.xml @ 0:a8e434ebe961 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/das_tool commit 151c0e625ce20fb3ea75aa5043486e41b1da48de
author | iuc |
---|---|
date | Mon, 27 Jun 2022 12:41:23 +0000 |
parents | |
children | e23e7bf8491b |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:a8e434ebe961 |
---|---|
1 <tool id="das_tool" name="DAS Tool" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@"> | |
2 <description> | |
3 for genome resolved metagenomics | |
4 </description> | |
5 <macros> | |
6 <import>macros.xml</import> | |
7 </macros> | |
8 <expand macro="biotools"/> | |
9 <expand macro="requirements"/> | |
10 <expand macro="version"/> | |
11 <command detect_errors="exit_code"><![CDATA[ | |
12 #set $bins = "" | |
13 #set $labels = "" | |
14 #set $sep = "" | |
15 #for $i, $s in enumerate($binning) | |
16 #set $bins += "%s%s" %($sep, $s.bins) | |
17 #set $labels += "%s%s" %($sep, $s.labels) | |
18 #set $sep = "," | |
19 #end for | |
20 | |
21 #if $adv.proteins | |
22 ln -s $adv.proteins 'proteins' && | |
23 #end if | |
24 | |
25 DAS_Tool | |
26 --contigs '$contigs' | |
27 --outputbasename 'outputs' | |
28 --bins '$bins' | |
29 --labels '$labels' | |
30 --search_engine '$adv.search_engine' | |
31 #if $adv.proteins | |
32 --proteins 'proteins' | |
33 #end if | |
34 --score_threshold $adv.score_threshold | |
35 --duplicate_penalty $adv.duplicate_penalty | |
36 --megabin_penalty $adv.megabin_penalty | |
37 $output.write_bin_evals | |
38 $output.write_bins.write_bins | |
39 #if str($output.write_bins.write_bins) != '' | |
40 $output.write_bins.write_unbinned | |
41 #end if | |
42 $output.debug | |
43 --threads \${GALAXY_SLOTS:-1} | |
44 ]]></command> | |
45 <inputs> | |
46 <param argument="--contigs" type="data" format="fasta" label="Contig sequences"/> | |
47 <repeat name="binning" title="Bins" min="1"> | |
48 <param argument="--bins" type="data" format="tabular" label="Contigs-to-bin table" help="Tabular with two columns: contig-IDs and bin-IDs. Fasta_to_Contigs2Bin can be used to Converts genome bins in fasta format to Contigs-to-bin table"/> | |
49 <param argument="--labels" type="text" value="" label="Name of binning prediction tool used to generate the table"/> | |
50 </repeat> | |
51 <section name="adv" title="Advanced options"> | |
52 <param argument="--search_engine" type="select" label="Engine used for single copy gene identification"> | |
53 <option value="diamond" selected="true">diamond</option> | |
54 <option value="blastp">blastp</option> | |
55 </param> | |
56 <param argument="--proteins" type="data" format="fasta" optional="true" label="Predicted proteins" help="The file should be prodigal fasta format: >contigID_geneNo"/> | |
57 <param argument="--score_threshold" type="float" min="0" max="1" value="0.5" label="Score threshold until selection algorithm will keep selecting bins"/> | |
58 <param argument="--duplicate_penalty" type="float" min="0" max="3" value="0.6" label="Penalty for duplicate single copy genes per bin (weight b)" help="Only change if you know what you are doing"/> | |
59 <param argument="--megabin_penalty" type="float" min="0" max="3" value="0.5" label="Penalty for megabins (weight c)" help="Only change if you know what you are doing"/> | |
60 </section> | |
61 <section name="output" title="Outputs"> | |
62 <param name="proteins" type="boolean" checked="false" label="Output predicted proteins?"/> | |
63 <param argument="--write_bin_evals" type="boolean" truevalue="--write_bin_evals" falsevalue="" checked="false" label="Write evaluation of input bin sets?"/> | |
64 <conditional name="write_bins"> | |
65 <param argument="--write_bins" type="select" label="Export bins as fasta files?"> | |
66 <option value="--write_bins" selected="true">Yes</option> | |
67 <option value="">No</option> | |
68 </param> | |
69 <when value="--write_bins"> | |
70 <param argument="--write_unbinned" type="boolean" truevalue="--write_unbinned" falsevalue="" checked="false" label="Export unbinned contigs as fasta file?"/> | |
71 </when> | |
72 <when value=""/> | |
73 </conditional> | |
74 <param argument="--debug" type="boolean" truevalue="--debug" falsevalue="" checked="false" label="Write debug information to log file?"/> | |
75 </section> | |
76 </inputs> | |
77 <outputs> | |
78 <data name="summary" format="tabular" from_work_dir="outputs_DASTool_summary.tsv" label="${tool.name} on ${on_string}: Summary of output bins" /> | |
79 <data name="contigs2bin" format="tabular" from_work_dir="outputs_DASTool_contig2bin.tsv" label="${tool.name} on ${on_string}: Contigs to bin file for the output bins" /> | |
80 <data name="log" format="txt" from_work_dir="outputs_DASTool.log" label="${tool.name} on ${on_string}: Log" /> | |
81 <data name="eval" format="tabular" from_work_dir="outputs_allBins.eval" label="${tool.name} on ${on_string}: Quality and completeness estimates of input bin sets" > | |
82 <filter>output['write_bin_evals']</filter> | |
83 </data> | |
84 <collection name="bins" type="list" label="${tool.name} on ${on_string}: Bins"> | |
85 <filter>output['write_bins']['write_bins'] != ""</filter> | |
86 <discover_datasets pattern=".*?\.(?P<designation>.*)\.fa" format="fasta" directory="outputs_DASTool_bins" /> | |
87 </collection> | |
88 <data name="unbinned_contigs" format="fasta" from_work_dir="outputs_DASTool_bins/unbinned.fa" label="${tool.name} on ${on_string}: Unbinned contigs" > | |
89 <filter>output['write_bins']['write_bins'] != "" and output['write_bins']['write_unbinned']</filter> | |
90 </data> | |
91 <data name="proteins" format="fasta" from_work_dir="outputs_proteins.faa" label="${tool.name} on ${on_string}: Proteins" > | |
92 <filter>output['proteins']</filter> | |
93 </data> | |
94 </outputs> | |
95 <tests> | |
96 <test expect_num_outputs="4"> | |
97 <param name="contigs" value="contigs.fasta"/> | |
98 <repeat name="binning"> | |
99 <param name="bins" value="metabat.tabular"/> | |
100 <param name="labels" value="metabat"/> | |
101 </repeat> | |
102 <section name="adv"> | |
103 <param name="search_engine" value="diamond"/> | |
104 <param name="proteins" value="proteins.fasta"/> | |
105 <param name="score_threshold" value="0.5"/> | |
106 <param name="duplicate_penalty" value="0.6"/> | |
107 <param name="megabin_penalty" value="0.5" /> | |
108 </section> | |
109 <section name="output"> | |
110 <param name="write_bin_evals" value="true"/> | |
111 <conditional name="write_bins"> | |
112 <param name="write_bins" value=""/> | |
113 </conditional> | |
114 <param name="debug" value="true"/> | |
115 </section> | |
116 <output name="summary" ftype="tabular"> | |
117 <assert_contents> | |
118 <has_text text="unique_SCGs"/> | |
119 <has_text text="metabat.8"/> | |
120 <has_text text="bacteria"/> | |
121 </assert_contents> | |
122 </output> | |
123 <output name="contigs2bin" ftype="tabular"> | |
124 <assert_contents> | |
125 <has_text text="Ley3_66761_scaffold_6"/> | |
126 </assert_contents> | |
127 </output> | |
128 <output name="log" ftype="txt"> | |
129 <assert_contents> | |
130 <has_text text="Skipping gene prediction"/> | |
131 <has_text text="#Target sequences to report alignments for: 1"/> | |
132 </assert_contents> | |
133 </output> | |
134 <output name="eval" ftype="tabular"> | |
135 <assert_contents> | |
136 <has_text text="unique_SCGs"/> | |
137 <has_text text="metabat.8"/> | |
138 </assert_contents> | |
139 </output> | |
140 </test> | |
141 <test expect_num_outputs="6"> | |
142 <param name="contigs" value="contigs.fasta"/> | |
143 <repeat name="binning"> | |
144 <param name="bins" value="metabat.tabular"/> | |
145 <param name="labels" value="metabat"/> | |
146 </repeat> | |
147 <section name="adv"> | |
148 <param name="search_engine" value="diamond"/> | |
149 <param name="score_threshold" value="0.5"/> | |
150 <param name="duplicate_penalty" value="0.6"/> | |
151 <param name="megabin_penalty" value="0.5" /> | |
152 </section> | |
153 <section name="output"> | |
154 <param name="proteins" value="true"/> | |
155 <param name="write_bin_evals" value="false"/> | |
156 <conditional name="write_bins"> | |
157 <param name="write_bins" value="--write_bins"/> | |
158 <param name="write_unbinned" value="true"/> | |
159 </conditional> | |
160 <param name="debug" value="true"/> | |
161 </section> | |
162 <output name="summary" ftype="tabular"> | |
163 <assert_contents> | |
164 <has_text text="unique_SCGs"/> | |
165 <has_text text="metabat.8"/> | |
166 <has_text text="bacteria"/> | |
167 </assert_contents> | |
168 </output> | |
169 <output name="contigs2bin" ftype="tabular"> | |
170 <assert_contents> | |
171 <has_text text="Ley3_66761_scaffold_6"/> | |
172 </assert_contents> | |
173 </output> | |
174 <output name="log" ftype="txt"> | |
175 <assert_contents> | |
176 <has_text text="Parameters"/> | |
177 <has_text text="Predicting genes"/> | |
178 </assert_contents> | |
179 </output> | |
180 <output_collection name="bins" count="1"> | |
181 <element name="8" ftype="fasta"> | |
182 <assert_contents> | |
183 <has_text text=">Ley3_66761_scaffold_6"/> | |
184 </assert_contents> | |
185 </element> | |
186 </output_collection> | |
187 <output name="unbinned_contigs" ftype="fasta"> | |
188 <assert_contents> | |
189 <has_text text=">Ley3_66761_scaffold_505"/> | |
190 </assert_contents> | |
191 </output> | |
192 <output name="proteins" ftype="fasta"> | |
193 <assert_contents> | |
194 <has_text text="Ley3_66761_scaffold_6_1 # 1 # 786 # 1 #"/> | |
195 </assert_contents> | |
196 </output> | |
197 </test> | |
198 </tests> | |
199 <help><![CDATA[ | |
200 @HELP_HEADER@ | |
201 | |
202 Inputs | |
203 ====== | |
204 | |
205 - Bins: Tab separated files of contig-IDs and bin-IDs. Contigs to bin file example: :: | |
206 | |
207 Contig_1 bin.01 | |
208 Contig_8 bin.01 | |
209 Contig_42 bin.02 | |
210 Contig_49 bin.03 | |
211 | |
212 - Contigs: Assembled contigs in fasta format: :: | |
213 | |
214 >Contig_1 | |
215 ATCATCGTCCGCATCGACGAATTCGGCGAACGAGTACCCCTGACCATCTCCGATTA... | |
216 >Contig_2 | |
217 GATCGTCACGCAGGCTATCGGAGCCTCGACCCGCAAGCTCTGCGCCTTGGAGCAGG... | |
218 | |
219 - [Optional] Proteins: Predicted proteins in prodigal fasta format. Header contains contig-ID and gene number: :: | |
220 | |
221 >Contig_1_1 | |
222 MPRKNKKLPRHLLVIRTSAMGDVAMLPHALRALKEAYPEVKVTVATKSLFHPFFEG... | |
223 >Contig_1_2 | |
224 MANKIPRVPVREQDPKVRATNFEEVCYGYNVEEATLEASRCLNCKNPRCVAACPVN... | |
225 | |
226 Outputs | |
227 ======= | |
228 | |
229 - Summary of output bins including quality and completeness estimates | |
230 - Contigs to bin file of output bins | |
231 - [Optional] Quality and completeness estimates of input bin sets | |
232 - [Optional] Bins in fasta format | |
233 - [Optional] Unbinned contigs | |
234 | |
235 ]]></help> | |
236 <expand macro="citations"/> | |
237 </tool> |