Mercurial > repos > iuc > rnaquast
comparison rna_quast.xml @ 3:a9edbe21bf47 draft
"planemo upload for repository https://git.ufz.de/lehmanju/rnaquast commit 5ba8cddaafd411e30baa19da0f93959ef5ccaca0"
author | iuc |
---|---|
date | Fri, 14 Jan 2022 18:42:15 +0000 |
parents | 96f74538896e |
children | f9f2ad782d8f |
comparison
equal
deleted
inserted
replaced
2:96f74538896e | 3:a9edbe21bf47 |
---|---|
1 <tool id="rna_quast" name="rnaQUAST" version="@TOOL_VERSION@"> | 1 <tool id="rna_quast" name="rnaQUAST" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@"> |
2 <description>A Quality Assessment Tool for De Novo Transcriptome Assemblies</description> | 2 <description>A quality assessment tool for De Novo transcriptome assemblies</description> |
3 <xrefs> | 3 <xrefs> |
4 <xref type="bio.tools">rnaQUAST</xref> | 4 <xref type="bio.tools">rnaQUAST</xref> |
5 </xrefs> | 5 </xrefs> |
6 <macros> | 6 <macros> |
7 <token name="@TOOL_VERSION@">2.2.1</token> | 7 <token name="@TOOL_VERSION@">2.2.1</token> |
8 <token name="@VERSION_SUFFIX@">1</token> | |
8 <xml name="element_matching_line" token_name="" token_expression=""> | 9 <xml name="element_matching_line" token_name="" token_expression=""> |
9 <element name="@NAME@"> | 10 <element name="@NAME@"> |
10 <assert_contents> | 11 <assert_contents> |
11 <has_line_matching expression="@EXPRESSION@" /> | 12 <has_line_matching expression="@EXPRESSION@" /> |
12 </assert_contents> | 13 </assert_contents> |
90 <stdio> | 91 <stdio> |
91 <regex match="Traceback " source="both" level="fatal" description="rnaQuast failed" /> | 92 <regex match="Traceback " source="both" level="fatal" description="rnaQuast failed" /> |
92 </stdio> | 93 </stdio> |
93 <command detect_errors="exit_code"><![CDATA[ | 94 <command detect_errors="exit_code"><![CDATA[ |
94 #import re | 95 #import re |
95 #for $i in $in_fasta | 96 #for $i in $transcripts |
96 ln -s '$i' '${re.sub('[^\w\-.]', '_', i.element_identifier)}' && | 97 ln -s '$i' '${re.sub('[^\w\-.]', '_', i.element_identifier)}' && |
97 #end for | 98 #end for |
98 #if $r | 99 #if $r |
99 #for $rf in $r | 100 #for $rf in $r |
100 ln -s '$rf' '${re.sub('[^\w\-.]', '_', rf.element_identifier)}' && | 101 ln -s '$rf' '${re.sub('[^\w\-.]', '_', rf.element_identifier)}' && |
107 #end if | 108 #end if |
108 mkdir outputdir && | 109 mkdir outputdir && |
109 rnaQUAST.py | 110 rnaQUAST.py |
110 --threads \${GALAXY_SLOTS:-1} | 111 --threads \${GALAXY_SLOTS:-1} |
111 --transcripts | 112 --transcripts |
112 #for $i in $in_fasta | 113 #for $i in $transcripts |
113 '${re.sub('[^\w\-.]', '_', i.element_identifier)}' | 114 '${re.sub('[^\w\-.]', '_', i.element_identifier)}' |
114 #end for | 115 #end for |
115 $strand_specific | 116 $strand_specific |
116 #if $r | 117 #if $r |
117 -r | 118 -r |
131 --min_alignment '$min_alignment' | 132 --min_alignment '$min_alignment' |
132 #if "pdf" not in $out_sr and "plots" not in $out_add | 133 #if "pdf" not in $out_sr and "plots" not in $out_add |
133 --no_plots | 134 --no_plots |
134 #end if | 135 #end if |
135 $blat | 136 $blat |
136 $busco_lineage | 137 #if $busco_option.busco == 'true' |
137 ##GeneMarkS-T is not available in conda $gene_mark | 138 --busco $busco_option.lineage |
139 #end if | |
140 ##$gene_mark | |
138 $meta | 141 $meta |
139 --lower_threshold $lower_threshold | 142 --lower_threshold $lower_threshold |
140 --upper_threshold $upper_threshold | 143 --upper_threshold $upper_threshold |
141 -o outputdir | 144 -o outputdir |
142 | 145 |
143 && mkdir details | 146 && mkdir details |
144 | 147 |
145 ## move per outputs that are generated for each input (outputdir/ASSEMBLER_output) | 148 ## move per outputs that are generated for each input (outputdir/ASSEMBLER_output) |
146 ## to a joint dir (details) to make them discoverable | 149 ## to a joint dir (details) to make them discoverable |
147 ## also remove "ASSEMBLER." prefixes from files (otherwise the test macros don't work) | 150 ## also remove "ASSEMBLER." prefixes from files (otherwise the test macros don't work) |
148 #for $i in $in_fasta | 151 #for $i in $transcripts |
149 #set basename = os.path.splitext(re.sub('[^\w\-.]', '_', $i.element_identifier))[0] | 152 #set basename = os.path.splitext(re.sub('[^\w\-.]', '_', $i.element_identifier))[0] |
150 && | 153 && |
151 (for f in \$(find 'outputdir/'$basename'_output' -type f); | 154 (for f in \$(find 'outputdir/'$basename'_output' -type f); |
152 do | 155 do |
153 d=\$(dirname \$f | cut -d"/" -f2 | cut -d'_' -f1) && | 156 d=\$(dirname \$f | cut -d"/" -f2 | cut -d'_' -f1) && |
159 ## the final `true` seems needed since otherwise the `;` at the end is swallowed | 162 ## the final `true` seems needed since otherwise the `;` at the end is swallowed |
160 && find details/ -name "*.list" -exec mv {} {}.txt \; | 163 && find details/ -name "*.list" -exec mv {} {}.txt \; |
161 && true | 164 && true |
162 ]]> </command> | 165 ]]> </command> |
163 <inputs> | 166 <inputs> |
164 <param name="in_fasta" type="data" format="fasta" multiple="true" label="Chromosomes/scaffolds file" /> | 167 <param argument="--transcripts" type="data" format="fasta" multiple="true" label="Transcripts" help="File(s) with transcripts in FASTA format."/> |
165 <param name="strand_specific" argument="-ss" type="boolean" truevalue="-ss" falsevalue="" checked="false" label="Strand-specific" /> | 168 <param name="strand_specific" argument="-ss" type="boolean" truevalue="-ss" falsevalue="" checked="false" label="Strand-specific" |
166 <param name="r" optional="true" argument="-r" type="data" format="fasta" multiple="true" label="Reference genome" /> | 169 help="Set if transcripts were assembled using strand-specific RNA-Seq data in order to benefit from knowing whether the transcript originated from the + or - strand"/> |
170 <param name="r" optional="true" argument="-r" type="data" format="fasta" multiple="true" label="Reference genome" help="File with reference genome containing all chromosomes/scaffolds in FASTA forma." /> | |
167 <conditional name="gene_coordinates"> | 171 <conditional name="gene_coordinates"> |
168 <param name="use_gtf" type="select" label="Use file with gene coordinates in GTF/GFF format?" help="We recommend to use files downloaded from GENCODE or Ensembl."> | 172 <param name="use_gtf" type="select" label="Use file with gene coordinates in GTF/GFF format?" help="We recommend to use files downloaded from GENCODE or Ensembl."> |
169 <option value="true" selected="true">Yes</option> | 173 <option value="true" selected="true">Yes</option> |
170 <option value="false">No</option> | 174 <option value="false">No</option> |
171 </param> | 175 </param> |
172 <when value="true"> | 176 <when value="true"> |
173 <param name="gtf" argument="--gtf" type="data" format="gtf,gff,gff3" multiple="true" label="GTF/GFF file" /> | 177 <param name="gtf" argument="--gtf" type="data" format="gtf,gff,gff3" multiple="true" label="GTF/GFF file" /> |
174 <param argument="--disable_infer_genes" type="boolean" truevalue="--disable_infer_genes" falsevalue="" checked="false" label=" GTF file contains genes records?" /> | 178 <param argument="--disable_infer_genes" type="boolean" truevalue="--disable_infer_genes" falsevalue="" checked="false" label=" GTF file contains genes records?" |
175 <param argument="--disable_infer_transcripts" type="boolean" truevalue="--disable_infer_transcripts" falsevalue="" checked="false" label="GTF file contains transcripts records?" /> | 179 help="Use this option if your GTF file already contains genes records, otherwise gffutils will fix it. Note that gffutils may work for quite a long time"/> |
180 <param argument="--disable_infer_transcripts" type="boolean" truevalue="--disable_infer_transcripts" falsevalue="" checked="false" label="GTF file contains transcripts records?" help="Is option if your GTF file already contains transcripts records, otherwise gffutils will fix it."/> | |
176 </when> | 181 </when> |
177 <when value="false"> | 182 <when value="false"> |
178 </when> | 183 </when> |
179 </conditional> | 184 </conditional> |
180 <param argument="--prokaryote" type="boolean" truevalue="--prokaryote" falsevalue="" checked="false" label="Is genome prokararyotic?" /> | 185 <param argument="--prokaryote" type="boolean" truevalue="--prokaryote" falsevalue="" checked="false" label="Is genome prokararyotic?" help="Use this option if the genome is prokaryotic."/> |
181 <param argument="--min_alignment" type="integer" value="50" label="Minimal alignment length to be used" /> | 186 <param argument="--min_alignment" type="integer" value="50" label="Minimal alignment length to be used" help="Default value is 50"/> |
182 <param argument="--blat" type="boolean" truevalue="--blat" falsevalue="" checked="false" label="Run with BLAT alignment tool instead of GMAP?" /> | 187 <param argument="--blat" type="boolean" truevalue="--blat" falsevalue="" checked="false" label="Run with BLAT alignment tool instead of GMAP?" help="Blat is especially useful for aligning long sequences and gapped mapping, which cannot be performed properly by other fast sequence mappers designed for short reads. " /> |
183 <param argument="--busco_lineage" type="boolean" truevalue="--busco_lineage" falsevalue="" checked="false" label="Run BUSCO tool?" help="The BUSCO tool detects core genes in the assembly. Use this option to provide path to the BUSCO lineage data (Eukaryota, Metazoa, Arthropoda, Vertebrata or Fungi)." /> | 188 <conditional name="busco_option"> |
184 <!-- GeneMarkS-T is not available in conda <param argument="\-\-gene_mark" type="boolean" truevalue="\-\-gene_mark" falsevalue="" checked="false" label="Run with GeneMarkS-T gene prediction tool?"/>--> | 189 <param argument="--busco" type="select" label="Run BUSCO tool?" help="BUSCO allows to detect core genes in the assembled transcripts"> |
185 <param argument="--meta" type="boolean" truevalue="--meta" falsevalue="" checked="false" label="Meta Transcriptome" help="Run quality asessment for Meta Transcriptome" /> | 190 <option value="false">Disabled</option> |
186 <param argument="--lower_threshold" type="integer" value="50" label="Lower threshold for x_assembled/covered/matched metrics." /> | 191 <option value="true">Enabled</option> |
187 <param argument="--upper_threshold" type="integer" value="95" label="Upper threshold for x_assembled/covered/matched metrics." /> | 192 </param> |
193 <when value="false"/> | |
194 <when value="true"> | |
195 <param name="lineage" type="select" label="Lineage" help="Select a lineage for using BUSCO"> | |
196 <option value="metazoa">Metazoa</option> | |
197 <option value="eukaryota">Eukaryota</option> | |
198 <option value="arthropoda">Arthropoda</option> | |
199 <option value="vertebrata">Vertebrata</option> | |
200 <option value="fungi">Fungi</option> | |
201 <option value="bacteria">Bacteria</option> | |
202 </param> | |
203 </when> | |
204 </conditional> | |
205 <!--param argument="-\-gene_mark" type="boolean" truevalue="-\-gene_mark" falsevalue="" checked="false" label="Run with GeneMarkS-T gene prediction tool?" help="GeneMarkS-T allows to predict genes in the assembled transcripts without reference genome"/--> | |
206 <param argument="--meta" type="boolean" truevalue="--meta" falsevalue="" checked="false" label="Meta Transcriptome" help="Run quality asessment for meta-transcriptome assemblies" /> | |
207 <param argument="--lower_threshold" type="integer" value="50" label="Lower threshold for x-assembled/covered/matched metrics." /> | |
208 <param argument="--upper_threshold" type="integer" value="95" label="Upper threshold for x-assembled/covered/matched metrics." /> | |
188 <param name="out_sr" type="select" multiple="true" label="Short report formats"> | 209 <param name="out_sr" type="select" multiple="true" label="Short report formats"> |
189 <option value="tsv" selected="true">tabular</option> | 210 <option value="tsv" selected="true">tabular</option> |
190 <option value="txt">txt</option> | 211 <option value="txt">txt</option> |
191 <option value="tex">tex</option> | 212 <option value="tex">tex</option> |
192 <option value="pdf" selected="true">pdf</option> | 213 <option value="pdf" selected="true">pdf</option> |
216 <collection name="list_logs" type="list" label="${tool.name} on ${on_string}: logs"> | 237 <collection name="list_logs" type="list" label="${tool.name} on ${on_string}: logs"> |
217 <discover_datasets ext="txt" pattern="(?P<name>.+)\.log" directory="outputdir/logs/" visible="false" /> | 238 <discover_datasets ext="txt" pattern="(?P<name>.+)\.log" directory="outputdir/logs/" visible="false" /> |
218 <filter>"logs" in out_add</filter> | 239 <filter>"logs" in out_add</filter> |
219 </collection> | 240 </collection> |
220 <!-- note the output filter of the next two outputs checks if there is | 241 <!-- note the output filter of the next two outputs checks if there is |
221 more than 1 input for in_fasta (for 1 its a HDA, for more list or HDAs) --> | 242 more than 1 input for transcripts (for 1 its a HDA, for more list or HDAs) --> |
222 <collection name="comparison_png" type="list" label="${tool.name} on ${on_string}: comparison plots"> | 243 <collection name="comparison_png" type="list" label="${tool.name} on ${on_string}: comparison plots"> |
223 <discover_datasets ext="png" pattern="(?P<name>.+)\.png" directory="outputdir/comparison_output/" visible="false" recurse="true" /> | 244 <discover_datasets ext="png" pattern="(?P<name>.+)\.png" directory="outputdir/comparison_output/" visible="false" recurse="true" /> |
224 <filter> isinstance(in_fasta, list) and "plots" in out_add</filter> | 245 <filter> isinstance(transcripts, list) and "plots" in out_add</filter> |
225 </collection> | 246 </collection> |
226 <collection name="comparison" type="list" label="${tool.name} on ${on_string}: comparison"> | 247 <collection name="comparison" type="list" label="${tool.name} on ${on_string}: comparison"> |
227 <discover_datasets ext="txt" pattern="(?P<name>.+)\.txt" directory="outputdir/comparison_output/" visible="false" recurse="true" /> | 248 <discover_datasets ext="txt" pattern="(?P<name>.+)\.txt" directory="outputdir/comparison_output/" visible="false" recurse="true" /> |
228 <filter> isinstance(in_fasta, list) and "comparison" in out_add</filter> | 249 <filter> isinstance(transcripts, list) and "comparison" in out_add</filter> |
229 </collection> | 250 </collection> |
230 <collection name="details" type="list:list" label="${tool.name} on ${on_string}: detailed output"> | 251 <collection name="details" type="list:list" label="${tool.name} on ${on_string}: detailed output"> |
231 <discover_datasets pattern="(?P<identifier_0>.+)_____(?P<identifier_1>.+)\.(?P<ext>txt)" directory="details/" visible="false" /> | 252 <discover_datasets pattern="(?P<identifier_0>.+)_____(?P<identifier_1>.+)\.(?P<ext>txt)" directory="details/" visible="false" /> |
232 <filter>"details" in out_add</filter> | 253 <filter>"details" in out_add</filter> |
233 </collection> | 254 </collection> |
236 <filter>"details_plots" in out_add</filter> | 257 <filter>"details_plots" in out_add</filter> |
237 </collection> | 258 </collection> |
238 </outputs> | 259 </outputs> |
239 <tests> | 260 <tests> |
240 <test expect_num_outputs="7"> | 261 <test expect_num_outputs="7"> |
241 <param name="in_fasta" value="idba.fasta,Trinity.fasta" ftype="fasta" /> | 262 <param name="transcripts" value="idba.fasta,Trinity.fasta" ftype="fasta" /> |
242 <param name="r" value="Saccharomyces_cerevisiae.R64-1-1.75.dna.toplevel.fa" ftype="fasta" /> | 263 <param name="r" value="Saccharomyces_cerevisiae.R64-1-1.75.dna.toplevel.fa" ftype="fasta" /> |
243 <conditional name="gene_coordinates"> | 264 <conditional name="gene_coordinates"> |
244 <param name="use_gtf" value="true" /> | 265 <param name="use_gtf" value="true" /> |
245 <param name="gtf" value="Saccharomyces_cerevisiae.R64-1-1.75.gtf" ftype="gtf" /> | 266 <param name="gtf" value="Saccharomyces_cerevisiae.R64-1-1.75.gtf" ftype="gtf" /> |
246 <param name="disable_infer_genes" value="true" /> | 267 <param name="disable_infer_genes" value="true" /> |
258 <expand macro="details_output_test" assembler="Trinity" /> | 279 <expand macro="details_output_test" assembler="Trinity" /> |
259 <expand macro="details_output_test" assembler="idba" /> | 280 <expand macro="details_output_test" assembler="idba" /> |
260 </output_collection> | 281 </output_collection> |
261 </test> | 282 </test> |
262 <test expect_num_outputs="6"> | 283 <test expect_num_outputs="6"> |
263 <param name="in_fasta" value="Trinity.fasta" ftype="fasta" /> | 284 <param name="transcripts" value="Trinity.fasta" ftype="fasta" /> |
264 <conditional name="gene_coordinates"> | 285 <conditional name="gene_coordinates"> |
265 <param name="use_gtf" value="false" /> | 286 <param name="use_gtf" value="false" /> |
266 </conditional> | 287 </conditional> |
267 <param name="min_alignment" value="30" /> | 288 <param name="min_alignment" value="30" /> |
268 <param name="lower_threshold" value="45" /> | 289 <param name="lower_threshold" value="45" /> |
282 <element name="Trinity"> | 303 <element name="Trinity"> |
283 <expand macro="element_has_text" name="Nx" text="PNG" /> | 304 <expand macro="element_has_text" name="Nx" text="PNG" /> |
284 <expand macro="element_has_text" name="transcript_length" text="PNG" /> | 305 <expand macro="element_has_text" name="transcript_length" text="PNG" /> |
285 </element> | 306 </element> |
286 </output_collection> | 307 </output_collection> |
308 </test> | |
309 <test expect_num_outputs="6"> | |
310 <param name="transcripts" value="Trinity.fasta" ftype="fasta" /> | |
311 <conditional name="gene_coordinates"> | |
312 <param name="use_gtf" value="false" /> | |
313 </conditional> | |
314 <param name="min_alignment" value="30" /> | |
315 <param name="lower_threshold" value="45" /> | |
316 <param name="upper_threshold" value="95" /> | |
317 <param name="out_sr" value="txt,tex,tsv,pdf" /> | |
318 <param name="out_add" value="logs,details_plots" /> | |
319 <conditional name="busco_option"> | |
320 <param name="busco" value="true"/> | |
321 <param name="lineage" value="metazoa"/> | |
322 </conditional> | |
323 <expand macro="pdf_output_test" /> | |
324 <expand macro="tex_output_test" /> | |
325 <expand macro="tsv_output_test" /> | |
326 <expand macro="txt_output_test" /> | |
327 <output_collection name="list_logs" type="list"> | |
328 <expand macro="element_has_text" name="Trinity.GeneMarkS_T.err" text="" /> | |
329 <expand macro="element_matching_line" name="rnaQUAST" expression="Thank you for using rnaQUAST!" /> | |
330 </output_collection> | |
331 <output_collection name="details_png" type="list:list" count="1"> | |
332 <element name="Trinity"> | |
333 <expand macro="element_has_text" name="Nx" text="PNG" /> | |
334 <expand macro="element_has_text" name="transcript_length" text="PNG" /> | |
335 </element> | |
336 </output_collection> | |
337 <assert_command> | |
338 <has_text text="--busco metazoa"/> | |
339 </assert_command> | |
287 </test> | 340 </test> |
288 </tests> | 341 </tests> |
289 <help><![CDATA[ | 342 <help><![CDATA[ |
290 **What is rnaQUAST** | 343 **What is rnaQUAST** |
291 - a quality assessment tool for de novo transcriptome assemblies | 344 - a quality assessment tool for de novo transcriptome assemblies |