Mercurial > repos > mbernt > maxbin2
comparison maxbin2.xml @ 6:2bc40bfbcfb4 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/maxbin2/ commit e0e4e512a0858295ce3d445b9413de2b5bcfcd78
author | iuc |
---|---|
date | Mon, 16 Oct 2023 07:46:13 +0000 |
parents | 8a0473eb465e |
children | 28a0b1446d2b |
comparison
equal
deleted
inserted
replaced
5:8a0473eb465e | 6:2bc40bfbcfb4 |
---|---|
1 <tool id="maxbin2" name="MaxBin2" version="@MAXBIN_VERSION@+galaxy3"> | 1 <tool id="maxbin2" name="MaxBin2" version="@MAXBIN_VERSION@+galaxy4"> |
2 <description>clusters metagenomic contigs into bins</description> | 2 <description>clusters metagenomic contigs into bins</description> |
3 <xrefs> | |
4 <xref type="bio.tools">masigpro</xref> | |
5 </xrefs> | |
6 <macros> | 3 <macros> |
7 <token name="@MAXBIN_VERSION@">2.2.7</token> | 4 <token name="@MAXBIN_VERSION@">2.2.7</token> |
8 <xml name="contig"> | 5 <xml name="contig"> |
9 <param argument="-contig" type="data" format="fasta,fasta.gz" label="Contig file"/> | 6 <param argument="-contig" type="data" format="fasta,fasta.gz" label="Contig file"/> |
10 </xml> | 7 </xml> |
17 <xml name="reads_extra_params"> | 14 <xml name="reads_extra_params"> |
18 <param name="output_abundances" type="boolean" checked="false" label="Output abundances" help="" /> | 15 <param name="output_abundances" type="boolean" checked="false" label="Output abundances" help="" /> |
19 <param argument="--reassembly" type="boolean" truevalue="-reassembly" falsevalue="" checked="false" label="Reassembly" help="Reassembly option is still highly experimental. To use this function, you need to feed MaxBin interleaved paired-end fastq or fasta file." /> | 16 <param argument="--reassembly" type="boolean" truevalue="-reassembly" falsevalue="" checked="false" label="Reassembly" help="Reassembly option is still highly experimental. To use this function, you need to feed MaxBin interleaved paired-end fastq or fasta file." /> |
20 </xml> | 17 </xml> |
21 </macros> | 18 </macros> |
19 <xrefs> | |
20 <xref type="bio.tools">maxbin</xref> | |
21 </xrefs> | |
22 <requirements> | 22 <requirements> |
23 <requirement type="package" version="@MAXBIN_VERSION@">maxbin2</requirement> | 23 <requirement type="package" version="@MAXBIN_VERSION@">maxbin2</requirement> |
24 </requirements> | 24 </requirements> |
25 <version_command><![CDATA[run_MaxBin.pl -version | head -n 1]]></version_command> | 25 <version_command><![CDATA[run_MaxBin.pl -version | head -n 1]]></version_command> |
26 <command detect_errors="exit_code"><![CDATA[ | 26 <command detect_errors="exit_code"><![CDATA[ |
27 ## generate read or abundance files | 27 ## generate read or abundance files |
28 #import re | |
28 #if $assembly.inputs.type == 'reads' | 29 #if $assembly.inputs.type == 'reads' |
29 #if $assembly.type == 'individual' | 30 #if $assembly.type == 'individual' |
30 echo '$assembly.inputs.reads' >> reads_list && | 31 ## uncompress .gz reads files if necessary |
32 #set $e = $assembly.inputs.reads | |
33 #set $identifier = re.sub('[^\s\w\-\\.]', '_', str($e.element_identifier)) | |
34 #if $e.ext.endswith(".gz") | |
35 gunzip -c '$e' > '$identifier' && | |
36 echo '$identifier' >> reads_list && | |
37 #else | |
38 ln -s '$e' '$identifier' && | |
39 echo '$identifier' >> reads_list && | |
40 #end if | |
31 #else | 41 #else |
32 #for $r in $assembly.inputs.reads | 42 #for $i, $r in enumerate($assembly.inputs.reads) |
33 #if $r | 43 #if $r |
34 echo '$r' >> reads_list && | 44 #set $identifier = re.sub('[^\s\w\-\\.]', '_', str($r.element_identifier)) |
45 #set $newid = $identifier + '_' + str($i) | |
46 #if $r.ext.endswith(".gz") | |
47 gunzip -c '$r' > '$newid' && | |
48 echo '$newid' >> reads_list && | |
49 #else | |
50 ln -s '$r' '$newid' && | |
51 echo '$newid' >> reads_list && | |
52 #end if | |
35 #end if | 53 #end if |
36 #end for | 54 #end for |
37 #end if | 55 #end if |
38 #else if $assembly.inputs.type == 'abund' | 56 #else if $assembly.inputs.type == 'abund' |
39 #if $assembly.type == 'individual' | 57 #if $assembly.type == 'individual' |
92 </param> | 110 </param> |
93 <when value="individual"> | 111 <when value="individual"> |
94 <conditional name="inputs"> | 112 <conditional name="inputs"> |
95 <expand macro="input_type"/> | 113 <expand macro="input_type"/> |
96 <when value="reads"> | 114 <when value="reads"> |
97 <param argument="-reads" type="data" format="fasta,fastq" label="Reads file"/> | 115 <param argument="-reads" type="data" format="fasta,fastq,fastq.gz,fasta.gz" label="Reads file"/> |
98 <expand macro="reads_extra_params"/> | 116 <expand macro="reads_extra_params"/> |
99 </when> | 117 </when> |
100 <when value="abund"> | 118 <when value="abund"> |
101 <param argument="-abund" type="data" format="tabular" label="Abundance file"/> | 119 <param argument="-abund" type="data" format="tabular" label="Abundance file"/> |
102 </when> | 120 </when> |
342 <has_text text="out.002.fasta"/> | 360 <has_text text="out.002.fasta"/> |
343 <has_text text="2878"/> | 361 <has_text text="2878"/> |
344 </assert_contents> | 362 </assert_contents> |
345 </output> | 363 </output> |
346 </test> | 364 </test> |
365 <!-- test w contigs and reads in fastqsanger format as input --> | |
366 <test expect_num_outputs="4"> | |
367 <param name="contig" value="test4_contigs.fasta" ftype="fasta" /> | |
368 <conditional name="assembly"> | |
369 <param name="type" value="individual"/> | |
370 <conditional name="inputs"> | |
371 <param name="type" value="reads"/> | |
372 <param name="reads" value="test4_reads.fastqsanger" ftype="fastqsanger"/> | |
373 <param name="output_abundances" value="false"/> | |
374 <param name="reassembly" value=""/> | |
375 </conditional> | |
376 </conditional> | |
377 <section name="adv"> | |
378 <param name="min_contig_length" value="1000"/> | |
379 <param name="max_iteration" value="50"/> | |
380 <param name="prob_threshold" value="0.5"/> | |
381 </section> | |
382 <section name="output"> | |
383 <param name="plotmarker" value=""/> | |
384 <param name="marker" value="false"/> | |
385 <param name="markers" value="false" /> | |
386 <param name="log" value="false"/> | |
387 <param name="markerset" value="107"/> | |
388 </section> | |
389 <output_collection name="bins" type="list" count="2"> | |
390 <element name="001" file="4/out.001.fasta" ftype="fasta"/> | |
391 <element name="002" file="4/out.002.fasta" ftype="fasta"/> | |
392 </output_collection> | |
393 <output name="summary" file="4/out.summary" ftype="tabular" /> | |
394 <output name="noclass" file="4/out.noclass" ftype="fasta" /> | |
395 <output name="toshort" file="4/out.tooshort" ftype="fasta" /> | |
396 </test> | |
397 <!-- test w contigs and reads in fastqsanger.gz format as input --> | |
398 <test expect_num_outputs="4"> | |
399 <param name="contig" value="test4_contigs.fasta" ftype="fasta" /> | |
400 <conditional name="assembly"> | |
401 <param name="type" value="individual"/> | |
402 <conditional name="inputs"> | |
403 <param name="type" value="reads"/> | |
404 <param name="reads" value="test4_reads.fastqsanger.gz" ftype="fastqsanger.gz"/> | |
405 <param name="output_abundances" value="false"/> | |
406 <param name="reassembly" value=""/> | |
407 </conditional> | |
408 </conditional> | |
409 <section name="adv"> | |
410 <param name="min_contig_length" value="1000"/> | |
411 <param name="max_iteration" value="50"/> | |
412 <param name="prob_threshold" value="0.5"/> | |
413 </section> | |
414 <section name="output"> | |
415 <param name="plotmarker" value=""/> | |
416 <param name="marker" value="false"/> | |
417 <param name="markers" value="false" /> | |
418 <param name="log" value="false"/> | |
419 <param name="markerset" value="107"/> | |
420 </section> | |
421 <output_collection name="bins" type="list" count="2"> | |
422 <element name="001" file="4/out.001.fasta" ftype="fasta"/> | |
423 <element name="002" file="4/out.002.fasta" ftype="fasta"/> | |
424 </output_collection> | |
425 <output name="summary" file="4/out.summary" ftype="tabular" /> | |
426 <output name="noclass" file="4/out.noclass" ftype="fasta" /> | |
427 <output name="toshort" file="4/out.tooshort" ftype="fasta" /> | |
428 </test> | |
429 <!-- test w co-assembled contigs and multiple reads as .gz and optional outputs --> | |
430 <test expect_num_outputs="9"> | |
431 <param name="contig" value="test4_contigs.fasta" ftype="fasta" /> | |
432 <conditional name="assembly"> | |
433 <param name="type" value="coassembly"/> | |
434 <conditional name="inputs"> | |
435 <param name="type" value="reads"/> | |
436 <param name="reads" value="test4_reads.fastqsanger.gz,test4_reads.fastqsanger.gz" ftype="fasta"/> | |
437 <param name="output_abundances" value="true"/> | |
438 <param name="reassembly" value=""/> | |
439 </conditional> | |
440 </conditional> | |
441 <section name="adv"> | |
442 <param name="min_contig_length" value="1000"/> | |
443 <param name="max_iteration" value="50"/> | |
444 <param name="prob_threshold" value="0.5"/> | |
445 </section> | |
446 <section name="output"> | |
447 <param name="plotmarker" value="true"/> | |
448 <param name="marker" value="true"/> | |
449 <param name="markers" value="true" /> | |
450 <param name="log" value="true"/> | |
451 <param name="markerset" value="107"/> | |
452 </section> | |
453 <output_collection name="bins" type="list" count="2"> | |
454 <element name="001" file="4/out.001.fasta" ftype="fasta"/> | |
455 <element name="002" file="4/out.002.fasta" ftype="fasta"/> | |
456 </output_collection> | |
457 <output name="summary" ftype="tabular"> | |
458 <assert_contents> | |
459 <has_text text="Completeness"/> | |
460 <has_text text="out.001.fasta"/> | |
461 </assert_contents> | |
462 </output> | |
463 <output name="noclass" file="4/out.noclass" ftype="fasta" /> | |
464 <output name="toshort" file="4/out.tooshort" ftype="fasta" /> | |
465 <output name="log" ftype="txt" > | |
466 <assert_contents> | |
467 <has_text text="Input contig"/> | |
468 <has_text text="Elapsed time"/> | |
469 <has_text text="Yielded 2 bins for contig (scaffold) file"/> | |
470 </assert_contents> | |
471 </output> | |
472 <output name="abundout" file="4/out.abund1" ftype="tabular" /> | |
473 <output name="marker" file="4/out.marker" ftype="tabular" /> | |
474 <output name="plot" file="4/out.marker.pdf" ftype="pdf" compare="sim_size" /> | |
475 <output_collection name="markers" type="list" count="2"> | |
476 <element name="001" ftype="fasta"> | |
477 <assert_contents> | |
478 <has_text text=">out.001.Methyltransf_5"/> | |
479 </assert_contents> | |
480 </element> | |
481 <element name="002" ftype="fasta"> | |
482 <assert_contents> | |
483 <has_text text=">out.002.Methyltransf_5"/> | |
484 </assert_contents> | |
485 </element> | |
486 </output_collection> | |
487 </test> | |
347 </tests> | 488 </tests> |
348 <help><![CDATA[ | 489 <help><![CDATA[ |
349 MaxBin is a software that clusters metagenomic contigs into different bins, | 490 MaxBin is a software that clusters metagenomic contigs into different bins, |
350 each consists (hopefully) of contigs from one species. MaxBin uses the | 491 each consists (hopefully) of contigs from one species. MaxBin uses the |
351 nucleotide composition information and contig abundance information to do | 492 nucleotide composition information and contig abundance information to do |