Mercurial > repos > iuc > metaphlan
comparison metaphlan.xml @ 2:a92a632c4d9b draft
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/metaphlan/ commit f1c6f4fe1e572ace84cf9106bc253603f55aac55"
author | iuc |
---|---|
date | Mon, 14 Jun 2021 12:48:10 +0000 |
parents | b89b0765695d |
children | ff8f55893e7d |
comparison
equal
deleted
inserted
replaced
1:b89b0765695d | 2:a92a632c4d9b |
---|---|
193 python '$__tool_directory__/formatoutput.py' | 193 python '$__tool_directory__/formatoutput.py' |
194 split_levels | 194 split_levels |
195 --metaphlan_output '$output_file' | 195 --metaphlan_output '$output_file' |
196 --outdir 'split_levels' | 196 --outdir 'split_levels' |
197 $out.legacy_output | 197 $out.legacy_output |
198 && | 198 |
199 ls split_levels | |
200 #end if | 199 #end if |
201 | 200 |
202 #if $out.krona_output | 201 #if $out.krona_output |
203 && | 202 && |
204 python '$__tool_directory__/formatoutput.py' | 203 python '$__tool_directory__/formatoutput.py' |
209 ]]></command> | 208 ]]></command> |
210 <inputs> | 209 <inputs> |
211 <section name="inputs" title="Inputs" expanded="true"> | 210 <section name="inputs" title="Inputs" expanded="true"> |
212 <conditional name="in"> | 211 <conditional name="in"> |
213 <param name="selector" type="select" label="Input(s)"> | 212 <param name="selector" type="select" label="Input(s)"> |
214 <option value="raw" selected="true">Fasta/FastQ file(s) with metagenomic reads</option> | 213 <option value="raw" selected="true">Fasta/FastQ file(s) with microbiota reads</option> |
215 <option value="sam">Externally BowTie2-mapped SAM file</option> | 214 <option value="sam">Externally BowTie2-mapped SAM file</option> |
216 <option value="bowtie2out">Intermediary mapping file of the metagenome generated by a previous MetaPhlAn run</option> | 215 <option value="bowtie2out">Intermediary mapping file of the microbiota generated by a previous MetaPhlAn run</option> |
217 </param> | 216 </param> |
218 <when value="raw"> | 217 <when value="raw"> |
219 <conditional name="raw_in"> | 218 <conditional name="raw_in"> |
220 <param name="selector" type="select" label="Fasta/FastQ file(s) with metagenomic reads"> | 219 <param name="selector" type="select" label="Fasta/FastQ file(s) with microbiota reads"> |
221 <option value="single" selected="true">One single-end file</option> | 220 <option value="single" selected="true">One single-end file</option> |
222 <option value="multiple">Multiple single-end files</option> | 221 <option value="multiple">Multiple single-end files</option> |
223 <option value="paired">Paired-end files</option> | 222 <option value="paired">Paired-end files</option> |
224 </param> | 223 </param> |
225 <when value="single"> | 224 <when value="single"> |
226 <param name="in" type="data" format="@FILE_FORMATS@" label="Single-end Fasta/FastQ file with metagenomic reads"/> | 225 <param name="in" type="data" format="@FILE_FORMATS@" label="Single-end Fasta/FastQ file with microbiota reads"/> |
227 </when> | 226 </when> |
228 <when value="multiple"> | 227 <when value="multiple"> |
229 <param name="in" type="data" format="@FILE_FORMATS@" multiple="true" label="Single-end Fasta/FastQ files with metagenomic reads"/> | 228 <param name="in" type="data" format="@FILE_FORMATS@" multiple="true" label="Single-end Fasta/FastQ files with microbiota reads"/> |
230 </when> | 229 </when> |
231 <when value="paired"> | 230 <when value="paired"> |
232 <param name="in_f" type="data" format="@FILE_FORMATS@" label="Forward paired-end Fasta/FastQ file with metagenomic reads"/> | 231 <param name="in_f" type="data" format="@FILE_FORMATS@" label="Forward paired-end Fasta/FastQ file with microbiota reads"/> |
233 <param name="in_r" type="data" format="@FILE_FORMATS@" label="Reverse paired-end Fasta/FastQ file with metagenomic reads"/> | 232 <param name="in_r" type="data" format="@FILE_FORMATS@" label="Reverse paired-end Fasta/FastQ file with microbiota reads"/> |
234 </when> | 233 </when> |
235 </conditional> | 234 </conditional> |
236 <param argument="--read_min_len" type="integer" value="70" label="Minimum length of the reads to be considered when parsing the input file"/> | 235 <param argument="--read_min_len" type="integer" value="70" label="Minimum length of the reads to be considered when parsing the input file"/> |
237 <section name="mapping" title="Mapping" expanded="true"> | 236 <section name="mapping" title="Mapping" expanded="true"> |
238 <param argument="--bt2_ps" type="select" label="Presets options for BowTie2" help="Applied only with FASTA files"> | 237 <param argument="--bt2_ps" type="select" label="Presets options for BowTie2" help="Applied only with FASTA files"> |
243 </param> | 242 </param> |
244 <param argument="--min_mapq_val" type="integer" value="5" label="Minimum mapping quality value (MAPQ)"/> | 243 <param argument="--min_mapq_val" type="integer" value="5" label="Minimum mapping quality value (MAPQ)"/> |
245 </section> | 244 </section> |
246 </when> | 245 </when> |
247 <when value="sam"> | 246 <when value="sam"> |
248 <param name="in" type="data" format="sam" label="Externally BowTie2-mapped SAM file" help="BowTie2 needs to be used first to map metagenom reads"/> | 247 <param name="in" type="data" format="sam" label="Externally BowTie2-mapped SAM file" help="BowTie2 needs to be used first to map microbiota reads"/> |
249 </when> | 248 </when> |
250 <when value="bowtie2out"> | 249 <when value="bowtie2out"> |
251 <param name="in" type="data" format="tabular" label="Intermediary mapping file of the metagenome generated by a previous MetaPhlAn run" | 250 <param name="in" type="data" format="tabular" label="Intermediary mapping file of the microbiota generated by a previous MetaPhlAn run" |
252 help="File needs to be generated with MetaPhlAn versions >3.0"/> | 251 help="File needs to be generated with MetaPhlAn versions >3.0"/> |
253 </when> | 252 </when> |
254 </conditional> | 253 </conditional> |
255 <conditional name="db"> | 254 <conditional name="db"> |
256 <param name="db_selector" type="select" label="Database with clade-specific marker genes"> | 255 <param name="db_selector" type="select" label="Database with clade-specific marker genes"> |
271 </conditional> | 270 </conditional> |
272 </section> | 271 </section> |
273 <section name="analysis" title="Analysis" expanded="true"> | 272 <section name="analysis" title="Analysis" expanded="true"> |
274 <conditional name="analysis_type"> | 273 <conditional name="analysis_type"> |
275 <param argument="-t" type="select" label="Type of analysis to perform"> | 274 <param argument="-t" type="select" label="Type of analysis to perform"> |
276 <option value="rel_ab" selected="true">rel_ab: Profiling a metagenomes in terms of relative abundances</option> | 275 <option value="rel_ab" selected="true">rel_ab: Profiling a microbiota in terms of relative abundances</option> |
277 <option value="rel_ab_w_read_stats">rel_ab_w_read_stats: Profiling a metagenomes in terms of relative abundances and estimate the number of reads comming from each clade</option> | 276 <option value="rel_ab_w_read_stats">rel_ab_w_read_stats: Profiling a microbiota in terms of relative abundances and estimate the number of reads comming from each clade</option> |
278 <option value="reads_map">reads_map: Mapping from reads to clades (only reads hitting a marker)</option> | 277 <option value="reads_map">reads_map: Mapping from reads to clades (only reads hitting a marker)</option> |
279 <option value="clade_profiles">clade_profiles: Normalized marker counts for clades with at least a non-null marker</option> | 278 <option value="clade_profiles">clade_profiles: Normalized marker counts for clades with at least a non-null marker</option> |
280 <option value="clade_specific_strain_tracker">clade_specific_strain_tracker: List of markers present for a specific clade and all its subclades</option> | 279 <option value="clade_specific_strain_tracker">clade_specific_strain_tracker: List of markers present for a specific clade and all its subclades</option> |
281 <option value="marker_ab_table">marker_ab_table: Normalized marker counts (only when > 0.0 and normalized by metagenome size if number of reads is specified)</option> | 280 <option value="marker_ab_table">marker_ab_table: Normalized marker counts (only when > 0.0 and normalized by microbiota size if number of reads is specified)</option> |
282 <option value="marker_counts">marker_counts: Non-normalized marker counts (use with extreme caution)</option> | 281 <option value="marker_counts">marker_counts: Non-normalized marker counts (use with extreme caution)</option> |
283 <option value="marker_pres_table">marker_pres_table: List of markers present in the sample (threshold at 1.0 if not differently specified with --pres_th</option> | 282 <option value="marker_pres_table">marker_pres_table: List of markers present in the sample (threshold at 1.0 if not differently specified with --pres_th</option> |
284 </param> | 283 </param> |
285 <when value="rel_ab"> | 284 <when value="rel_ab"> |
286 <expand macro="tax_lev"/> | 285 <expand macro="tax_lev"/> |
294 <param argument="--clade" type="text" value="" label="Clade for which to extract list of markers present" | 293 <param argument="--clade" type="text" value="" label="Clade for which to extract list of markers present" |
295 help="Markers are also extracted for subclades" /> | 294 help="Markers are also extracted for subclades" /> |
296 <param argument="--min_ab" type="float" optional="true" label="The minimum percentage abundance for the clade"/> | 295 <param argument="--min_ab" type="float" optional="true" label="The minimum percentage abundance for the clade"/> |
297 </when> | 296 </when> |
298 <when value="marker_ab_table"> | 297 <when value="marker_ab_table"> |
299 <param argument="--nreads" type="integer" optional="true" label="Total number of reads in the original metagenome" | 298 <param argument="--nreads" type="integer" optional="true" label="Total number of reads in the original microbiota" |
300 help="It is used for normalizing the length-normalized counts with the metagenome size as well. No normalization applied if the value is not specified"/> | 299 help="It is used for normalizing the length-normalized counts with the microbiota size as well. No normalization applied if the value is not specified"/> |
301 </when> | 300 </when> |
302 <when value="marker_counts"/> | 301 <when value="marker_counts"/> |
303 <when value="marker_pres_table"> | 302 <when value="marker_pres_table"> |
304 <param argument="--pres_th" type="integer" optional="true" label="Threshold for calling a marker present"/> | 303 <param argument="--pres_th" type="integer" optional="true" label="Threshold for calling a marker present"/> |
305 </when> | 304 </when> |
367 <conditional name="in"> | 366 <conditional name="in"> |
368 <param name="selector" value="raw"/> | 367 <param name="selector" value="raw"/> |
369 <conditional name="raw_in"> | 368 <conditional name="raw_in"> |
370 <!-- Single GZ file --> | 369 <!-- Single GZ file --> |
371 <param name="selector" value="single"/> | 370 <param name="selector" value="single"/> |
371 <param name="in" value="no_taxon_input.fasta"/> | |
372 </conditional> | |
373 <param name="read_min_len" value="70"/> | |
374 <section name="mapping"> | |
375 <param name="bt2_ps" value="sensitive"/> | |
376 <param name="min_mapq_val" value="5"/> | |
377 </section> | |
378 </conditional> | |
379 <conditional name="db"> | |
380 <!-- Cached db --> | |
381 <param name="db_selector" value="cached"/> | |
382 <param name="cached_db" value="test-db-20210409"/> | |
383 </conditional> | |
384 </section> | |
385 <section name="analysis"> | |
386 <conditional name="analysis_type"> | |
387 <param name="t" value="rel_ab"/> | |
388 <conditional name="tax_lev"> | |
389 <param name="tax_lev" value="a"/> | |
390 <param name="split_levels" value="true"/> | |
391 </conditional> | |
392 </conditional> | |
393 <param name="min_cu_len" value="2000"/> | |
394 <param name="organism_profiling" value="add_viruses"/> | |
395 <param name="stat" value="avg_g"/> | |
396 <param name="stat_q" value="0.2"/> | |
397 <param name="perc_nonzero" value="0.33"/> | |
398 <param name="avoid_disqm" value="true"/> | |
399 </section> | |
400 <section name="out"> | |
401 <param name="sample_id_key" value="SampleID"/> | |
402 <param name="sample_id" value="Metaphlan_Analysis"/> | |
403 <param name="use_group_representative" value="false"/> | |
404 <param name="legacy_output" value="false"/> | |
405 <param name="CAMI_format_output" value="false"/> | |
406 <param name="unknown_estimation" value="false"/> | |
407 <param name="krona_output" value="true"/> | |
408 </section> | |
409 <output name="output_file" ftype="tabular"> | |
410 <assert_contents> | |
411 <has_text text="UNKNOWN"/> | |
412 </assert_contents> | |
413 </output> | |
414 <output name="bowtie2out" ftype="tabular"> | |
415 <assert_contents> | |
416 <not_has_text text="HWI-EAS109_102883399:3:104:7342:14360/1"/> | |
417 <has_n_lines n="2"/> | |
418 </assert_contents> | |
419 </output> | |
420 <output name="sam_output_file" ftype="sam"> | |
421 <assert_contents> | |
422 <has_text text="SN:13076__A0A2I1PE66__CYJ72_10760"/> | |
423 </assert_contents> | |
424 </output> | |
425 <output name="biom_output_file" ftype="biom1"> | |
426 <assert_contents> | |
427 <not_has_text text="k__Bacteria"/> | |
428 <not_has_text text="p__Actinobacteria"/> | |
429 </assert_contents> | |
430 </output> | |
431 <output_collection name="levels" type="list" > | |
432 <element name="all" ftype="tabular"> | |
433 <assert_contents> | |
434 <has_text text="class"/> | |
435 <has_n_columns n="17"/> | |
436 <has_n_lines n="1"/> | |
437 </assert_contents> | |
438 </element> | |
439 <element name="kingdom" ftype="tabular"> | |
440 <assert_contents> | |
441 <has_text text="kingdom_id"/> | |
442 <has_n_columns n="3"/> | |
443 <has_n_lines n="1"/> | |
444 </assert_contents> | |
445 </element> | |
446 <element name="phylum" ftype="tabular"> | |
447 <assert_contents> | |
448 <has_text text="phylum_id"/> | |
449 <not_has_text text="kingdom_id"/> | |
450 <has_n_columns n="3"/> | |
451 <has_n_lines n="1"/> | |
452 </assert_contents> | |
453 </element> | |
454 <element name="class" ftype="tabular"> | |
455 <assert_contents> | |
456 <has_text text="class_id"/> | |
457 <not_has_text text="phylum_id"/> | |
458 <has_n_columns n="3"/> | |
459 <has_n_lines n="1"/> | |
460 </assert_contents> | |
461 </element> | |
462 <element name="order" ftype="tabular"> | |
463 <assert_contents> | |
464 <has_text text="order_id"/> | |
465 <not_has_text text="class_id"/> | |
466 <has_n_columns n="3"/> | |
467 <has_n_lines n="1"/> | |
468 </assert_contents> | |
469 </element> | |
470 <element name="family" ftype="tabular"> | |
471 <assert_contents> | |
472 <has_text text="family_id"/> | |
473 <not_has_text text="order"/> | |
474 <has_n_columns n="3"/> | |
475 <has_n_lines n="1"/> | |
476 </assert_contents> | |
477 </element> | |
478 <element name="genus" ftype="tabular"> | |
479 <assert_contents> | |
480 <has_text text="genus_id"/> | |
481 <not_has_text text="family"/> | |
482 <has_n_columns n="3"/> | |
483 <has_n_lines n="1"/> | |
484 </assert_contents> | |
485 </element> | |
486 <element name="species" ftype="tabular"> | |
487 <assert_contents> | |
488 <has_text text="species_id"/> | |
489 <not_has_text text="genus"/> | |
490 <has_n_columns n="3"/> | |
491 <has_n_lines n="1"/> | |
492 </assert_contents> | |
493 </element> | |
494 <element name="strains" ftype="tabular"> | |
495 <assert_contents> | |
496 <has_text text="strains_id"/> | |
497 <not_has_text text="species_id"/> | |
498 <has_n_columns n="3"/> | |
499 <has_n_lines n="1"/> | |
500 </assert_contents> | |
501 </element> | |
502 </output_collection> | |
503 <output name="krona_output_file" ftype="tabular"> | |
504 <assert_contents> | |
505 <not_has_text text="k__Bacteria"/> | |
506 <has_n_lines n="0"/> | |
507 </assert_contents> | |
508 </output> | |
509 </test> | |
510 <test expect_num_outputs="6"> | |
511 <section name="inputs"> | |
512 <conditional name="in"> | |
513 <param name="selector" value="raw"/> | |
514 <conditional name="raw_in"> | |
515 <!-- Single GZ file --> | |
516 <param name="selector" value="single"/> | |
372 <param name="in" value="SRS014464-Anterior_nares.fasta.gz"/> | 517 <param name="in" value="SRS014464-Anterior_nares.fasta.gz"/> |
373 </conditional> | 518 </conditional> |
374 <param name="read_min_len" value="70"/> | 519 <param name="read_min_len" value="70"/> |
375 <section name="mapping"> | 520 <section name="mapping"> |
376 <param name="bt2_ps" value="sensitive"/> | 521 <param name="bt2_ps" value="sensitive"/> |
914 - unambiguous taxonomic assignments; | 1059 - unambiguous taxonomic assignments; |
915 - accurate estimation of organismal relative abundance; | 1060 - accurate estimation of organismal relative abundance; |
916 - species-level resolution for bacteria, archaea, eukaryotes and viruses; | 1061 - species-level resolution for bacteria, archaea, eukaryotes and viruses; |
917 - strain identification and tracking | 1062 - strain identification and tracking |
918 - orders of magnitude speedups compared to existing methods. | 1063 - orders of magnitude speedups compared to existing methods. |
919 - metagenomic strain-level population genomics | 1064 - microbiota strain-level population genomics |
920 | 1065 |
921 MetaPhlAn clade-abundance estimation | 1066 MetaPhlAn clade-abundance estimation |
922 ------------------------------------ | 1067 ------------------------------------ |
923 | 1068 |
924 The basic usage of MetaPhlAn consists in the identification of the clades (from phyla to species and | 1069 The basic usage of MetaPhlAn consists in the identification of the clades (from phyla to species and |
925 strains in particular cases) present in the metagenome obtained from a microbiome sample and their | 1070 strains in particular cases) present in the microbiota obtained from a microbiome sample and their |
926 relative abundance. | 1071 relative abundance. |
927 | 1072 |
928 Marker level analysis | 1073 Marker level analysis |
929 --------------------- | 1074 --------------------- |
930 | 1075 |
942 | 1087 |
943 Metaphlan takes as input either: | 1088 Metaphlan takes as input either: |
944 | 1089 |
945 - one or several sequence files in Fasta, FastQ (compressed or not) | 1090 - one or several sequence files in Fasta, FastQ (compressed or not) |
946 - a BowTie2 produced SAM file | 1091 - a BowTie2 produced SAM file |
947 - an intermediary mapping file of the metagenome generated by a previous MetaPhlAn run | 1092 - an intermediary mapping file of the microbiota generated by a previous MetaPhlAn run |
948 | 1093 |
949 It also need the reference database, which can be locally installed or customized using the dedicated tools. | 1094 It also need the reference database, which can be locally installed or customized using the dedicated tools. |
950 | 1095 |
951 Outputs | 1096 Outputs |
952 ======= | 1097 ======= |