diff metaphlan.xml @ 5:6dee4abadccb draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/metaphlan/ commit f3a89af137b13715f9fb13383577aceb2c445ce6
author iuc
date Sat, 03 Dec 2022 10:43:21 +0000
parents ff8f55893e7d
children 2131d7dca455
line wrap: on
line diff
--- a/metaphlan.xml	Wed Feb 02 22:03:11 2022 +0000
+++ b/metaphlan.xml	Sat Dec 03 10:43:21 2022 +0000
@@ -107,7 +107,7 @@
 #if $inputs.db.db_selector == "history"
 mkdir 'ref_db'
 &&
-bowtie2-build '$inputs.db.bowtie2db' 'ref_db/custom_db'
+bowtie2-build --large-index '$inputs.db.bowtie2db' 'ref_db/custom_db'
 &&
 python '$__tool_directory__/customizemetadata.py'
     transform_json_to_pkl
@@ -123,9 +123,15 @@
     --read_min_len $inputs.in.read_min_len
     --bt2_ps '$inputs.in.mapping.bt2_ps'
     --min_mapq_val $inputs.in.mapping.min_mapq_val
+    #if $ext == "sam"
+        --nreads \$(cat '$file_path' | grep -c -v '^@')
+    #end if
 #else
     '$inputs.in.in'
     --input_type '$inputs.in.selector'
+    #if $inputs.in.selector == "sam"
+        --nreads \$(cat '$inputs.in.in' | grep -c -v '^@')
+    #end if
 #end if
 #if $inputs.db.db_selector == "cached"
     --bowtie2db '$inputs.db.cached_db.fields.path'
@@ -334,7 +340,7 @@
             <param argument="--sample_id" type="text" value="Metaphlan_Analysis" label="Sample ID for this analysis"/>
             <param argument="--use_group_representative" type='boolean' checked="false" truevalue='--use_group_representative' falsevalue='' 
                 label="Use a species as representative for species groups?"/>
-            <param name="legacy_output" argument="--legacy-output" type='boolean' checked="false" truevalue='--legacy-output' falsevalue='' 
+            <param argument="--legacy-output" type='boolean' checked="false" truevalue='--legacy-output' falsevalue='' 
                 label="Old MetaPhlAn2 two columns output?"/>
             <param argument="--CAMI_format_output" type='boolean' checked="false" truevalue='--CAMI_format_output' falsevalue='' 
                 label="Report the profiling using the CAMI output format?"/>
@@ -408,7 +414,7 @@
             </section>
             <output name="output_file" ftype="tabular">
                 <assert_contents>
-                    <has_text text="UNKNOWN"/>
+                    <has_text text="UNCLASSIFIED"/>
                 </assert_contents>
             </output>
             <output name="bowtie2out" ftype="tabular">
@@ -503,7 +509,8 @@
             <output name="krona_output_file" ftype="tabular">
                 <assert_contents>
                     <not_has_text text="k__Bacteria"/>
-                    <has_n_lines n="0"/>
+                    <has_n_lines n="1" delta="1"/>
+                    <has_size value="1" delta="1"/>
                 </assert_contents>
             </output>
         </test>
@@ -1051,7 +1058,7 @@
 ============
 
 MetaPhlAn is a computational tool for profiling the composition of microbial communities (Bacteria, 
-Archaea and Eukaryotes) from metagenomic shotgun sequencing data (i.e. not 16S) with species-level. 
+Archaea and Eukaryotes) from metagenomic shotgun sequencing data (i.e. not 16S) at species-level. 
 
 MetaPhlAn relies on ~1.1M unique clade-specific marker genes identified from ~100,000 reference genomes 
 (~99,500 bacterial and archaeal and ~500 eukaryotic), allowing:
@@ -1077,8 +1084,8 @@
 aggregated marker information. Such capability comes with several slightly different flavours and 
 are a way to perform strain tracking and comparison across multiple samples.
 
-Usually, MetaPhlAn is first ran with the default parameter for the type of analysis to profile the 
-species present in the community, and then a strain-level profiling can be performed to zoom-in into 
+Usually, MetaPhlAn is first ran with default parameters for the type of analysis to profile the 
+species present in the community, and then a strain-level profiling can be performed to zoom-in on 
 specific species of interest. This operation can be performed quickly as it exploits the bowtie2out 
 intermediate file saved during the execution of the default analysis type.
 
@@ -1087,16 +1094,16 @@
 
 Metaphlan takes as input either:
 
-- one or several sequence files in Fasta, FastQ (compressed or not)
+- one or several sequence files in Fasta, FastQ (whether compressed or not)
 - a BowTie2 produced SAM file
 - an intermediary mapping file of the microbiota generated by a previous MetaPhlAn run
 
-It also need the reference database, which can be locally installed or customized using the dedicated tools.
+It also needs the reference database, which can be locally installed or customized using the dedicated tools.
 
 Outputs
 =======
 
-The main output file is a tab-separated file with the predicted taxon relative abundances.
+The main output is a tab-separated file with the predicted taxon relative abundances.
 
 It also generates a BIOM file and some intermediate files (SAM and BowTie2out) if sequence files are given as inputs.
 
@@ -1106,7 +1113,7 @@
 
 To get more information about MetaPhlAn usage and use cases, please refer to the `Metaphlan documentation`_.
 
-.. _Metaphlan documentation: https://github.com/biobakery/MetaPhlAn/wiki/MetaPhlAn-3.0#basic-usage
+.. _Metaphlan documentation: https://github.com/biobakery/MetaPhlAn/wiki/MetaPhlAn-4#Basic-Usage
 
     ]]></help>
     <expand macro="citations"/>