Mercurial > repos > thanhlv > metaphlan4
comparison metaphlan.xml @ 0:12e29dbb7041 draft default tip
planemo upload for repository https://github.com/quadram-institute-bioscience/galaxy-tools/tree/master/tools/metaphlan/
| author | thanhlv |
|---|---|
| date | Mon, 13 Feb 2023 11:36:42 +0000 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:12e29dbb7041 |
|---|---|
| 1 <tool id="metaphlan4" name="MetaPhlAn4" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@"> | |
| 2 <description>to profile the composition of microbial communities</description> | |
| 3 <macros> | |
| 4 <import>macros.xml</import> | |
| 5 <xml name="tax_lev"> | |
| 6 <conditional name="tax_lev"> | |
| 7 <param argument="--tax_lev" type="select" label="Taxonomic level for the relative abundance output"> | |
| 8 <option value="a" selected="true">All taxonomic levels</option> | |
| 9 <option value="k">Kingdoms only</option> | |
| 10 <option value="p">Phyla only</option> | |
| 11 <option value="c">Classes only</option> | |
| 12 <option value="o">Orders only</option> | |
| 13 <option value="f">Families only</option> | |
| 14 <option value="g">Genera only</option> | |
| 15 <option value="s">Species only</option> | |
| 16 </param> | |
| 17 <when value="a"> | |
| 18 <param name="split_levels" type='boolean' checked="false" truevalue='true' falsevalue='false' | |
| 19 label="Generate a report for each taxonomic level?" help="It will be in addition to the default output"/> | |
| 20 </when> | |
| 21 <when value="k"/> | |
| 22 <when value="p"/> | |
| 23 <when value="c"/> | |
| 24 <when value="o"/> | |
| 25 <when value="f"/> | |
| 26 <when value="g"/> | |
| 27 <when value="s"/> | |
| 28 </conditional> | |
| 29 </xml> | |
| 30 <token name="@FILE_FORMATS@">fastq,fastq.gz,fastq.bz2,fasta,fasta.gz,fasta.bz2</token> | |
| 31 </macros> | |
| 32 <expand macro="edam_ontology"/> | |
| 33 <expand macro="requirements"/> | |
| 34 <version_command>metaphlan -v</version_command> | |
| 35 <command detect_errors="aggressive"><![CDATA[ | |
| 36 #if $inputs.in.selector == "raw" | |
| 37 #if $inputs.in.raw_in.selector == "single" | |
| 38 #set full_ext=$inputs.in.raw_in.in.datatype.file_ext | |
| 39 #if $full_ext.endswith("gz") | |
| 40 #set $file_path="in" | |
| 41 zcat '$inputs.in.raw_in.in' > '$file_path' | |
| 42 && | |
| 43 #else if $full_ext.endswith("bz2") | |
| 44 #set $file_path="in" | |
| 45 bzcat '$inputs.in.raw_in.in' > '$file_path' | |
| 46 && | |
| 47 #else | |
| 48 #set $file_path=$inputs.in.raw_in.in | |
| 49 #end if | |
| 50 #else if $inputs.in.raw_in.selector == "multiple" | |
| 51 #set full_ext=$inputs.in.raw_in.in[0].datatype.file_ext | |
| 52 #set file_path="" | |
| 53 #set sep="" | |
| 54 #for $i, $f in enumerate($inputs.in.raw_in.in) | |
| 55 #if $f.datatype.file_ext != $full_ext | |
| 56 echo "Different datatypes for input files" | |
| 57 && | |
| 58 exit 1 | |
| 59 #end if | |
| 60 #if $full_ext.endswith("gz") | |
| 61 #set fp="input_%s" % ($i) | |
| 62 zcat '$f' > '$fp' | |
| 63 && | |
| 64 #else if $full_ext.endswith("bz2") | |
| 65 #set fp="input_%s" % ($i) | |
| 66 bzcat '$f' > '$fp' | |
| 67 && | |
| 68 #else | |
| 69 #set fp=$f | |
| 70 #end if | |
| 71 #set $file_path+="%s%s" % ($sep, $fp) | |
| 72 #set $sep="," | |
| 73 #end for | |
| 74 #else if $inputs.in.raw_in.selector == "paired" | |
| 75 #set full_ext=$inputs.in.raw_in.in_f.datatype.file_ext | |
| 76 #if $full_ext != $inputs.in.raw_in.in_r.datatype.file_ext | |
| 77 echo "Different datatypes for input paired-end files" | |
| 78 && | |
| 79 exit 1 | |
| 80 #end if | |
| 81 #if $full_ext.endswith("gz") | |
| 82 zcat '$inputs.in.raw_in.in_f' > 'in_f' | |
| 83 && | |
| 84 zcat '$inputs.in.raw_in.in_r' > 'in_r' | |
| 85 && | |
| 86 #set file_path="in_f,in_r" | |
| 87 #else if $full_ext.endswith("bz2") | |
| 88 bzcat '$inputs.in.raw_in.in_f' > 'in_f' | |
| 89 && | |
| 90 bzcat '$inputs.in.raw_in.in_r' > 'in_r' | |
| 91 && | |
| 92 #set file_path="in_f,in_r" | |
| 93 #else | |
| 94 #set file_path="%s,%s" % ($inputs.in.raw_in.in_f,$inputs.in.raw_in.in_r) | |
| 95 #end if | |
| 96 #end if | |
| 97 | |
| 98 #if $full_ext.startswith("fastq") | |
| 99 #set ext='fastq' | |
| 100 #else if $full_ext.startswith("fasta") and $full_ext.endswith(("gz","bz2")) | |
| 101 #set ext='fasta' | |
| 102 #else | |
| 103 #set ext=$full_ext | |
| 104 #end if | |
| 105 #end if | |
| 106 | |
| 107 #if $inputs.db.db_selector == "history" | |
| 108 mkdir 'ref_db' | |
| 109 && | |
| 110 bowtie2-build --large-index '$inputs.db.bowtie2db' 'ref_db/custom_db' | |
| 111 && | |
| 112 python '$__tool_directory__/customizemetadata.py' | |
| 113 transform_json_to_pkl | |
| 114 --json '$inputs.db.mpa_pkl' | |
| 115 --pkl 'ref_db/custom_db.pkl' | |
| 116 && | |
| 117 #end if | |
| 118 | |
| 119 metaphlan | |
| 120 #if $inputs.in.selector == "raw" | |
| 121 '$file_path' | |
| 122 --input_type '$ext' | |
| 123 --read_min_len $inputs.in.read_min_len | |
| 124 --bt2_ps '$inputs.in.mapping.bt2_ps' | |
| 125 --min_mapq_val $inputs.in.mapping.min_mapq_val | |
| 126 #if $ext == "sam" | |
| 127 --nreads \$(cat '$file_path' | grep -c -v '^@') | |
| 128 #end if | |
| 129 #else | |
| 130 '$inputs.in.in' | |
| 131 --input_type '$inputs.in.selector' | |
| 132 #if $inputs.in.selector == "sam" | |
| 133 --nreads \$(cat '$inputs.in.in' | grep -c -v '^@') | |
| 134 #end if | |
| 135 #end if | |
| 136 #if $inputs.db.db_selector == "cached" | |
| 137 --bowtie2db '$inputs.db.cached_db.fields.path' | |
| 138 --index '$inputs.db.cached_db.fields.dbkey' | |
| 139 #else | |
| 140 --bowtie2db 'ref_db/' | |
| 141 --index 'custom_db' | |
| 142 #end if | |
| 143 -t '$analysis.analysis_type.t' | |
| 144 #if $analysis.analysis_type.t == "rel_ab" or $analysis.analysis_type.t == "rel_ab_w_read_stats" | |
| 145 --tax_lev '$analysis.analysis_type.tax_lev.tax_lev' | |
| 146 #else if $analysis.analysis_type.t == "clade_specific_strain_tracker" | |
| 147 --clade '$analysis.analysis_type.clade' | |
| 148 #if str($analysis.analysis_type.min_ab) != '' | |
| 149 --min_ab $analysis.analysis_type.min_ab | |
| 150 #end if | |
| 151 #else if $analysis.analysis_type.t == "marker_ab_table" and str($analysis.analysis_type.nreads) != '' | |
| 152 --nreads $$analysis.analysis_type.nreads | |
| 153 #else if $analysis.analysis_type.t == "marker_pres_table" and str($analysis.analysis_type.pres_th) != '' | |
| 154 --pres_th $analysis.analysis_type.pres_th | |
| 155 #end if | |
| 156 --min_cu_len $analysis.min_cu_len | |
| 157 #if str($analysis.min_alignment_len) != '' | |
| 158 --min_alignment_len $analysis.min_alignment_len | |
| 159 #end if | |
| 160 #if 'add_viruses' in $analysis.organism_profiling | |
| 161 --add_viruses | |
| 162 #end if | |
| 163 #if 'ignore_eukaryotes' in $analysis.organism_profiling | |
| 164 --ignore_eukaryotes | |
| 165 #end if | |
| 166 #if 'ignore_bacteria' in $analysis.organism_profiling | |
| 167 --ignore_bacteria | |
| 168 #end if | |
| 169 #if 'ignore_archaea' in $analysis.organism_profiling | |
| 170 --ignore_archaea | |
| 171 #end if | |
| 172 --stat_q $analysis.stat_q | |
| 173 --perc_nonzero $analysis.perc_nonzero | |
| 174 #if $analysis.ignore_markers | |
| 175 --ignore_markers '$analysis.ignore_markers' | |
| 176 #end if | |
| 177 $analysis.avoid_disqm | |
| 178 --sample_id_key '$out.sample_id_key' | |
| 179 --sample_id '$out.sample_id' | |
| 180 $out.use_group_representative | |
| 181 $out.legacy_output | |
| 182 $out.CAMI_format_output | |
| 183 $out.unknown_estimation | |
| 184 -o '$output_file' | |
| 185 --bowtie2out 'bowtie2out' | |
| 186 -s '$sam_output_file' | |
| 187 --biom '$biom_output_file' | |
| 188 --nproc \${GALAXY_SLOTS:-4} | |
| 189 | |
| 190 #if $inputs.in.selector == "raw" | |
| 191 && | |
| 192 mv 'bowtie2out' '$bowtie2out' | |
| 193 #end if | |
| 194 | |
| 195 #if $analysis.analysis_type.tax_lev.tax_lev == 'a' and $analysis.analysis_type.tax_lev.split_levels | |
| 196 && | |
| 197 mkdir 'split_levels' | |
| 198 && | |
| 199 python '$__tool_directory__/formatoutput.py' | |
| 200 split_levels | |
| 201 --metaphlan_output '$output_file' | |
| 202 --outdir 'split_levels' | |
| 203 $out.legacy_output | |
| 204 | |
| 205 #end if | |
| 206 | |
| 207 #if $out.krona_output | |
| 208 && | |
| 209 python '$__tool_directory__/formatoutput.py' | |
| 210 format_for_krona | |
| 211 --metaphlan_output '$output_file' | |
| 212 --krona_output '$krona_output_file' | |
| 213 #end if | |
| 214 ]]></command> | |
| 215 <inputs> | |
| 216 <section name="inputs" title="Inputs" expanded="true"> | |
| 217 <conditional name="in"> | |
| 218 <param name="selector" type="select" label="Input(s)"> | |
| 219 <option value="raw" selected="true">Fasta/FastQ file(s) with microbiota reads</option> | |
| 220 <option value="sam">Externally BowTie2-mapped SAM file</option> | |
| 221 <option value="bowtie2out">Intermediary mapping file of the microbiota generated by a previous MetaPhlAn run</option> | |
| 222 </param> | |
| 223 <when value="raw"> | |
| 224 <conditional name="raw_in"> | |
| 225 <param name="selector" type="select" label="Fasta/FastQ file(s) with microbiota reads"> | |
| 226 <option value="single" selected="true">One single-end file</option> | |
| 227 <option value="multiple">Multiple single-end files</option> | |
| 228 <option value="paired">Paired-end files</option> | |
| 229 </param> | |
| 230 <when value="single"> | |
| 231 <param name="in" type="data" format="@FILE_FORMATS@" label="Single-end Fasta/FastQ file with microbiota reads"/> | |
| 232 </when> | |
| 233 <when value="multiple"> | |
| 234 <param name="in" type="data" format="@FILE_FORMATS@" multiple="true" label="Single-end Fasta/FastQ files with microbiota reads"/> | |
| 235 </when> | |
| 236 <when value="paired"> | |
| 237 <param name="in_f" type="data" format="@FILE_FORMATS@" label="Forward paired-end Fasta/FastQ file with microbiota reads"/> | |
| 238 <param name="in_r" type="data" format="@FILE_FORMATS@" label="Reverse paired-end Fasta/FastQ file with microbiota reads"/> | |
| 239 </when> | |
| 240 </conditional> | |
| 241 <param argument="--read_min_len" type="integer" value="70" label="Minimum length of the reads to be considered when parsing the input file"/> | |
| 242 <section name="mapping" title="Mapping" expanded="true"> | |
| 243 <param argument="--bt2_ps" type="select" label="Presets options for BowTie2" help="Applied only with FASTA files"> | |
| 244 <option value="sensitive">Sensitive</option> | |
| 245 <option value="very-sensitive" selected="true">Very sensitive</option> | |
| 246 <option value="sensitive-local">Sensitive local</option> | |
| 247 <option value="very-sensitive-local">Very sensitive local</option> | |
| 248 </param> | |
| 249 <param argument="--min_mapq_val" type="integer" value="5" label="Minimum mapping quality value (MAPQ)"/> | |
| 250 </section> | |
| 251 </when> | |
| 252 <when value="sam"> | |
| 253 <param name="in" type="data" format="sam" label="Externally BowTie2-mapped SAM file" help="BowTie2 needs to be used first to map microbiota reads"/> | |
| 254 </when> | |
| 255 <when value="bowtie2out"> | |
| 256 <param name="in" type="data" format="tabular" label="Intermediary mapping file of the microbiota generated by a previous MetaPhlAn run" | |
| 257 help="File needs to be generated with MetaPhlAn versions >3.0"/> | |
| 258 </when> | |
| 259 </conditional> | |
| 260 <conditional name="db"> | |
| 261 <param name="db_selector" type="select" label="Database with clade-specific marker genes"> | |
| 262 <option value="cached" selected="true">Locally cached</option> | |
| 263 <option value="history">From history</option> | |
| 264 </param> | |
| 265 <when value="cached"> | |
| 266 <param name="cached_db" type="select" label="Cached database with clade-specific marker genes"> | |
| 267 <options from_data_table="@IDX_DATA_TABLE@"> | |
| 268 <filter type="static_value" column="4" value="@IDX_VERSION@"/> | |
| 269 <validator message="No compatible MetaPhlAn database is available" type="no_options"/> | |
| 270 </options> | |
| 271 </param> | |
| 272 </when> | |
| 273 <when value="history"> | |
| 274 <param argument="--bowtie2db" type="data" format="fasta" label="Database with clade-specific marker genes from history"/> | |
| 275 <param argument="--mpa_pkl" type="data" format="json" label="Metadata associated to the database with clade-specific marker genes from history"/> | |
| 276 </when> | |
| 277 </conditional> | |
| 278 </section> | |
| 279 <section name="analysis" title="Analysis" expanded="true"> | |
| 280 <conditional name="analysis_type"> | |
| 281 <param argument="-t" type="select" label="Type of analysis to perform"> | |
| 282 <option value="rel_ab" selected="true">rel_ab: Profiling a microbiota in terms of relative abundances</option> | |
| 283 <option value="rel_ab_w_read_stats">rel_ab_w_read_stats: Profiling a microbiota in terms of relative abundances and estimate the number of reads comming from each clade</option> | |
| 284 <option value="reads_map">reads_map: Mapping from reads to clades (only reads hitting a marker)</option> | |
| 285 <option value="clade_profiles">clade_profiles: Normalized marker counts for clades with at least a non-null marker</option> | |
| 286 <option value="clade_specific_strain_tracker">clade_specific_strain_tracker: List of markers present for a specific clade and all its subclades</option> | |
| 287 <option value="marker_ab_table">marker_ab_table: Normalized marker counts (only when > 0.0 and normalized by microbiota size if number of reads is specified)</option> | |
| 288 <option value="marker_counts">marker_counts: Non-normalized marker counts (use with extreme caution)</option> | |
| 289 <option value="marker_pres_table">marker_pres_table: List of markers present in the sample (threshold at 1.0 if not differently specified with --pres_th</option> | |
| 290 </param> | |
| 291 <when value="rel_ab"> | |
| 292 <expand macro="tax_lev"/> | |
| 293 </when> | |
| 294 <when value="rel_ab_w_read_stats"> | |
| 295 <expand macro="tax_lev"/> | |
| 296 </when> | |
| 297 <when value="reads_map"/> | |
| 298 <when value="clade_profiles"/> | |
| 299 <when value="clade_specific_strain_tracker"> | |
| 300 <param argument="--clade" type="text" value="" label="Clade for which to extract list of markers present" | |
| 301 help="Markers are also extracted for subclades" /> | |
| 302 <param argument="--min_ab" type="float" optional="true" label="The minimum percentage abundance for the clade"/> | |
| 303 </when> | |
| 304 <when value="marker_ab_table"> | |
| 305 <param argument="--nreads" type="integer" optional="true" label="Total number of reads in the original microbiota" | |
| 306 help="It is used for normalizing the length-normalized counts with the microbiota size as well. No normalization applied if the value is not specified"/> | |
| 307 </when> | |
| 308 <when value="marker_counts"/> | |
| 309 <when value="marker_pres_table"> | |
| 310 <param argument="--pres_th" type="integer" optional="true" label="Threshold for calling a marker present"/> | |
| 311 </when> | |
| 312 </conditional> | |
| 313 <param argument="--min_cu_len" type="integer" value="2000" | |
| 314 label="Minimum total nucleotide length for the markers in a clade for estimating the abundance without considering sub-clade abundances"/> | |
| 315 <param argument="--min_alignment_len" type="integer" optional="true" | |
| 316 label="Sam records for aligned reads with the longest subalignment length smaller than this threshold will be discarded."/> | |
| 317 <param name="organism_profiling" type="select" multiple="true" optional="true" label="Organisms to profile"> | |
| 318 <option value="add_viruses" selected="true">Profile viral organisms (add_viruses)</option> | |
| 319 <option value="ignore_eukaryotes">Ignore eukaryotic organisms (ignore_eukaryotes)</option> | |
| 320 <option value="ignore_bacteria">Ignore bacteria organisms (ignore_bacteria)</option> | |
| 321 <option value="ignore_archaea">Ignore archea organisms (ignore_archaea)</option> | |
| 322 </param> | |
| 323 <param argument="--stat" type="select" label="Statistical approach for converting marker abundances into clade abundances"> | |
| 324 <option value="avg_g">avg_g: Clade global (i.e. normalizing all markers together) average (avg_g)</option> | |
| 325 <option value="avg_l">avg_l: Average of length-normalized marker counts</option> | |
| 326 <option value="tavg_g" selected="true">tavg_g: Truncated clade global average at --stat_q quantile</option> | |
| 327 <option value="tavg_l">tavg_l: Truncated average of length-normalized marker counts (at --stat_q)</option> | |
| 328 <option value="wavg_g">wavg_g: Winsorized clade global average (at --stat_q)</option> | |
| 329 <option value="wavg_l">wavg_l: Winsorized average of length-normalized marker counts (at --stat_q)</option> | |
| 330 <option value="med">med: Median of length-normalized marker counts</option> | |
| 331 </param> | |
| 332 <param argument="--stat_q" type="float" value="0.2" label="Quantile value for the robust average"/> | |
| 333 <param argument="--perc_nonzero" type="float" value="0.33" label="Percentage of markers with a non zero relative abundance for misidentify a species"/> | |
| 334 <param argument="--ignore_markers" type="data" format="txt,tabular" optional="true" label="File containing a list of markers to ignore" help="One marker per line"/> | |
| 335 <param argument="--avoid_disqm" type='boolean' checked="true" truevalue='--avoid_disqm' falsevalue='' | |
| 336 label="Deactivate the procedure of disambiguating the quasi-markers based on the marker abundance pattern found in the sample?" | |
| 337 help="It is generally recommended to keep the disambiguation procedure in order to minimize false positives"/> | |
| 338 </section> | |
| 339 <section name="out" title="Outputs" expanded="true"> | |
| 340 <param argument="--sample_id_key" type="text" value="SampleID" label="Sample ID key for this analysis"/> | |
| 341 <param argument="--sample_id" type="text" value="Metaphlan_Analysis" label="Sample ID for this analysis"/> | |
| 342 <param argument="--use_group_representative" type='boolean' checked="false" truevalue='--use_group_representative' falsevalue='' | |
| 343 label="Use a species as representative for species groups?"/> | |
| 344 <param argument="--legacy-output" type='boolean' checked="false" truevalue='--legacy-output' falsevalue='' | |
| 345 label="Old MetaPhlAn2 two columns output?"/> | |
| 346 <param argument="--CAMI_format_output" type='boolean' checked="false" truevalue='--CAMI_format_output' falsevalue='' | |
| 347 label="Report the profiling using the CAMI output format?"/> | |
| 348 <param argument="--unknown_estimation" type='boolean' checked="false" truevalue='--unknown_estimation' falsevalue='' | |
| 349 label="Scale relative abundances to the number of reads mapping to known clades in order to estimate unknowness?"/> | |
| 350 <param name="krona_output" type='boolean' checked="false" truevalue='true' falsevalue='false' label="Output for Krona?"/> | |
| 351 </section> | |
| 352 </inputs> | |
| 353 <outputs> | |
| 354 <data name="output_file" format="tabular" label="${tool.name} on ${on_string}: Predicted taxon relative abundances" /> | |
| 355 <data name="bowtie2out" format="tabular" label="${tool.name} on ${on_string}: Bowtie2 output"> | |
| 356 <filter>inputs['in']['selector'] == "raw"</filter> | |
| 357 </data> | |
| 358 <data name="sam_output_file" format="sam" label="${tool.name} on ${on_string}: SAM file"> | |
| 359 <filter>inputs['in']['selector'] == "raw"</filter> | |
| 360 </data> | |
| 361 <data name="biom_output_file" format="biom1" label="${tool.name} on ${on_string}: BIOM file" /> | |
| 362 <collection name="levels" type="list" label="${tool.name} on ${on_string}: Predicted taxon relative abundances at each taxonomic levels" > | |
| 363 <discover_datasets pattern="(?P<designation>.+)" directory="split_levels/" format="tabular"/> | |
| 364 <filter>analysis['analysis_type']['tax_lev']['tax_lev'] == "a" and analysis['analysis_type']['tax_lev']['split_levels']</filter> | |
| 365 </collection> | |
| 366 <data name="krona_output_file" format="tabular" label="${tool.name} on ${on_string}: Predicted taxon relative abundances for Krona"> | |
| 367 <filter>out['krona_output']</filter> | |
| 368 </data> | |
| 369 </outputs> | |
| 370 <tests> | |
| 371 <test expect_num_outputs="6"> | |
| 372 <section name="inputs"> | |
| 373 <conditional name="in"> | |
| 374 <param name="selector" value="raw"/> | |
| 375 <conditional name="raw_in"> | |
| 376 <!-- Single GZ file --> | |
| 377 <param name="selector" value="single"/> | |
| 378 <param name="in" value="no_taxon_input.fasta"/> | |
| 379 </conditional> | |
| 380 <param name="read_min_len" value="70"/> | |
| 381 <section name="mapping"> | |
| 382 <param name="bt2_ps" value="sensitive"/> | |
| 383 <param name="min_mapq_val" value="5"/> | |
| 384 </section> | |
| 385 </conditional> | |
| 386 <conditional name="db"> | |
| 387 <!-- Cached db --> | |
| 388 <param name="db_selector" value="cached"/> | |
| 389 <param name="cached_db" value="test-db-20210409"/> | |
| 390 </conditional> | |
| 391 </section> | |
| 392 <section name="analysis"> | |
| 393 <conditional name="analysis_type"> | |
| 394 <param name="t" value="rel_ab"/> | |
| 395 <conditional name="tax_lev"> | |
| 396 <param name="tax_lev" value="a"/> | |
| 397 <param name="split_levels" value="true"/> | |
| 398 </conditional> | |
| 399 </conditional> | |
| 400 <param name="min_cu_len" value="2000"/> | |
| 401 <param name="organism_profiling" value="add_viruses"/> | |
| 402 <param name="stat" value="avg_g"/> | |
| 403 <param name="stat_q" value="0.2"/> | |
| 404 <param name="perc_nonzero" value="0.33"/> | |
| 405 <param name="avoid_disqm" value="true"/> | |
| 406 </section> | |
| 407 <section name="out"> | |
| 408 <param name="sample_id_key" value="SampleID"/> | |
| 409 <param name="sample_id" value="Metaphlan_Analysis"/> | |
| 410 <param name="use_group_representative" value="false"/> | |
| 411 <param name="legacy_output" value="false"/> | |
| 412 <param name="CAMI_format_output" value="false"/> | |
| 413 <param name="unknown_estimation" value="false"/> | |
| 414 <param name="krona_output" value="true"/> | |
| 415 </section> | |
| 416 <output name="output_file" ftype="tabular"> | |
| 417 <assert_contents> | |
| 418 <has_text text="UNCLASSIFIED"/> | |
| 419 </assert_contents> | |
| 420 </output> | |
| 421 <output name="bowtie2out" ftype="tabular"> | |
| 422 <assert_contents> | |
| 423 <not_has_text text="HWI-EAS109_102883399:3:104:7342:14360/1"/> | |
| 424 <has_n_lines n="2"/> | |
| 425 </assert_contents> | |
| 426 </output> | |
| 427 <output name="sam_output_file" ftype="sam"> | |
| 428 <assert_contents> | |
| 429 <has_text text="SN:13076__A0A2I1PE66__CYJ72_10760"/> | |
| 430 </assert_contents> | |
| 431 </output> | |
| 432 <output name="biom_output_file" ftype="biom1"> | |
| 433 <assert_contents> | |
| 434 <not_has_text text="k__Bacteria"/> | |
| 435 <not_has_text text="p__Actinobacteria"/> | |
| 436 </assert_contents> | |
| 437 </output> | |
| 438 <output_collection name="levels" type="list" > | |
| 439 | |
| 440 <element name="all" ftype="tabular"> | |
| 441 <assert_contents> | |
| 442 <has_text text="class"/> | |
| 443 <has_n_columns n="17"/> | |
| 444 <has_n_lines n="1"/> | |
| 445 </assert_contents> | |
| 446 </element> | |
| 447 <element name="class" ftype="tabular"> | |
| 448 <assert_contents> | |
| 449 <has_text text="class_id"/> | |
| 450 <not_has_text text="phylum_id"/> | |
| 451 <has_n_columns n="3"/> | |
| 452 <has_n_lines n="1"/> | |
| 453 </assert_contents> | |
| 454 </element> | |
| 455 <element name="family" ftype="tabular"> | |
| 456 <assert_contents> | |
| 457 <has_text text="family_id"/> | |
| 458 <not_has_text text="order"/> | |
| 459 <has_n_columns n="3"/> | |
| 460 <has_n_lines n="1"/> | |
| 461 </assert_contents> | |
| 462 </element> | |
| 463 <element name="genus" ftype="tabular"> | |
| 464 <assert_contents> | |
| 465 <has_text text="genus_id"/> | |
| 466 <not_has_text text="family"/> | |
| 467 <has_n_columns n="3"/> | |
| 468 <has_n_lines n="1"/> | |
| 469 </assert_contents> | |
| 470 </element> | |
| 471 <element name="kingdom" ftype="tabular"> | |
| 472 <assert_contents> | |
| 473 <has_text text="kingdom_id"/> | |
| 474 <has_n_columns n="3"/> | |
| 475 <has_n_lines n="1"/> | |
| 476 </assert_contents> | |
| 477 </element> | |
| 478 <element name="order" ftype="tabular"> | |
| 479 <assert_contents> | |
| 480 <has_text text="order_id"/> | |
| 481 <not_has_text text="class_id"/> | |
| 482 <has_n_columns n="3"/> | |
| 483 <has_n_lines n="1"/> | |
| 484 </assert_contents> | |
| 485 </element> | |
| 486 <element name="phylum" ftype="tabular"> | |
| 487 <assert_contents> | |
| 488 <has_text text="phylum_id"/> | |
| 489 <not_has_text text="kingdom_id"/> | |
| 490 <has_n_columns n="3"/> | |
| 491 <has_n_lines n="1"/> | |
| 492 </assert_contents> | |
| 493 </element> | |
| 494 <element name="species" ftype="tabular"> | |
| 495 <assert_contents> | |
| 496 <has_text text="species_id"/> | |
| 497 <not_has_text text="genus"/> | |
| 498 <has_n_columns n="3"/> | |
| 499 <has_n_lines n="1"/> | |
| 500 </assert_contents> | |
| 501 </element> | |
| 502 <element name="strains" ftype="tabular"> | |
| 503 <assert_contents> | |
| 504 <has_text text="strains_id"/> | |
| 505 <not_has_text text="species_id"/> | |
| 506 <has_n_columns n="3"/> | |
| 507 <has_n_lines n="1"/> | |
| 508 </assert_contents> | |
| 509 </element> | |
| 510 </output_collection> | |
| 511 <output name="krona_output_file" ftype="tabular"> | |
| 512 <assert_contents> | |
| 513 <not_has_text text="k__Bacteria"/> | |
| 514 <has_n_lines n="1" delta="1"/> | |
| 515 <has_size value="1" delta="1"/> | |
| 516 </assert_contents> | |
| 517 </output> | |
| 518 </test> | |
| 519 <test expect_num_outputs="6"> | |
| 520 <section name="inputs"> | |
| 521 <conditional name="in"> | |
| 522 <param name="selector" value="raw"/> | |
| 523 <conditional name="raw_in"> | |
| 524 <!-- Single GZ file --> | |
| 525 <param name="selector" value="single"/> | |
| 526 <param name="in" value="SRS014464-Anterior_nares.fasta.gz"/> | |
| 527 </conditional> | |
| 528 <param name="read_min_len" value="70"/> | |
| 529 <section name="mapping"> | |
| 530 <param name="bt2_ps" value="sensitive"/> | |
| 531 <param name="min_mapq_val" value="5"/> | |
| 532 </section> | |
| 533 </conditional> | |
| 534 <conditional name="db"> | |
| 535 <!-- Cached db --> | |
| 536 <param name="db_selector" value="cached"/> | |
| 537 <param name="cached_db" value="test-db-20210409"/> | |
| 538 </conditional> | |
| 539 </section> | |
| 540 <section name="analysis"> | |
| 541 <conditional name="analysis_type"> | |
| 542 <param name="t" value="rel_ab"/> | |
| 543 <conditional name="tax_lev"> | |
| 544 <param name="tax_lev" value="a"/> | |
| 545 <param name="split_levels" value="true"/> | |
| 546 </conditional> | |
| 547 </conditional> | |
| 548 <param name="min_cu_len" value="2000"/> | |
| 549 <param name="organism_profiling" value="add_viruses"/> | |
| 550 <param name="stat" value="avg_g"/> | |
| 551 <param name="stat_q" value="0.2"/> | |
| 552 <param name="perc_nonzero" value="0.33"/> | |
| 553 <param name="avoid_disqm" value="true"/> | |
| 554 </section> | |
| 555 <section name="out"> | |
| 556 <param name="sample_id_key" value="SampleID"/> | |
| 557 <param name="sample_id" value="Metaphlan_Analysis"/> | |
| 558 <param name="use_group_representative" value="false"/> | |
| 559 <param name="legacy_output" value="false"/> | |
| 560 <param name="CAMI_format_output" value="false"/> | |
| 561 <param name="unknown_estimation" value="false"/> | |
| 562 <param name="krona_output" value="true"/> | |
| 563 </section> | |
| 564 <output name="output_file" ftype="tabular" file="SRS014464-Anterior_nares-abundances.tabular" compare="sim_size"> | |
| 565 <assert_contents> | |
| 566 <has_text text="k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Corynebacteriales|f__Corynebacteriaceae|g__Corynebacterium|s__Corynebacterium_accolens"/> | |
| 567 </assert_contents> | |
| 568 </output> | |
| 569 <output name="bowtie2out" ftype="tabular" file="SRS014464-Anterior_nares-bowtie2out.tabular" compare="sim_size"> | |
| 570 <assert_contents> | |
| 571 <has_text text="HWI-EAS109_102883399:3:104:7342:14360/1"/> | |
| 572 <has_text text="37637__U2I1U8__N579_01580"/> | |
| 573 </assert_contents> | |
| 574 </output> | |
| 575 <output name="sam_output_file" ftype="sam" file="SRS014464-Anterior_nares.sam" compare="sim_size"> | |
| 576 <assert_contents> | |
| 577 <has_text text="SN:13076__A0A2I1PE66__CYJ72_10760"/> | |
| 578 </assert_contents> | |
| 579 </output> | |
| 580 <output name="biom_output_file" ftype="biom1" file="SRS014464-Anterior_nares.biom" compare="sim_size"> | |
| 581 <assert_contents> | |
| 582 <has_text text="k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Pseudomonadales|f__Moraxellaceae|g__Moraxella|s__Moraxella_lacunata"/> | |
| 583 </assert_contents> | |
| 584 </output> | |
| 585 <output_collection name="levels" type="list" > | |
| 586 <element name="all" ftype="tabular"> | |
| 587 <assert_contents> | |
| 588 <has_text text="Gammaproteobacteria"/> | |
| 589 <has_text text="Corynebacterium accolens"/> | |
| 590 <has_n_columns n="17"/> | |
| 591 </assert_contents> | |
| 592 </element> | |
| 593 <element name="class" ftype="tabular"> | |
| 594 <assert_contents> | |
| 595 <has_text text="class_id"/> | |
| 596 <not_has_text text="phylum_id"/> | |
| 597 <has_text text="Actinobacteria"/> | |
| 598 <has_n_columns n="3"/> | |
| 599 </assert_contents> | |
| 600 </element> | |
| 601 <element name="family" ftype="tabular"> | |
| 602 <assert_contents> | |
| 603 <has_text text="family_id"/> | |
| 604 <not_has_text text="order"/> | |
| 605 <has_text text="Propionibacteriaceae"/> | |
| 606 <has_n_columns n="3"/> | |
| 607 </assert_contents> | |
| 608 </element> | |
| 609 <element name="genus" ftype="tabular"> | |
| 610 <assert_contents> | |
| 611 <has_text text="genus_id"/> | |
| 612 <not_has_text text="family"/> | |
| 613 <has_text text="Cutibacterium"/> | |
| 614 <has_n_columns n="3"/> | |
| 615 </assert_contents> | |
| 616 </element> | |
| 617 <element name="kingdom" ftype="tabular"> | |
| 618 <assert_contents> | |
| 619 <has_text text="kingdom_id"/> | |
| 620 <has_text text="Bacteria"/> | |
| 621 <has_n_columns n="3"/> | |
| 622 </assert_contents> | |
| 623 </element> | |
| 624 <element name="order" ftype="tabular"> | |
| 625 <assert_contents> | |
| 626 <has_text text="order_id"/> | |
| 627 <not_has_text text="class_id"/> | |
| 628 <has_text text="Propionibacteriales"/> | |
| 629 <has_n_columns n="3"/> | |
| 630 </assert_contents> | |
| 631 </element> | |
| 632 <element name="phylum" ftype="tabular"> | |
| 633 <assert_contents> | |
| 634 <has_text text="phylum_id"/> | |
| 635 <not_has_text text="kingdom_id"/> | |
| 636 <has_text text="Firmicutes"/> | |
| 637 <has_n_columns n="3"/> | |
| 638 </assert_contents> | |
| 639 </element> | |
| 640 <element name="species" ftype="tabular"> | |
| 641 <assert_contents> | |
| 642 <has_text text="species_id"/> | |
| 643 <not_has_text text="genus"/> | |
| 644 <has_text text="Corynebacterium accolens"/> | |
| 645 <has_n_columns n="3"/> | |
| 646 </assert_contents> | |
| 647 </element> | |
| 648 <element name="strains" ftype="tabular"> | |
| 649 <assert_contents> | |
| 650 <has_text text="strains_id"/> | |
| 651 <not_has_text text="species_id"/> | |
| 652 <has_n_columns n="3"/> | |
| 653 </assert_contents> | |
| 654 </element> | |
| 655 </output_collection> | |
| 656 <output name="krona_output_file" ftype="tabular"> | |
| 657 <assert_contents> | |
| 658 <not_has_text text="k__Bacteria"/> | |
| 659 <has_text text="Corynebacterium accolens"/> | |
| 660 <has_n_columns n="9"/> | |
| 661 </assert_contents> | |
| 662 </output> | |
| 663 </test> | |
| 664 <test expect_num_outputs="4"> | |
| 665 <section name="inputs"> | |
| 666 <conditional name="in"> | |
| 667 <param name="selector" value="raw"/> | |
| 668 <conditional name="raw_in"> | |
| 669 <!-- Multiple GZ file --> | |
| 670 <param name="selector" value="multiple"/> | |
| 671 <param name="in" value="SRS014464-Anterior_nares.fasta.gz,SRS014464-Anterior_nares.fasta.gz"/> | |
| 672 </conditional> | |
| 673 <param name="read_min_len" value="70"/> | |
| 674 <section name="mapping"> | |
| 675 <param name="bt2_ps" value="sensitive"/> | |
| 676 <param name="min_mapq_val" value="5"/> | |
| 677 </section> | |
| 678 </conditional> | |
| 679 <conditional name="db"> | |
| 680 <!-- Local db --> | |
| 681 <param name="db_selector" value="history"/> | |
| 682 <param name="bowtie2db" value="test-db.fasta"/> | |
| 683 <param name="mpa_pkl" value="test-db.json"/> | |
| 684 </conditional> | |
| 685 </section> | |
| 686 <section name="analysis"> | |
| 687 <conditional name="analysis_type"> | |
| 688 <param name="t" value="rel_ab"/> | |
| 689 <conditional name="tax_lev"> | |
| 690 <param name="tax_lev" value="a"/> | |
| 691 <param name="split_levels" value="false"/> | |
| 692 </conditional> | |
| 693 </conditional> | |
| 694 <param name="min_cu_len" value="2000"/> | |
| 695 <param name="organism_profiling" value="add_viruses"/> | |
| 696 <param name="stat" value="avg_g"/> | |
| 697 <param name="stat_q" value="0.2"/> | |
| 698 <param name="perc_nonzero" value="0.33"/> | |
| 699 <param name="avoid_disqm" value="true"/> | |
| 700 </section> | |
| 701 <section name="out"> | |
| 702 <param name="sample_id_key" value="SampleID"/> | |
| 703 <param name="sample_id" value="Metaphlan_Analysis"/> | |
| 704 <param name="use_group_representative" value="false"/> | |
| 705 <param name="legacy_output" value="false"/> | |
| 706 <param name="CAMI_format_output" value="false"/> | |
| 707 <param name="unknown_estimation" value="false"/> | |
| 708 <param name="krona_output" value="false"/> | |
| 709 </section> | |
| 710 <output name="output_file" ftype="tabular" file="SRS014464-Anterior_nares-abundances.tabular" compare="sim_size"> | |
| 711 <assert_contents> | |
| 712 <has_text text="k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Corynebacteriales|f__Corynebacteriaceae|g__Corynebacterium|s__Corynebacterium_accolens"/> | |
| 713 <has_text text="relative_abundance"/> | |
| 714 <has_text text="NCBI_tax_id"/> | |
| 715 <has_text text="clade_name"/> | |
| 716 </assert_contents> | |
| 717 </output> | |
| 718 <output name="bowtie2out" ftype="tabular" file="SRS014464-Anterior_nares-two-inputs-bowtie2out.tabular" compare="sim_size"> | |
| 719 <assert_contents> | |
| 720 <has_text text="HWI-EAS109_102883399:3:104:7342:14360/1"/> | |
| 721 <has_text text="37637__U2I1U8__N579_01580"/> | |
| 722 </assert_contents> | |
| 723 </output> | |
| 724 <output name="sam_output_file" ftype="sam" file="SRS014464-Anterior_nares-two-inputs.sam" compare="sim_size"> | |
| 725 <assert_contents> | |
| 726 <has_text text="SN:13076__A0A2I1PE66__CYJ72_10760"/> | |
| 727 </assert_contents> | |
| 728 </output> | |
| 729 <output name="biom_output_file" ftype="biom1" file="SRS014464-Anterior_nares.biom" compare="sim_size"> | |
| 730 <assert_contents> | |
| 731 <has_text text="k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Pseudomonadales|f__Moraxellaceae|g__Moraxella|s__Moraxella_lacunata"/> | |
| 732 </assert_contents> | |
| 733 </output> | |
| 734 </test> | |
| 735 <test expect_num_outputs="4"> | |
| 736 <section name="inputs"> | |
| 737 <conditional name="in"> | |
| 738 <param name="selector" value="raw"/> | |
| 739 <conditional name="raw_in"> | |
| 740 <!-- Paired GZ file --> | |
| 741 <param name="selector" value="paired"/> | |
| 742 <param name="in_f" value="SRS014464-Anterior_nares.fasta.gz"/> | |
| 743 <param name="in_r" value="SRS014464-Anterior_nares.fasta.gz"/> | |
| 744 </conditional> | |
| 745 <param name="read_min_len" value="70"/> | |
| 746 <section name="mapping"> | |
| 747 <param name="bt2_ps" value="sensitive"/> | |
| 748 <param name="min_mapq_val" value="5"/> | |
| 749 </section> | |
| 750 </conditional> | |
| 751 <conditional name="db"> | |
| 752 <!-- Cached db --> | |
| 753 <param name="db_selector" value="cached"/> | |
| 754 <param name="cached_db" value="test-db-20210409"/> | |
| 755 </conditional> | |
| 756 </section> | |
| 757 <section name="analysis"> | |
| 758 <conditional name="analysis_type"> | |
| 759 <param name="t" value="rel_ab"/> | |
| 760 <conditional name="tax_lev"> | |
| 761 <param name="tax_lev" value="a"/> | |
| 762 <param name="split_levels" value="false"/> | |
| 763 </conditional> | |
| 764 </conditional> | |
| 765 <param name="min_cu_len" value="2000"/> | |
| 766 <param name="organism_profiling" value="add_viruses"/> | |
| 767 <param name="stat" value="avg_g"/> | |
| 768 <param name="stat_q" value="0.2"/> | |
| 769 <param name="perc_nonzero" value="0.33"/> | |
| 770 <param name="avoid_disqm" value="true"/> | |
| 771 </section> | |
| 772 <section name="out"> | |
| 773 <param name="sample_id_key" value="SampleID"/> | |
| 774 <param name="sample_id" value="Metaphlan_Analysis"/> | |
| 775 <param name="use_group_representative" value="false"/> | |
| 776 <param name="legacy_output" value="false"/> | |
| 777 <param name="CAMI_format_output" value="false"/> | |
| 778 <param name="unknown_estimation" value="false"/> | |
| 779 <param name="krona_output" value="false"/> | |
| 780 </section> | |
| 781 <output name="output_file" ftype="tabular" file="SRS014464-Anterior_nares-abundances.tabular" compare="sim_size"> | |
| 782 <assert_contents> | |
| 783 <has_text text="k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Corynebacteriales|f__Corynebacteriaceae|g__Corynebacterium|s__Corynebacterium_accolens"/> | |
| 784 <has_text text="relative_abundance"/> | |
| 785 <has_text text="NCBI_tax_id"/> | |
| 786 <has_text text="clade_name"/> | |
| 787 </assert_contents> | |
| 788 </output> | |
| 789 <output name="bowtie2out" ftype="tabular" file="SRS014464-Anterior_nares-two-inputs-bowtie2out.tabular" compare="sim_size"> | |
| 790 <assert_contents> | |
| 791 <has_text text="HWI-EAS109_102883399:3:104:7342:14360/1"/> | |
| 792 <has_text text="37637__U2I1U8__N579_01580"/> | |
| 793 </assert_contents> | |
| 794 </output> | |
| 795 <output name="sam_output_file" ftype="sam" file="SRS014464-Anterior_nares-two-inputs.sam" compare="sim_size"> | |
| 796 <assert_contents> | |
| 797 <has_text text="SN:13076__A0A2I1PE66__CYJ72_10760"/> | |
| 798 </assert_contents> | |
| 799 </output> | |
| 800 <output name="biom_output_file" ftype="biom1" file="SRS014464-Anterior_nares.biom" compare="sim_size"> | |
| 801 <assert_contents> | |
| 802 <has_text text="k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Pseudomonadales|f__Moraxellaceae|g__Moraxella|s__Moraxella_lacunata"/> | |
| 803 </assert_contents> | |
| 804 </output> | |
| 805 </test> | |
| 806 <test expect_num_outputs="2"> | |
| 807 <section name="inputs"> | |
| 808 <conditional name="in"> | |
| 809 <!-- SAM --> | |
| 810 <param name="selector" value="sam"/> | |
| 811 <param name="in" value="SRS014464-Anterior_nares.sam"/> | |
| 812 </conditional> | |
| 813 <conditional name="db"> | |
| 814 <!-- Cached db --> | |
| 815 <param name="db_selector" value="cached"/> | |
| 816 <param name="cached_db" value="test-db-20210409"/> | |
| 817 </conditional> | |
| 818 </section> | |
| 819 <section name="analysis"> | |
| 820 <conditional name="analysis_type"> | |
| 821 <param name="t" value="rel_ab"/> | |
| 822 <conditional name="tax_lev"> | |
| 823 <param name="tax_lev" value="a"/> | |
| 824 <param name="split_levels" value="false"/> | |
| 825 </conditional> | |
| 826 </conditional> | |
| 827 <param name="min_cu_len" value="2000"/> | |
| 828 <param name="organism_profiling" value="add_viruses"/> | |
| 829 <param name="stat" value="avg_g"/> | |
| 830 <param name="stat_q" value="0.2"/> | |
| 831 <param name="perc_nonzero" value="0.33"/> | |
| 832 <param name="avoid_disqm" value="true"/> | |
| 833 </section> | |
| 834 <section name="out"> | |
| 835 <param name="sample_id_key" value="SampleID"/> | |
| 836 <param name="sample_id" value="Metaphlan_Analysis"/> | |
| 837 <param name="use_group_representative" value="false"/> | |
| 838 <param name="legacy_output" value="false"/> | |
| 839 <param name="CAMI_format_output" value="false"/> | |
| 840 <param name="unknown_estimation" value="false"/> | |
| 841 <param name="krona_output" value="false"/> | |
| 842 </section> | |
| 843 <output name="output_file" ftype="tabular" file="SRS014464-Anterior_nares-abundances.tabular" compare="sim_size"> | |
| 844 <assert_contents> | |
| 845 <has_text text="k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Corynebacteriales|f__Corynebacteriaceae|g__Corynebacterium|s__Corynebacterium_accolens"/> | |
| 846 <has_text text="relative_abundance"/> | |
| 847 <has_text text="NCBI_tax_id"/> | |
| 848 <has_text text="clade_name"/> | |
| 849 </assert_contents> | |
| 850 </output> | |
| 851 <output name="biom_output_file" ftype="biom1" file="SRS014464-Anterior_nares.biom" compare="sim_size"> | |
| 852 <assert_contents> | |
| 853 <has_text text="k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Pseudomonadales|f__Moraxellaceae|g__Moraxella|s__Moraxella_lacunata"/> | |
| 854 </assert_contents> | |
| 855 </output> | |
| 856 </test> | |
| 857 <test expect_num_outputs="2"> | |
| 858 <section name="inputs"> | |
| 859 <conditional name="in"> | |
| 860 <!-- bowtie2out --> | |
| 861 <param name="selector" value="bowtie2out"/> | |
| 862 <param name="in" value="SRS014464-Anterior_nares-bowtie2out.tabular"/> | |
| 863 </conditional> | |
| 864 <conditional name="db"> | |
| 865 <!-- Cached db --> | |
| 866 <param name="db_selector" value="cached"/> | |
| 867 <param name="cached_db" value="test-db-20210409"/> | |
| 868 </conditional> | |
| 869 </section> | |
| 870 <conditional name="in"> | |
| 871 <param name="selector" value="bowtie2out"/> | |
| 872 <param name="in" value="SRS014464-Anterior_nares-bowtie2out.tabular"/> | |
| 873 </conditional> | |
| 874 <section name="mapping"> | |
| 875 <param name="bt2_ps" value="sensite"/> | |
| 876 <param name="min_mapq_val" value="5"/> | |
| 877 </section> | |
| 878 <section name="analysis"> | |
| 879 <conditional name="analysis_type"> | |
| 880 <param name="t" value="rel_ab"/> | |
| 881 <conditional name="tax_lev"> | |
| 882 <param name="tax_lev" value="a"/> | |
| 883 <param name="split_levels" value="false"/> | |
| 884 </conditional> | |
| 885 </conditional> | |
| 886 <param name="min_cu_len" value="2000"/> | |
| 887 <param name="organism_profiling" value="add_viruses"/> | |
| 888 <param name="stat" value="avg_g"/> | |
| 889 <param name="stat_q" value="0.2"/> | |
| 890 <param name="perc_nonzero" value="0.33"/> | |
| 891 <param name="avoid_disqm" value="true"/> | |
| 892 </section> | |
| 893 <section name="out"> | |
| 894 <param name="sample_id_key" value="SampleID"/> | |
| 895 <param name="sample_id" value="Metaphlan_Analysis"/> | |
| 896 <param name="use_group_representative" value="false"/> | |
| 897 <param name="legacy_output" value="false"/> | |
| 898 <param name="CAMI_format_output" value="false"/> | |
| 899 <param name="unknown_estimation" value="false"/> | |
| 900 <param name="krona_output" value="false"/> | |
| 901 </section> | |
| 902 <output name="output_file" ftype="tabular" file="SRS014464-Anterior_nares-abundances.tabular" compare="sim_size"> | |
| 903 <assert_contents> | |
| 904 <has_text text="k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Corynebacteriales|f__Corynebacteriaceae|g__Corynebacterium|s__Corynebacterium_accolens"/> | |
| 905 <has_text text="relative_abundance"/> | |
| 906 <has_text text="NCBI_tax_id"/> | |
| 907 <has_text text="clade_name"/> | |
| 908 </assert_contents> | |
| 909 </output> | |
| 910 <output name="biom_output_file" ftype="biom1" file="SRS014464-Anterior_nares.biom" compare="sim_size"> | |
| 911 <assert_contents> | |
| 912 <has_text text="k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Pseudomonadales|f__Moraxellaceae|g__Moraxella|s__Moraxella_lacunata"/> | |
| 913 </assert_contents> | |
| 914 </output> | |
| 915 </test> | |
| 916 <test expect_num_outputs="6"> | |
| 917 <section name="inputs"> | |
| 918 <conditional name="in"> | |
| 919 <param name="selector" value="raw"/> | |
| 920 <conditional name="raw_in"> | |
| 921 <!-- Single FASTA file --> | |
| 922 <param name="selector" value="single"/> | |
| 923 <param name="in" value="SRS014464-Anterior_nares.fasta"/> | |
| 924 </conditional> | |
| 925 <param name="read_min_len" value="70"/> | |
| 926 <section name="mapping"> | |
| 927 <param name="bt2_ps" value="sensitive"/> | |
| 928 <param name="min_mapq_val" value="5"/> | |
| 929 </section> | |
| 930 </conditional> | |
| 931 <conditional name="db"> | |
| 932 <!-- Cached db --> | |
| 933 <param name="db_selector" value="cached"/> | |
| 934 <param name="cached_db" value="test-db-20210409"/> | |
| 935 </conditional> | |
| 936 </section> | |
| 937 <section name="analysis"> | |
| 938 <conditional name="analysis_type"> | |
| 939 <param name="t" value="rel_ab"/> | |
| 940 <conditional name="tax_lev"> | |
| 941 <param name="tax_lev" value="a"/> | |
| 942 <param name="split_levels" value="true"/> | |
| 943 </conditional> | |
| 944 </conditional> | |
| 945 <param name="min_cu_len" value="2000"/> | |
| 946 <param name="organism_profiling" value="add_viruses"/> | |
| 947 <param name="stat" value="avg_g"/> | |
| 948 <param name="stat_q" value="0.2"/> | |
| 949 <param name="perc_nonzero" value="0.33"/> | |
| 950 <param name="ignore_markers" value="marker.txt"/> | |
| 951 <param name="avoid_disqm" value="true"/> | |
| 952 </section> | |
| 953 <section name="out"> | |
| 954 <param name="sample_id_key" value="SampleID"/> | |
| 955 <param name="sample_id" value="Metaphlan_Analysis"/> | |
| 956 <param name="use_group_representative" value="false"/> | |
| 957 <param name="legacy_output" value="true"/> | |
| 958 <param name="CAMI_format_output" value="false"/> | |
| 959 <param name="unknown_estimation" value="false"/> | |
| 960 <param name="krona_output" value="true"/> | |
| 961 </section> | |
| 962 <output name="output_file" ftype="tabular" file="SRS014464-Anterior_nares-legacy-abundances.tabular" compare="sim_size"> | |
| 963 <assert_contents> | |
| 964 <has_text text="k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Corynebacteriales|f__Corynebacteriaceae|g__Corynebacterium|s__Corynebacterium_accolens"/> | |
| 965 <has_text text="SampleID"/> | |
| 966 <has_text text="Metaphlan_Analysis"/> | |
| 967 </assert_contents> | |
| 968 </output> | |
| 969 <output name="bowtie2out" ftype="tabular" file="SRS014464-Anterior_nares-bowtie2out.tabular" compare="sim_size"> | |
| 970 <assert_contents> | |
| 971 <has_text text="HWI-EAS109_102883399:3:104:7342:14360/1"/> | |
| 972 <has_text text="37637__U2I1U8__N579_01580"/> | |
| 973 </assert_contents> | |
| 974 </output> | |
| 975 <output name="sam_output_file" ftype="sam" file="SRS014464-Anterior_nares.sam" compare="sim_size"> | |
| 976 <assert_contents> | |
| 977 <has_text text="SN:13076__A0A2I1PE66__CYJ72_10760"/> | |
| 978 </assert_contents> | |
| 979 </output> | |
| 980 <output name="biom_output_file" ftype="biom1" file="SRS014464-Anterior_nares.biom" compare="sim_size"> | |
| 981 <assert_contents> | |
| 982 <has_text text="k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Pseudomonadales|f__Moraxellaceae|g__Moraxella|s__Moraxella_lacunata"/> | |
| 983 </assert_contents> | |
| 984 </output> | |
| 985 <output_collection name="levels" type="list" > | |
| 986 <element name="all" ftype="tabular"> | |
| 987 <assert_contents> | |
| 988 <has_text text="Gammaproteobacteria"/> | |
| 989 <has_text text="Corynebacterium accolens"/> | |
| 990 <has_n_columns n="9"/> | |
| 991 </assert_contents> | |
| 992 </element> | |
| 993 <element name="class" ftype="tabular"> | |
| 994 <assert_contents> | |
| 995 <has_text text="class"/> | |
| 996 <has_text text="Actinobacteria"/> | |
| 997 <has_n_columns n="2"/> | |
| 998 </assert_contents> | |
| 999 </element> | |
| 1000 <element name="family" ftype="tabular"> | |
| 1001 <assert_contents> | |
| 1002 <has_text text="family"/> | |
| 1003 <has_text text="Propionibacteriaceae"/> | |
| 1004 <has_n_columns n="2"/> | |
| 1005 </assert_contents> | |
| 1006 </element> | |
| 1007 <element name="genus" ftype="tabular"> | |
| 1008 <assert_contents> | |
| 1009 <has_text text="genus"/> | |
| 1010 <has_text text="Cutibacterium"/> | |
| 1011 <has_n_columns n="2"/> | |
| 1012 </assert_contents> | |
| 1013 </element> | |
| 1014 <element name="kingdom" ftype="tabular"> | |
| 1015 <assert_contents> | |
| 1016 <has_text text="kingdom"/> | |
| 1017 <has_text text="Bacteria"/> | |
| 1018 <has_n_columns n="2"/> | |
| 1019 </assert_contents> | |
| 1020 </element> | |
| 1021 <element name="order" ftype="tabular"> | |
| 1022 <assert_contents> | |
| 1023 <has_text text="order"/> | |
| 1024 <has_text text="Propionibacteriales"/> | |
| 1025 <has_n_columns n="2"/> | |
| 1026 </assert_contents> | |
| 1027 </element> | |
| 1028 <element name="phylum" ftype="tabular"> | |
| 1029 <assert_contents> | |
| 1030 <has_text text="phylum"/> | |
| 1031 <has_text text="Firmicutes"/> | |
| 1032 <has_n_columns n="2"/> | |
| 1033 </assert_contents> | |
| 1034 </element> | |
| 1035 <element name="species" ftype="tabular"> | |
| 1036 <assert_contents> | |
| 1037 <has_text text="species"/> | |
| 1038 <has_text text="Corynebacterium accolens"/> | |
| 1039 <has_n_columns n="2"/> | |
| 1040 </assert_contents> | |
| 1041 </element> | |
| 1042 <element name="strains" ftype="tabular"> | |
| 1043 <assert_contents> | |
| 1044 <has_text text="strains"/> | |
| 1045 <has_n_columns n="2"/> | |
| 1046 </assert_contents> | |
| 1047 </element> | |
| 1048 </output_collection> | |
| 1049 <output name="krona_output_file" ftype="tabular"> | |
| 1050 <assert_contents> | |
| 1051 <not_has_text text="k__Bacteria"/> | |
| 1052 <has_text text="Corynebacterium accolens"/> | |
| 1053 <has_n_columns n="9"/> | |
| 1054 </assert_contents> | |
| 1055 </output> | |
| 1056 </test> | |
| 1057 </tests> | |
| 1058 <help><![CDATA[ | |
| 1059 What it does | |
| 1060 ============ | |
| 1061 | |
| 1062 MetaPhlAn is a computational tool for profiling the composition of microbial communities (Bacteria, | |
| 1063 Archaea and Eukaryotes) from metagenomic shotgun sequencing data (i.e. not 16S) at species-level. | |
| 1064 | |
| 1065 MetaPhlAn relies on ~1.1M unique clade-specific marker genes identified from ~100,000 reference genomes | |
| 1066 (~99,500 bacterial and archaeal and ~500 eukaryotic), allowing: | |
| 1067 | |
| 1068 - unambiguous taxonomic assignments; | |
| 1069 - accurate estimation of organismal relative abundance; | |
| 1070 - species-level resolution for bacteria, archaea, eukaryotes and viruses; | |
| 1071 - strain identification and tracking | |
| 1072 - orders of magnitude speedups compared to existing methods. | |
| 1073 - microbiota strain-level population genomics | |
| 1074 | |
| 1075 MetaPhlAn clade-abundance estimation | |
| 1076 ------------------------------------ | |
| 1077 | |
| 1078 The basic usage of MetaPhlAn consists in the identification of the clades (from phyla to species and | |
| 1079 strains in particular cases) present in the microbiota obtained from a microbiome sample and their | |
| 1080 relative abundance. | |
| 1081 | |
| 1082 Marker level analysis | |
| 1083 --------------------- | |
| 1084 | |
| 1085 MetaPhlAn introduces the capability of characterizing organisms at the strain level using non | |
| 1086 aggregated marker information. Such capability comes with several slightly different flavours and | |
| 1087 are a way to perform strain tracking and comparison across multiple samples. | |
| 1088 | |
| 1089 Usually, MetaPhlAn is first ran with default parameters for the type of analysis to profile the | |
| 1090 species present in the community, and then a strain-level profiling can be performed to zoom-in on | |
| 1091 specific species of interest. This operation can be performed quickly as it exploits the bowtie2out | |
| 1092 intermediate file saved during the execution of the default analysis type. | |
| 1093 | |
| 1094 Inputs | |
| 1095 ====== | |
| 1096 | |
| 1097 Metaphlan takes as input either: | |
| 1098 | |
| 1099 - one or several sequence files in Fasta, FastQ (whether compressed or not) | |
| 1100 - a BowTie2 produced SAM file | |
| 1101 - an intermediary mapping file of the microbiota generated by a previous MetaPhlAn run | |
| 1102 | |
| 1103 It also needs the reference database, which can be locally installed or customized using the dedicated tools. | |
| 1104 | |
| 1105 Outputs | |
| 1106 ======= | |
| 1107 | |
| 1108 The main output is a tab-separated file with the predicted taxon relative abundances. | |
| 1109 | |
| 1110 It also generates a BIOM file and some intermediate files (SAM and BowTie2out) if sequence files are given as inputs. | |
| 1111 | |
| 1112 | |
| 1113 More help and use cases | |
| 1114 ======================= | |
| 1115 | |
| 1116 To get more information about MetaPhlAn usage and use cases, please refer to the `Metaphlan documentation`_. | |
| 1117 | |
| 1118 .. _Metaphlan documentation: https://github.com/biobakery/MetaPhlAn/wiki/MetaPhlAn-4#Basic-Usage | |
| 1119 | |
| 1120 ]]></help> | |
| 1121 <expand macro="citations"/> | |
| 1122 </tool> |
