Mercurial > repos > ufz > iphop_predict
comparison iphop.xml @ 2:be0d13020aec draft default tip
planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/iphop/ commit e93300e2db7217d84659e199d3f23e280de80ccb
| author | ufz |
|---|---|
| date | Wed, 11 Feb 2026 14:31:52 +0000 |
| parents | d357350b6da0 |
| children |
comparison
equal
deleted
inserted
replaced
| 1:d357350b6da0 | 2:be0d13020aec |
|---|---|
| 1 <tool id="iphop_predict" name="iPHoP predict" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="23.0" license="MIT"> | 1 <tool id="iphop_predict" name="iPHoP predict" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="23.0" license="MIT"> |
| 2 <description>host of input bacteriophage/archaeal virus genomes</description> | 2 <description>host of input bacteriophage/archaeal virus genomes</description> |
| 3 <macros> | 3 <macros> |
| 4 <token name="@TOOL_VERSION@">1.3.3</token> | 4 <token name="@TOOL_VERSION@">1.4.2</token> |
| 5 <token name="@VERSION_SUFFIX@">0</token> | 5 <token name="@VERSION_SUFFIX@">0</token> |
| 6 </macros> | 6 </macros> |
| 7 <xrefs> | 7 <xrefs> |
| 8 <xref type="bio.tools">iphop</xref> | 8 <xref type="bio.tools">iphop</xref> |
| 9 </xrefs> | 9 </xrefs> |
| 23 ]]></command> | 23 ]]></command> |
| 24 <inputs> | 24 <inputs> |
| 25 <param argument="--fa_file" type="data" format="fasta" label="FASTA formatted virus sequences"/> | 25 <param argument="--fa_file" type="data" format="fasta" label="FASTA formatted virus sequences"/> |
| 26 <param argument="--db_dir" type="select" label="Reference database"> | 26 <param argument="--db_dir" type="select" label="Reference database"> |
| 27 <options from_data_table="iphop"> | 27 <options from_data_table="iphop"> |
| 28 <filter type="regexp" column="version" value="^(iPHoP_db_Jun25_rw|test_version)$"/> | |
| 28 <validator type="no_options" message="No reference data available. Contact your Galaxy admin."/> | 29 <validator type="no_options" message="No reference data available. Contact your Galaxy admin."/> |
| 29 </options> | 30 </options> |
| 30 </param> | 31 </param> |
| 31 <param argument="--min_score" type="integer" value="90" min="75" max="100" label="Minimum confidence score" help="Minimum confidence score for final output. Default of 90 corresponds to ~10% FDR (roughly). For ~5% overall (roughly) estimated FDR, use a minimum score of 95, etc."/> | 32 <param argument="--min_score" type="integer" value="90" min="75" max="100" label="Minimum confidence score" help="Minimum confidence score for final output. Default of 90 corresponds to ~10% FDR (roughly). For ~5% overall (roughly) estimated FDR, use a minimum score of 95, etc."/> |
| 32 <param argument="--no_qc" type="boolean" truevalue="--no_qc" falsevalue="" label="Bypass the automated QC" help="Bypass the automated QC that filters out input sequences with > 10% Ns or with characters other than ATCGN. Warning: if set to true, low-quality sequences (with Ns or unusual characters) may lead to unexpected failures at multiple steps. (default = False)"/> | 33 <param argument="--no_qc" type="boolean" truevalue="--no_qc" falsevalue="" label="Bypass the automated QC" help="Bypass the automated QC that filters out input sequences with > 10% Ns or with characters other than ATCGN. Warning: if set to true, low-quality sequences (with Ns or unusual characters) may lead to unexpected failures at multiple steps. (default = False)"/> |
| 40 <!-- <test> | 41 <!-- <test> |
| 41 <param name="fa_file" value="test_input_phages.fna" ftype="fasta"/> | 42 <param name="fa_file" value="test_input_phages.fna" ftype="fasta"/> |
| 42 <param name="db_dir" value="db2"/> | 43 <param name="db_dir" value="db2"/> |
| 43 <output name="detailed_per_tool"> | 44 <output name="detailed_per_tool"> |
| 44 <assert_contents> | 45 <assert_contents> |
| 45 <has_n_lines n="190"/> | 46 <has_n_lines n="192"/> |
| 46 <has_n_columns n="10" sep="," comment="#"/> | 47 <has_n_columns n="10" sep="," comment="#"/> |
| 47 </assert_contents> | 48 </assert_contents> |
| 48 </output> | 49 </output> |
| 49 <output name="host_genome"> | 50 <output name="host_genome"> |
| 50 <assert_contents> | 51 <assert_contents> |
| 51 <has_line line="Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods"/> | 52 <has_line line="Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods"/> |
| 52 <has_n_lines n="119"/> | 53 <has_n_lines n="27"/> |
| 53 <has_n_columns n="6" sep=","/> | 54 <has_n_columns n="6" sep=","/> |
| 54 </assert_contents> | 55 </assert_contents> |
| 55 </output> | 56 </output> |
| 56 <output name="host_genus"> | 57 <output name="host_genus"> |
| 57 <assert_contents> | 58 <assert_contents> |
| 58 <has_line line="Virus,AAI to closest RaFAH reference,Host genus,Confidence score,List of methods"/> | 59 <has_line line="Virus,AAI to closest RaFAH reference,Host genus,Confidence score,List of methods"/> |
| 59 <has_n_lines n="6"/> | 60 <has_n_lines n="8"/> |
| 60 <has_n_columns n="5" sep=","/> | 61 <has_n_columns n="5" sep=","/> |
| 61 </assert_contents> | 62 </assert_contents> |
| 62 </output> | 63 </output> |
| 63 </test> --> | 64 </test> --> |
| 64 </tests> | 65 </tests> |
| 85 - the level of amino-acid similarity (AAI) between the query and the genomes in the RaFAH phage database, | 86 - the level of amino-acid similarity (AAI) between the query and the genomes in the RaFAH phage database, |
| 86 - the predicted host genus, | 87 - the predicted host genus, |
| 87 - the confidence score calculated from all tools, and | 88 - the confidence score calculated from all tools, and |
| 88 - the list of scores for individual classifiers obtained for this virus-host pair. | 89 - the list of scores for individual classifiers obtained for this virus-host pair. |
| 89 | 90 |
| 90 - for the detailed score by classifier, "RaFAH" represents the score derived from RaFAH (https://pubmed.ncbi.nlm.nih.gov/34286299/), iPHoP-RF is the score derived from all host-based tools, CRISPR the score derived only from CRISPR hits, and blast the score derived only from blastn hits | 91 - for the detailed score by classifier, "RaFAH" represents the score derived from RaFAH (https://doi.org/10.1016/j.patter.2021.100274), iPHoP-RF is the score derived from all host-based tools, CRISPR the score derived only from CRISPR hits, and blast the score derived only from blastn hits |
| 91 - all virus-host pairs for which the confidence score is higher than the selected score cutoff (default = 90) are included, so each virus may be associated with multiple predictions | 92 - all virus-host pairs for which the confidence score is higher than the selected score cutoff (default = 90) are included, so each virus may be associated with multiple predictions |
| 92 - when multiple predictions are available for a query virus, typical standard practices is to use the one with the highest score | 93 - when multiple predictions are available for a query virus, typical standard practices is to use the one with the highest score |
| 93 | 94 |
| 94 Host prediction to genome | 95 Host prediction to genome |
| 95 | 96 |
