Mercurial > repos > iuc > roary
comparison roary.xml @ 7:78608ec02d62 draft
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/roary commit 442b1247ee31ec9872633be18784f346e4762486"
author | iuc |
---|---|
date | Sat, 13 Feb 2021 11:59:15 +0000 |
parents | 15ac71df11a0 |
children | e88a7de55d6e |
comparison
equal
deleted
inserted
replaced
6:15ac71df11a0 | 7:78608ec02d62 |
---|---|
1 <tool id="roary" name="Roary" version="3.13.0+galaxy0"> | 1 <tool id="roary" name="Roary" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@"> |
2 <description>the pangenome pipeline - Quickly generate a core gene alignment from gff3 files</description> | 2 <description>the pangenome pipeline - Quickly generate a core gene alignment from gff3 files</description> |
3 | 3 <macros> |
4 <token name="@TOOL_VERSION@">3.13.0</token> | |
5 <token name="@VERSION_SUFFIX@">1</token> | |
6 </macros> | |
4 <requirements> | 7 <requirements> |
5 <requirement type="package" version="3.13.0">roary</requirement> | 8 <requirement type="package" version="@TOOL_VERSION@">roary</requirement> |
6 </requirements> | 9 </requirements> |
7 | 10 |
8 <command detect_errors="exit_code"><![CDATA[ | 11 <command detect_errors="exit_code"><![CDATA[ |
9 #set $filenames = list() | 12 #set $filenames = list() |
10 #for $gff in $gff_input.gffs | 13 #for $gff in $gff_input.gffs |
11 cp '$gff' '${gff.element_identifier}.gff' && | 14 cp '$gff' '${gff.element_identifier}.gff' && |
12 #set $filename = str($gff.element_identifier) + '.gff' | 15 #set $filename = str($gff.element_identifier) + '.gff' |
13 $filenames.append(str($filename)) | 16 $filenames.append(str($filename)) |
14 #end for | 17 #end for |
15 | 18 |
16 roary | 19 roary |
17 -f out | 20 -f out |
18 -p \${GALAXY_SLOTS:-1} | 21 -p \${GALAXY_SLOTS:-1} |
27 | 30 |
28 #for $f in $filenames | 31 #for $f in $filenames |
29 '$f' | 32 '$f' |
30 #end for | 33 #end for |
31 | 34 |
32 ]]></command> | 35 ]]> </command> |
33 | 36 |
34 <inputs> | 37 <inputs> |
35 <conditional name="gff_input"> | 38 <conditional name="gff_input"> |
36 <param name="gff_input_selector" type="select" label="Individual gff files or a dataset collection" help="Select between individual gff files or a collection of gff files"> | 39 <param name="gff_input_selector" type="select" label="Individual gff files or a dataset collection" help="Select between individual gff files or a collection of gff files"> |
37 <option value="individual">Individual</option> | 40 <option value="individual">Individual</option> |
38 <option value="collection">Collection</option> | 41 <option value="collection">Collection</option> |
42 </param> | |
43 <when value="individual"> | |
44 <param name="gffs" type="data" multiple="true" min="2" format="gff,gff3" label="select gff inputs to Roary" help="Select the files you wish to send to Roary, must be in gff3 format with the sequence data at the end of the file." /> | |
45 </when> | |
46 <when value='collection'> | |
47 <param name="gffs" type="data_collection" collection_type="list" format="gff,gff3" label="Dataset collection to submit to Roary" help="A dataset list collection of gff3 files to send to Roary for analysis." /> | |
48 </when> | |
49 </conditional> | |
50 <param name="percent_ident" type="integer" value="95" label="minimum percentage identity for blastp" help="Sets the minimum percentage identity for protein matches" /> | |
51 <param name="core_diff" type="float" value="99.0" label="percentage of isolates a gene must be in to be core" help="The total percentage of the isolates that must have the gene for it to be considered a core gene." /> | |
52 | |
53 <param name="outputs" type="select" multiple="true" display="checkboxes" label="Additional outputs" help="Summary statistics, core gene alignments and Gene Presence/Absence tables are always produced."> | |
54 <option value="abg_nw">Accessory binary genes in newick format</option> | |
55 <option value="abg_fa">Accessory binary genes in fasta format</option> | |
56 <option value="accgraph">Accessory graph in dot format</option> | |
57 <option value="acchead_embl">Accessory header file in embl format</option> | |
58 <option value="acctab">Accessory gene table in tabular format</option> | |
59 <option value="blastfreq">Blast Identity Frequency Rtab file</option> | |
60 <option value="clust">Clustered proteins file</option> | |
61 <option value="coreaccgraph">Core Accessory Graph in dot format</option> | |
62 <option value="coreaccembl">Core Accessory table in embl format</option> | |
63 <option value="coreacctab">Core Accessory table in tabular format</option> | |
64 <option value="genepa_rtab">Gene Presence Absence file in Rtab format</option> | |
65 <option value="numcons_rtab">Number of Conserved Genes in Rtab format</option> | |
66 <option value="numpangene_rtab">Number of Genes in Pan Genome in Rtab format</option> | |
67 <option value="numnew_rtab">Number of New Genes in Rtab format</option> | |
68 <option value="numuniq_rtab">Number of Unique Genes in Rtab format</option> | |
69 <option value="pangenomeref">FASTA file which contains a single representative nucleotide sequence from each of the clusters in the pan genome (core and accessory)</option> | |
39 </param> | 70 </param> |
40 <when value="individual"> | |
41 <param name="gffs" type="data" multiple="true" format="gff,gff3" label="select gff inputs to Roary" help="Select the files you wish to send to Roary, must be in gff3 format with the sequence data at the end of the file." /> | |
42 </when> | |
43 <when value='collection'> | |
44 <param name="gffs" type="data_collection" collection_type="list" format="gff,gff3" label="Dataset collection to submit to Roary" help="A dataset list collection of gff3 files to send to Roary for analysis." /> | |
45 </when> | |
46 </conditional> | |
47 <param name="percent_ident" type="integer" label="minimum percentage identity for blastp" help="Sets the minimum percentage identity for protein matches" value="95"/> | |
48 <param name="core_diff" type="float" label="percentage of isolates a gene must be in to be core" help="The total percentage of the isolates that must have the gene for it to be considered a core gene." value="99.0"/> | |
49 | 71 |
50 <param name="outputs" type="select" multiple="true" display="checkboxes" label="Additional outputs" help="Summary statistics, core gene alignments and Gene Presence/Absence tables are always produced."> | 72 <section name="advanced" title="Advanced options" expanded="false"> |
51 <option value="abg_nw">Accessory binary genes in newick format</option> | 73 <param name="maxclust" type="integer" value="50000" label="Maximum number of clusters" help="The maximum number of clusters to assign proteins" /> |
52 <option value="abg_fa">Accessory binary genes in fasta format</option> | 74 <param name="split_para" type="boolean" checked="False" truevalue="-s" falsevalue="" label="Don't split paralogs" help="Click yes so that paralogs aren't split." /> |
53 <option value="accgraph">Accessory graph in dot format</option> | 75 <param name="trans_tab" type="integer" value="11" label="Translation table to use [1 or 4 or 11]" help="DNA -> RNA translation table to use. Roary is designed for prokaryotes and so tables 1, 4 or 11 will work, others could be problematic." /> |
54 <option value="acchead_embl">Accessory header file in embl format</option> | 76 <param name="mcl" type="float" value="1.5" label="MCL inflation value" help="This is an advanced setting, change only if you know what you are doing and then at your own risk!" /> |
55 <option value="acctab">Accessory gene table in tabular format</option> | 77 </section> |
56 <option value="blastfreq">Blast Identity Frequency Rtab file</option> | |
57 <option value="clust">Clustered proteins file</option> | |
58 <option value="coreaccgraph">Core Accessory Graph in dot format</option> | |
59 <option value="coreaccembl">Core Accessory table in embl format</option> | |
60 <option value="coreacctab">Core Accessory table in tabular format</option> | |
61 <option value="genepa_rtab">Gene Presence Absence file in Rtab format</option> | |
62 <option value="numcons_rtab">Number of Conserved Genes in Rtab format</option> | |
63 <option value="numpangene_rtab">Number of Genes in Pan Genome in Rtab format</option> | |
64 <option value="numnew_rtab">Number of New Genes in Rtab format</option> | |
65 <option value="numuniq_rtab">Number of Unique Genes in Rtab format</option> | |
66 <option value="pangenomeref">FASTA file which contains a single representative nucleotide sequence from each of the clusters in the pan genome (core and accessory)</option> | |
67 </param> | |
68 | |
69 <section name="advanced" title="Advanced options" expanded="false"> | |
70 <param name="maxclust" type="integer" value="50000" label="Maximum number of clusters" help="The maximum number of clusters to assign proteins" /> | |
71 <param name="split_para" type="boolean" checked="False" truevalue="-s" falsevalue="" label="Don't split paralogs" help="Click yes so that paralogs aren't split."/> | |
72 <param name="trans_tab" type="integer" value="11" label="Translation table to use [1 or 4 or 11]" help="DNA -> RNA translation table to use. Roary is designed for prokaryotes and so tables 1, 4 or 11 will work, others could be problematic." /> | |
73 <param name="mcl" type="float" value="1.5" label="MCL inflation value" help="This is an advanced setting, change only if you know what you are doing and then at your own risk!" /> | |
74 </section> | |
75 | 78 |
76 </inputs> | 79 </inputs> |
77 | 80 |
78 <outputs> | 81 <outputs> |
79 <data format="tabular" name="sumstats" label="${tool.name} on ${on_string} Summary statistics" from_work_dir="out/summary_statistics.txt" /> | 82 <data format="tabular" name="sumstats" label="${tool.name} on ${on_string} Summary statistics" from_work_dir="out/summary_statistics.txt" /> |
80 <data format="fasta" name="core_gene_aln" label="${tool.name} on ${on_string} Core Gene Alignment" from_work_dir="out/core_gene_alignment.aln" /> | 83 <data format="fasta" name="core_gene_aln" label="${tool.name} on ${on_string} Core Gene Alignment" from_work_dir="out/core_gene_alignment.aln" /> |
81 <data format="csv" name="gene_p_a" label="${tool.name} on ${on_string} Gene Presence Absence" from_work_dir="out/gene_presence_absence.csv" /> | 84 <data format="csv" name="gene_p_a" label="${tool.name} on ${on_string} Gene Presence Absence" from_work_dir="out/gene_presence_absence.csv" /> |
82 <data format="fasta" name="acc_bin" label="${tool.name} on ${on_string} Accessory Binary Genes" from_work_dir="out/accessory_binary_genes.fa" > | 85 <data format="fasta" name="acc_bin" label="${tool.name} on ${on_string} Accessory Binary Genes" from_work_dir="out/accessory_binary_genes.fa"> |
83 <filter>outputs and 'abg_fa' in outputs</filter> | 86 <filter>outputs and 'abg_fa' in outputs</filter> |
84 </data> | 87 </data> |
85 <data format="nhx" name="acc_bin_new" label="${tool.name} on ${on_string} Accessory Binary Genes (Newick)" from_work_dir="out/accessory_binary_genes.fa.newick" > | 88 <data format="nhx" name="acc_bin_new" label="${tool.name} on ${on_string} Accessory Binary Genes (Newick)" from_work_dir="out/accessory_binary_genes.fa.newick"> |
86 <filter>outputs and 'abg_nw' in outputs</filter> | 89 <filter>outputs and 'abg_nw' in outputs</filter> |
87 </data> | 90 </data> |
88 <data format="dot" name="acc_graph" label="${tool.name} on ${on_string} Acsessory Graph" from_work_dir="out/accessory_graph.dot"> | 91 <data format="dot" name="acc_graph" label="${tool.name} on ${on_string} Acsessory Graph" from_work_dir="out/accessory_graph.dot"> |
89 <filter>outputs and 'accgraph' in outputs</filter> | 92 <filter>outputs and 'accgraph' in outputs</filter> |
90 </data> | 93 </data> |
91 <data format="embl" name="acc_head_embl" label="${tool.name} on ${on_string} Accessory Header" from_work_dir="out/accessory.header.embl" > | 94 <data format="embl" name="acc_head_embl" label="${tool.name} on ${on_string} Accessory Header" from_work_dir="out/accessory.header.embl"> |
92 <filter>outputs and 'acchead_embl' in outputs</filter> | 95 <filter>outputs and 'acchead_embl' in outputs</filter> |
93 </data> | 96 </data> |
94 <data format="tabular" name="acc_tab" label="${tool.name} on ${on_string} Accessory Gene Table" from_work_dir="out/accessory.tab" > | 97 <data format="tabular" name="acc_tab" label="${tool.name} on ${on_string} Accessory Gene Table" from_work_dir="out/accessory.tab"> |
95 <filter>outputs and 'acctab' in outputs</filter> | 98 <filter>outputs and 'acctab' in outputs</filter> |
96 </data> | 99 </data> |
97 <data format="txt" name="blast_freq" label="${tool.name} on ${on_string} Blast Identity Frequencies" from_work_dir="out/blast_identity_frequency.Rtab" > | 100 <data format="txt" name="blast_freq" label="${tool.name} on ${on_string} Blast Identity Frequencies" from_work_dir="out/blast_identity_frequency.Rtab"> |
98 <filter>outputs and 'blastfreq' in outputs</filter> | 101 <filter>outputs and 'blastfreq' in outputs</filter> |
99 </data> | 102 </data> |
100 <data format="txt" name="clust_file" label="${tool.name} on ${on_string} Clustered Proteins" from_work_dir="out/clustered_proteins" > | 103 <data format="txt" name="clust_file" label="${tool.name} on ${on_string} Clustered Proteins" from_work_dir="out/clustered_proteins"> |
101 <filter>outputs and 'clust' in outputs</filter> | 104 <filter>outputs and 'clust' in outputs</filter> |
102 </data> | 105 </data> |
103 <data format="dot" name="core_acc_graph" label="${tool.name} on ${on_string} Core Accessory Graph" from_work_dir="out/core_accessory_graph.dot" > | 106 <data format="dot" name="core_acc_graph" label="${tool.name} on ${on_string} Core Accessory Graph" from_work_dir="out/core_accessory_graph.dot"> |
104 <filter>outputs and 'coreaccgraph' in outputs</filter> | 107 <filter>outputs and 'coreaccgraph' in outputs</filter> |
105 </data> | 108 </data> |
106 <data format="embl" name="core_acc_embl" label="${tool.name} on ${on_string} Core Accessory EMBL" from_work_dir="out/core_accessory.header.embl" > | 109 <data format="embl" name="core_acc_embl" label="${tool.name} on ${on_string} Core Accessory EMBL" from_work_dir="out/core_accessory.header.embl"> |
107 <filter>outputs and 'coreaccembl' in outputs</filter> | 110 <filter>outputs and 'coreaccembl' in outputs</filter> |
108 </data> | 111 </data> |
109 <data format="tabular" name="core_acc_tab" label="${tool.name} on ${on_string} Core Accessory Table" from_work_dir="out/core_accessory.tab" > | 112 <data format="tabular" name="core_acc_tab" label="${tool.name} on ${on_string} Core Accessory Table" from_work_dir="out/core_accessory.tab"> |
110 <filter>outputs and 'coreacctab' in outputs</filter> | 113 <filter>outputs and 'coreacctab' in outputs</filter> |
111 </data> | 114 </data> |
112 <data format="txt" name="gene_p_a_rtab" label="${tool.name} on ${on_string} Gene Presence Absence Rtab" from_work_dir="out/gene_presence_absence.Rtab" > | 115 <data format="txt" name="gene_p_a_rtab" label="${tool.name} on ${on_string} Gene Presence Absence Rtab" from_work_dir="out/gene_presence_absence.Rtab"> |
113 <filter>outputs and 'genepa_rtab' in outputs</filter> | 116 <filter>outputs and 'genepa_rtab' in outputs</filter> |
114 </data> | 117 </data> |
115 <data format="txt" name="num_cons_rtab" label="${tool.name} on ${on_string} Number of Conserved Genes" from_work_dir="out/number_of_conserved_genes.Rtab" > | 118 <data format="txt" name="num_cons_rtab" label="${tool.name} on ${on_string} Number of Conserved Genes" from_work_dir="out/number_of_conserved_genes.Rtab"> |
116 <filter>outputs and 'numcons_rtab' in outputs</filter> | 119 <filter>outputs and 'numcons_rtab' in outputs</filter> |
117 </data> | 120 </data> |
118 <data format="txt" name="num_pangene_rtab" label="${tool.name} on ${on_string} Number of Genes in Pan Geneome" from_work_dir="out/number_of_genes_in_pan_genome.Rtab" > | 121 <data format="txt" name="num_pangene_rtab" label="${tool.name} on ${on_string} Number of Genes in Pan Geneome" from_work_dir="out/number_of_genes_in_pan_genome.Rtab"> |
119 <filter>outputs and 'numpangene_rtab' in outputs</filter> | 122 <filter>outputs and 'numpangene_rtab' in outputs</filter> |
120 </data> | 123 </data> |
121 <data format="txt" name="num_new_rtab" label="${tool.name} on ${on_string} Number of New Genes" from_work_dir="out/number_of_new_genes.Rtab" > | 124 <data format="txt" name="num_new_rtab" label="${tool.name} on ${on_string} Number of New Genes" from_work_dir="out/number_of_new_genes.Rtab"> |
122 <filter>outputs and 'numnew_rtab' in outputs</filter> | 125 <filter>outputs and 'numnew_rtab' in outputs</filter> |
123 </data> | 126 </data> |
124 <data format="txt" name="num_uniq_rtab" label="${tool.name} on ${on_string} Number of Unique Genes" from_work_dir="out/number_of_unique_genes.Rtab" > | 127 <data format="txt" name="num_uniq_rtab" label="${tool.name} on ${on_string} Number of Unique Genes" from_work_dir="out/number_of_unique_genes.Rtab"> |
125 <filter>outputs and 'numuniq_rtab' in outputs</filter> | 128 <filter>outputs and 'numuniq_rtab' in outputs</filter> |
126 </data> | 129 </data> |
127 <data format="fasta" name="pan_genome_ref" label="${tool.name} on ${on_string} pan-genome reference" from_work_dir="out/pan_genome_reference.fa" > | 130 <data format="fasta" name="pan_genome_ref" label="${tool.name} on ${on_string} pan-genome reference" from_work_dir="out/pan_genome_reference.fa"> |
128 <filter>outputs and 'pangenomeref' in outputs</filter> | 131 <filter>outputs and 'pangenomeref' in outputs</filter> |
129 </data> | 132 </data> |
130 </outputs> | 133 </outputs> |
131 | 134 |
132 <tests> | 135 <tests> |
133 <test> | 136 <test> |
134 <param name="gff_input_selector" value="individual"/> | 137 <param name="gff_input_selector" value="individual" /> |
135 <param name="gffs" value="ex1.gff,ex2.gff" ftype="gff3"/> | 138 <param name="gffs" value="ex1.gff,ex2.gff" ftype="gff3" /> |
136 <output name="sumstats" file="out/summary_statistics.txt" ftype="tabular"/> | 139 <output name="sumstats" file="out/summary_statistics.txt" ftype="tabular" /> |
137 </test> | 140 </test> |
138 <test> | 141 <test> |
139 <param name="gff_input_selector" value="individual"/> | 142 <param name="gff_input_selector" value="individual" /> |
140 <param name="gffs" value="ex1.gff,ex2.gff" ftype="gff3"/> | 143 <param name="gffs" value="ex1.gff,ex2.gff" ftype="gff3" /> |
141 <param name="percent_ident" value="50"/> | 144 <param name="percent_ident" value="50" /> |
142 <param name="core_diff" value="50.0"/> | 145 <param name="core_diff" value="50.0" /> |
143 <output name="sumstats" file="test2/summary_statistics.txt" ftype="tabular"/> | 146 <output name="sumstats" file="test2/summary_statistics.txt" ftype="tabular" /> |
144 </test> | 147 </test> |
145 </tests> | 148 </tests> |
146 | 149 |
147 <help><![CDATA[ | 150 <help><![CDATA[ |
148 **Roary** | 151 **Roary** |
149 | 152 |
174 - Change the MCL inflation value - a float, default is [1.5] | 177 - Change the MCL inflation value - a float, default is [1.5] |
175 | 178 |
176 | 179 |
177 For further info see: http://sanger-pathogens.github.io/Roary/ | 180 For further info see: http://sanger-pathogens.github.io/Roary/ |
178 | 181 |
179 ]]></help> | 182 ]]> </help> |
180 | 183 |
181 <citations> | 184 <citations> |
182 <citation type="doi">10.1093/bioinformatics/btv421</citation> | 185 <citation type="doi">10.1093/bioinformatics/btv421</citation> |
183 </citations> | 186 </citations> |
184 | 187 |