comparison braker.xml @ 3:ac13de106677 draft default tip

planemo upload for repository https://github.com/genouest/galaxy-tools/tree/master/tools/braker commit d6e73c0417506d93c905b4aeb77d92350b662fbb
author genouest
date Wed, 06 Sep 2023 09:50:12 +0000
parents
children
comparison
equal deleted inserted replaced
2:cf241e076f7b 3:ac13de106677
1 <tool id="braker" name="Braker genome annotation" profile="20.01" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@">
2 <description></description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <requirements>
7 <expand macro="requirements" />
8 </requirements>
9 <version_command><![CDATA[braker.pl --version; $GENEMARK_PATH/gmes_petap.pl | grep version]]></version_command>
10 <command><![CDATA[
11 if [ -z "\$GENEMARK_PATH" ] ; then echo "GeneMark is not installed on this Galaxy server." >&2 ; exit 1 ; fi &&
12 if [ ! -f "\$GENEMARK_PATH/gmes_petap.pl" ] ; then echo "GeneMark is not installed properly on this Galaxy server." >&2 ; exit 1 ; fi &&
13 ## GeneMark only search for license in ~/.gm_key
14 cp '${genemark_license}' ~/.gm_key &&
15
16 braker.pl
17 --genome '${genome}'
18
19 $softmasking
20
21 #if $evidences.bam:
22 --bam ${evidences.bam}
23 #end if
24
25 #if $evidences.prot_seq:
26 --prot_seq ${evidences.prot_seq}
27 #end if
28
29 ## No hints, use esmode
30 #if not $evidences.bam and not $evidences.prot_seq
31 --esmode
32 #end if
33
34 ## Both proteins and rnaseq hints, use etpmode
35 #if $evidences.bam and $evidences.prot_seq
36 --etpmode
37 #end if
38
39 #if $output_format == 'gff3'
40 --gff3
41 #end if
42
43 $genemark.fungus
44
45 $augustus.crf
46 --rounds $augustus.rounds
47
48 $advanced.UTR
49
50 $advanced.filterOutShort
51
52 #if $advanced.eval:
53 --eval ${advanced.eval}
54 #end if
55
56 #if $advanced.eval_pseudo:
57 --eval_pseudo ${advanced.eval_pseudo}
58 #end if
59
60 --cores \${GALAXY_SLOTS:-2}
61 ]]></command>
62 <inputs>
63 <param name="genemark_license" type="data" format="txt" label="GeneMark license file" help="Braker uses GeneMark, which is not a free software, to use it download and unzip a license from http://topaz.gatech.edu/GeneMark/license_download.cgi (ES/ET/EP version). GeneMark needs to be installed manually by Galaxy administrators." />
64
65 <param argument="--genome" type="data" format="fasta" label="Assembly to annotate" help="The assembly should be soft-masked (with RepeatMasker for example)" />
66
67 <param argument="--softmasking" type="boolean" checked="false" truevalue="--softmasking" falsevalue="" label="Genome sequence is soft-masked" />
68
69 <section name="evidences" expanded="true" title="Evidences">
70 <param argument="--bam" type="data" format="bam" optional="true" label="RNA-seq mapped to genome to train Augustus/GeneMark" />
71 <param argument="--prot_seq" type="data" format="fasta" optional="true" label="Proteins to map to genome" />
72 </section>
73
74 <section name="genemark" expanded="true" title="GeneMark">
75 <param argument="--fungus" type="boolean" checked="false" truevalue="--fungus" falsevalue="" label="Fungal genome" help="GeneMark-EX option, run algorithm with branch point model (most useful for fungal genomes)" />
76 </section>
77
78 <section name="augustus" expanded="true" title="Augustus">
79 <param argument="--crf" type="boolean" checked="false" truevalue="--crf" falsevalue="" label="Use CRF training for Augustus" help="Alternate training method (Conditional Random Field)" />
80 <param argument="--rounds" type="integer" value="5" label="Number of optimization rounds used in optimize_augustus.pl" />
81 </section>
82
83 <section name="advanced" expanded="false" title="Advanced">
84 <param argument="--UTR" type="boolean" checked="false" truevalue="--UTR=on" falsevalue="" label="" help="Experimental, requires RNASeq data (bam) and a softmasked genome" />
85 <param argument="--filterOutShort" type="boolean" checked="false" truevalue="--filterOutShort" falsevalue="" label="Filter out too short traingin gene predicted by GeneMark-EX" />
86 <param argument="--eval" type="data" format="gtf" optional="true" label="Reference set to evaluate predictions" help="using evaluation scripts from GaTech" />
87 <param argument="--eval_pseudo" type="data" format="gff3" optional="true" label="File with pseudogenes that will be excluded from accuracy evaluation" />
88 </section>
89
90 <param name="output_format" type="select" label="Output format">
91 <option value="gtf" selected="true">GTF</option>
92 <option value="gff3">GFF3</option>
93 </param>
94 </inputs>
95 <outputs>
96 <data name='output_gtf' format='gtf' label="${tool.name} on ${on_string}: GTF annotation" from_work_dir="braker/braker.gtf">
97 <filter>output_format == 'gtf'</filter>
98 </data>
99 <data name='output_gff' format='gff3' label="${tool.name} on ${on_string}: GFF annotation" from_work_dir="braker/braker.gff3">
100 <filter>output_format == 'gff3'</filter>
101 </data>
102 </outputs>
103 <tests>
104
105 <test expect_failure="true">
106 <param name="genemark_license" value="gm_key_64"/>
107 <param name="genome" value="genome_masked.fa"/>
108 <section name="evidences">
109 <param name="bam" value="SRR7458692.bam"/>
110 </section>
111 <param name="output_format" value="gtf"/>
112 </test>
113
114 <!-- Disable next 2 for CI (it should pass locally)-->
115 <!--test>
116 <param name="genome" value="genome_masked.fa" />
117 <param name="softmasking" value="true" />
118 <param name="genemark_license" value="genemark_license.gm_key" />
119 <output name="output_gtf" file="out_genome/braker.gtf" sort="true" />
120 </test>
121 <test>
122 <param name="genome" value="genome_masked.fa" />
123 <param name="softmasking" value="true" />
124 <param name="genemark_license" value="genemark_license.gm_key" />
125 <param name="output_format" value="gff3" />
126 <output name="output_gff" file="out_genome/braker.gff3" sort="true" />
127 </test-->
128 <!-- following 2 tests throw an error because test dataset is too small -->
129 <!--test>
130 <param name="genome" value="genome_masked.fa" />
131 <param name="softmasking" value="true" />
132 <param name="genemark_license" value="genemark_license.gm_key" />
133 <section name="evidences">
134 <param name="bam" value="SRR7458692.bam" />
135 </section>
136 <output name="output_gtf" file="out_bam/braker.gtf" sort="true" />
137 </test>
138 <test>
139 <param name="genome" value="genome_masked.fa" />
140 <param name="softmasking" value="true" />
141 <param name="genemark_license" value="genemark_license.gm_key" />
142 <section name="evidences">
143 <param name="prot_seq" value="proteins.fa" />
144 </section>
145 <output name="output_gtf" file="out_prot/braker.gtf" sort="true" />
146 </test-->
147 </tests>
148 <help><![CDATA[
149 Braker_
150 -------
151
152 Braker_ allows for fully automated training of the gene prediction tools GeneMark-EX and AUGUSTUS from RNA-Seq and/or protein homology information, and that integrates the extrinsic evidence from RNA-Seq and protein homology information into the prediction.
153
154 In contrast to other available methods that rely on protein homology information, BRAKER reaches high gene prediction accuracy even in the absence of the annotation of very closely related species and in the absence of RNA-Seq data.
155
156 .. _Braker: https://github.com/Gaius-Augustus/BRAKER
157 ]]></help>
158 <expand macro="citations" />
159 </tool>