Mercurial > repos > bgruening > augustus
comparison augustus.xml @ 2:a77a4e9921e0 draft
Uploaded
author | bgruening |
---|---|
date | Wed, 06 May 2015 14:31:02 -0400 |
parents | e2b822d7408f |
children | f5075dee9d6b |
comparison
equal
deleted
inserted
replaced
1:e2b822d7408f | 2:a77a4e9921e0 |
---|---|
1 <tool id="augustus" name="Augustus" version="0.3.1"> | 1 <tool id="augustus" name="Augustus" version="0.3.1"> |
2 <description>gene prediction for eukaryotic genomes</description> | 2 <description>gene prediction for eukaryotic genomes</description> |
3 <parallelism method="multi" split_inputs="input_genome" split_mode="to_size" split_size="10" merge_outputs="output,protein_output,codingseq_output"></parallelism> | 3 <parallelism method="multi" split_inputs="input_genome" split_mode="to_size" split_size="10" merge_outputs="output,protein_output,codingseq_output"></parallelism> |
4 <requirements> | 4 <requirements> |
5 <requirement type="package" version="2.7">augustus</requirement> | 5 <requirement type="package" version="2.7">augustus</requirement> |
6 <requirement type="set_environment">AUGUSTUS_SCRIPT_PATH</requirement> | |
7 </requirements> | 6 </requirements> |
7 <stdio> | |
8 <exit_code range="1:" /> | |
9 <exit_code range=":-1" /> | |
10 <regex match="Error:" /> | |
11 <regex match="Exception:" /> | |
12 </stdio> | |
8 <command> | 13 <command> |
14 <![CDATA[ | |
9 ## please set export AUGUSTUS_CONFIG_PATH=/path_to_augustus/augustus/config | 15 ## please set export AUGUSTUS_CONFIG_PATH=/path_to_augustus/augustus/config |
10 ## or use the --AUGUSTUS_CONFIG_PATH=path if you are not installing through the toolshed | 16 ## or use the --AUGUSTUS_CONFIG_PATH=path if you are not installing through the toolshed |
11 ## Augustus writes the protein and coding sequences as comment into the gff/gtf file an external script is used to extract the sequences into additional files | 17 ## Augustus writes the protein and coding sequences as comment into the gff/gtf file an external script is used to extract the sequences into additional files |
12 | 18 |
13 augustus | 19 augustus |
14 --strand=$strand | 20 --strand=$strand |
15 $noInFrameStop | 21 $noInFrameStop |
16 $gff | 22 $gff |
17 | 23 |
18 #if 'protein' in str($outputs).split(','): | 24 #if 'protein' in str($outputs).split(','): |
19 --protein=on | 25 --protein=on |
20 #else: | 26 #else: |
21 --protein=off | 27 --protein=off |
22 #end if | 28 #end if |
24 #if 'codingseq' in str($outputs).split(','): | 30 #if 'codingseq' in str($outputs).split(','): |
25 --codingseq=on | 31 --codingseq=on |
26 #else: | 32 #else: |
27 --codingseq=off | 33 --codingseq=off |
28 #end if | 34 #end if |
29 | 35 |
30 #if 'introns' in str($outputs).split(','): | 36 #if 'introns' in str($outputs).split(','): |
31 --introns=on | 37 --introns=on |
32 #else: | 38 #else: |
33 --introns=off | 39 --introns=off |
34 #end if | 40 #end if |
56 $mea | 62 $mea |
57 $utr | 63 $utr |
58 --genemodel=$genemodel | 64 --genemodel=$genemodel |
59 --species=$organism | 65 --species=$organism |
60 ##--outfile=$output | 66 ##--outfile=$output |
61 | tee $output | 67 | tee $output |
62 #if 'protein' in str($outputs).split(',') or 'codingseq' in str($outputs).split(','): | 68 #if 'protein' in str($outputs).split(',') or 'codingseq' in str($outputs).split(','): |
63 | python \$AUGUSTUS_SCRIPT_PATH/extract_features.py | 69 | python $__tool_directory__/extract_features.py |
64 #if 'protein' in str($outputs).split(','): | 70 #if 'protein' in str($outputs).split(','): |
65 --protein $protein_output | 71 --protein $protein_output |
66 #end if | 72 #end if |
67 #if 'codingseq' in str($outputs).split(','): | 73 #if 'codingseq' in str($outputs).split(','): |
68 --codingseq $codingseq_output | 74 --codingseq $codingseq_output |
69 #end if | 75 #end if |
70 #end if | 76 #end if |
77 ]]> | |
71 </command> | 78 </command> |
72 <inputs> | 79 <inputs> |
73 <param name="input_genome" type="data" format="fasta" label="Genome Sequence"/> | 80 <param name="input_genome" type="data" format="fasta" label="Genome Sequence"/> |
74 <param name="noInFrameStop" type="boolean" label="Don't report transcripts with in-frame stop codons (--noInFrameStop)" truevalue="--noInFrameStop=true" falsevalue="--noInFrameStop=false" checked="false" help="Otherwise, intron-spanning stop codons could occur" /> | 81 <param name="noInFrameStop" type="boolean" label="Don't report transcripts with in-frame stop codons (--noInFrameStop)" truevalue="--noInFrameStop=true" falsevalue="--noInFrameStop=false" checked="false" help="Otherwise, intron-spanning stop codons could occur" /> |
75 <param name="singlestrand" type="boolean" label="Predict genes independently on each strand, allow overlapping genes on opposite strands (--singlestrand)" truevalue="--singlestrand=true" falsevalue="--singlestrand=false" checked="false" /> | 82 <param name="singlestrand" type="boolean" label="Predict genes independently on each strand, allow overlapping genes on opposite strands (--singlestrand)" truevalue="--singlestrand=true" falsevalue="--singlestrand=false" checked="false" /> |
134 <option value="pneumocystis">Pneumocystis jirovecii</option> | 141 <option value="pneumocystis">Pneumocystis jirovecii</option> |
135 <option value="chicken">Gallus gallus domesticus (chicken)</option> | 142 <option value="chicken">Gallus gallus domesticus (chicken)</option> |
136 <option value="cacao">Theobroma cacao (cacao)</option> | 143 <option value="cacao">Theobroma cacao (cacao)</option> |
137 <option value="heliconius_melpomene1">Heliconius melpomene</option> | 144 <option value="heliconius_melpomene1">Heliconius melpomene</option> |
138 <option value="xenoturbella">Xenoturbella</option> | 145 <option value="xenoturbella">Xenoturbella</option> |
139 </param> | 146 </param> |
140 | 147 |
141 <param name="strand" type="select" multiple="false" format="text" help="Report predicted genes on both strands, just the forward or just the backward strand."> | 148 <param name="strand" type="select" multiple="false" format="text" help="Report predicted genes on both strands, just the forward or just the backward strand."> |
142 <option value="both">both</option> | 149 <option value="both">both</option> |
143 <option value="forward">forward</option> | 150 <option value="forward">forward</option> |
144 <option value="backward">backward</option> | 151 <option value="backward">backward</option> |
145 </param> | 152 </param> |
146 | 153 |
147 <param name="genemodel" label="Gene Model" type="select" multiple="false" format="text" help="Gene Model to predict, for more information please refere to the help."> | 154 <param name="genemodel" label="Gene Model" type="select" multiple="false" format="text" help="Gene Model to predict, for more information please refere to the help."> |
148 <option value="complete">complete</option> | 155 <option value="complete">complete</option> |
149 <option value="partial">partial</option> | 156 <option value="partial">partial</option> |
150 <option value="intronless">intronless</option> | 157 <option value="intronless">intronless</option> |
211 <output name="codingseq_output" file="human_augustus_protein_codingseq_introns_cds_codingseq.fasta" ftype="fasta" /> | 218 <output name="codingseq_output" file="human_augustus_protein_codingseq_introns_cds_codingseq.fasta" ftype="fasta" /> |
212 <output name="protein_output" file="human_augustus_protein_codingseq_introns_cds_protein.fasta" ftype="fasta" /> | 219 <output name="protein_output" file="human_augustus_protein_codingseq_introns_cds_protein.fasta" ftype="fasta" /> |
213 </test> | 220 </test> |
214 </tests> | 221 </tests> |
215 <help> | 222 <help> |
223 <![CDATA[ | |
216 | 224 |
217 **What it does** | 225 **What it does** |
218 | 226 |
219 AUGUSTUS is a gene prediction program for eukaryotes written by Mario Stanke and Oliver Keller. | 227 AUGUSTUS is a gene prediction program for eukaryotes written by Mario Stanke and Oliver Keller. |
220 It can be used as an ab initio program, which means it bases its prediction purely on the | 228 It can be used as an ab initio program, which means it bases its prediction purely on the |
269 scaffold1|size1992969 AUGUSTUS CDS 18368 19013 0.99 + 0 transcript_id "g6.t1"; gene_id "g6"; | 277 scaffold1|size1992969 AUGUSTUS CDS 18368 19013 0.99 + 0 transcript_id "g6.t1"; gene_id "g6"; |
270 scaffold1|size1992969 AUGUSTUS CDS 19081 19379 0.31 + 2 transcript_id "g6.t1"; gene_id "g6"; | 278 scaffold1|size1992969 AUGUSTUS CDS 19081 19379 0.31 + 2 transcript_id "g6.t1"; gene_id "g6"; |
271 scaffold1|size1992969 AUGUSTUS stop_codon 19380 19382 . + 0 transcript_id "g6.t1"; gene_id "g6"; | 279 scaffold1|size1992969 AUGUSTUS stop_codon 19380 19382 . + 0 transcript_id "g6.t1"; gene_id "g6"; |
272 | 280 |
273 | 281 |
274 **References** | 282 ]]> |
275 | |
276 Mario Stanke and Stephan Waack (2003) | |
277 Gene Prediction with a Hidden-Markov Model and a new Intron Submodel. | |
278 Bioinformatics, Vol. 19, Suppl. 2, pages ii215-ii225 | |
279 | |
280 | |
281 </help> | 283 </help> |
284 <citations> | |
285 <citation type="doi">10.1093/bioinformatics/btg1080</citation> | |
286 </citations> | |
282 </tool> | 287 </tool> |