annotate glimmer_wo_icm.xml @ 2:b1ad88bbc5fa draft default tip

Uploaded
author bgruening
date Mon, 12 Aug 2013 11:55:07 -0400
parents 841357e0acbf
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
841357e0acbf Uploaded
bgruening
parents:
diff changeset
1 <tool id="glimmer_not-knowlegde-based" name="Glimmer3" version="0.2">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
2 <description>Predict ORFs in prokaryotic genomes (not knowlegde-based)</description>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
3 <requirements>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
4 <requirement type="package" version="3.02b">glimmer</requirement>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
5 <requirement type="package" version="1.61">biopython</requirement>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
6 </requirements>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
7 <command interpreter="python">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
8 glimmer_wo_icm.py
841357e0acbf Uploaded
bgruening
parents:
diff changeset
9 $input
841357e0acbf Uploaded
bgruening
parents:
diff changeset
10 #if $report:
841357e0acbf Uploaded
bgruening
parents:
diff changeset
11 $prediction
841357e0acbf Uploaded
bgruening
parents:
diff changeset
12 #else:
841357e0acbf Uploaded
bgruening
parents:
diff changeset
13 "None"
841357e0acbf Uploaded
bgruening
parents:
diff changeset
14 #end if
841357e0acbf Uploaded
bgruening
parents:
diff changeset
15 #if $detailed_report:
841357e0acbf Uploaded
bgruening
parents:
diff changeset
16 $detailed
841357e0acbf Uploaded
bgruening
parents:
diff changeset
17 #else:
841357e0acbf Uploaded
bgruening
parents:
diff changeset
18 "None"
841357e0acbf Uploaded
bgruening
parents:
diff changeset
19 #end if
841357e0acbf Uploaded
bgruening
parents:
diff changeset
20 $overlap
841357e0acbf Uploaded
bgruening
parents:
diff changeset
21 $gene_length
841357e0acbf Uploaded
bgruening
parents:
diff changeset
22 $threshold
841357e0acbf Uploaded
bgruening
parents:
diff changeset
23 $linear
841357e0acbf Uploaded
bgruening
parents:
diff changeset
24 $genes_output
841357e0acbf Uploaded
bgruening
parents:
diff changeset
25 </command>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
26 <inputs>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
27 <param name="input" type="data" format="fasta" label="Genome sequence" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
28 <param name="overlap" type="integer" value="0" label="Set maximum overlap length. Overlaps this short or shorter are ignored." />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
29 <param name="gene_length" type="integer" value="110" label="Set minimum gene length." />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
30 <param name="threshold" type="integer" value="30" label="Set threshold score for calling as gene. If the in-frame score >= N, then the region is given a number and considered a potential gene." />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
31 <param name="linear" type="boolean" truevalue="true" falsevalue="false" checked="true" label="Assume linear rather than circular genome, i.e., no wraparound" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
32
841357e0acbf Uploaded
bgruening
parents:
diff changeset
33 <param name="detailed_report" type="boolean" truevalue="" falsevalue="" checked="false" label="Output a detailed gene prediction report as separate file" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
34 <param name="report" type="boolean" truevalue="" falsevalue="" checked="false" label="Report the classic glimmer table output" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
35 </inputs>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
36 <outputs>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
37 <data name="genes_output" format="fasta" label="Glimmer3 on ${on_string} (Gene Prediction FASTA)" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
38 <data name="prediction" format="txt" label="Glimmer3 on ${on_string} (Gene Prediction table)">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
39 <filter>report == True</filter>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
40 </data>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
41 <data name="detailed" format="txt" label="Glimmer3 on ${on_string} (detailed report)">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
42 <filter>detailed_report == True</filter>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
43 </data>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
44 </outputs>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
45 <tests>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
46 <test>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
47 <param name="input" value="streptomyces_Tue6071_plasmid_genomic.fasta" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
48 <param name="overlap" value="0" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
49 <param name="gene_length" value="110" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
50 <param name="threshold" value="30" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
51 <param name="linear" value="true" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
52 <param name="detailed_report" value="" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
53 <param name="report" value="" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
54 <output name="genes_output" file="glimmer_wo_icm_trans-table-11_plasmid_genomic.fasta" ftype="fasta" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
55 </test>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
56 </tests>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
57 <help>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
58
841357e0acbf Uploaded
bgruening
parents:
diff changeset
59 **What it does**
841357e0acbf Uploaded
bgruening
parents:
diff changeset
60
841357e0acbf Uploaded
bgruening
parents:
diff changeset
61 This tool predicts open reading frames (orfs) from a given DNA Sequence. That tool is not knowlegde-based.
841357e0acbf Uploaded
bgruening
parents:
diff changeset
62
841357e0acbf Uploaded
bgruening
parents:
diff changeset
63 The recommended way is to use a trained Glimmer3 with ICM model. Use the knowlegde-based version for that and insert/generate a training set.
841357e0acbf Uploaded
bgruening
parents:
diff changeset
64
841357e0acbf Uploaded
bgruening
parents:
diff changeset
65 -----
841357e0acbf Uploaded
bgruening
parents:
diff changeset
66
841357e0acbf Uploaded
bgruening
parents:
diff changeset
67 **Glimmer Overview**
841357e0acbf Uploaded
bgruening
parents:
diff changeset
68
841357e0acbf Uploaded
bgruening
parents:
diff changeset
69 ::
841357e0acbf Uploaded
bgruening
parents:
diff changeset
70
841357e0acbf Uploaded
bgruening
parents:
diff changeset
71 ************** ************** ************** **************
841357e0acbf Uploaded
bgruening
parents:
diff changeset
72 * * * * * * * *
841357e0acbf Uploaded
bgruening
parents:
diff changeset
73 * long-orfs * ===> * Extract * ===> * build-icm * ===> * glimmer3 *
841357e0acbf Uploaded
bgruening
parents:
diff changeset
74 * * * * * * * *
841357e0acbf Uploaded
bgruening
parents:
diff changeset
75 ************** ************** ************** **************
841357e0acbf Uploaded
bgruening
parents:
diff changeset
76
841357e0acbf Uploaded
bgruening
parents:
diff changeset
77 -----
841357e0acbf Uploaded
bgruening
parents:
diff changeset
78
841357e0acbf Uploaded
bgruening
parents:
diff changeset
79 **Example**
841357e0acbf Uploaded
bgruening
parents:
diff changeset
80
841357e0acbf Uploaded
bgruening
parents:
diff changeset
81 Suppose you have the following DNA sequences::
841357e0acbf Uploaded
bgruening
parents:
diff changeset
82
841357e0acbf Uploaded
bgruening
parents:
diff changeset
83 >SQ Sequence 8667507 BP; 1203558 A; 3121252 C; 3129638 G; 1213059 T; 0 other;
841357e0acbf Uploaded
bgruening
parents:
diff changeset
84 cccgcggagcgggtaccacatcgctgcgcgatgtgcgagcgaacacccgggctgcgcccg
841357e0acbf Uploaded
bgruening
parents:
diff changeset
85 ggtgttgcgctcccgctccgcgggagcgctggcgggacgctgcgcgtcccgctcaccaag
841357e0acbf Uploaded
bgruening
parents:
diff changeset
86 cccgcttcgcgggcttggtgacgctccgtccgctgcgcttccggagttgcggggcttcgc
841357e0acbf Uploaded
bgruening
parents:
diff changeset
87 cccgctaaccctgggcctcgcttcgctccgccttgggcctgcggcgggtccgctgcgctc
841357e0acbf Uploaded
bgruening
parents:
diff changeset
88 ccccgcctcaagggcccttccggctgcgcctccaggacccaaccgcttgcgcgggcctgg
841357e0acbf Uploaded
bgruening
parents:
diff changeset
89 .......
841357e0acbf Uploaded
bgruening
parents:
diff changeset
90
841357e0acbf Uploaded
bgruening
parents:
diff changeset
91 Running this tool will produce a FASTA file with predicted genes and glimmer output files like the following::
841357e0acbf Uploaded
bgruening
parents:
diff changeset
92
841357e0acbf Uploaded
bgruening
parents:
diff changeset
93 >SQ Sequence 8667507 BP; 1203558 A; 3121252 C; 3129638 G; 1213059 T; 0 other;
841357e0acbf Uploaded
bgruening
parents:
diff changeset
94 orf00001 577 699 +1 5.24
841357e0acbf Uploaded
bgruening
parents:
diff changeset
95 orf00003 800 1123 +2 5.18
841357e0acbf Uploaded
bgruening
parents:
diff changeset
96 orf00004 1144 3813 +1 10.62
841357e0acbf Uploaded
bgruening
parents:
diff changeset
97 orf00006 3857 6220 +2 6.07
841357e0acbf Uploaded
bgruening
parents:
diff changeset
98 orf00007 6226 7173 +1 1.69
841357e0acbf Uploaded
bgruening
parents:
diff changeset
99 orf00008 7187 9307 +2 8.95
841357e0acbf Uploaded
bgruening
parents:
diff changeset
100 orf00009 9424 10410 +1 8.29
841357e0acbf Uploaded
bgruening
parents:
diff changeset
101 orf00010 10515 11363 +3 7.00
841357e0acbf Uploaded
bgruening
parents:
diff changeset
102 orf00011 11812 11964 +1 2.80
841357e0acbf Uploaded
bgruening
parents:
diff changeset
103 orf00012 12360 13457 +3 4.80
841357e0acbf Uploaded
bgruening
parents:
diff changeset
104 orf00013 14379 14044 -1 7.41
841357e0acbf Uploaded
bgruening
parents:
diff changeset
105 orf00015 15029 14739 -3 12.43
841357e0acbf Uploaded
bgruening
parents:
diff changeset
106 orf00016 15066 15227 +3 1.91
841357e0acbf Uploaded
bgruening
parents:
diff changeset
107 orf00020 16061 15351 -3 2.83
841357e0acbf Uploaded
bgruening
parents:
diff changeset
108 orf00021 17513 17391 -3 2.20
841357e0acbf Uploaded
bgruening
parents:
diff changeset
109 orf00023 17529 17675 +3 0.11
841357e0acbf Uploaded
bgruening
parents:
diff changeset
110
841357e0acbf Uploaded
bgruening
parents:
diff changeset
111
841357e0acbf Uploaded
bgruening
parents:
diff changeset
112 -------
841357e0acbf Uploaded
bgruening
parents:
diff changeset
113
841357e0acbf Uploaded
bgruening
parents:
diff changeset
114 **References**
841357e0acbf Uploaded
bgruening
parents:
diff changeset
115
841357e0acbf Uploaded
bgruening
parents:
diff changeset
116 A.L. Delcher, K.A. Bratke, E.C. Powers, and S.L. Salzberg. Identifying bacterial genes and endosymbiont DNA with Glimmer. Bioinformatics (Advance online version) (2007).
841357e0acbf Uploaded
bgruening
parents:
diff changeset
117
841357e0acbf Uploaded
bgruening
parents:
diff changeset
118 </help>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
119 </tool>