comparison long-orfs_wrapper.xml @ 0:9c8ffce71f7c draft default tip

Uploaded
author crs4
date Mon, 09 Sep 2013 12:16:17 -0400
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:9c8ffce71f7c
1 <tool id="long_orfs_wrapper" name="Long-ORFs" version="0.2">
2 <description></description>
3 <requirements>
4 <requirement type="package" version="3.02">glimmer</requirement>
5 </requirements>
6 <command interpreter="python">
7 long-orfs_wrapper.py --loSequence $loSequence
8 #if $loStartCodons
9 --loStartCodons="$loStartCodons"
10 #end if
11 #if $loEntropy
12 --loEntropy=$loEntropy
13 #end if
14 #if $loFixed
15 --loFixed
16 #end if
17 #if str($loMinLen)
18 --loMinLen=$loMinLen
19 #end if
20 #if $loLinear
21 --loLinear
22 #end if
23 #if $loLengthOpt
24 --loLengthOpt
25 #end if
26 #if $loNoHeader
27 --loNoHeader
28 #end if
29 #if str($loMaxOverlap)
30 --loMaxOverlap=$loMaxOverlap
31 #end if
32 #if str($loCutoff)
33 --loCutoff=$loCutoff
34 #end if
35 #if $loWithoutStops
36 --loWithoutStops
37 #end if
38 #if str($loTransTable)
39 --loTransTable=$loTransTable
40 #end if
41 #if $loStopCodons
42 --loStopCodons="$loStopCodons"
43 #end if
44 --loOutput $loOutput --logfile $logfile
45 </command>
46
47 <inputs>
48 <param name="loSequence" type="data" format="fasta" label="DNA sequence to be analyzed" help="FASTA format" />
49
50 <param name="loStartCodons" type="text" value="" optional="true" label="Specify allowable start codons as a comma-separated list (-A, --start_codons)" help="Sample format: 'atg,gtg'. The default start codons are atg, gtg and ttg." />
51
52 <param name="loEntropy" type="data" format="glimmer_entropy_profiles" optional="true" label="Entropy profiles (-E, --entropy)" help="The entropy profiles are used only if the cutoff option is specified." />
53
54 <param name="loFixed" type="boolean" checked="false" label="Fixed minimum gene length (-f, --fixed)" help="Do NOT automatically calculate the minimum gene length that maximizes the number or length of output regions, but instead use either the value specified by the 'minimum gene length' option or else the default, which is 90." />
55
56 <param name="loMinLen" type="integer" value="" optional="true" label="Minimum gene length in number of nucleotides (-g, --min_len)" help="It does not include the bases in the stop codon." />
57
58 <param name="loLinear" type="boolean" checked="false" label="Assuming a linear genome (-l, --linear)" help="No 'wrap-around' genes with part at the beginning of the sequence and the rest at the end of the sequence." />
59
60 <param name="loLengthOpt" type="boolean" checked="false" label="Optimize minimum gene length (-L, --length_opt)" help="Find and use as the minimum gene length the value that maximizes the total length of non-overlapping genes, instead of the default behaviour, which is to maximize the total number of non-overlapping genes." />
61
62 <param name="loNoHeader" type="boolean" checked="true" label="Do not include the program-settings header information in the output file (-n, --no_header)" help="The output file will contain only the coordinates of the selected ORFs." />
63
64 <param name="loMaxOverlap" type="integer" value="" optional="true" label="Maximum overlap length (-o, --max_olap)" help="Overlaps of this many or fewer bases between genes are not regarded as overlaps." />
65
66 <param name="loCutoff" type="float" value="" optional="true" label="Only genes with an entropy distance score less than this value will be considered (-t, --cutoff)" help=" This cutoff is made before any subsequent steps in the algorithm." />
67
68 <param name="loWithoutStops" type="boolean" checked="false" label="Do NOT include the stop codon in the region described by the output coordinates (-w, --without_stops)" help="By default it is included." />
69
70 <param name="loTransTable" type="integer" value="" optional="true" label="Use GenBank translation table number n to specify stop codons (-z, --trans_table)" help="" />
71
72 <param name="loStopCodons" type="text" value="" optional="true" label="Specify allowable stop codons as a comma-separated list (-Z, --stop_codons)" help="Sample format: 'tag,tga'. The default stop codons are tag, tga and taa." />
73 </inputs>
74
75 <outputs>
76 <data name="logfile" format="txt" label="${tool.name} on ${on_string}: log" />
77 <data name="loOutput" format="glimmer_coords" label="${tool.name} on ${on_string}: output" />
78 </outputs>
79
80 <tests>
81
82 </tests>
83 <help>
84 **What it does**
85
86 This program identifies long, non-overlapping open reading frames (ORFs) in a DNA sequence file. These ORFs are very likely to contain genes, and can be used as a set of training sequences for Build-ICM. More specifically, among all ORFs longer than a minimum length, those that do not overlap any others are output. The start codon used for each ORF is the first possible one. The program, by default, automatically determines the value that maximizes the number of ORFs that are output. With the -t option, the initial set of candidate ORFs also can be filtered using entropy distance, which generally produces a larger, more accurate training set, particularly for high-GC-content genomes.
87
88
89 **License and citation**
90
91 This Galaxy tool is Copyright © 2013 `CRS4 Srl.`_ and is released under the `MIT license`_.
92
93 .. _CRS4 Srl.: http://www.crs4.it/
94 .. _MIT license: http://opensource.org/licenses/MIT
95
96 If you use this tool in Galaxy, please cite |Cuccuru2013|_.
97
98 .. |Cuccuru2013| replace:: Cuccuru, G., Orsini, M., Pinna, A., Sbardellati, A., Soranzo, N., Travaglione, A., Uva, P., Zanetti, G., Fotia, G. (2013) Orione, a web-based framework for NGS analysis in microbiology. *Submitted*
99 .. _Cuccuru2013: http://orione.crs4.it/
100
101 This tool uses `Glimmer`_, which is licensed separately. Please cite |Delcher2007|_.
102
103 .. _Glimmer: http://ccb.jhu.edu/software/glimmer/index.shtml
104 .. |Delcher2007| replace:: Delcher, A. L., Bratke, K. A., Powers, E. C., Salzberg, S. L. (2007) Identifying bacterial genes and endosymbiont DNA with Glimmer. *Bioinformatics* 23(6), 673-679
105 .. _Delcher2007: http://bioinformatics.oxfordjournals.org/content/23/6/673
106 </help>
107 </tool>