rnabob: rnabob.xml annotate

author	rnateam
date	Mon, 22 Dec 2014 09:08:31 -0500
parents
children	5a4b00c84f50

rev	line source
0 cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	1 <tool id="rbc_rnabob" name="RNABOB" version="2.2.1.0">
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	2 <description>Fast Pattern searching for RNA secondary structures</description>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	3 <requirements>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	4 <requirement type="package" version="2.2.1">rnabob</requirement>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	5 </requirements>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	6 <version_command>echo "2.2.1"</version_command>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	7 <command>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	8 <![CDATA[
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	9 rnabob
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	10 -q
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	11 $fancy
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	12 $compStrands
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	13 $skipOverlapping
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	14 $descriptorFile
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	15 $sequenceFile > $stdout
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	16 ]]>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	17 </command>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	18 <stdio>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	19 <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	20 <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	21 </stdio>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	22 <inputs>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	23 <param name="descriptorFile" type="data" format="txt" multiple="false" label="Motif Descriptor File" help="This file contains the description of the motif for which to search"/>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	24 <param name="sequenceFile" type="data" format="fasta" multiple="false" label="Sequence File" help="This file specifies the sequence in which the motif will be searched"/>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	25 <param name="compStrands" type="boolean" truevalue="-c" falsevalue="" checked="false" label="Also search on complementary strands" help="-c : Search both strands of the supplied sequence"/>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	26 <param name="skipOverlapping" type="boolean" truevalue="-s" falsevalue="" checked="false" label="Skip overlapping matches" help="-s : This is a workaround to avoid a problem in the DNABANK, overlapping matches will be ignored"/>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	27 <param name="fancy" type="boolean" checked="false" truevalue="-F" falsevalue="" label="Show Alignments" help="Display full alignments to pattern"/>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	28 </inputs>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	29 <outputs>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	30 <data format="txt" name="stdout" label="${tool.name} on ${on_string}" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	31 </outputs>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	32 <tests>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	33 <test>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	34 <param name="descriptorFile" value="r17.des" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	35 <param name="sequenceFile" value="F22B7.fa" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	36 <param name="compStrands" value="True" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	37 <param name="skipOverlapping" value="False" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	38 <param name="fancy" value="False" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	39 <output name="stdout" file="r17.bob" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	40 </test>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	41 <test>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	42 <param name="descriptorFile" value="trna.des" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	43 <param name="sequenceFile" value="F22B7.fa" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	44 <param name="compStrands" value="True" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	45 <param name="skipOverlapping" value="False" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	46 <param name="fancy" value="False" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	47 <output name="stdout" file="trna.bob" />
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	48 </test>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	49 </tests>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	50 <help>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	51 What RNABOB does
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	52
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	53 RNABOB allows searching a sequence database for RNA structural motifs.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	54 The probe motif is specified in a descriptor file,
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	55 which describes its primary sequence, secondary structure, and tertiary constraints.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	56 The source in its original packaging can be found at http://selab.janelia.org/software/#rnabob.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	57
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	58 -----
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	59
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	60 Sequence database format
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	61
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	62 RNABOB is currently restricted to reading sequence files in FASTA format.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	63 The command line version of RNABOB can also read sequence files in GCG, EMBL, GenBank and other formats.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	64
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	65 -----
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	66
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	67 Descriptor file syntax
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	68
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	69 The descriptor file syntax is fairly powerful, and allows a great deal of freedom for specifying
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	70 RNA motifs. The syntax is therefore a bit complicated.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	71
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	72 The descriptor file has two parts: a topology description and an explicit description.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	73
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	74 The first non-blank, non-comment line of the file is the topology description. It defines the
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	75 order of occurrence of a series of single-stranded, double-stranded and related elements. Each
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	76 element must be given a unique name (a number, typically) and must be prefixed with 's',
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	77 'h', or 'r', indicating single-strand, helical, or a relational element. Helical and
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	78 relational elements are paired to other elements, which are suffixed by a prime, \'.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	79
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	80 For example::
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	81
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	82 \
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	83 h1 s1 h1'
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	84
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	85 describes a hairpin loop structure with a simple helix and single-stranded loop. If the helix
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	86 always contained a non-canonical base pair at one position, the topology coud be described as::
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	87
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	88 \
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	89 h1 r1 h2 s1 h2' r1' h1'
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	90
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	91 where r1,r1' indicate a correlation, where the sequence r1 constrains the sequence of r1'.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	92 (Helices are a special case of this.)
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	93
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	94 The remaining non-comment, non-blank lines are explicit descriptions of each element in turn. Each
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	95 line contains 3 or 4 fields, separated by tabs or blank space. The first field is the name of the
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	96 element, from the topology description. The second field is the number of mismatches allowed in
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	97 this element. The third field is the primary sequence constraint to apply to this element.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	98
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	99 Helices and relational element pairs are specified on a single line rather than two. Mismatches
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	100 and primary sequence constraints are given as pairs, separated by a colon ':'. The left side
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	101 is the constraint applied to the upstream element, and the right side is applied to the downstream
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	102 elements.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	103
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	104 The primary sequence constraint is given as a sequence of nucleotides. Any IUPAC single-letter
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	105 code is recognized, including N if the position can have any base identity. Allowed length
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	106 variations are specified with asterisks ``''``, where each ```` will allow either 0 or 1 N at
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	107 that position.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	108
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	109 For example::
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	110
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	111 \
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	112 GGAGG******NNNAUG
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	113
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	114 specifies a GGAGG Shine/Dalgarno site and an AUG initiation codon, separated by a spacer of 3 to 9
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	115 nucleotides of any sequence.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	116
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	117 An alternative syntax can be used for very long gaps::
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	118
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	119 \
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	120 GGAGG[10]NNNAUG is the same as GGAGG**********NNNAUG
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	121
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	122 Be careful defining variable length helices and relational elements; if the number and type (gap
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	123 or identity) of position do not match on left and right sides, the program will refuse to accept
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	124 the descriptor.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	125
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	126 Relational elements have an additional field which specifies a "transformation matrix" of four
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	127 nucleotides, specifying the rule for making the ``r'`` pattern from the ``r`` sequence in order
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	128 ``A-C-G-T``. For example, the transformation matrix for a simple helix is ``TGCA``; if you allow
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	129 ``G-U`` pairs, it is ``TGYR``. RNABOB allows ``G-U`` pairing by default and uses the ``TGYR``
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	130 matrix for helical elements.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	131
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	132 For example, the explicit description of our hairpin might be:
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	133
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	134 ::
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	135
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	136 \
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	137 h1 0:0 NNN:NNN
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	138 r1 0:0 R:N GNAN
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	139 h2 0:0 NC:GN
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	140 s1 0 UUCG
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	141
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	142 This describes a stem of 6 to 8 base pairs, in which the 4th pair from the bottom of the stem must
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	143 be a non-canonical GA pair. Note that, in general, the left side of the primary constraint for
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	144 helices and relational elements is redundant, and should be given as all N. In some cases it is
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	145 convenient to constrain the right side to require a particular base pair (GU, for instance) at one
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	146 position.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	147
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	148 A note on mismatches: The split format for helices and relational elements works like this. The
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	149 number on the left constrains the primary sequence match of the left side of the primary
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	150 constraint. The number on the right constrains the match of the right side of the primary
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	151 constraint, after that side has been constructed according to the sequence on the left. In other
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	152 words, the number on the left constrains the mismatches in primary sequence only, while the number
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	153 on the right will constrain the number of mispaired positions in the helix.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	154
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	155 Finally: any line that begins with a pound sign '#' is a comment line, and will not be interpreted
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	156 by the pattern compiler.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	157
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	158 Options
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	159
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	160 The behavior of RNABOB can be modified by use of the following options:
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	161
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	162 Complement: Selecting this option will cause RNABOB to search for the pattern also on the
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	163 complementary strands.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	164
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	165 Skip: This is a workaround to avoid a problem in the DNABANK. There are some sequences in the
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	166 database which have long stretches of ambiguous sequence (N's). Descriptors with no primary
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	167 sequence constraints will match these garbage sequences at many, many positions, and generate huge
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	168 outputs. This option toggles a search strategy that skips forward a pattern-length rather than a
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	169 single base when a match is found, thus printing out only a single match when overlapping matches
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	170 are found.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	171
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	172 Examples
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	173
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	174 The following example descriptors included in the source distribution
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	175 (http://selab.janelia.org/software/rnabob/rnabob.tar.gz):
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	176
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	177 - trna.des - a general descriptor of a tRNA structure
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	178 - r17.des - descriptor of the consensus binding site for the r17 phage coat protein
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	179 - pseudoknot.des - description of a simple pseudoknotted structure
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	180
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	181 An example cosmid ``F22B7.fa`` from the C. elegans genome sequencing project is also provided
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	182 for running these descriptors against.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	183
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	184 ::
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	185
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	186 \
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	187 # trna.des
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	188 #
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	189 # Generalized descriptor of a tRNA cloverleaf. Doesn't
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	190 # find them all though.
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	191 #
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	192
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	193 h1 s1 h2 s2 h2' s3 h3 s4 h3' s5 h4 s6 h4' h1' s8
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	194
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	195 h1 0:2 NNNNNNN:NNNNNNN
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	196 h2 0:1 NNN:NNN
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	197 h3 0:1 NNNNN:NNNNN
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	198 h4 0:1 NNNNN:NNNNN
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	199 s1 0 TN
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	200 s2 0 NNNN**********
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	201 s3 0 N
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	202 s4 0 NNNNNN*
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	203 s5 0 NN********************
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	204 s6 0 TTC****
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	205 s8 0 NCCA
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	206
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	207 Running RNABOB with ``trna.des`` against ``F22B7.fa`` searches the top strand of the cosmid for
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	208 the above motif. ``trna.des`` hits twice, once on each strand. (F22B7 has several other tRNA genes
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	209 in it which the pattern fails to detect - this is not a pattern to use for tRNA genefinding!).
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	210 </help>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	211 <citations>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	212 <citation type="doi">10.1093/bioinformatics/6.4.325</citation>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	213 <citation type="bibtex">@UNPUBLISHED{rnabob,
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	214 author = {Eddy S.R},
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	215 title = {RNABOB: a program to search for RNA secondary structure motifs in sequence databases},
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	216 note = {}}</citation>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	217 </citations>
cd00b4fe6552 Imported from capsule None rnateam parents: diff changeset	218 </tool>

0

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

1 <tool id="rbc_rnabob" name="RNABOB" version="2.2.1.0">

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

2 <description>Fast Pattern searching for RNA secondary structures</description>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

3 <requirements>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

4 <requirement type="package" version="2.2.1">rnabob</requirement>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

5 </requirements>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

6 <version_command>echo "2.2.1"</version_command>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

7 <command>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

8 <![CDATA[

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

9 rnabob

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

10 -q

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

11 $fancy

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

12 $compStrands

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

13 $skipOverlapping

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

14 $descriptorFile

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

15 $sequenceFile > $stdout

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

16 ]]>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

17 </command>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

18 <stdio>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

19 <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

20 <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

21 </stdio>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

22 <inputs>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

23 <param name="descriptorFile" type="data" format="txt" multiple="false" label="Motif Descriptor File" help="This file contains the description of the motif for which to search"/>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

24 <param name="sequenceFile" type="data" format="fasta" multiple="false" label="Sequence File" help="This file specifies the sequence in which the motif will be searched"/>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

25 <param name="compStrands" type="boolean" truevalue="-c" falsevalue="" checked="false" label="Also search on complementary strands" help="-c : Search both strands of the supplied sequence"/>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

26 <param name="skipOverlapping" type="boolean" truevalue="-s" falsevalue="" checked="false" label="Skip overlapping matches" help="-s : This is a workaround to avoid a problem in the DNABANK, overlapping matches will be ignored"/>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

27 <param name="fancy" type="boolean" checked="false" truevalue="-F" falsevalue="" label="Show Alignments" help="Display full alignments to pattern"/>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

28 </inputs>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

29 <outputs>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

30 <data format="txt" name="stdout" label="${tool.name} on ${on_string}" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

31 </outputs>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

32 <tests>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

33 <test>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

34 <param name="descriptorFile" value="r17.des" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

35 <param name="sequenceFile" value="F22B7.fa" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

36 <param name="compStrands" value="True" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

37 <param name="skipOverlapping" value="False" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

38 <param name="fancy" value="False" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

39 <output name="stdout" file="r17.bob" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

40 </test>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

41 <test>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

42 <param name="descriptorFile" value="trna.des" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

43 <param name="sequenceFile" value="F22B7.fa" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

44 <param name="compStrands" value="True" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

45 <param name="skipOverlapping" value="False" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

46 <param name="fancy" value="False" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

47 <output name="stdout" file="trna.bob" />

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

48 </test>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

49 </tests>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

50 <help>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

51 **What RNABOB does**

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

52

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

53 RNABOB allows searching a sequence database for RNA structural motifs.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

54 The probe motif is specified in a *descriptor* file,

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

55 which describes its primary sequence, secondary structure, and tertiary constraints.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

56 The source in its original packaging can be found at http://selab.janelia.org/software/#rnabob.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

57

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

58 -----

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

59

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

60 **Sequence database format**

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

61

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

62 RNABOB is currently restricted to reading sequence files in FASTA format.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

63 The command line version of RNABOB can also read sequence files in GCG, EMBL, GenBank and other formats.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

64

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

65 -----

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

66

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

67 **Descriptor file syntax**

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

68

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

69 The descriptor file syntax is fairly powerful, and allows a great deal of freedom for specifying

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

70 RNA motifs. The syntax is therefore a bit complicated.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

71

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

72 The descriptor file has two parts: a **topology** description and an **explicit** description.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

73

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

74 The first non-blank, non-comment line of the file is the topology description. It defines the

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

75 order of occurrence of a series of single-stranded, double-stranded and related elements. Each

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

76 element must be given a unique name (a number, typically) and must be prefixed with '**s**',

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

77 '**h**', or '**r**', indicating single-strand, helical, or a relational element. Helical and

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

78 relational elements are paired to other elements, which are suffixed by a prime, **\'**.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

79

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

80 For example::

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

81

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

82 \

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

83 h1 s1 h1'

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

84

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

85 describes a hairpin loop structure with a simple helix and single-stranded loop. If the helix

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

86 always contained a non-canonical base pair at one position, the topology coud be described as::

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

87

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

88 \

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

89 h1 r1 h2 s1 h2' r1' h1'

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

90

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

91 where r1,r1' indicate a correlation, where the sequence r1 constrains the sequence of r1'.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

92 (Helices are a special case of this.)

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

93

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

94 The remaining non-comment, non-blank lines are explicit descriptions of each element in turn. Each

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

95 line contains 3 or 4 fields, separated by tabs or blank space. The first field is the name of the

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

96 element, from the topology description. The second field is the number of mismatches allowed in

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

97 this element. The third field is the primary sequence constraint to apply to this element.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

98

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

99 Helices and relational element pairs are specified on a single line rather than two. Mismatches

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

100 and primary sequence constraints are given as pairs, separated by a colon '**:**'. The left side

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

101 is the constraint applied to the upstream element, and the right side is applied to the downstream

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

102 elements.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

103

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

104 The primary sequence constraint is given as a sequence of nucleotides. Any IUPAC single-letter

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

105 code is recognized, including N if the position can have any base identity. Allowed length

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

106 variations are specified with asterisks ``'*'``, where each ``*`` will allow either 0 or 1 N at

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

107 that position.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

108

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

109 For example::

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

110

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

111 \

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

112 GGAGG******NNNAUG

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

113

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

114 specifies a GGAGG Shine/Dalgarno site and an AUG initiation codon, separated by a spacer of 3 to 9

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

115 nucleotides of any sequence.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

116

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

117 An alternative syntax can be used for very long gaps::

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

118

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

119 \

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

120 GGAGG[10]NNNAUG is the same as GGAGG**********NNNAUG

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

121

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

122 Be careful defining variable length helices and relational elements; if the number and type (gap

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

123 or identity) of position do not match on left and right sides, the program will refuse to accept

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

124 the descriptor.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

125

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

126 Relational elements have an additional field which specifies a "transformation matrix" of four

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

127 nucleotides, specifying the rule for making the ``r'`` pattern from the ``r`` sequence in order

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

128 ``A-C-G-T``. For example, the transformation matrix for a simple helix is ``TGCA``; if you allow

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

129 ``G-U`` pairs, it is ``TGYR``. RNABOB allows ``G-U`` pairing by default and uses the ``TGYR``

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

130 matrix for helical elements.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

131

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

132 For example, the explicit description of our hairpin might be:

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

133

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

134 ::

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

135

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

136 \

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

137 h1 0:0 NNN:NNN

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

138 r1 0:0 R:N GNAN

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

139 h2 0:0 **NC:GN**

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

140 s1 0 UUCG

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

141

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

142 This describes a stem of 6 to 8 base pairs, in which the 4th pair from the bottom of the stem must

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

143 be a non-canonical GA pair. Note that, in general, the left side of the primary constraint for

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

144 helices and relational elements is redundant, and should be given as all N. In some cases it is

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

145 convenient to constrain the right side to require a particular base pair (GU, for instance) at one

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

146 position.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

147

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

148 A note on mismatches: The split format for helices and relational elements works like this. The

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

149 number on the left constrains the primary sequence match of the left side of the primary

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

150 constraint. The number on the right constrains the match of the right side of the primary

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

151 constraint, *after* that side has been constructed according to the sequence on the left. In other

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

152 words, the number on the left constrains the mismatches in primary sequence only, while the number

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

153 on the right will constrain the number of mispaired positions in the helix.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

154

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

155 Finally: any line that begins with a pound sign '#' is a comment line, and will not be interpreted

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

156 by the pattern compiler.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

157

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

158 **Options**

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

159

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

160 The behavior of RNABOB can be modified by use of the following options:

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

161

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

162 *Complement*: Selecting this option will cause RNABOB to search for the pattern also on the

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

163 complementary strands.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

164

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

165 *Skip*: This is a workaround to avoid a problem in the DNABANK. There are some sequences in the

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

166 database which have long stretches of ambiguous sequence (N's). Descriptors with no primary

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

167 sequence constraints will match these garbage sequences at many, many positions, and generate huge

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

168 outputs. This option toggles a search strategy that skips forward a pattern-length rather than a

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

169 single base when a match is found, thus printing out only a single match when overlapping matches

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

170 are found.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

171

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

172 **Examples**

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

173

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

174 The following example descriptors included in the source distribution

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

175 (http://selab.janelia.org/software/rnabob/rnabob.tar.gz):

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

176

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

177 - trna.des - a general descriptor of a tRNA structure

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

178 - r17.des - descriptor of the consensus binding site for the r17 phage coat protein

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

179 - pseudoknot.des - description of a simple pseudoknotted structure

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

180

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

181 An example cosmid ``F22B7.fa`` from the *C. elegans* genome sequencing project is also provided

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

182 for running these descriptors against.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

183

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

184 ::

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

185

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

186 \

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

187 # trna.des

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

188 #

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

189 # Generalized descriptor of a tRNA cloverleaf. Doesn't

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

190 # find them all though.

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

191 #

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

192

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

193 h1 s1 h2 s2 h2' s3 h3 s4 h3' s5 h4 s6 h4' h1' s8

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

194

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

195 h1 0:2 NNNNNNN:NNNNNNN

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

196 h2 0:1 *NNN:NNN*

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

197 h3 0:1 NNNNN:NNNNN

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

198 h4 0:1 NNNNN:NNNNN

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

199 s1 0 TN

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

200 s2 0 NNNN**********

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

201 s3 0 N

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

202 s4 0 NNNNNN*

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

203 s5 0 NN********************

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

204 s6 0 TTC****

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

205 s8 0 NCCA

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

206

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

207 Running RNABOB with ``trna.des`` against ``F22B7.fa`` searches the top strand of the cosmid for

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

208 the above motif. ``trna.des`` hits twice, once on each strand. (F22B7 has several other tRNA genes

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

209 in it which the pattern fails to detect - this is *not* a pattern to use for tRNA genefinding!).

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

210 </help>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

211 <citations>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

212 <citation type="doi">10.1093/bioinformatics/6.4.325</citation>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

213 <citation type="bibtex">@UNPUBLISHED{rnabob,

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

214 author = {Eddy S.R},

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

215 title = {RNABOB: a program to search for RNA secondary structure motifs in sequence databases},

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

216 note = {}}</citation>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

217 </citations>

cd00b4fe6552 Imported from capsule None

rnateam

parents:

diff changeset

218 </tool>

Mercurial > repos > rnateam > rnabob

annotate rnabob.xml @ 0:cd00b4fe6552 draft