annotate cmsearch.xml @ 2:fac157e22e1b draft

Uploaded
author bgruening
date Fri, 13 Feb 2015 03:10:51 -0500
parents 55bb96edfc07
children 2c2c5e5e495b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
1 <tool id="infernal_cmsearch" name="Search covariance model(s)" version="1.1.0.2">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
2 <description>against a sequence database (cmsearch)</description>
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
3 <parallelism method="multi" split_inputs="seqdb" split_mode="to_size" split_size="500" shared_inputs="" merge_outputs="outfile,multiple_alignment_output"></parallelism>
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
4 <requirements>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
5 <requirement type="package">infernal</requirement>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
6 <requirement type="package" version="1.1">infernal</requirement>
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
7 <requirement type="package" version="8.22">gnu_coreutils</requirement>
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
8 </requirements>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
9 <command>
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
10 <![CDATA[
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
11 ## a temp file is needed, because the standard tabular output from infernal is not usefull in Galaxy
652f9d550531 Uploaded
bgruening
parents:
diff changeset
12 ## it will be converted to a tab delimited file and piped to Galaxy
652f9d550531 Uploaded
bgruening
parents:
diff changeset
13 temp_tabular_output=\$(mktemp);
652f9d550531 Uploaded
bgruening
parents:
diff changeset
14
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
15 cmsearch
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
16 ## Infernal Options
652f9d550531 Uploaded
bgruening
parents:
diff changeset
17 --cpu "\${GALAXY_SLOTS:-12}"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
18 -o /dev/null
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
19 --tformat $seqdb.ext ##target format: fasta, embl, genbank, ddbj, stockholm, pfam, a2m, afa, clustal, and phylip
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
20 $bottomonly
652f9d550531 Uploaded
bgruening
parents:
diff changeset
21 $toponly
652f9d550531 Uploaded
bgruening
parents:
diff changeset
22 $cyk
652f9d550531 Uploaded
bgruening
parents:
diff changeset
23 $notrunc
652f9d550531 Uploaded
bgruening
parents:
diff changeset
24 $max
652f9d550531 Uploaded
bgruening
parents:
diff changeset
25 $nohmm
652f9d550531 Uploaded
bgruening
parents:
diff changeset
26 $mid
652f9d550531 Uploaded
bgruening
parents:
diff changeset
27 ##$bitscore_thresholds
652f9d550531 Uploaded
bgruening
parents:
diff changeset
28 --tblout \$temp_tabular_output
652f9d550531 Uploaded
bgruening
parents:
diff changeset
29 $g
652f9d550531 Uploaded
bgruening
parents:
diff changeset
30 #if $A:
652f9d550531 Uploaded
bgruening
parents:
diff changeset
31 $A $multiple_alignment_output
652f9d550531 Uploaded
bgruening
parents:
diff changeset
32 #end if
652f9d550531 Uploaded
bgruening
parents:
diff changeset
33
652f9d550531 Uploaded
bgruening
parents:
diff changeset
34 #if str($inclusion_thresholds_opts.inclusion_thresholds_selector) == "--incE":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
35 --incE $inclusion_thresholds_opts.incE
652f9d550531 Uploaded
bgruening
parents:
diff changeset
36 #elif str($inclusion_thresholds_opts.inclusion_thresholds_selector) == "--incT":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
37 --incT $inclusion_thresholds_opts.incT
652f9d550531 Uploaded
bgruening
parents:
diff changeset
38 #end if
652f9d550531 Uploaded
bgruening
parents:
diff changeset
39
652f9d550531 Uploaded
bgruening
parents:
diff changeset
40 #if str($reporting_thresholds_opts.reporting_thresholds_selector) == "-E":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
41 -E $reporting_thresholds_opts.E
652f9d550531 Uploaded
bgruening
parents:
diff changeset
42 #elif str($reporting_thresholds_opts.reporting_thresholds_selector) == "-T":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
43 -T $reporting_thresholds_opts.T
652f9d550531 Uploaded
bgruening
parents:
diff changeset
44 #end if
652f9d550531 Uploaded
bgruening
parents:
diff changeset
45
652f9d550531 Uploaded
bgruening
parents:
diff changeset
46 ## CM file from the history or stored as database on disc
652f9d550531 Uploaded
bgruening
parents:
diff changeset
47
652f9d550531 Uploaded
bgruening
parents:
diff changeset
48 #if str($cm_opts.cm_opts_selector) == "db":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
49 $cm_opts.database.fields.path
652f9d550531 Uploaded
bgruening
parents:
diff changeset
50 #else:
652f9d550531 Uploaded
bgruening
parents:
diff changeset
51 $cm_opts.cmfile
652f9d550531 Uploaded
bgruening
parents:
diff changeset
52 #end if
652f9d550531 Uploaded
bgruening
parents:
diff changeset
53
652f9d550531 Uploaded
bgruening
parents:
diff changeset
54 ## sequence file
652f9d550531 Uploaded
bgruening
parents:
diff changeset
55 $seqdb
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
56 2>&1
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
57 ;
652f9d550531 Uploaded
bgruening
parents:
diff changeset
58
652f9d550531 Uploaded
bgruening
parents:
diff changeset
59 ## 1. replace all lines starting # (comment lines)
652f9d550531 Uploaded
bgruening
parents:
diff changeset
60 ## 2. replace the first 18 spaces with tabs, 18th field is a free text field (can contain spaces)
1
55bb96edfc07 Uploaded
bgruening
parents: 0
diff changeset
61 sed -e 's/#.*$//' -e '/^$/d' -e 's/\s\+/\t/g' -e 's/\t/ /18g' \$temp_tabular_output > $outfile
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
62
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
63 ]]>
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
64 </command>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
65 <inputs>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
66
652f9d550531 Uploaded
bgruening
parents:
diff changeset
67 <param name="seqdb" type="data" format="fasta" label="Sequence database"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
68
652f9d550531 Uploaded
bgruening
parents:
diff changeset
69 <conditional name="cm_opts">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
70 <param name="cm_opts_selector" type="select" label="Subject covariance models">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
71 <option value="db" selected="True">Locally installed covariance models</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
72 <option value="histdb">Covariance model from your history</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
73 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
74 <when value="db">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
75 <param name="database" type="select" label="Covariance models">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
76 <options from_file="infernal.loc">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
77 <column name="value" index="0"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
78 <column name="name" index="1"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
79 <column name="path" index="2"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
80 </options>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
81 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
82 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
83 <when value="histdb">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
84 <param name="cmfile" type="data" format="cm" label="Covariance models file from the history."/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
85 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
86 </conditional>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
87
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
88 <param name="g" truevalue="-g" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
89 label="Turn on the glocal alignment algorithm" help="... global with respect to the query model and local with respect to the target database."/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
90
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
91 <param name="bottomonly" truevalue="--bottomonly" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
92 label="Only search the bottom (Crick) strand of target sequences" help="in the sequence database"/>
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
93 <param name="toponly" truevalue="--toponly" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
94 label="Only search the top (Watson) strand of target sequences" help="in the sequence database"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
95
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
96 <param name="cyk" truevalue="--cyk" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
97 label="Use the CYK algorithm, not Inside, to determine the final score of all hits" help=""/>
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
98 <param name="--acyk" truevalue="--cyk" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
99 label="Use the CYK algorithm to align hits" help="By default, the Durbin/Holmes optimal accuracy algorithm is used, which finds the alignment that maximizes the expected accuracy of all aligned residues."/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
100
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
101 <param name="notrunc" truevalue="--notrunc" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
102 label="Turn off truncated hit detection" help=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
103
652f9d550531 Uploaded
bgruening
parents:
diff changeset
104 <!-- accelleration pipeline -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
105
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
106 <param name="max" truevalue="--max" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
107 label="Turn off all filters, and run non-banded Inside on every full-length target sequence" help="This
652f9d550531 Uploaded
bgruening
parents:
diff changeset
108 increases sensitivity somewhat, at an extremely large cost in speed."/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
109
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
110 <param name="nohmm" truevalue="--nohmm" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
111 label="Turn off all HMM filter stages " help=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
112
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
113 <param name="mid" truevalue="--mid" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
114 label="Turn off the HMM SSV and Viterbi filter stages" help=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
115
652f9d550531 Uploaded
bgruening
parents:
diff changeset
116
652f9d550531 Uploaded
bgruening
parents:
diff changeset
117 <!-- Options for model-specific score thresholding -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
118 <!--
652f9d550531 Uploaded
bgruening
parents:
diff changeset
119 <param name="bitscore_thresholds" type="select" label="Bit score thresholds" help="Curated CM databases may define specific bit score thresholds for each CM, superseding any thresholding based on statistical significance alone.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
120 <option value="" selected="true">None</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
121 <option value=" - -cut_ga">GA (gathering) bit scores</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
122 <option value=" - -cut_nc">NC (noise cutoff) bit score</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
123 <option value=" - -cut_tc">TC (trusted cutoff) bit score</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
124 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
125 -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
126 <!-- Options for inclusion thresholds -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
127
652f9d550531 Uploaded
bgruening
parents:
diff changeset
128
652f9d550531 Uploaded
bgruening
parents:
diff changeset
129 <conditional name="inclusion_thresholds_opts">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
130 <param name="inclusion_thresholds_selector" type="select" label="Inclusion thresholds"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
131 help="Inclusion thresholds are stricter than reporting thresholds. Inclusion thresholds control which hits are considered to be reliable enough to be included in an output alignment or in a possible subsequent search round, or marked as significant (”!”) as opposed to questionable (”?”) in hit output.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
132 <option value="" selected="true">default</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
133 <option value="--incE">Use E-value</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
134 <option value="--incT">Use bit score</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
135 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
136 <when value=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
137 <when value="--incE">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
138 <param name="incE" type="float" value="0.01" size="5" label="Use E-value" help="of &lt;= X as the hit inclusion threshold.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
139 <sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
140 <valid initial="string.printable">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
141 <remove value="&apos;"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
142 </valid>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
143 </sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
144 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
145 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
146 <when value="--incT">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
147 <param name="incT" type="integer" size="5" value="0" label="Use bit score" help="of >= X as the hit inclusion threshold.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
148 <sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
149 <valid initial="string.printable">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
150 <remove value="&apos;"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
151 </valid>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
152 </sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
153 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
154 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
155 </conditional>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
156
652f9d550531 Uploaded
bgruening
parents:
diff changeset
157 <!-- Options controlling reporting thresholds -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
158
652f9d550531 Uploaded
bgruening
parents:
diff changeset
159 <conditional name="reporting_thresholds_opts">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
160 <param name="reporting_thresholds_selector" type="select" label="reporting thresholds"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
161 help="Reporting thresholds control which hits are reported in output files">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
162 <option value="" selected="true">default</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
163 <option value="-E">Use E-value</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
164 <option value="-T">Use bit score</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
165 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
166 <when value=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
167 <when value="-E">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
168 <param name="E" type="float" value="10.0" size="5" label="Use E-value" help="of &lt;= X as the hit reporting threshold. The default is 10.0, meaning that on average, about 10 false positives will be reported per query, so you can see the top of the noise and decide for yourself if it’s really noise.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
169 <sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
170 <valid initial="string.printable">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
171 <remove value="&apos;"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
172 </valid>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
173 </sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
174 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
175 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
176 <when value="-T">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
177 <param name="T" type="integer" size="5" value="0" label="Use bit score" help="of >= X as the hit reporting threshold.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
178 <sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
179 <valid initial="string.printable">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
180 <remove value="&apos;"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
181 </valid>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
182 </sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
183 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
184 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
185 </conditional>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
186
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
187 <param name="A" truevalue="-A" falsevalue="" checked="False" type="boolean"
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
188 label="Save a multiple alignment of all significant hits" help="... those satisfying inclusion thresholds"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
189
652f9d550531 Uploaded
bgruening
parents:
diff changeset
190 </inputs>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
191 <outputs>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
192
652f9d550531 Uploaded
bgruening
parents:
diff changeset
193 <data format="tabular" name="outfile" label="cmsearch on ${on_string}"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
194 <data format="tabular" name="multiple_alignment_output" label="cmsearch on ${on_string} (multi alignment)">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
195 <filter>A is True</filter>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
196 </data>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
197
652f9d550531 Uploaded
bgruening
parents:
diff changeset
198 </outputs>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
199 <help>
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
200 <![CDATA[
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
201
652f9d550531 Uploaded
bgruening
parents:
diff changeset
202
652f9d550531 Uploaded
bgruening
parents:
diff changeset
203 **What it does**
652f9d550531 Uploaded
bgruening
parents:
diff changeset
204
652f9d550531 Uploaded
bgruening
parents:
diff changeset
205 Infernal is used to search sequence databases for homologs of structural RNA sequences, and to make
652f9d550531 Uploaded
bgruening
parents:
diff changeset
206 sequence- and structure-based RNA sequence alignments. Infernal needs a profile from a structurally
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
207 annotated multiple sequence alignment of an RNA family with a position-specific scoring system for substitutions,
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
208 insertions, and deletions. Positions in the profile that are basepaired in the consensus secondary
652f9d550531 Uploaded
bgruening
parents:
diff changeset
209 structure of the alignment are modeled as dependent on one another, allowing Infernal’s scoring system to
652f9d550531 Uploaded
bgruening
parents:
diff changeset
210 consider the secondary structure, in addition to the primary sequence, of the family being modeled. Infernal
652f9d550531 Uploaded
bgruening
parents:
diff changeset
211 profiles are probabilistic models called “covariance models”, a specialized type of stochastic context-free
652f9d550531 Uploaded
bgruening
parents:
diff changeset
212 grammar (SCFG) (Lari and Young, 1990).
652f9d550531 Uploaded
bgruening
parents:
diff changeset
213
652f9d550531 Uploaded
bgruening
parents:
diff changeset
214 Compared to other alignment and database search tools based only on sequence comparison, Infernal
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
215 aims to be significantly more accurate and more able to detect remote homologs because it models sequence
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
216 and structure.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
217
652f9d550531 Uploaded
bgruening
parents:
diff changeset
218
652f9d550531 Uploaded
bgruening
parents:
diff changeset
219 Output format
652f9d550531 Uploaded
bgruening
parents:
diff changeset
220 -------------
652f9d550531 Uploaded
bgruening
parents:
diff changeset
221
652f9d550531 Uploaded
bgruening
parents:
diff changeset
222 (1) target name: The name of the target sequence or profile.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
223 (2) accession: The accession of the target sequence or profile, or ’-’ if none.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
224 (3) query name: The name of the query sequence or profile.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
225 (4) accession: The accession of the query sequence or profile, or ’-’ if none.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
226 (5) mdl (model): Which type of model was used to compute the final score. Either ’cm’ or ’hmm’. A CM is used to compute the final hit scores unless the model has zero basepairs or the --hmmonly option is used, in which case a HMM will be used.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
227 (6) mdl from (model coord): The start of the alignment of this hit with respect to the profile (CM or HMM), numbered 1..N for a profile of N consensus positions.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
228 (7) mdl to (model coord): The end of the alignment of this hit with respect to the profile (CM or HMM), numbered 1..N for a profile of N consensus positions.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
229 (8) seq from (ali coord): The start of the alignment of this hit with respect to the sequence, numbered 1..L for a sequence of L residues.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
230 (9) seq to (ali coord): The end of the alignment of this hit with respect to the sequence, numbered 1..L for a sequence of L residues.
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
231 (10) strand: The strand on which the hit occurs on the sequence. ’+’ if the hit is on the top (Watson) strand, ’-’ if the hit is on the bottom (Crick) strand. If on the top strand, the “seq from” value will be less than or equal to the “seq to” value, else it will be greater than or equal to it.
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
232 (11) trunc: Indicates if this is predicted to be a truncated CM hit or not. This will be “no” if it is a CM hit that is not predicted to be truncated by the end of the sequence, “5’ ” or “3’ ” if the hit is predicted to have one or more 5’ or 3’ residues missing due to a artificial truncation of the sequence, or “5’&3”’ if the hit is predicted to have one or more 5’ residues missing and one or more 3’ residues missing. If the hit is an HMM hit, this will always be ’-’.
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
233 (12) pass: Indicates what “pass” of the pipeline the hit was detected on. This is probably only useful for testing and debugging. Non-truncated hits are found on the first pass, truncated hits are found on successive passes.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
234 (13) gc: Fraction of G and C nucleotides in the hit.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
235 (14) bias: The biased-composition correction: the bit score difference contributed by the null3 model for CM hits, or the null2 model for HMM hits. High bias scores may be a red flag for a false positive. It is difficult to correct for all possible ways in which a nonrandom but nonhomologous biological sequences can appear to be similar, such as short-period tandem repeats, so there are cases where the bias correction is not strong enough (creating false positives).
652f9d550531 Uploaded
bgruening
parents:
diff changeset
236 (15) score: The score (in bits) for this target/query comparison. It includes the biased-composition cor-rection (the “null3” model for CM hits, or the “null2” model for HMM hits).
652f9d550531 Uploaded
bgruening
parents:
diff changeset
237 (16) E-value: The expectation value (statistical significance) of the target. This is a per query E-value; i.e. calculated as the expected number of false positives achieving this comparison’s score for a single query against the search space Z. For cmsearch Z is defined as the total number of nucleotides in the target dataset multiplied by 2 because both strands are searched. For cmscan Z is the total number of nucleotides in the query sequence multiplied by 2 because both strands are searched and multiplied by the number of models in the target database. If you search with multiple queries and if you want to control the overall false positive rate of that search rather than the false positive rate per query, you will want to multiply this per-query E-value by how many queries you’re doing.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
238 (17) inc: Indicates whether or not this hit achieves the inclusion threshold: ’!’ if it does, ’?’ if it does not (and rather only achieves the reporting threshold). By default, the inclusion threshold is an E-value of 0.01 and the reporting threshold is an E-value of 10.0, but these can be changed with command line options as described in the manual pages.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
239 (18) description of target: The remainder of the line is the target’s description line, as free text.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
240
652f9d550531 Uploaded
bgruening
parents:
diff changeset
241
652f9d550531 Uploaded
bgruening
parents:
diff changeset
242 For further questions please refere to the Infernal Userguide_.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
243
652f9d550531 Uploaded
bgruening
parents:
diff changeset
244 .. _Userguide: http://selab.janelia.org/software/infernal/Userguide.pdf
652f9d550531 Uploaded
bgruening
parents:
diff changeset
245
652f9d550531 Uploaded
bgruening
parents:
diff changeset
246
652f9d550531 Uploaded
bgruening
parents:
diff changeset
247 How do I cite Infernal?
652f9d550531 Uploaded
bgruening
parents:
diff changeset
248 -----------------------
652f9d550531 Uploaded
bgruening
parents:
diff changeset
249
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
250 The recommended citation for using Infernal 1.1 is E. P. Nawrocki and S. R. Eddy, Infernal 1.1: 100-fold faster RNA homology searches , Bioinformatics 29:2933-2935 (2013).
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
251
652f9d550531 Uploaded
bgruening
parents:
diff changeset
252 **Galaxy Wrapper Author**::
652f9d550531 Uploaded
bgruening
parents:
diff changeset
253
652f9d550531 Uploaded
bgruening
parents:
diff changeset
254 * Bjoern Gruening, University of Freiburg
652f9d550531 Uploaded
bgruening
parents:
diff changeset
255
2
fac157e22e1b Uploaded
bgruening
parents: 1
diff changeset
256 ]]>
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
257 </help>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
258 </tool>