annotate cmsearch.xml @ 1:55bb96edfc07 draft

Uploaded
author bgruening
date Thu, 24 Apr 2014 15:02:05 -0400
parents 652f9d550531
children fac157e22e1b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
1 <tool id="infernal_cmsearch" name="Search covariance model(s)" version="1.1.0.2">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
2 <description>against a sequence database (cmsearch)</description>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
3 <parallelism method="multi" split_inputs="seqdb" split_mode="to_size" split_size="100" shared_inputs="" merge_outputs="outfile,multiple_alignment_output"></parallelism>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
4 <requirements>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
5 <requirement type="package">infernal</requirement>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
6 <requirement type="package" version="1.1">infernal</requirement>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
7 <requirement type="package" version="8.21">gnu_coreutils</requirement>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
8 </requirements>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
9 <command>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
10 ## a temp file is needed, because the standard tabular output from infernal is not usefull in Galaxy
652f9d550531 Uploaded
bgruening
parents:
diff changeset
11 ## it will be converted to a tab delimited file and piped to Galaxy
652f9d550531 Uploaded
bgruening
parents:
diff changeset
12 temp_tabular_output=\$(mktemp);
652f9d550531 Uploaded
bgruening
parents:
diff changeset
13
652f9d550531 Uploaded
bgruening
parents:
diff changeset
14 cmsearch
652f9d550531 Uploaded
bgruening
parents:
diff changeset
15 ## Infernal Options
652f9d550531 Uploaded
bgruening
parents:
diff changeset
16 --cpu "\${GALAXY_SLOTS:-12}"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
17 -o /dev/null
652f9d550531 Uploaded
bgruening
parents:
diff changeset
18 --tformat $seqdb.ext ##target format: fasta, embl, genbank, ddbj, stockholm, pfam, a2m, afa, clustal, and phylip
652f9d550531 Uploaded
bgruening
parents:
diff changeset
19 $bottomonly
652f9d550531 Uploaded
bgruening
parents:
diff changeset
20 $toponly
652f9d550531 Uploaded
bgruening
parents:
diff changeset
21 $cyk
652f9d550531 Uploaded
bgruening
parents:
diff changeset
22 $notrunc
652f9d550531 Uploaded
bgruening
parents:
diff changeset
23 $max
652f9d550531 Uploaded
bgruening
parents:
diff changeset
24 $nohmm
652f9d550531 Uploaded
bgruening
parents:
diff changeset
25 $mid
652f9d550531 Uploaded
bgruening
parents:
diff changeset
26 ##$bitscore_thresholds
652f9d550531 Uploaded
bgruening
parents:
diff changeset
27 --tblout \$temp_tabular_output
652f9d550531 Uploaded
bgruening
parents:
diff changeset
28 $g
652f9d550531 Uploaded
bgruening
parents:
diff changeset
29 #if $A:
652f9d550531 Uploaded
bgruening
parents:
diff changeset
30 $A $multiple_alignment_output
652f9d550531 Uploaded
bgruening
parents:
diff changeset
31 #end if
652f9d550531 Uploaded
bgruening
parents:
diff changeset
32
652f9d550531 Uploaded
bgruening
parents:
diff changeset
33 #if str($inclusion_thresholds_opts.inclusion_thresholds_selector) == "--incE":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
34 --incE $inclusion_thresholds_opts.incE
652f9d550531 Uploaded
bgruening
parents:
diff changeset
35 #elif str($inclusion_thresholds_opts.inclusion_thresholds_selector) == "--incT":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
36 --incT $inclusion_thresholds_opts.incT
652f9d550531 Uploaded
bgruening
parents:
diff changeset
37 #end if
652f9d550531 Uploaded
bgruening
parents:
diff changeset
38
652f9d550531 Uploaded
bgruening
parents:
diff changeset
39 #if str($reporting_thresholds_opts.reporting_thresholds_selector) == "-E":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
40 -E $reporting_thresholds_opts.E
652f9d550531 Uploaded
bgruening
parents:
diff changeset
41 #elif str($reporting_thresholds_opts.reporting_thresholds_selector) == "-T":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
42 -T $reporting_thresholds_opts.T
652f9d550531 Uploaded
bgruening
parents:
diff changeset
43 #end if
652f9d550531 Uploaded
bgruening
parents:
diff changeset
44
652f9d550531 Uploaded
bgruening
parents:
diff changeset
45 ## CM file from the history or stored as database on disc
652f9d550531 Uploaded
bgruening
parents:
diff changeset
46
652f9d550531 Uploaded
bgruening
parents:
diff changeset
47 #if str($cm_opts.cm_opts_selector) == "db":
652f9d550531 Uploaded
bgruening
parents:
diff changeset
48 $cm_opts.database.fields.path
652f9d550531 Uploaded
bgruening
parents:
diff changeset
49 #else:
652f9d550531 Uploaded
bgruening
parents:
diff changeset
50 $cm_opts.cmfile
652f9d550531 Uploaded
bgruening
parents:
diff changeset
51 #end if
652f9d550531 Uploaded
bgruening
parents:
diff changeset
52
652f9d550531 Uploaded
bgruening
parents:
diff changeset
53 ## sequence file
652f9d550531 Uploaded
bgruening
parents:
diff changeset
54 $seqdb
652f9d550531 Uploaded
bgruening
parents:
diff changeset
55 2>&#38;1
652f9d550531 Uploaded
bgruening
parents:
diff changeset
56 ;
652f9d550531 Uploaded
bgruening
parents:
diff changeset
57
652f9d550531 Uploaded
bgruening
parents:
diff changeset
58 ## 1. replace all lines starting # (comment lines)
652f9d550531 Uploaded
bgruening
parents:
diff changeset
59 ## 2. replace the first 18 spaces with tabs, 18th field is a free text field (can contain spaces)
1
55bb96edfc07 Uploaded
bgruening
parents: 0
diff changeset
60 sed -e 's/#.*$//' -e '/^$/d' -e 's/\s\+/\t/g' -e 's/\t/ /18g' \$temp_tabular_output > $outfile
0
652f9d550531 Uploaded
bgruening
parents:
diff changeset
61
652f9d550531 Uploaded
bgruening
parents:
diff changeset
62 </command>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
63 <inputs>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
64
652f9d550531 Uploaded
bgruening
parents:
diff changeset
65 <param name="seqdb" type="data" format="fasta" label="Sequence database"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
66
652f9d550531 Uploaded
bgruening
parents:
diff changeset
67 <conditional name="cm_opts">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
68 <param name="cm_opts_selector" type="select" label="Subject covariance models">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
69 <option value="db" selected="True">Locally installed covariance models</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
70 <option value="histdb">Covariance model from your history</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
71 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
72 <when value="db">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
73 <param name="database" type="select" label="Covariance models">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
74 <options from_file="infernal.loc">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
75 <column name="value" index="0"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
76 <column name="name" index="1"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
77 <column name="path" index="2"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
78 </options>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
79 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
80 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
81 <when value="histdb">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
82 <param name="cmfile" type="data" format="cm" label="Covariance models file from the history."/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
83 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
84 </conditional>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
85
652f9d550531 Uploaded
bgruening
parents:
diff changeset
86 <param name="g" truevalue="-g" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
87 label="Turn on the glocal alignment algorithm" help="... global with respect to the query model and local with respect to the target database."/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
88
652f9d550531 Uploaded
bgruening
parents:
diff changeset
89 <param name="bottomonly" truevalue="--bottomonly" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
90 label="Only search the bottom (Crick) strand of target sequences" help="in the sequence database"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
91 <param name="toponly" truevalue="--toponly" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
92 label="Only search the top (Watson) strand of target sequences" help="in the sequence database"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
93
652f9d550531 Uploaded
bgruening
parents:
diff changeset
94 <param name="cyk" truevalue="--cyk" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
95 label="Use the CYK algorithm, not Inside, to determine the final score of all hits" help=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
96 <param name="--acyk" truevalue="--cyk" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
97 label="Use the CYK algorithm to align hits" help="By default, the Durbin/Holmes optimal accuracy algorithm is used, which finds the alignment that maximizes the expected accuracy of all aligned residues."/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
98
652f9d550531 Uploaded
bgruening
parents:
diff changeset
99 <param name="notrunc" truevalue="--notrunc" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
100 label="Turn off truncated hit detection" help=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
101
652f9d550531 Uploaded
bgruening
parents:
diff changeset
102 <!-- accelleration pipeline -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
103
652f9d550531 Uploaded
bgruening
parents:
diff changeset
104 <param name="max" truevalue="--max" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
105 label="Turn off all filters, and run non-banded Inside on every full-length target sequence" help="This
652f9d550531 Uploaded
bgruening
parents:
diff changeset
106 increases sensitivity somewhat, at an extremely large cost in speed."/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
107
652f9d550531 Uploaded
bgruening
parents:
diff changeset
108 <param name="nohmm" truevalue="--nohmm" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
109 label="Turn off all HMM filter stages " help=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
110
652f9d550531 Uploaded
bgruening
parents:
diff changeset
111 <param name="mid" truevalue="--mid" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
112 label="Turn off the HMM SSV and Viterbi filter stages" help=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
113
652f9d550531 Uploaded
bgruening
parents:
diff changeset
114
652f9d550531 Uploaded
bgruening
parents:
diff changeset
115 <!-- Options for model-specific score thresholding -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
116 <!--
652f9d550531 Uploaded
bgruening
parents:
diff changeset
117 <param name="bitscore_thresholds" type="select" label="Bit score thresholds" help="Curated CM databases may define specific bit score thresholds for each CM, superseding any thresholding based on statistical significance alone.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
118 <option value="" selected="true">None</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
119 <option value=" - -cut_ga">GA (gathering) bit scores</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
120 <option value=" - -cut_nc">NC (noise cutoff) bit score</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
121 <option value=" - -cut_tc">TC (trusted cutoff) bit score</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
122 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
123 -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
124 <!-- Options for inclusion thresholds -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
125
652f9d550531 Uploaded
bgruening
parents:
diff changeset
126
652f9d550531 Uploaded
bgruening
parents:
diff changeset
127 <conditional name="inclusion_thresholds_opts">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
128 <param name="inclusion_thresholds_selector" type="select" label="Inclusion thresholds"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
129 help="Inclusion thresholds are stricter than reporting thresholds. Inclusion thresholds control which hits are considered to be reliable enough to be included in an output alignment or in a possible subsequent search round, or marked as significant (”!”) as opposed to questionable (”?”) in hit output.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
130 <option value="" selected="true">default</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
131 <option value="--incE">Use E-value</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
132 <option value="--incT">Use bit score</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
133 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
134 <when value=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
135 <when value="--incE">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
136 <param name="incE" type="float" value="0.01" size="5" label="Use E-value" help="of &lt;= X as the hit inclusion threshold.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
137 <sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
138 <valid initial="string.printable">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
139 <remove value="&apos;"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
140 </valid>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
141 </sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
142 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
143 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
144 <when value="--incT">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
145 <param name="incT" type="integer" size="5" value="0" label="Use bit score" help="of >= X as the hit inclusion threshold.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
146 <sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
147 <valid initial="string.printable">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
148 <remove value="&apos;"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
149 </valid>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
150 </sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
151 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
152 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
153 </conditional>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
154
652f9d550531 Uploaded
bgruening
parents:
diff changeset
155 <!-- Options controlling reporting thresholds -->
652f9d550531 Uploaded
bgruening
parents:
diff changeset
156
652f9d550531 Uploaded
bgruening
parents:
diff changeset
157 <conditional name="reporting_thresholds_opts">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
158 <param name="reporting_thresholds_selector" type="select" label="reporting thresholds"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
159 help="Reporting thresholds control which hits are reported in output files">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
160 <option value="" selected="true">default</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
161 <option value="-E">Use E-value</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
162 <option value="-T">Use bit score</option>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
163 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
164 <when value=""/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
165 <when value="-E">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
166 <param name="E" type="float" value="10.0" size="5" label="Use E-value" help="of &lt;= X as the hit reporting threshold. The default is 10.0, meaning that on average, about 10 false positives will be reported per query, so you can see the top of the noise and decide for yourself if it’s really noise.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
167 <sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
168 <valid initial="string.printable">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
169 <remove value="&apos;"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
170 </valid>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
171 </sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
172 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
173 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
174 <when value="-T">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
175 <param name="T" type="integer" size="5" value="0" label="Use bit score" help="of >= X as the hit reporting threshold.">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
176 <sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
177 <valid initial="string.printable">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
178 <remove value="&apos;"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
179 </valid>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
180 </sanitizer>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
181 </param>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
182 </when>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
183 </conditional>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
184
652f9d550531 Uploaded
bgruening
parents:
diff changeset
185 <param name="A" truevalue="-A" falsevalue="" checked="False" type="boolean"
652f9d550531 Uploaded
bgruening
parents:
diff changeset
186 label="Save a multiple alignment of all significant hits" help="... those satisfying inclusion thresholds"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
187
652f9d550531 Uploaded
bgruening
parents:
diff changeset
188 </inputs>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
189 <outputs>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
190
652f9d550531 Uploaded
bgruening
parents:
diff changeset
191 <data format="tabular" name="outfile" label="cmsearch on ${on_string}"/>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
192 <data format="tabular" name="multiple_alignment_output" label="cmsearch on ${on_string} (multi alignment)">
652f9d550531 Uploaded
bgruening
parents:
diff changeset
193 <filter>A is True</filter>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
194 </data>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
195
652f9d550531 Uploaded
bgruening
parents:
diff changeset
196 </outputs>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
197 <help>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
198
652f9d550531 Uploaded
bgruening
parents:
diff changeset
199
652f9d550531 Uploaded
bgruening
parents:
diff changeset
200 **What it does**
652f9d550531 Uploaded
bgruening
parents:
diff changeset
201
652f9d550531 Uploaded
bgruening
parents:
diff changeset
202 Infernal is used to search sequence databases for homologs of structural RNA sequences, and to make
652f9d550531 Uploaded
bgruening
parents:
diff changeset
203 sequence- and structure-based RNA sequence alignments. Infernal needs a profile from a structurally
652f9d550531 Uploaded
bgruening
parents:
diff changeset
204 annotated multiple sequence alignment of an RNA family with a position-specific scoring system for substitutions,
652f9d550531 Uploaded
bgruening
parents:
diff changeset
205 insertions, and deletions. Positions in the profile that are basepaired in the consensus secondary
652f9d550531 Uploaded
bgruening
parents:
diff changeset
206 structure of the alignment are modeled as dependent on one another, allowing Infernal’s scoring system to
652f9d550531 Uploaded
bgruening
parents:
diff changeset
207 consider the secondary structure, in addition to the primary sequence, of the family being modeled. Infernal
652f9d550531 Uploaded
bgruening
parents:
diff changeset
208 profiles are probabilistic models called “covariance models”, a specialized type of stochastic context-free
652f9d550531 Uploaded
bgruening
parents:
diff changeset
209 grammar (SCFG) (Lari and Young, 1990).
652f9d550531 Uploaded
bgruening
parents:
diff changeset
210
652f9d550531 Uploaded
bgruening
parents:
diff changeset
211 Compared to other alignment and database search tools based only on sequence comparison, Infernal
652f9d550531 Uploaded
bgruening
parents:
diff changeset
212 aims to be significantly more accurate and more able to detect remote homologs because it models sequence
652f9d550531 Uploaded
bgruening
parents:
diff changeset
213 and structure.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
214
652f9d550531 Uploaded
bgruening
parents:
diff changeset
215
652f9d550531 Uploaded
bgruening
parents:
diff changeset
216 Output format
652f9d550531 Uploaded
bgruening
parents:
diff changeset
217 -------------
652f9d550531 Uploaded
bgruening
parents:
diff changeset
218
652f9d550531 Uploaded
bgruening
parents:
diff changeset
219 (1) target name: The name of the target sequence or profile.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
220 (2) accession: The accession of the target sequence or profile, or ’-’ if none.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
221 (3) query name: The name of the query sequence or profile.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
222 (4) accession: The accession of the query sequence or profile, or ’-’ if none.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
223 (5) mdl (model): Which type of model was used to compute the final score. Either ’cm’ or ’hmm’. A CM is used to compute the final hit scores unless the model has zero basepairs or the --hmmonly option is used, in which case a HMM will be used.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
224 (6) mdl from (model coord): The start of the alignment of this hit with respect to the profile (CM or HMM), numbered 1..N for a profile of N consensus positions.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
225 (7) mdl to (model coord): The end of the alignment of this hit with respect to the profile (CM or HMM), numbered 1..N for a profile of N consensus positions.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
226 (8) seq from (ali coord): The start of the alignment of this hit with respect to the sequence, numbered 1..L for a sequence of L residues.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
227 (9) seq to (ali coord): The end of the alignment of this hit with respect to the sequence, numbered 1..L for a sequence of L residues.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
228 (10) strand: The strand on which the hit occurs on the sequence. ’+’ if the hit is on the top (Watson) strand, ’-’ if the hit is on the bottom (Crick) strand. If on the top strand, the “seq from” value will be less than or equal to the “seq to” value, else it will be greater than or equal to it.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
229 (11) trunc: Indicates if this is predicted to be a truncated CM hit or not. This will be “no” if it is a CM hit that is not predicted to be truncated by the end of the sequence, “5’ ” or “3’ ” if the hit is predicted to have one or more 5’ or 3’ residues missing due to a artificial truncation of the sequence, or “5’&amp;3”’ if the hit is predicted to have one or more 5’ residues missing and one or more 3’ residues missing. If the hit is an HMM hit, this will always be ’-’.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
230 (12) pass: Indicates what “pass” of the pipeline the hit was detected on. This is probably only useful for testing and debugging. Non-truncated hits are found on the first pass, truncated hits are found on successive passes.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
231 (13) gc: Fraction of G and C nucleotides in the hit.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
232 (14) bias: The biased-composition correction: the bit score difference contributed by the null3 model for CM hits, or the null2 model for HMM hits. High bias scores may be a red flag for a false positive. It is difficult to correct for all possible ways in which a nonrandom but nonhomologous biological sequences can appear to be similar, such as short-period tandem repeats, so there are cases where the bias correction is not strong enough (creating false positives).
652f9d550531 Uploaded
bgruening
parents:
diff changeset
233 (15) score: The score (in bits) for this target/query comparison. It includes the biased-composition cor-rection (the “null3” model for CM hits, or the “null2” model for HMM hits).
652f9d550531 Uploaded
bgruening
parents:
diff changeset
234 (16) E-value: The expectation value (statistical significance) of the target. This is a per query E-value; i.e. calculated as the expected number of false positives achieving this comparison’s score for a single query against the search space Z. For cmsearch Z is defined as the total number of nucleotides in the target dataset multiplied by 2 because both strands are searched. For cmscan Z is the total number of nucleotides in the query sequence multiplied by 2 because both strands are searched and multiplied by the number of models in the target database. If you search with multiple queries and if you want to control the overall false positive rate of that search rather than the false positive rate per query, you will want to multiply this per-query E-value by how many queries you’re doing.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
235 (17) inc: Indicates whether or not this hit achieves the inclusion threshold: ’!’ if it does, ’?’ if it does not (and rather only achieves the reporting threshold). By default, the inclusion threshold is an E-value of 0.01 and the reporting threshold is an E-value of 10.0, but these can be changed with command line options as described in the manual pages.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
236 (18) description of target: The remainder of the line is the target’s description line, as free text.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
237
652f9d550531 Uploaded
bgruening
parents:
diff changeset
238
652f9d550531 Uploaded
bgruening
parents:
diff changeset
239 For further questions please refere to the Infernal Userguide_.
652f9d550531 Uploaded
bgruening
parents:
diff changeset
240
652f9d550531 Uploaded
bgruening
parents:
diff changeset
241 .. _Userguide: http://selab.janelia.org/software/infernal/Userguide.pdf
652f9d550531 Uploaded
bgruening
parents:
diff changeset
242
652f9d550531 Uploaded
bgruening
parents:
diff changeset
243
652f9d550531 Uploaded
bgruening
parents:
diff changeset
244 How do I cite Infernal?
652f9d550531 Uploaded
bgruening
parents:
diff changeset
245 -----------------------
652f9d550531 Uploaded
bgruening
parents:
diff changeset
246
652f9d550531 Uploaded
bgruening
parents:
diff changeset
247 The recommended citation for using Infernal 1.1 is E. P. Nawrocki and S. R. Eddy, Infernal 1.1: 100-fold faster RNA homology searches , Bioinformatics 29:2933-2935 (2013).
652f9d550531 Uploaded
bgruening
parents:
diff changeset
248
652f9d550531 Uploaded
bgruening
parents:
diff changeset
249 **Galaxy Wrapper Author**::
652f9d550531 Uploaded
bgruening
parents:
diff changeset
250
652f9d550531 Uploaded
bgruening
parents:
diff changeset
251 * Bjoern Gruening, University of Freiburg
652f9d550531 Uploaded
bgruening
parents:
diff changeset
252
652f9d550531 Uploaded
bgruening
parents:
diff changeset
253 </help>
652f9d550531 Uploaded
bgruening
parents:
diff changeset
254 </tool>