Mercurial > repos > crs4 > blat
comparison blat_wrapper.xml @ 0:0a71a7d35d09 draft
Uploaded
author | crs4 |
---|---|
date | Wed, 16 Oct 2013 13:54:38 -0400 |
parents | |
children | c4ad58c4bc7d |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:0a71a7d35d09 |
---|---|
1 <tool id="blat_wrapper" name="BLAT" version="0.2"> | |
2 <description></description> | |
3 <requirements> | |
4 <requirement type="package" version="35">blat</requirement> | |
5 </requirements> | |
6 <command> | |
7 blat $database $query -t=$databaseType.databaseType_select -q=$databaseType.queryType | |
8 #if str($databaseType.tileSize) | |
9 -tileSize=$databaseType.tileSize | |
10 #end if | |
11 #if str($stepSize) | |
12 -stepSize=$stepSize | |
13 #end if | |
14 #if $oneOff | |
15 -oneOff=1 | |
16 #end if | |
17 #if str($databaseType.minMatch) | |
18 -minMatch=$databaseType.minMatch | |
19 #end if | |
20 #if str($minScore) | |
21 -minScore=$minScore | |
22 #end if | |
23 #if str($databaseType.minIdentity) | |
24 -minIdentity=$databaseType.minIdentity | |
25 #end if | |
26 #if str($maxGap) | |
27 -maxGap=$maxGap | |
28 #end if | |
29 #if str($repMatch) | |
30 -repMatch=$repMatch | |
31 #end if | |
32 #if $mask.mask_select | |
33 -mask=$mask.mask_select | |
34 #else if $mask.repeats | |
35 -repeats=$mask.repeats | |
36 #end if | |
37 #if $qMask | |
38 -qMask=$qMask | |
39 #end if | |
40 #if str($dots) | |
41 -dots=$dots | |
42 #end if | |
43 #if $trimT | |
44 -trimT | |
45 #end if | |
46 #if $noTrimA | |
47 -noTrimA | |
48 #end if | |
49 #if $trimHardA | |
50 -trimHardA | |
51 #end if | |
52 #if $fastMap | |
53 -fastMap | |
54 #end if | |
55 #if $fine | |
56 -fine | |
57 #end if | |
58 #if str($maxIntron) | |
59 -maxIntron=$maxIntron | |
60 #end if | |
61 #if $extendThroughN | |
62 -extendThroughN | |
63 #end if | |
64 -out=$out | |
65 $output > $logfile | |
66 </command> | |
67 | |
68 <inputs> | |
69 <param name="database" type="data" format="fasta,twobit" label="Database" help="FASTA or 2bit format" /> | |
70 <param name="query" type="data" format="fasta,twobit" label="Query" help="FASTA or 2bit format" /> | |
71 | |
72 <conditional name="databaseType"> | |
73 <param name="databaseType_select" type="select" label="Database type (-t)"> | |
74 <option value="dna" selected="true">DNA sequence (dna)</option> | |
75 <option value="prot">Protein sequence (prot)</option> | |
76 <option value="dnax">DNA sequence translated in six frames to protein (dnax)</option> | |
77 </param> | |
78 <when value="dna"> | |
79 <param name="queryType" type="select" label="Select the query type (-q)"> | |
80 <option value="dna" selected="true">DNA sequence (dna)</option> | |
81 <option value="rna">RNA sequence (rna)</option> | |
82 </param> | |
83 <param name="tileSize" type="integer" value="11" min="6" max="18" optional="true" label="Size of match that triggers an alignment (-tileSize)" help="Usually between 8 and 12" /> | |
84 <param name="minMatch" type="integer" value="2" optional="true" label="Number of tile matches (-minMatch)"> | |
85 <validator type="in_range" min="1" /> | |
86 </param> | |
87 <param name="minIdentity" type="integer" value="90" optional="true" label="Minimum sequence identity (%) (-minIdentity)" /> | |
88 </when> | |
89 <when value="prot"> | |
90 <param name="queryType" type="select" label="Select the query type (-q)"> | |
91 <option value="prot">Protein sequence (prot)</option> | |
92 </param> | |
93 <param name="tileSize" type="integer" value="5" min="3" max="8" optional="true" label="Size of match that triggers an alignment (-tileSize)" help="Usually between 8 and 12" /> | |
94 <param name="minMatch" type="integer" value="1" optional="true" label="Number of tile matches (-minMatch)"> | |
95 <validator type="in_range" min="1" /> | |
96 </param> | |
97 <param name="minIdentity" type="integer" value="25" optional="true" label="Minimum sequence identity (%) (-minIdentity)" /> | |
98 </when> | |
99 <when value="dnax"> | |
100 <param name="queryType" type="select" label="Select the query type (-q)"> | |
101 <option value="prot">Protein sequence (prot)</option> | |
102 <option value="dnax">DNA sequence translated in six frames to protein (dnax)</option> | |
103 <option value="rnax">DNA sequence translated in three frames to protein (rnax)</option> | |
104 </param> | |
105 <param name="tileSize" type="integer" value="5" min="3" max="8" optional="true" label="Size of match that triggers an alignment (-tileSize)" help="Usually between 8 and 12" /> | |
106 <param name="minMatch" type="integer" value="1" optional="true" label="Number of tile matches (-minMatch)"> | |
107 <validator type="in_range" min="1" /> | |
108 </param> | |
109 <param name="minIdentity" type="integer" value="25" optional="true" label="Minimum sequence identity (%) (-minIdentity)" /> | |
110 </when> | |
111 </conditional> | |
112 | |
113 <!-- <param name="ooc" type="data" format="ooc" optional="true" label="Over-occuring N-mers file (-ooc) produced with blat -makeOoc" help="Use N as tileSize below." /> This should wait for a makeOoc wrapper --> | |
114 | |
115 <param name="stepSize" type="integer" value="" optional="true" label="Spacing between tiles (-stepSize)" help="Default is tileSize"> | |
116 <validator type="in_range" min="1" /> | |
117 </param> | |
118 | |
119 <param name="oneOff" type="boolean" checked="false" label="If set, this allows one mismatch in tile and still triggers an alignments (-oneOff)" /> | |
120 | |
121 <param name="minScore" type="integer" value="30" optional="true" label="Minimum score (-minScore)" help="It is the matches minus the mismatches minus some sort of gap penalty" /> | |
122 | |
123 <param name="maxGap" type="integer" value="2" optional="true" label="Maximum gap between tiles in a clump (-maxGap)" help="Usually set from 0 to 3. Only relevant for minMatch > 1" /> | |
124 | |
125 <!-- <param name="makeOoc" type="boolean" checked="false" label="Make overused tile file N.ooc (-makeOoc)" help="Target needs to be a complete genome" /> This should go in a separate wrapper since after making the ooc file, blat exits --> | |
126 | |
127 <param name="repMatch" type="integer" value="" optional="true" label="Number of repetitions of a tile allowed before it is marked as overused (-repMatch)" help="Typically this is 256 for tileSize 12, 1024 for tileSize 11, 4096 for tileSize 10. Also affected by stepSize. When stepSize is halved repMatch is doubled to compensate" /> | |
128 | |
129 <conditional name="mask"> | |
130 <param name="mask_select" type="select" label="Mask out repeats in database sequences (-mask)" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored completely in protein or translated searches"> | |
131 <option value="">No masking</option> | |
132 <option value="lower">Mask out lower cased sequence</option> | |
133 <option value="upper">Mask out upper cased sequence</option> | |
134 <!-- <option value="out">Mask out according to database.out RepeatMasker.out file</option> | |
135 <option value="file.out">Mask database according to RepeatMasker file.out</option>--> | |
136 </param> | |
137 <when value=""> | |
138 <param name="repeats" type="select" label="Select repeat type if matches in repeat areas should be reported separately from matches in other areas (-repeats)"> | |
139 <option value="">No masking</option> | |
140 <option value="lower">Mask out lower cased sequence</option> | |
141 <option value="upper">Mask out upper cased sequence</option> | |
142 <!-- <option value="out">Mask out according to database.out RepeatMasker.out file</option> | |
143 <option value="file.out">Mask database according to RepeatMasker file.out</option>--> | |
144 </param> | |
145 </when> | |
146 <when value="lower" /> | |
147 <when value="upper" /> | |
148 </conditional> | |
149 <param name="qMask" type="select" label="Mask out repeats in query sequences (-qMask)"> | |
150 <option value="">No masking</option> | |
151 <option value="lower">Mask out lower cased sequence</option> | |
152 <option value="upper">Mask out upper cased sequence</option> | |
153 <!-- <option value="out">Mask out according to database.out RepeatMasker .out file</option> | |
154 <option value="file.out">Mask database according to RepeatMasker file.out</option>--> | |
155 </param> | |
156 <!-- <param name="minRepDivergence" type="integer" optional="true" value="15" label="Minimum percent divergence of repeats to allow them to be unmasked (-minRepDivergence)" help="Only relevant for masking using RepeatMasket .out files" />--> | |
157 | |
158 <param name="dots" type="integer" value="" optional="true" label="Output a dot every N sequences in log (-dots)" help="Dots show program's progress" /> | |
159 | |
160 <param name="trimT" type="boolean" checked="false" label="Trim leading poly-T (-trimT)" /> | |
161 | |
162 <param name="noTrimA" type="boolean" checked="false" label="Don't trim trailing poly-A (-noTrimA)" /> | |
163 | |
164 <param name="trimHardA" type="boolean" checked="false" label="Remove poly-A tail from qSize and alignments in .psl output (-trimHardA)" /> | |
165 | |
166 <param name="fastMap" type="boolean" checked="false" label="Run for fast DNA/DNA remapping (-fastMap)" help="It does not allow introns and require high %ID. Query sizes must not exceed 5000" /> | |
167 | |
168 <param name="fine" type="boolean" checked="false" label="Refine search for small initial and terminal exons (-fine)" help="For high-quality mRNAs. Not recommended for ESTs" /> | |
169 <param name="maxIntron" type="integer" value="750000" optional="true" label="Maximum intron size (-maxIntron)" /> | |
170 <param name="extendThroughN" type="boolean" checked="false" label="Allow extension of alignment through large blocks of N's (-extendThroughN)" /> | |
171 <param name="out" type="select" label="Select output file format (-out)"> | |
172 <option value="psl">Tab-separated format, no sequence (psl)</option> | |
173 <option value="psl -noHead">Tab-separated format, no sequence, no header (psl -noHead)</option> | |
174 <option value="pslx">Tab-separated format with sequence (pslx)</option> | |
175 <option value="pslx -noHead">Tab-separated format with sequence, no header (pslx -noHead)</option> | |
176 <option value="axt">Blastz-associated axt format (axt)</option> | |
177 <option value="maf">Multiz-associated maf format (maf)</option> | |
178 <option value="sim4">Similar to sim4 format (sim4)</option> | |
179 <option value="wublast">Similar to WU-BLAST format (wublast)</option> | |
180 <option value="blast">Similar to NCBI BLAST format (blast)</option> | |
181 <option value="blast8">NCBI BLAST tabular format (blast8)</option> | |
182 <option value="blast9">NCBI BLAST tabular format with comments (blast9)</option> | |
183 </param> | |
184 </inputs> | |
185 | |
186 <outputs> | |
187 <data name="logfile" format="txt" label="${tool.name} on ${on_string}: log" /> | |
188 <data name="output" format="txt" label="${tool.name} on ${on_string}: alignment"> | |
189 <change_format> | |
190 <when input="out" value="psl -noHead" format="tabular" /> | |
191 <when input="out" value="pslx -noHead" format="tabular" /> | |
192 <when input="out" value="axt" format="axt" /> | |
193 <when input="out" value="maf" format="maf" /> | |
194 <when input="out" value="blast8" format="tabular" /> | |
195 </change_format> | |
196 </data> | |
197 </outputs> | |
198 | |
199 <tests> | |
200 </tests> | |
201 <help> | |
202 **What it does** | |
203 | |
204 BLAT produces two major classes of alignments: | |
205 | |
206 - at the DNA level between two sequences that are of 95% or greater identity, but which may include large inserts; | |
207 - at the protein or translated DNA level between sequences that are of 80% or greater identity and may also include large inserts. | |
208 | |
209 The output of BLAT is flexible. By default it is a simple tab-delimited file which describes the alignment, but which does not include the sequence of the alignment itself. Optionally it can produce BLAST and WU-BLAST compatible output as well as a number of other formats. | |
210 | |
211 **License and citation** | |
212 | |
213 This Galaxy tool is Copyright © 2013 `CRS4 Srl.`_ and is released under the `MIT license`_. | |
214 | |
215 .. _CRS4 Srl.: http://www.crs4.it/ | |
216 .. _MIT license: http://opensource.org/licenses/MIT | |
217 | |
218 If you use this tool in Galaxy, please cite |Cuccuru2013|_. | |
219 | |
220 .. |Cuccuru2013| replace:: Cuccuru, G., Orsini, M., Pinna, A., Sbardellati, A., Soranzo, N., Travaglione, A., Uva, P., Zanetti, G., Fotia, G. (2013) Orione, a web-based framework for NGS analysis in microbiology. *Submitted* | |
221 .. _Cuccuru2013: http://orione.crs4.it/ | |
222 | |
223 This tool uses `BLAT`_, which is licensed separately. Please cite |Kent2002|_. | |
224 | |
225 .. _BLAT: http://genome.ucsc.edu/FAQ/FAQblat.html | |
226 .. |Kent2002| replace:: Kent, W. J. (2002) BLAT – The BLAST-Like Alignment Tool. *Genome Res.* 12(4), 656-664 | |
227 .. _Kent2002: http://genome.cshlp.org/content/12/4/656 | |
228 </help> | |
229 </tool> |