comparison blat.xml @ 7:10f3a5b6f2ac draft

planemo upload commit 964ceec6b1c6371b10923c7d49446b1361fc5895-dirty
author yating-l
date Mon, 09 Jul 2018 13:07:54 -0400
parents 250a7f2b1331
children a9d863528f48
comparison
equal deleted inserted replaced
6:250a7f2b1331 7:10f3a5b6f2ac
1 <?xml version="1.0"?> 1 <?xml version="1.0"?>
2 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="36"> 2 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="1.1">
3 <description>BLAST-like sequence alignment tool</description> 3 <description>Standalone blat sequence search command line tool</description>
4 <requirements> 4 <requirements>
5 <requirement type="package" version="36">blat</requirement> 5 <requirement type="package" version="1.0">ucsc_tools_340_for_BLAT</requirement>
6 </requirements> 6 </requirements>
7 <command detect_errors="exit_code"><![CDATA[ 7 <command detect_errors="exit_code"><![CDATA[
8 #if str($reference_source.reference_source_selector) == "history": 8 #if str($reference_source.reference_source_selector) == "history":
9 ## blat depends on file extension 9 #set $reference_fasta_filename = "localref.fa"
10 #if $reference_source.database.is_of_type("fasta"):
11 #set $reference_fasta_filename = "localref.fa"
12 #elif $reference_source.database.is_of_type("twobit"):
13 #set $reference_fasta_filename = "localref.2bit"
14 #else
15 #set $reference_fasta_filename = "localref"
16 #end if
17
18 ln -s '${reference_source.database}' '${reference_fasta_filename}' && 10 ln -s '${reference_source.database}' '${reference_fasta_filename}' &&
19 #else: 11 #else:
20 #set $reference_fasta_filename = str($reference_source.database.fields.path) 12 #set $reference_fasta_filename = str($reference_source.database.fields.path)
21 #end if 13 #end if
22 14 blat
23 blat 15 #if $noHead == "yes"
24 16 -noHead
17 #end if
25 -q=$query_type 18 -q=$query_type
26 -t=$database_type 19 -t=$database_type
27
28 ${oneOff}
29
30 #if str($minScore)
31 -minScore=${minScore}
32 #end if
33
34 -maxGap=${maxGap}
35
36 #if str($repMatch)
37 -repMatch=${repMatch}
38 #end if
39
40 #if $mask_type.mask == "file.out": 20 #if $mask_type.mask == "file.out":
41 -mask='${mask_type.mask_file}' 21 -mask=$mask_type.mask_file
42 #else: 22 #else:
43 -mask=$mask_type.mask 23 -mask=$mask_type.mask
44 #end if 24 #end if
45
46 #if str($dots)
47 -dots=${dots}
48 #end if
49
50 ${trimT}
51 ${noTrimA}
52 ${trimHardA}
53 ${fastMap}
54 ${fine}
55
56 #if str($maxIntron)
57 -maxIntron=${maxIntron}
58 #end if
59
60 ${extendThroughN}
61
62 '$reference_fasta_filename' 25 '$reference_fasta_filename'
63 '${query}' 26 '${query}'
64 27 output
65 -out=${out} 28 && sort -k 10,10 -k 12,12n output > '${output_sorted}'
66
67 '${output}'
68 ]]></command> 29 ]]></command>
69 <inputs> 30 <inputs>
70 <conditional name="reference_source"> 31 <conditional name="reference_source">
71 <param name="reference_source_selector" type="select" label="Choose the source for the database"> 32 <param name="reference_source_selector" type="select" label="Choose the source for the database">
72 <option value="cached">Locally cached</option> 33 <option value="cached">Locally cached</option>
79 </options> 40 </options>
80 <validator type="no_options" message="A built-in database is not available" /> 41 <validator type="no_options" message="A built-in database is not available" />
81 </param> 42 </param>
82 </when> 43 </when>
83 <when value="history"> 44 <when value="history">
84 <param name="database" type="data" format="fasta, twobit" label="Using database file, either a .fa, .nib or .2bit file" /> 45 <param name="database" type="data" format="fasta,twobit" label="Using database file, either a .fa, .nib or .2bit file" />
85 </when> 46 </when>
86 </conditional> 47 </conditional>
87 <param type="data" name="query" format="fasta, twobit" label="Query data, either a .fa, .nib or .2bit file"/> 48 <param type="data" name="query" format="fasta,twobit" label="Query data, either a .fa, .nib or .2bit file"/>
88 <param type="select" name="database_type" format="text" multiple="false" label="database type" help="Choose your database type, the default is dnax" argument="-t"> 49 <param type="select" name="database_type" format="text" multiple="false" label="database type" help="Choose your database type, the default is dnax" argument="-t">
89 <option value="dna">dna - DNA sequence</option> 50 <option value="dna">dna - DNA sequence</option>
90 <option value="prot">prot - protein sequence</option> 51 <option value="prot">prot - protein sequence</option>
91 <option value="dnax" selected="true">dnax - DNA sequence translated in six frames to protein</option> 52 <option value="dnax" selected="true">dnax - DNA sequence translated in six frames to protein</option>
92 </param> 53 </param>
95 <option value="rna">rna - RNA sequence</option> 56 <option value="rna">rna - RNA sequence</option>
96 <option value="prot">prot - protein sequence</option> 57 <option value="prot">prot - protein sequence</option>
97 <option value="dnax">dnax - DNA sequence translated in six frames to protein</option> 58 <option value="dnax">dnax - DNA sequence translated in six frames to protein</option>
98 <option value="rnax" selected="true">rnax - DNA sequence translated in three frames to protein</option> 59 <option value="rnax" selected="true">rnax - DNA sequence translated in three frames to protein</option>
99 </param> 60 </param>
100 <param argument="-oneOff" type="boolean" truevalue="-oneOff=1" falsevalue="" label="If set, this allows one mismatch in tile and still triggers an alignments" /> 61 <param type="select" name="noHead" format="text" label="Suppresses .psl header (so it's just a tab-separated file)." >
101 <param argument="-minScore" type="integer" value="30" label="Minimum score" help="It is the matches minus the mismatches minus some sort of gap penalty" /> 62 <option value="yes" selected="true">Yes, suppresses .psl header</option>
102 <param argument="-maxGap" type="integer" value="2" min="0" max="3" label="Maximum gap between tiles in a clump" help="Usually set from 0 to 3. Only relevant for minMatch > 1" /> 63 <option value="no">No, do not suppresses .psl header</option>
103 <param argument="-repMatch" type="integer" value="" optional="true" label="Number of repetitions of a tile allowed before it is marked as overused" help="Typically this is 256 for tileSize 12, 1024 for tileSize 11, 4096 for tileSize 10. Also affected by stepSize. When stepSize is halved repMatch is doubled to compensate" /> 64 </param>
104 <conditional name="mask_type"> 65 <conditional name="mask_type">
105 <param name="mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region 66 <param name="mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region
106 but may extend through it in nucleotide searches. Masked areas 67 but may extend through it in nucleotide searches. Masked areas
107 are ignored entirely in protein or translated searches. Default is lower" argument="-mask"> 68 are ignored entirely in protein or translated searches. Default is lower" argument="-mask">
108 <option value="lower" selected="true">lower - mask out lower-cased sequence</option> 69 <option value="lower" selected="true">lower - mask out lower-cased sequence</option>
113 <when value="lower" /> 74 <when value="lower" />
114 <when value="upper" /> 75 <when value="upper" />
115 <when value="out" /> 76 <when value="out" />
116 <when value="file.out"> 77 <when value="file.out">
117 <param name="mask_file" type="data" format="txt" label="RepeatMasker file.out" /> 78 <param name="mask_file" type="data" format="txt" label="RepeatMasker file.out" />
118 </when> 79 </when>
119 </conditional> 80 </conditional>
120 <param argument="-dots" type="integer" value="" optional="true" label="Output a dot every N sequences in log" help="Dots show program's progress" />
121 <param argument="-trimT" type="boolean" truevalue="-trimT" falsevalue="" label="Trim leading poly-T" />
122 <param argument="-noTrimA" type="boolean" truevalue="-noTrimA" falsevalue="" label="Don't trim trailing poly-A" />
123 <param argument="-trimHardA" type="boolean" truevalue="-trimHardA" falsevalue="" label="Remove poly-A tail from qSize and alignments in .psl output" />
124 <param argument="-fastMap" type="boolean" truevalue="-fastMap" falsevalue="" label="Run for fast DNA/DNA remapping" help="It does not allow introns and require high %ID. Query sizes must not exceed 5000" />
125 <param argument="-fine" type="boolean" truevalue="-fine" falsevalue="" label="Refine search for small initial and terminal exons" help="For high-quality mRNAs. Not recommended for ESTs" />
126 <param argument="-maxIntron" type="integer" value="750000" optional="true" label="Maximum intron size" />
127 <param argument="-extendThroughN" type="boolean" truevalue="-extendThroughN" falsevalue="" label="Allow extension of alignment through large blocks of N's" />
128 <param name="out" type="select" label="Select output file format (-out)">
129 <option value="psl">Tab-separated format, no sequence (psl)</option>
130 <option value="psl -noHead">Tab-separated format, no sequence, no header (psl -noHead)</option>
131 <option value="axt">Blastz-associated axt format (axt)</option>
132 <option value="maf">Multiz-associated maf format (maf)</option>
133 <option value="sim4">Similar to sim4 format (sim4)</option>
134 <option value="wublast">Similar to WU-BLAST format (wublast)</option>
135 <option value="blast">Similar to NCBI BLAST format (blast)</option>
136 <option value="blast8">NCBI BLAST tabular format (blast8)</option>
137 <option value="blast9">NCBI BLAST tabular format with comments (blast9)</option>
138 </param>
139 </inputs> 81 </inputs>
140 <outputs> 82 <outputs>
141 <data name="output" format="tabular" label="${tool.name} on ${on_string}"> 83 <data format="psl" name="output_sorted" label="${tool.name} on ${on_string}"></data>
142 <change_format>
143 <when input="out" value="psl" format="psl" />
144 <when input="out" value="axt" format="axt" />
145 <when input="out" value="maf" format="maf" />
146 <when input="out" value="sim4" format="txt" />
147 <when input="out" value="wublast" format="txt" />
148 <when input="out" value="blast" format="txt" />
149 </change_format>
150 </data>
151 </outputs> 84 </outputs>
152 <tests> 85 <tests>
153 <!-- test on query of GenBank RefSeq records for Gallus gallus and database of Amazona vittata --> 86 <!-- test on query of GenBank RefSeq records for Gallus gallus and database of Amazona vittata -->
154 <test> 87 <test>
155 <param name="reference_source_selector" value="history" /> 88 <param name="reference_source_selector" value="history" />
156 <param name="database" value="amaVit1_Gallus/amaVit1.fa" /> 89 <param name="database" value="amaVit1_Gallus/amaVit1.fa" />
157 <param name="query" value="amaVit1_Gallus/Gallus_gallus_RefSeq.fa" /> 90 <param name="query" value="amaVit1_Gallus/Gallus_gallus_RefSeq.fa" />
158 <param name="database_type" value="dnax" /> 91 <param name="database_type" value="dnax" />
159 <param name="query_type" value="rnax" /> 92 <param name="query_type" value="rnax" />
93 <param name="noHead" value="yes" />
160 <param name="mask" value="lower" /> 94 <param name="mask" value="lower" />
161 <param name="out" value="psl -noHead" /> 95 <output name="output_sorted" value="amaVit1_Gallus/amaVit1_Gallus_gallus.psl" />
162 <output name="output" value="amaVit1_Gallus/amaVit1_Gallus_gallus_sorted.psl" sort="True"/>
163 </test> 96 </test>
164 <!-- test on query of partial mRNA of Drosophila melanogaster and the database of Drosophila biamipes dot chromosome --> 97 <!-- test on query of partial mRNA of Drosophila melanogaster and the database of Drosophila biamipes dot chromosome -->
165 <test> 98 <test>
166 <param name="reference_source_selector" value="history" /> 99 <param name="reference_source_selector" value="history" />
167 <param name="database" value="dbia3/dbia3.fa" /> 100 <param name="database" value="dbia3/dbia3.fa" />
168 <param name="query" value="dbia3/dmel-transcript.fa" /> 101 <param name="query" value="dbia3/dmel-transcript.fa" />
169 <param name="database_type" value="dnax" /> 102 <param name="database_type" value="dnax" />
170 <param name="query_type" value="rnax" /> 103 <param name="query_type" value="rnax" />
104 <param name="noHead" value="yes" />
171 <param name="mask" value="lower" /> 105 <param name="mask" value="lower" />
172 <param name="out" value="psl -noHead" /> 106 <output name="output_sorted" value="dbia3/dbia3.sorted.psl" />
173 <param name="maxIntron" value="" />
174 <output name="output" value="dbia3/dbia3.sorted.psl" sort="True"/>
175 </test> 107 </test>
176 <!-- test on the database masked by repeat masker --> 108 <!-- test on the database masked by repeat masker -->
177 <test> 109 <test>
178 <param name="reference_source_selector" value="history" /> 110 <param name="reference_source_selector" value="history" />
179 <param name="database" value="dbia3/dbia3_masked.2bit" /> 111 <param name="database" value="dbia3/dbia3_masked.2bit" />
180 <param name="query" value="dbia3/dmel-transcript.fa" /> 112 <param name="query" value="dbia3/dmel-transcript.fa" />
181 <param name="database_type" value="dnax" /> 113 <param name="database_type" value="dnax" />
182 <param name="query_type" value="rnax" /> 114 <param name="query_type" value="rnax" />
183 <param name="oneOff" value="false" /> 115 <param name="noHead" value="yes" />
184 <param name="minScore" value="30" />
185 <param name="maxGap" value="2" />
186 <param name="trimT" value="false" />
187 <param name="noTrimA" value="false" />
188 <param name="fine" value="false" />
189 <param name="maxIntron" value="750000" />
190 <param name="extendThroughN" value="false" />
191 <param name="mask" value="file.out" /> 116 <param name="mask" value="file.out" />
192 <param name="mask_file" value="dbia3/dbia3_RM.out" /> 117 <param name="mask_file" value="dbia3/dbia3_RM.out" />
193 <param name="out" value="psl -noHead" /> 118 <output name="output_sorted" value="dbia3/dbia3_masked.sorted.psl" />
194 <output name="output" value="dbia3/dbia3_masked.sorted.psl"/>
195 </test> 119 </test>
196 120
197 </tests> 121 </tests>
198 <help> 122 <help>
199 <![CDATA[ 123 <![CDATA[
200 BLAT 124 BLAT
201 ==== 125 ====
202 BLAT is a bioinformatics software a tool which performs rapid mRNA/DNA and cross-species protein alignments. 126 BLAT is a bioinformatics software a tool which performs rapid mRNA/DNA and cross-species protein alignments.
203 127
204 blat (version: v36)- Standalone blat sequence search command line tool. 128 blat (version: v340)- Standalone blat sequence search command line tool.
205 ------------------------------------------------------------------------- 129 -------------------------------------------------------------------------
206 130
207 usage: 131 usage:
208 ++++++ 132 ++++++
209 133
213 database and query are each either a .fa, .nib or .2bit file, 137 database and query are each either a .fa, .nib or .2bit file,
214 or a list of these files with one file name per line. 138 or a list of these files with one file name per line.
215 -ooc=11.ooc tells the program to load over-occurring 11-mers from 139 -ooc=11.ooc tells the program to load over-occurring 11-mers from
216 an external file. This will increase the speed 140 an external file. This will increase the speed
217 by a factor of 40 in many cases, but is not required. 141 by a factor of 40 in many cases, but is not required.
218 output.psl is the name of the output file. 142 output.psl is the name of the output file.
219 143
220 documentation: 144 documentation:
221 ++++++++++++++ 145 ++++++++++++++
222 146
223 See Blat documentation (http://genome.ucsc.edu/goldenPath/help/blatSpec.html) 147 See Blat documentation (http://genome.ucsc.edu/goldenPath/help/blatSpec.html)
224 148
225 Source code: 149 Source code:
226 ++++++++++++ 150 ++++++++++++
227 151
228 http://hgdownload.cse.ucsc.edu/admin/exe/ 152 http://hgdownload.cse.ucsc.edu/admin/exe/
229 153
230 ]]></help> 154 ]]></help>
231 <citations> 155 <citations>
232 <citation type="doi">10.1101/gr.229202</citation> 156 <citation type="doi">10.1101/gr.229202</citation>
233 </citations> 157 </citations>
234 </tool> 158 </tool>
159
160
161
162
163