comparison blat.xml @ 6:250a7f2b1331 draft

planemo upload commit 630d4a316c3b72b0d92b32e8b37303d247a41190
author iuc
date Thu, 31 May 2018 11:25:53 -0400
parents dede60f744f4
children 10f3a5b6f2ac
comparison
equal deleted inserted replaced
5:dede60f744f4 6:250a7f2b1331
1 <?xml version="1.0"?> 1 <?xml version="1.0"?>
2 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="35-0"> 2 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="36">
3 <description>BLAST-like sequence alignment tool</description> 3 <description>BLAST-like sequence alignment tool</description>
4 <requirements> 4 <requirements>
5 <requirement type="package" version="35">blat</requirement> 5 <requirement type="package" version="36">blat</requirement>
6 </requirements> 6 </requirements>
7 <command detect_errors="exit_code"><![CDATA[ 7 <command detect_errors="exit_code"><![CDATA[
8 #if str($reference_source.reference_source_selector) == "history": 8 #if str($reference_source.reference_source_selector) == "history":
9 ## blat depends on file extension 9 ## blat depends on file extension
10 #if $reference_source.database.is_of_type("fasta"): 10 #if $reference_source.database.is_of_type("fasta"):
18 ln -s '${reference_source.database}' '${reference_fasta_filename}' && 18 ln -s '${reference_source.database}' '${reference_fasta_filename}' &&
19 #else: 19 #else:
20 #set $reference_fasta_filename = str($reference_source.database.fields.path) 20 #set $reference_fasta_filename = str($reference_source.database.fields.path)
21 #end if 21 #end if
22 22
23 blat 23 blat
24 #if $noHead == "yes"
25 -noHead
26 #end if
27 24
28 -q=$query_type 25 -q=$query_type
29 -t=$database_type 26 -t=$database_type
27
28 ${oneOff}
29
30 #if str($minScore)
31 -minScore=${minScore}
32 #end if
33
34 -maxGap=${maxGap}
35
36 #if str($repMatch)
37 -repMatch=${repMatch}
38 #end if
30 39
31 #if $mask_type.mask == "file.out": 40 #if $mask_type.mask == "file.out":
32 -mask='${mask_type.mask_file}' 41 -mask='${mask_type.mask_file}'
33 #else: 42 #else:
34 -mask=$mask_type.mask 43 -mask=$mask_type.mask
35 #end if 44 #end if
36 45
46 #if str($dots)
47 -dots=${dots}
48 #end if
49
50 ${trimT}
51 ${noTrimA}
52 ${trimHardA}
53 ${fastMap}
54 ${fine}
55
56 #if str($maxIntron)
57 -maxIntron=${maxIntron}
58 #end if
59
60 ${extendThroughN}
61
37 '$reference_fasta_filename' 62 '$reference_fasta_filename'
38 '${query}' 63 '${query}'
39 64
40 output 65 -out=${out}
41 && sort -k 10,10 -k 12,12n output > '${output_sorted}' 66
67 '${output}'
42 ]]></command> 68 ]]></command>
43 <inputs> 69 <inputs>
44 <conditional name="reference_source"> 70 <conditional name="reference_source">
45 <param name="reference_source_selector" type="select" label="Choose the source for the database"> 71 <param name="reference_source_selector" type="select" label="Choose the source for the database">
46 <option value="cached">Locally cached</option> 72 <option value="cached">Locally cached</option>
69 <option value="rna">rna - RNA sequence</option> 95 <option value="rna">rna - RNA sequence</option>
70 <option value="prot">prot - protein sequence</option> 96 <option value="prot">prot - protein sequence</option>
71 <option value="dnax">dnax - DNA sequence translated in six frames to protein</option> 97 <option value="dnax">dnax - DNA sequence translated in six frames to protein</option>
72 <option value="rnax" selected="true">rnax - DNA sequence translated in three frames to protein</option> 98 <option value="rnax" selected="true">rnax - DNA sequence translated in three frames to protein</option>
73 </param> 99 </param>
74 <param type="select" name="noHead" format="text" label="Suppresses .psl header (so it's just a tab-separated file)." > 100 <param argument="-oneOff" type="boolean" truevalue="-oneOff=1" falsevalue="" label="If set, this allows one mismatch in tile and still triggers an alignments" />
75 <option value="yes" selected="true">Yes, suppresses .psl header</option> 101 <param argument="-minScore" type="integer" value="30" label="Minimum score" help="It is the matches minus the mismatches minus some sort of gap penalty" />
76 <option value="no">No, do not suppresses .psl header</option> 102 <param argument="-maxGap" type="integer" value="2" min="0" max="3" label="Maximum gap between tiles in a clump" help="Usually set from 0 to 3. Only relevant for minMatch > 1" />
77 </param> 103 <param argument="-repMatch" type="integer" value="" optional="true" label="Number of repetitions of a tile allowed before it is marked as overused" help="Typically this is 256 for tileSize 12, 1024 for tileSize 11, 4096 for tileSize 10. Also affected by stepSize. When stepSize is halved repMatch is doubled to compensate" />
78 <conditional name="mask_type"> 104 <conditional name="mask_type">
79 <param name="mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region 105 <param name="mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region
80 but may extend through it in nucleotide searches. Masked areas 106 but may extend through it in nucleotide searches. Masked areas
81 are ignored entirely in protein or translated searches. Default is lower" argument="-mask"> 107 are ignored entirely in protein or translated searches. Default is lower" argument="-mask">
82 <option value="lower" selected="true">lower - mask out lower-cased sequence</option> 108 <option value="lower" selected="true">lower - mask out lower-cased sequence</option>
87 <when value="lower" /> 113 <when value="lower" />
88 <when value="upper" /> 114 <when value="upper" />
89 <when value="out" /> 115 <when value="out" />
90 <when value="file.out"> 116 <when value="file.out">
91 <param name="mask_file" type="data" format="txt" label="RepeatMasker file.out" /> 117 <param name="mask_file" type="data" format="txt" label="RepeatMasker file.out" />
92 </when> 118 </when>
93 </conditional> 119 </conditional>
120 <param argument="-dots" type="integer" value="" optional="true" label="Output a dot every N sequences in log" help="Dots show program's progress" />
121 <param argument="-trimT" type="boolean" truevalue="-trimT" falsevalue="" label="Trim leading poly-T" />
122 <param argument="-noTrimA" type="boolean" truevalue="-noTrimA" falsevalue="" label="Don't trim trailing poly-A" />
123 <param argument="-trimHardA" type="boolean" truevalue="-trimHardA" falsevalue="" label="Remove poly-A tail from qSize and alignments in .psl output" />
124 <param argument="-fastMap" type="boolean" truevalue="-fastMap" falsevalue="" label="Run for fast DNA/DNA remapping" help="It does not allow introns and require high %ID. Query sizes must not exceed 5000" />
125 <param argument="-fine" type="boolean" truevalue="-fine" falsevalue="" label="Refine search for small initial and terminal exons" help="For high-quality mRNAs. Not recommended for ESTs" />
126 <param argument="-maxIntron" type="integer" value="750000" optional="true" label="Maximum intron size" />
127 <param argument="-extendThroughN" type="boolean" truevalue="-extendThroughN" falsevalue="" label="Allow extension of alignment through large blocks of N's" />
128 <param name="out" type="select" label="Select output file format (-out)">
129 <option value="psl">Tab-separated format, no sequence (psl)</option>
130 <option value="psl -noHead">Tab-separated format, no sequence, no header (psl -noHead)</option>
131 <option value="axt">Blastz-associated axt format (axt)</option>
132 <option value="maf">Multiz-associated maf format (maf)</option>
133 <option value="sim4">Similar to sim4 format (sim4)</option>
134 <option value="wublast">Similar to WU-BLAST format (wublast)</option>
135 <option value="blast">Similar to NCBI BLAST format (blast)</option>
136 <option value="blast8">NCBI BLAST tabular format (blast8)</option>
137 <option value="blast9">NCBI BLAST tabular format with comments (blast9)</option>
138 </param>
94 </inputs> 139 </inputs>
95 <outputs> 140 <outputs>
96 <data format="psl" name="output_sorted" label="${tool.name} on ${on_string}"></data> 141 <data name="output" format="tabular" label="${tool.name} on ${on_string}">
142 <change_format>
143 <when input="out" value="psl" format="psl" />
144 <when input="out" value="axt" format="axt" />
145 <when input="out" value="maf" format="maf" />
146 <when input="out" value="sim4" format="txt" />
147 <when input="out" value="wublast" format="txt" />
148 <when input="out" value="blast" format="txt" />
149 </change_format>
150 </data>
97 </outputs> 151 </outputs>
98 <tests> 152 <tests>
99 <!-- test on query of GenBank RefSeq records for Gallus gallus and database of Amazona vittata --> 153 <!-- test on query of GenBank RefSeq records for Gallus gallus and database of Amazona vittata -->
100 <test> 154 <test>
101 <param name="reference_source_selector" value="history" /> 155 <param name="reference_source_selector" value="history" />
102 <param name="database" value="amaVit1_Gallus/amaVit1.fa" /> 156 <param name="database" value="amaVit1_Gallus/amaVit1.fa" />
103 <param name="query" value="amaVit1_Gallus/Gallus_gallus_RefSeq.fa" /> 157 <param name="query" value="amaVit1_Gallus/Gallus_gallus_RefSeq.fa" />
104 <param name="database_type" value="dnax" /> 158 <param name="database_type" value="dnax" />
105 <param name="query_type" value="rnax" /> 159 <param name="query_type" value="rnax" />
106 <param name="noHead" value="yes" />
107 <param name="mask" value="lower" /> 160 <param name="mask" value="lower" />
108 <output name="output_sorted" value="amaVit1_Gallus/amaVit1_Gallus_gallus.psl" /> 161 <param name="out" value="psl -noHead" />
162 <output name="output" value="amaVit1_Gallus/amaVit1_Gallus_gallus_sorted.psl" sort="True"/>
109 </test> 163 </test>
110 <!-- test on query of partial mRNA of Drosophila melanogaster and the database of Drosophila biamipes dot chromosome --> 164 <!-- test on query of partial mRNA of Drosophila melanogaster and the database of Drosophila biamipes dot chromosome -->
111 <test> 165 <test>
112 <param name="reference_source_selector" value="history" /> 166 <param name="reference_source_selector" value="history" />
113 <param name="database" value="dbia3/dbia3.fa" /> 167 <param name="database" value="dbia3/dbia3.fa" />
114 <param name="query" value="dbia3/dmel-transcript.fa" /> 168 <param name="query" value="dbia3/dmel-transcript.fa" />
115 <param name="database_type" value="dnax" /> 169 <param name="database_type" value="dnax" />
116 <param name="query_type" value="rnax" /> 170 <param name="query_type" value="rnax" />
117 <param name="noHead" value="yes" />
118 <param name="mask" value="lower" /> 171 <param name="mask" value="lower" />
119 <output name="output_sorted" value="dbia3/dbia3.sorted.psl" /> 172 <param name="out" value="psl -noHead" />
173 <param name="maxIntron" value="" />
174 <output name="output" value="dbia3/dbia3.sorted.psl" sort="True"/>
120 </test> 175 </test>
121 <!-- test on the database masked by repeat masker --> 176 <!-- test on the database masked by repeat masker -->
122 <test> 177 <test>
123 <param name="reference_source_selector" value="history" /> 178 <param name="reference_source_selector" value="history" />
124 <param name="database" value="dbia3/dbia3_masked.2bit" /> 179 <param name="database" value="dbia3/dbia3_masked.2bit" />
125 <param name="query" value="dbia3/dmel-transcript.fa" /> 180 <param name="query" value="dbia3/dmel-transcript.fa" />
126 <param name="database_type" value="dnax" /> 181 <param name="database_type" value="dnax" />
127 <param name="query_type" value="rnax" /> 182 <param name="query_type" value="rnax" />
128 <param name="noHead" value="yes" /> 183 <param name="oneOff" value="false" />
184 <param name="minScore" value="30" />
185 <param name="maxGap" value="2" />
186 <param name="trimT" value="false" />
187 <param name="noTrimA" value="false" />
188 <param name="fine" value="false" />
189 <param name="maxIntron" value="750000" />
190 <param name="extendThroughN" value="false" />
129 <param name="mask" value="file.out" /> 191 <param name="mask" value="file.out" />
130 <param name="mask_file" value="dbia3/dbia3_RM.out" /> 192 <param name="mask_file" value="dbia3/dbia3_RM.out" />
131 <output name="output_sorted" value="dbia3/dbia3_masked.sorted.psl" /> 193 <param name="out" value="psl -noHead" />
194 <output name="output" value="dbia3/dbia3_masked.sorted.psl"/>
132 </test> 195 </test>
133 196
134 </tests> 197 </tests>
135 <help> 198 <help>
136 <![CDATA[ 199 <![CDATA[
137 BLAT 200 BLAT
138 ==== 201 ====
139 BLAT is a bioinformatics software a tool which performs rapid mRNA/DNA and cross-species protein alignments. 202 BLAT is a bioinformatics software a tool which performs rapid mRNA/DNA and cross-species protein alignments.
140 203
141 blat (version: v340)- Standalone blat sequence search command line tool. 204 blat (version: v36)- Standalone blat sequence search command line tool.
142 ------------------------------------------------------------------------- 205 -------------------------------------------------------------------------
143 206
144 usage: 207 usage:
145 ++++++ 208 ++++++
146 209
150 database and query are each either a .fa, .nib or .2bit file, 213 database and query are each either a .fa, .nib or .2bit file,
151 or a list of these files with one file name per line. 214 or a list of these files with one file name per line.
152 -ooc=11.ooc tells the program to load over-occurring 11-mers from 215 -ooc=11.ooc tells the program to load over-occurring 11-mers from
153 an external file. This will increase the speed 216 an external file. This will increase the speed
154 by a factor of 40 in many cases, but is not required. 217 by a factor of 40 in many cases, but is not required.
155 output.psl is the name of the output file. 218 output.psl is the name of the output file.
156 219
157 documentation: 220 documentation:
158 ++++++++++++++ 221 ++++++++++++++
159 222
160 See Blat documentation (http://genome.ucsc.edu/goldenPath/help/blatSpec.html) 223 See Blat documentation (http://genome.ucsc.edu/goldenPath/help/blatSpec.html)
161 224
162 Source code: 225 Source code:
163 ++++++++++++ 226 ++++++++++++
164 227
165 http://hgdownload.cse.ucsc.edu/admin/exe/ 228 http://hgdownload.cse.ucsc.edu/admin/exe/
166 229
167 ]]></help> 230 ]]></help>
168 <citations> 231 <citations>
169 <citation type="doi">10.1101/gr.229202</citation> 232 <citation type="doi">10.1101/gr.229202</citation>
170 </citations> 233 </citations>
171 </tool> 234 </tool>
172
173
174
175
176