comparison blat.xml @ 10:c449963debd5 draft

planemo upload commit c5f669e334bf65c1158855bd1eef88df78a8028c
author iuc
date Mon, 21 Nov 2022 11:12:14 +0000
parents a9d863528f48
children 2a89f630fa85
comparison
equal deleted inserted replaced
9:a9d863528f48 10:c449963debd5
1 <?xml version="1.0"?> 1 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@">
2 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="1.2"> 2 <description>BLAST-like sequence alignment tool</description>
3 <description>Standalone blat sequence search command line tool</description> 3 <macros>
4 <token name="@TOOL_VERSION@">377</token>
5 <token name="@VERSION_SUFFIX@">0</token>
6 </macros>
7 <xrefs>
8 <xref type="bio.tools">blat</xref>
9 </xrefs>
4 <requirements> 10 <requirements>
5 <requirement type="package" version="1.0">ucsc_tools_340_for_BLAT</requirement> 11 <requirement type="package" version="@TOOL_VERSION@">ucsc-blat</requirement>
6 </requirements> 12 </requirements>
7 <command detect_errors="exit_code"><![CDATA[ 13 <command detect_errors="exit_code"><![CDATA[
8 #if str($reference_source.reference_source_selector) == "history": 14 #if str($reference_source.reference_source_selector) == "history":
9 #set $reference_fasta_filename = "localref.fa" 15 ## blat depends on file extension
10 ln -s '${reference_source.database}' '${reference_fasta_filename}' && 16 #if $reference_source.database.is_of_type("fasta"):
11 #else: 17 #set $reference_fasta_filename = "localref.fa"
12 #set $reference_fasta_filename = str($reference_source.database.fields.path) 18 #elif $reference_source.database.is_of_type("twobit"):
13 #end if 19 #set $reference_fasta_filename = "localref.2bit"
14 blat 20 #else
15 #if $noHead == "yes" 21 #set $reference_fasta_filename = "localref"
16 -noHead 22 #end if
17 #end if 23 ln -s '$reference_source.database' '$reference_fasta_filename' &&
18 -q=$query_type 24 #else:
19 -t=$database_type 25 #set $reference_fasta_filename = str($reference_source.database.fields.path)
20 #if $mask_type.mask == "file.out": 26 #end if
21 -mask=$mask_type.mask_file 27
22 #else: 28 blat
23 -mask=$mask_type.mask 29 -q=$query_type
24 #end if 30 -t=$database_type
25 '$reference_fasta_filename' 31 $oneOff
26 '${query}' 32 #if str($minScore)
27 output 33 -minScore=$minScore
28 && sort -k 10,10 -k 12,12n output > '${output_sorted}' 34 #end if
29 ]]></command> 35 -maxGap=$maxGap
30 <inputs> 36 #if str($repMatch)
31 <conditional name="reference_source"> 37 -repMatch=$repMatch
32 <param name="reference_source_selector" type="select" label="Choose the source for the database"> 38 #end if
33 <option value="cached">Locally cached</option> 39 #if $mask_type.mask == "file.out":
34 <option value="history">History</option> 40 -mask='$mask_type.mask_file'
35 </param> 41 #else:
36 <when value="cached"> 42 -mask=$mask_type.mask
37 <param name="database" type="select" label="Select database"> 43 #end if
38 <options from_data_table="all_fasta"> 44 #if str($dots)
39 <filter type="sort_by" column="2" /> 45 -dots=$dots
40 </options> 46 #end if
41 <validator type="no_options" message="A built-in database is not available" /> 47 $trimT
42 </param> 48 $noTrimA
43 </when> 49 $trimHardA
44 <when value="history"> 50 $fastMap
45 <param name="database" type="data" format="fasta,twobit" label="Using database file, either a .fa, .nib or .2bit file" /> 51 $fine
46 </when> 52 #if str($maxIntron)
47 </conditional> 53 -maxIntron=$maxIntron
48 <param type="data" name="query" format="fasta,twobit" label="Query data, either a .fa, .nib or .2bit file"/> 54 #end if
49 <param type="select" name="database_type" format="text" multiple="false" label="database type" help="Choose your database type, the default is dnax" argument="-t"> 55 $extendThroughN
50 <option value="dna">dna - DNA sequence</option> 56 '$reference_fasta_filename'
51 <option value="prot">prot - protein sequence</option> 57 '$query'
52 <option value="dnax" selected="true">dnax - DNA sequence translated in six frames to protein</option> 58 -out=$out
59 '$output'
60 ]]></command>
61 <inputs>
62 <conditional name="reference_source">
63 <param name="reference_source_selector" type="select" label="Choose the source for the database">
64 <option value="cached">Locally cached</option>
65 <option value="history">History</option>
53 </param> 66 </param>
54 <param type="select" name="query_type" format="text" multiple="false" label="query type" help="Choose your query type, the default is rnax" argument="-q"> 67 <when value="cached">
55 <option value="dna">dna - DNA sequence </option> 68 <param name="database" type="select" label="Select database">
56 <option value="rna">rna - RNA sequence</option> 69 <options from_data_table="all_fasta">
57 <option value="prot">prot - protein sequence</option> 70 <filter type="sort_by" column="2" />
58 <option value="dnax">dnax - DNA sequence translated in six frames to protein</option> 71 </options>
59 <option value="rnax" selected="true">rnax - DNA sequence translated in three frames to protein</option> 72 <validator type="no_options" message="A built-in database is not available" />
73 </param>
74 </when>
75 <when value="history">
76 <param name="database" type="data" format="fasta, twobit" label="Using database file, either a .fa, .nib or .2bit file" />
77 </when>
78 </conditional>
79 <param name="query" type="data" format="fasta, twobit" label="Query data, either a .fa, .nib or .2bit file"/>
80 <param argument="-t" name="database_type" type="select" format="txt" multiple="false" label="database type" help="Choose your database type, the default is dnax">
81 <option value="dna">dna - DNA sequence</option>
82 <option value="prot">prot - protein sequence</option>
83 <option value="dnax" selected="true">dnax - DNA sequence translated in six frames to protein</option>
84 </param>
85 <param argument="-q" name="query_type" type="select" format="txt" multiple="false" label="query type" help="Choose your query type, the default is rnax">
86 <option value="dna">dna - DNA sequence </option>
87 <option value="rna">rna - RNA sequence</option>
88 <option value="prot">prot - protein sequence</option>
89 <option value="dnax">dnax - DNA sequence translated in six frames to protein</option>
90 <option value="rnax" selected="true">rnax - DNA sequence translated in three frames to protein</option>
91 </param>
92 <param argument="-oneOff" type="boolean" truevalue="-oneOff=1" falsevalue="" label="If set, this allows one mismatch in tile and still triggers an alignments" />
93 <param argument="-minScore" type="integer" value="30" label="Minimum score" help="It is the matches minus the mismatches minus some sort of gap penalty" />
94 <param argument="-maxGap" type="integer" value="2" min="0" max="3" label="Maximum gap between tiles in a clump" help="Usually set from 0 to 3. Only relevant for minMatch > 1" />
95 <param argument="-repMatch" type="integer" value="" optional="true" label="Number of repetitions of a tile allowed before it is marked as overused" help="Typically this is 256 for tileSize 12, 1024 for tileSize 11, 4096 for tileSize 10. Also affected by stepSize. When stepSize is halved repMatch is doubled to compensate" />
96 <conditional name="mask_type">
97 <param argument="-mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored entirely in protein or translated searches. Default is lower">
98 <option value="lower" selected="true">lower - mask out lower-cased sequence</option>
99 <option value="upper">upper - mask out upper-cased sequence</option>
100 <option value="out">out - mask according to database.out RepeatMasker .out file</option>
101 <option value="file.out">file.out - mask database according to RepeatMasker file.out</option>
60 </param> 102 </param>
61 <param type="select" name="noHead" format="text" label="Suppresses .psl header (so it's just a tab-separated file)." > 103 <when value="lower" />
62 <option value="yes" selected="true">Yes, suppresses .psl header</option> 104 <when value="upper" />
63 <option value="no">No, do not suppresses .psl header</option> 105 <when value="out" />
64 </param> 106 <when value="file.out">
65 <conditional name="mask_type"> 107 <param name="mask_file" type="data" format="txt" label="RepeatMasker file.out" />
66 <param name="mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region 108 </when>
67 but may extend through it in nucleotide searches. Masked areas 109 </conditional>
68 are ignored entirely in protein or translated searches. Default is lower" argument="-mask"> 110 <param argument="-dots" type="integer" value="" optional="true" label="Output a dot every N sequences in log" help="Dots show program's progress" />
69 <option value="lower" selected="true">lower - mask out lower-cased sequence</option> 111 <param argument="-trimT" type="boolean" truevalue="-trimT" falsevalue="" label="Trim leading poly-T" />
70 <option value="upper">upper - mask out upper-cased sequence</option> 112 <param argument="-noTrimA" type="boolean" truevalue="-noTrimA" falsevalue="" label="Don't trim trailing poly-A" />
71 <option value="out">out - mask according to database.out RepeatMasker .out file</option> 113 <param argument="-trimHardA" type="boolean" truevalue="-trimHardA" falsevalue="" label="Remove poly-A tail from qSize and alignments in .psl output" />
72 <option value="file.out">file.out - mask database according to RepeatMasker file.out</option> 114 <param argument="-fastMap" type="boolean" truevalue="-fastMap" falsevalue="" label="Run for fast DNA/DNA remapping" help="It does not allow introns and require high %ID. Query sizes must not exceed 5000" />
73 </param> 115 <param argument="-fine" type="boolean" truevalue="-fine" falsevalue="" label="Refine search for small initial and terminal exons" help="For high-quality mRNAs. Not recommended for ESTs" />
74 <when value="lower" /> 116 <param argument="-maxIntron" type="integer" value="750000" optional="true" label="Maximum intron size" />
75 <when value="upper" /> 117 <param argument="-extendThroughN" type="boolean" truevalue="-extendThroughN" falsevalue="" label="Allow extension of alignment through large blocks of N's" />
76 <when value="out" /> 118 <param name="out" type="select" label="Select output file format (-out)">
77 <when value="file.out"> 119 <option value="psl">Tab-separated format, no sequence (psl)</option>
78 <param name="mask_file" type="data" format="txt" label="RepeatMasker file.out" /> 120 <option value="psl -noHead">Tab-separated format, no sequence, no header (psl -noHead)</option>
79 </when> 121 <option value="axt">Blastz-associated axt format (axt)</option>
80 </conditional> 122 <option value="maf">Multiz-associated maf format (maf)</option>
81 </inputs> 123 <option value="sim4">Similar to sim4 format (sim4)</option>
82 <outputs> 124 <option value="wublast">Similar to WU-BLAST format (wublast)</option>
83 <data format="psl" name="output_sorted" label="${tool.name} on ${on_string}"></data> 125 <option value="blast">Similar to NCBI BLAST format (blast)</option>
84 </outputs> 126 <option value="blast8">NCBI BLAST tabular format (blast8)</option>
85 <tests> 127 <option value="blast9">NCBI BLAST tabular format with comments (blast9)</option>
86 <!-- test on query of GenBank RefSeq records for Gallus gallus and database of Amazona vittata --> 128 </param>
87 <test> 129 </inputs>
130 <outputs>
131 <data name="output" format="tabular" label="${tool.name} on ${on_string}">
132 <change_format>
133 <when input="out" value="axt" format="axt" />
134 <when input="out" value="maf" format="maf" />
135 <when input="out" value="sim4" format="txt" />
136 <when input="out" value="wublast" format="tabular" />
137 <when input="out" value="blast" format="tabular" />
138 </change_format>
139 </data>
140 </outputs>
141 <tests>
142 <!-- test on query of GenBank RefSeq records for Gallus gallus and database of Amazona vittata -->
143 <test>
88 <param name="reference_source_selector" value="history" /> 144 <param name="reference_source_selector" value="history" />
89 <param name="database" value="amaVit1_Gallus/amaVit1.fa" /> 145 <param name="database" value="amaVit1_Gallus/amaVit1.fa" />
90 <param name="query" value="amaVit1_Gallus/Gallus_gallus_RefSeq.fa" /> 146 <param name="query" value="amaVit1_Gallus/Gallus_gallus_RefSeq.fa" />
91 <param name="database_type" value="dnax" /> 147 <param name="database_type" value="dnax" />
92 <param name="query_type" value="rnax" /> 148 <param name="query_type" value="rnax" />
93 <param name="noHead" value="yes" />
94 <param name="mask" value="lower" /> 149 <param name="mask" value="lower" />
95 <output name="output_sorted" value="amaVit1_Gallus/amaVit1_Gallus_gallus.psl" /> 150 <param name="out" value="psl -noHead" />
96 </test> 151 <output name="output" value="amaVit1_Gallus/amaVit1_Gallus_gallus_sorted.psl" sort="true"/>
97 <!-- test on query of partial mRNA of Drosophila melanogaster and the database of Drosophila biamipes dot chromosome --> 152 </test>
98 <test> 153 <!-- test on query of partial mRNA of Drosophila melanogaster and the database of Drosophila biamipes dot chromosome -->
154 <test>
99 <param name="reference_source_selector" value="history" /> 155 <param name="reference_source_selector" value="history" />
100 <param name="database" value="dbia3/dbia3.fa" /> 156 <param name="database" value="dbia3/dbia3.fa" />
101 <param name="query" value="dbia3/dmel-transcript.fa" /> 157 <param name="query" value="dbia3/dmel-transcript.fa" />
102 <param name="database_type" value="dnax" /> 158 <param name="database_type" value="dnax" />
103 <param name="query_type" value="rnax" /> 159 <param name="query_type" value="rnax" />
104 <param name="noHead" value="yes" />
105 <param name="mask" value="lower" /> 160 <param name="mask" value="lower" />
106 <output name="output_sorted" value="dbia3/dbia3.sorted.psl" /> 161 <param name="out" value="psl -noHead" />
107 </test> 162 <param name="maxIntron" value="" />
108 <!-- test on the database masked by repeat masker --> 163 <output name="output" value="dbia3/dbia3.sorted.psl" sort="true"/>
109 <test> 164 </test>
165 <!-- test on the database masked by repeat masker -->
166 <test>
110 <param name="reference_source_selector" value="history" /> 167 <param name="reference_source_selector" value="history" />
111 <param name="database" value="dbia3/dbia3_masked.2bit" /> 168 <param name="database" value="dbia3/dbia3_masked.2bit" />
112 <param name="query" value="dbia3/dmel-transcript.fa" /> 169 <param name="query" value="dbia3/dmel-transcript.fa" />
113 <param name="database_type" value="dnax" /> 170 <param name="database_type" value="dnax" />
114 <param name="query_type" value="rnax" /> 171 <param name="query_type" value="rnax" />
115 <param name="noHead" value="yes" /> 172 <param name="oneOff" value="false" />
173 <param name="minScore" value="30" />
174 <param name="maxGap" value="2" />
175 <param name="trimT" value="false" />
176 <param name="noTrimA" value="false" />
177 <param name="fine" value="false" />
178 <param name="maxIntron" value="750000" />
179 <param name="extendThroughN" value="false" />
116 <param name="mask" value="file.out" /> 180 <param name="mask" value="file.out" />
117 <param name="mask_file" value="dbia3/dbia3_RM.out" /> 181 <param name="mask_file" value="dbia3/dbia3_RM.out" />
118 <output name="output_sorted" value="dbia3/dbia3_masked.sorted.psl" /> 182 <param name="out" value="psl -noHead" />
119 </test> 183 <output name="output" value="dbia3/dbia3_masked.sorted.psl"/>
120 184 </test>
121 </tests> 185 </tests>
122 <help> 186 <help>
123 <![CDATA[ 187 <![CDATA[
124 BLAT 188 BLAT
125 ==== 189 ====
126 BLAT is a bioinformatics software a tool which performs rapid mRNA/DNA and cross-species protein alignments. 190 BLAT is a bioinformatics software a tool which performs rapid mRNA/DNA and cross-species protein alignments.
127 191
128 blat (version: v340)- Standalone blat sequence search command line tool. 192 blat (version: v36)- Standalone blat sequence search command line tool.
129 ------------------------------------------------------------------------- 193 -------------------------------------------------------------------------
130 194
131 usage: 195 usage:
132 ++++++ 196 ++++++
133 197
137 database and query are each either a .fa, .nib or .2bit file, 201 database and query are each either a .fa, .nib or .2bit file,
138 or a list of these files with one file name per line. 202 or a list of these files with one file name per line.
139 -ooc=11.ooc tells the program to load over-occurring 11-mers from 203 -ooc=11.ooc tells the program to load over-occurring 11-mers from
140 an external file. This will increase the speed 204 an external file. This will increase the speed
141 by a factor of 40 in many cases, but is not required. 205 by a factor of 40 in many cases, but is not required.
142 output.psl is the name of the output file. 206 output.psl is the name of the output file.
143 207
144 documentation: 208 documentation:
145 ++++++++++++++ 209 ++++++++++++++
146 210
147 See Blat documentation (http://genome.ucsc.edu/goldenPath/help/blatSpec.html) 211 See Blat documentation (http://genome.ucsc.edu/goldenPath/help/blatSpec.html)
148 212
149 Source code: 213 Source code:
150 ++++++++++++ 214 ++++++++++++
151 215
152 http://hgdownload.cse.ucsc.edu/admin/exe/ 216 http://hgdownload.cse.ucsc.edu/admin/exe/
153 217
154 ]]></help> 218 ]]></help>
155 <citations> 219 <citations>
156 <citation type="doi">10.1101/gr.229202</citation> 220 <citation type="doi">10.1101/gr.229202</citation>
157 </citations> 221 </citations>
158 </tool> 222 </tool>
159
160
161
162
163