Mercurial > repos > yating-l > ucsc_blat
comparison blat.xml @ 10:c449963debd5 draft
planemo upload commit c5f669e334bf65c1158855bd1eef88df78a8028c
author | iuc |
---|---|
date | Mon, 21 Nov 2022 11:12:14 +0000 |
parents | a9d863528f48 |
children | 2a89f630fa85 |
comparison
equal
deleted
inserted
replaced
9:a9d863528f48 | 10:c449963debd5 |
---|---|
1 <?xml version="1.0"?> | 1 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@"> |
2 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="1.2"> | 2 <description>BLAST-like sequence alignment tool</description> |
3 <description>Standalone blat sequence search command line tool</description> | 3 <macros> |
4 <token name="@TOOL_VERSION@">377</token> | |
5 <token name="@VERSION_SUFFIX@">0</token> | |
6 </macros> | |
7 <xrefs> | |
8 <xref type="bio.tools">blat</xref> | |
9 </xrefs> | |
4 <requirements> | 10 <requirements> |
5 <requirement type="package" version="1.0">ucsc_tools_340_for_BLAT</requirement> | 11 <requirement type="package" version="@TOOL_VERSION@">ucsc-blat</requirement> |
6 </requirements> | 12 </requirements> |
7 <command detect_errors="exit_code"><![CDATA[ | 13 <command detect_errors="exit_code"><![CDATA[ |
8 #if str($reference_source.reference_source_selector) == "history": | 14 #if str($reference_source.reference_source_selector) == "history": |
9 #set $reference_fasta_filename = "localref.fa" | 15 ## blat depends on file extension |
10 ln -s '${reference_source.database}' '${reference_fasta_filename}' && | 16 #if $reference_source.database.is_of_type("fasta"): |
11 #else: | 17 #set $reference_fasta_filename = "localref.fa" |
12 #set $reference_fasta_filename = str($reference_source.database.fields.path) | 18 #elif $reference_source.database.is_of_type("twobit"): |
13 #end if | 19 #set $reference_fasta_filename = "localref.2bit" |
14 blat | 20 #else |
15 #if $noHead == "yes" | 21 #set $reference_fasta_filename = "localref" |
16 -noHead | 22 #end if |
17 #end if | 23 ln -s '$reference_source.database' '$reference_fasta_filename' && |
18 -q=$query_type | 24 #else: |
19 -t=$database_type | 25 #set $reference_fasta_filename = str($reference_source.database.fields.path) |
20 #if $mask_type.mask == "file.out": | 26 #end if |
21 -mask=$mask_type.mask_file | 27 |
22 #else: | 28 blat |
23 -mask=$mask_type.mask | 29 -q=$query_type |
24 #end if | 30 -t=$database_type |
25 '$reference_fasta_filename' | 31 $oneOff |
26 '${query}' | 32 #if str($minScore) |
27 output | 33 -minScore=$minScore |
28 && sort -k 10,10 -k 12,12n output > '${output_sorted}' | 34 #end if |
29 ]]></command> | 35 -maxGap=$maxGap |
30 <inputs> | 36 #if str($repMatch) |
31 <conditional name="reference_source"> | 37 -repMatch=$repMatch |
32 <param name="reference_source_selector" type="select" label="Choose the source for the database"> | 38 #end if |
33 <option value="cached">Locally cached</option> | 39 #if $mask_type.mask == "file.out": |
34 <option value="history">History</option> | 40 -mask='$mask_type.mask_file' |
35 </param> | 41 #else: |
36 <when value="cached"> | 42 -mask=$mask_type.mask |
37 <param name="database" type="select" label="Select database"> | 43 #end if |
38 <options from_data_table="all_fasta"> | 44 #if str($dots) |
39 <filter type="sort_by" column="2" /> | 45 -dots=$dots |
40 </options> | 46 #end if |
41 <validator type="no_options" message="A built-in database is not available" /> | 47 $trimT |
42 </param> | 48 $noTrimA |
43 </when> | 49 $trimHardA |
44 <when value="history"> | 50 $fastMap |
45 <param name="database" type="data" format="fasta,twobit" label="Using database file, either a .fa, .nib or .2bit file" /> | 51 $fine |
46 </when> | 52 #if str($maxIntron) |
47 </conditional> | 53 -maxIntron=$maxIntron |
48 <param type="data" name="query" format="fasta,twobit" label="Query data, either a .fa, .nib or .2bit file"/> | 54 #end if |
49 <param type="select" name="database_type" format="text" multiple="false" label="database type" help="Choose your database type, the default is dnax" argument="-t"> | 55 $extendThroughN |
50 <option value="dna">dna - DNA sequence</option> | 56 '$reference_fasta_filename' |
51 <option value="prot">prot - protein sequence</option> | 57 '$query' |
52 <option value="dnax" selected="true">dnax - DNA sequence translated in six frames to protein</option> | 58 -out=$out |
59 '$output' | |
60 ]]></command> | |
61 <inputs> | |
62 <conditional name="reference_source"> | |
63 <param name="reference_source_selector" type="select" label="Choose the source for the database"> | |
64 <option value="cached">Locally cached</option> | |
65 <option value="history">History</option> | |
53 </param> | 66 </param> |
54 <param type="select" name="query_type" format="text" multiple="false" label="query type" help="Choose your query type, the default is rnax" argument="-q"> | 67 <when value="cached"> |
55 <option value="dna">dna - DNA sequence </option> | 68 <param name="database" type="select" label="Select database"> |
56 <option value="rna">rna - RNA sequence</option> | 69 <options from_data_table="all_fasta"> |
57 <option value="prot">prot - protein sequence</option> | 70 <filter type="sort_by" column="2" /> |
58 <option value="dnax">dnax - DNA sequence translated in six frames to protein</option> | 71 </options> |
59 <option value="rnax" selected="true">rnax - DNA sequence translated in three frames to protein</option> | 72 <validator type="no_options" message="A built-in database is not available" /> |
73 </param> | |
74 </when> | |
75 <when value="history"> | |
76 <param name="database" type="data" format="fasta, twobit" label="Using database file, either a .fa, .nib or .2bit file" /> | |
77 </when> | |
78 </conditional> | |
79 <param name="query" type="data" format="fasta, twobit" label="Query data, either a .fa, .nib or .2bit file"/> | |
80 <param argument="-t" name="database_type" type="select" format="txt" multiple="false" label="database type" help="Choose your database type, the default is dnax"> | |
81 <option value="dna">dna - DNA sequence</option> | |
82 <option value="prot">prot - protein sequence</option> | |
83 <option value="dnax" selected="true">dnax - DNA sequence translated in six frames to protein</option> | |
84 </param> | |
85 <param argument="-q" name="query_type" type="select" format="txt" multiple="false" label="query type" help="Choose your query type, the default is rnax"> | |
86 <option value="dna">dna - DNA sequence </option> | |
87 <option value="rna">rna - RNA sequence</option> | |
88 <option value="prot">prot - protein sequence</option> | |
89 <option value="dnax">dnax - DNA sequence translated in six frames to protein</option> | |
90 <option value="rnax" selected="true">rnax - DNA sequence translated in three frames to protein</option> | |
91 </param> | |
92 <param argument="-oneOff" type="boolean" truevalue="-oneOff=1" falsevalue="" label="If set, this allows one mismatch in tile and still triggers an alignments" /> | |
93 <param argument="-minScore" type="integer" value="30" label="Minimum score" help="It is the matches minus the mismatches minus some sort of gap penalty" /> | |
94 <param argument="-maxGap" type="integer" value="2" min="0" max="3" label="Maximum gap between tiles in a clump" help="Usually set from 0 to 3. Only relevant for minMatch > 1" /> | |
95 <param argument="-repMatch" type="integer" value="" optional="true" label="Number of repetitions of a tile allowed before it is marked as overused" help="Typically this is 256 for tileSize 12, 1024 for tileSize 11, 4096 for tileSize 10. Also affected by stepSize. When stepSize is halved repMatch is doubled to compensate" /> | |
96 <conditional name="mask_type"> | |
97 <param argument="-mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored entirely in protein or translated searches. Default is lower"> | |
98 <option value="lower" selected="true">lower - mask out lower-cased sequence</option> | |
99 <option value="upper">upper - mask out upper-cased sequence</option> | |
100 <option value="out">out - mask according to database.out RepeatMasker .out file</option> | |
101 <option value="file.out">file.out - mask database according to RepeatMasker file.out</option> | |
60 </param> | 102 </param> |
61 <param type="select" name="noHead" format="text" label="Suppresses .psl header (so it's just a tab-separated file)." > | 103 <when value="lower" /> |
62 <option value="yes" selected="true">Yes, suppresses .psl header</option> | 104 <when value="upper" /> |
63 <option value="no">No, do not suppresses .psl header</option> | 105 <when value="out" /> |
64 </param> | 106 <when value="file.out"> |
65 <conditional name="mask_type"> | 107 <param name="mask_file" type="data" format="txt" label="RepeatMasker file.out" /> |
66 <param name="mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region | 108 </when> |
67 but may extend through it in nucleotide searches. Masked areas | 109 </conditional> |
68 are ignored entirely in protein or translated searches. Default is lower" argument="-mask"> | 110 <param argument="-dots" type="integer" value="" optional="true" label="Output a dot every N sequences in log" help="Dots show program's progress" /> |
69 <option value="lower" selected="true">lower - mask out lower-cased sequence</option> | 111 <param argument="-trimT" type="boolean" truevalue="-trimT" falsevalue="" label="Trim leading poly-T" /> |
70 <option value="upper">upper - mask out upper-cased sequence</option> | 112 <param argument="-noTrimA" type="boolean" truevalue="-noTrimA" falsevalue="" label="Don't trim trailing poly-A" /> |
71 <option value="out">out - mask according to database.out RepeatMasker .out file</option> | 113 <param argument="-trimHardA" type="boolean" truevalue="-trimHardA" falsevalue="" label="Remove poly-A tail from qSize and alignments in .psl output" /> |
72 <option value="file.out">file.out - mask database according to RepeatMasker file.out</option> | 114 <param argument="-fastMap" type="boolean" truevalue="-fastMap" falsevalue="" label="Run for fast DNA/DNA remapping" help="It does not allow introns and require high %ID. Query sizes must not exceed 5000" /> |
73 </param> | 115 <param argument="-fine" type="boolean" truevalue="-fine" falsevalue="" label="Refine search for small initial and terminal exons" help="For high-quality mRNAs. Not recommended for ESTs" /> |
74 <when value="lower" /> | 116 <param argument="-maxIntron" type="integer" value="750000" optional="true" label="Maximum intron size" /> |
75 <when value="upper" /> | 117 <param argument="-extendThroughN" type="boolean" truevalue="-extendThroughN" falsevalue="" label="Allow extension of alignment through large blocks of N's" /> |
76 <when value="out" /> | 118 <param name="out" type="select" label="Select output file format (-out)"> |
77 <when value="file.out"> | 119 <option value="psl">Tab-separated format, no sequence (psl)</option> |
78 <param name="mask_file" type="data" format="txt" label="RepeatMasker file.out" /> | 120 <option value="psl -noHead">Tab-separated format, no sequence, no header (psl -noHead)</option> |
79 </when> | 121 <option value="axt">Blastz-associated axt format (axt)</option> |
80 </conditional> | 122 <option value="maf">Multiz-associated maf format (maf)</option> |
81 </inputs> | 123 <option value="sim4">Similar to sim4 format (sim4)</option> |
82 <outputs> | 124 <option value="wublast">Similar to WU-BLAST format (wublast)</option> |
83 <data format="psl" name="output_sorted" label="${tool.name} on ${on_string}"></data> | 125 <option value="blast">Similar to NCBI BLAST format (blast)</option> |
84 </outputs> | 126 <option value="blast8">NCBI BLAST tabular format (blast8)</option> |
85 <tests> | 127 <option value="blast9">NCBI BLAST tabular format with comments (blast9)</option> |
86 <!-- test on query of GenBank RefSeq records for Gallus gallus and database of Amazona vittata --> | 128 </param> |
87 <test> | 129 </inputs> |
130 <outputs> | |
131 <data name="output" format="tabular" label="${tool.name} on ${on_string}"> | |
132 <change_format> | |
133 <when input="out" value="axt" format="axt" /> | |
134 <when input="out" value="maf" format="maf" /> | |
135 <when input="out" value="sim4" format="txt" /> | |
136 <when input="out" value="wublast" format="tabular" /> | |
137 <when input="out" value="blast" format="tabular" /> | |
138 </change_format> | |
139 </data> | |
140 </outputs> | |
141 <tests> | |
142 <!-- test on query of GenBank RefSeq records for Gallus gallus and database of Amazona vittata --> | |
143 <test> | |
88 <param name="reference_source_selector" value="history" /> | 144 <param name="reference_source_selector" value="history" /> |
89 <param name="database" value="amaVit1_Gallus/amaVit1.fa" /> | 145 <param name="database" value="amaVit1_Gallus/amaVit1.fa" /> |
90 <param name="query" value="amaVit1_Gallus/Gallus_gallus_RefSeq.fa" /> | 146 <param name="query" value="amaVit1_Gallus/Gallus_gallus_RefSeq.fa" /> |
91 <param name="database_type" value="dnax" /> | 147 <param name="database_type" value="dnax" /> |
92 <param name="query_type" value="rnax" /> | 148 <param name="query_type" value="rnax" /> |
93 <param name="noHead" value="yes" /> | |
94 <param name="mask" value="lower" /> | 149 <param name="mask" value="lower" /> |
95 <output name="output_sorted" value="amaVit1_Gallus/amaVit1_Gallus_gallus.psl" /> | 150 <param name="out" value="psl -noHead" /> |
96 </test> | 151 <output name="output" value="amaVit1_Gallus/amaVit1_Gallus_gallus_sorted.psl" sort="true"/> |
97 <!-- test on query of partial mRNA of Drosophila melanogaster and the database of Drosophila biamipes dot chromosome --> | 152 </test> |
98 <test> | 153 <!-- test on query of partial mRNA of Drosophila melanogaster and the database of Drosophila biamipes dot chromosome --> |
154 <test> | |
99 <param name="reference_source_selector" value="history" /> | 155 <param name="reference_source_selector" value="history" /> |
100 <param name="database" value="dbia3/dbia3.fa" /> | 156 <param name="database" value="dbia3/dbia3.fa" /> |
101 <param name="query" value="dbia3/dmel-transcript.fa" /> | 157 <param name="query" value="dbia3/dmel-transcript.fa" /> |
102 <param name="database_type" value="dnax" /> | 158 <param name="database_type" value="dnax" /> |
103 <param name="query_type" value="rnax" /> | 159 <param name="query_type" value="rnax" /> |
104 <param name="noHead" value="yes" /> | |
105 <param name="mask" value="lower" /> | 160 <param name="mask" value="lower" /> |
106 <output name="output_sorted" value="dbia3/dbia3.sorted.psl" /> | 161 <param name="out" value="psl -noHead" /> |
107 </test> | 162 <param name="maxIntron" value="" /> |
108 <!-- test on the database masked by repeat masker --> | 163 <output name="output" value="dbia3/dbia3.sorted.psl" sort="true"/> |
109 <test> | 164 </test> |
165 <!-- test on the database masked by repeat masker --> | |
166 <test> | |
110 <param name="reference_source_selector" value="history" /> | 167 <param name="reference_source_selector" value="history" /> |
111 <param name="database" value="dbia3/dbia3_masked.2bit" /> | 168 <param name="database" value="dbia3/dbia3_masked.2bit" /> |
112 <param name="query" value="dbia3/dmel-transcript.fa" /> | 169 <param name="query" value="dbia3/dmel-transcript.fa" /> |
113 <param name="database_type" value="dnax" /> | 170 <param name="database_type" value="dnax" /> |
114 <param name="query_type" value="rnax" /> | 171 <param name="query_type" value="rnax" /> |
115 <param name="noHead" value="yes" /> | 172 <param name="oneOff" value="false" /> |
173 <param name="minScore" value="30" /> | |
174 <param name="maxGap" value="2" /> | |
175 <param name="trimT" value="false" /> | |
176 <param name="noTrimA" value="false" /> | |
177 <param name="fine" value="false" /> | |
178 <param name="maxIntron" value="750000" /> | |
179 <param name="extendThroughN" value="false" /> | |
116 <param name="mask" value="file.out" /> | 180 <param name="mask" value="file.out" /> |
117 <param name="mask_file" value="dbia3/dbia3_RM.out" /> | 181 <param name="mask_file" value="dbia3/dbia3_RM.out" /> |
118 <output name="output_sorted" value="dbia3/dbia3_masked.sorted.psl" /> | 182 <param name="out" value="psl -noHead" /> |
119 </test> | 183 <output name="output" value="dbia3/dbia3_masked.sorted.psl"/> |
120 | 184 </test> |
121 </tests> | 185 </tests> |
122 <help> | 186 <help> |
123 <![CDATA[ | 187 <![CDATA[ |
124 BLAT | 188 BLAT |
125 ==== | 189 ==== |
126 BLAT is a bioinformatics software a tool which performs rapid mRNA/DNA and cross-species protein alignments. | 190 BLAT is a bioinformatics software a tool which performs rapid mRNA/DNA and cross-species protein alignments. |
127 | 191 |
128 blat (version: v340)- Standalone blat sequence search command line tool. | 192 blat (version: v36)- Standalone blat sequence search command line tool. |
129 ------------------------------------------------------------------------- | 193 ------------------------------------------------------------------------- |
130 | 194 |
131 usage: | 195 usage: |
132 ++++++ | 196 ++++++ |
133 | 197 |
137 database and query are each either a .fa, .nib or .2bit file, | 201 database and query are each either a .fa, .nib or .2bit file, |
138 or a list of these files with one file name per line. | 202 or a list of these files with one file name per line. |
139 -ooc=11.ooc tells the program to load over-occurring 11-mers from | 203 -ooc=11.ooc tells the program to load over-occurring 11-mers from |
140 an external file. This will increase the speed | 204 an external file. This will increase the speed |
141 by a factor of 40 in many cases, but is not required. | 205 by a factor of 40 in many cases, but is not required. |
142 output.psl is the name of the output file. | 206 output.psl is the name of the output file. |
143 | 207 |
144 documentation: | 208 documentation: |
145 ++++++++++++++ | 209 ++++++++++++++ |
146 | 210 |
147 See Blat documentation (http://genome.ucsc.edu/goldenPath/help/blatSpec.html) | 211 See Blat documentation (http://genome.ucsc.edu/goldenPath/help/blatSpec.html) |
148 | 212 |
149 Source code: | 213 Source code: |
150 ++++++++++++ | 214 ++++++++++++ |
151 | 215 |
152 http://hgdownload.cse.ucsc.edu/admin/exe/ | 216 http://hgdownload.cse.ucsc.edu/admin/exe/ |
153 | 217 |
154 ]]></help> | 218 ]]></help> |
155 <citations> | 219 <citations> |
156 <citation type="doi">10.1101/gr.229202</citation> | 220 <citation type="doi">10.1101/gr.229202</citation> |
157 </citations> | 221 </citations> |
158 </tool> | 222 </tool> |
159 | |
160 | |
161 | |
162 | |
163 |