Mercurial > repos > devteam > tophat2
annotate tophat2_wrapper.xml @ 8:758594ed0364 draft
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
author | devteam |
---|---|
date | Mon, 09 May 2016 10:33:50 -0400 |
parents | 4eb3c3beb9c7 |
children | 0849fa93eadb |
rev | line source |
---|---|
8
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
1 <tool id="tophat2" name="TopHat" version="2.1.0"> |
0 | 2 <!-- Wrapper compatible with Tophat version 2.0.0+ --> |
3 <description>Gapped-read mapper for RNA-seq data</description> | |
8
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
4 <macros> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
5 <import>tophat_macros.xml</import> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
6 <xml name="paired_parameters"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
7 <param name="mate_inner_distance" type="integer" value="300" label="Mean Inner Distance between Mate Pairs" help="-r/--mate-inner-dist; This is the expected (mean) inner distance between mate pairs. For, example, for paired end runs with fragments selected at 300bp, where each end is 50bp, you should set -r to be 200. The default is 50bp."/> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
8 <param name="mate_std_dev" type="integer" value="20" label="Std. Dev for Distance between Mate Pairs" help="--mate-std-dev; The standard deviation for the distribution on inner distances between mate pairs. The default is 20bp."/> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
9 <!-- Discordant pairs. --> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
10 <param name="report_discordant_pairs" type="select" label="Report discordant pair alignments?" help="--no-discordant"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
11 <option value="No">No</option> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
12 <option selected="True" value="Yes">Yes</option> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
13 </param> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
14 </xml> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
15 <macro name="dbKeyActions"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
16 <actions> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
17 <conditional name="refGenomeSource.genomeSource"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
18 <when value="indexed"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
19 <action type="metadata" name="dbkey"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
20 <option type="from_data_table" name="tophat2_indexes" column="1" offset="0"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
21 <filter type="param_value" column="0" value="#" compare="startswith" keep="False"/> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
22 <filter type="param_value" ref="refGenomeSource.index" column="0"/> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
23 </option> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
24 </action> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
25 </when> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
26 <when value="history"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
27 <action type="metadata" name="dbkey"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
28 <option type="from_param" name="refGenomeSource.ownFile" param_attribute="dbkey" /> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
29 </action> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
30 </when> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
31 </conditional> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
32 </actions> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
33 </macro> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
34 </macros> |
0 | 35 <requirements> |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
36 <requirement type="package" version="2.2.5">bowtie2</requirement> |
8
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
37 <requirement type="package" version="2.1.0">tophat</requirement> |
0 | 38 </requirements> |
8
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
39 <stdio> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
40 <regex match="Exception|Error" source="both" level="fatal" description="Tool execution failed"/> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
41 <regex match=".*" source="both" level="log" description="tool progress"/> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
42 </stdio> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
43 <version_command>tophat2 --version</version_command> |
0 | 44 |
45 <command> | |
46 ## | |
47 ## Set path to index, building the reference if necessary. | |
48 ## | |
49 | |
50 #set index_path = '' | |
51 #if $refGenomeSource.genomeSource == "history": | |
52 bowtie2-build "$refGenomeSource.ownFile" genome ; ln -s "$refGenomeSource.ownFile" genome.fa ; | |
53 #set index_path = 'genome' | |
54 #else: | |
55 #set index_path = $refGenomeSource.index.fields.path | |
56 #end if | |
57 | |
58 ## | |
59 ## Run tophat. | |
60 ## | |
61 | |
62 tophat2 | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
63 |
0 | 64 ## Change this to accommodate the number of threads you have available. |
65 --num-threads \${GALAXY_SLOTS:-4} | |
66 | |
67 ## Set params. | |
68 #if $params.settingsType == "full": | |
69 --read-mismatches $params.read_mismatches | |
70 #if str($params.bowtie_n) == "Yes": | |
71 --bowtie-n | |
72 #end if | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
73 |
0 | 74 --read-edit-dist $params.read_edit_dist |
75 --read-realign-edit-dist $params.read_realign_edit_dist | |
76 -a $params.anchor_length | |
77 -m $params.splice_mismatches | |
78 -i $params.min_intron_length | |
79 -I $params.max_intron_length | |
80 -g $params.max_multihits | |
81 --min-segment-intron $params.min_segment_intron | |
82 --max-segment-intron $params.max_segment_intron | |
83 --segment-mismatches $params.seg_mismatches | |
84 --segment-length $params.seg_length | |
85 --library-type $params.library_type | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
86 |
0 | 87 ## Indel search. |
88 #if $params.indel_search.allow_indel_search == "Yes": | |
89 ## --allow-indels | |
90 --max-insertion-length $params.indel_search.max_insertion_length | |
91 --max-deletion-length $params.indel_search.max_deletion_length | |
92 #else: | |
93 --no-novel-indels | |
94 #end if | |
95 | |
96 ## Supplying junctions parameters. | |
97 #if $params.own_junctions.use_junctions == "Yes": | |
98 #if $params.own_junctions.gene_model_ann.use_annotations == "Yes": | |
99 -G $params.own_junctions.gene_model_ann.gene_annotation_model | |
100 #end if | |
101 #if $params.own_junctions.raw_juncs.use_juncs == "Yes": | |
102 -j $params.own_junctions.raw_juncs.raw_juncs | |
103 #end if | |
104 #if str($params.own_junctions.no_novel_juncs) == "Yes": | |
105 --no-novel-juncs | |
106 #end if | |
107 #end if | |
108 | |
109 #if $params.coverage_search.use_search == "Yes": | |
110 --coverage-search | |
111 --min-coverage-intron $params.coverage_search.min_coverage_intron | |
112 --max-coverage-intron $params.coverage_search.max_coverage_intron | |
8
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
113 #elif $params.coverage_search.use_search == "No" |
0 | 114 --no-coverage-search |
115 #end if | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
116 |
0 | 117 #if str($params.microexon_search) == "Yes": |
118 --microexon-search | |
119 #end if | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
120 |
0 | 121 #if $params.fusion_search.do_search == "Yes": |
122 --fusion-search | |
123 --fusion-anchor-length $params.fusion_search.anchor_len | |
124 --fusion-min-dist $params.fusion_search.min_dist | |
125 --fusion-read-mismatches $params.fusion_search.read_mismatches | |
126 --fusion-multireads $params.fusion_search.multireads | |
127 --fusion-multipairs $params.fusion_search.multipairs | |
128 --fusion-ignore-chromosomes "$params.fusion_search.ignore_chromosomes" | |
129 #end if | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
130 |
0 | 131 #if $params.bowtie2_settings.b2_settings == "Yes": |
132 #if $params.bowtie2_settings.preset.b2_preset == "Yes": | |
133 --b2-$params.bowtie2_settings.preset.b2_preset_select | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
134 #end if |
0 | 135 #end if |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
136 |
0 | 137 #end if |
138 | |
139 ## Read group information. | |
140 #if $readGroup.specReadGroup == "yes" | |
141 --rg-id "$readGroup.rgid" | |
142 --rg-library "$readGroup.rglb" | |
143 --rg-platform "$readGroup.rgpl" | |
144 --rg-sample "$readGroup.rgsm" | |
145 #end if | |
146 | |
147 ## Set index path, inputs and parameters specific to paired data. | |
2 | 148 #if $singlePaired.sPaired != "single" |
0 | 149 -r $singlePaired.mate_inner_distance |
150 --mate-std-dev=$singlePaired.mate_std_dev | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
151 |
0 | 152 #if str($singlePaired.report_discordant_pairs) == "No": |
153 --no-discordant | |
154 #end if | |
155 | |
2 | 156 #if $singlePaired.sPaired == "paired" |
157 ${index_path} "$singlePaired.input1" "$singlePaired.input2" | |
158 #else | |
159 ${index_path} "$singlePaired.input.forward" "$singlePaired.input.reverse" | |
160 #end if | |
0 | 161 #else |
2 | 162 ${index_path} "$singlePaired.input1" |
0 | 163 #end if |
164 </command> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
165 |
0 | 166 <inputs> |
167 <conditional name="singlePaired"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
168 <param name="sPaired" type="select" label="Is this single-end or paired-end data?"> |
0 | 169 <option value="single">Single-end</option> |
2 | 170 <option value="paired">Paired-end (as individual datasets)</option> |
171 <option value="paired_collection">Paired-end (as collection)</option> | |
0 | 172 </param> |
173 <when value="single"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
174 <param format="fastqsanger" name="input1" type="data" label="RNA-Seq FASTQ file" help="Must have Sanger-scaled quality values with ASCII offset 33"/> |
0 | 175 </when> |
176 <when value="paired"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
177 <param format="fastqsanger" name="input1" type="data" label="RNA-Seq FASTQ file, forward reads" help="Must have Sanger-scaled quality values with ASCII offset 33" /> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
178 <param format="fastqsanger" name="input2" type="data" label="RNA-Seq FASTQ file, reverse reads" help="Must have Sanger-scaled quality values with ASCII offset 33" /> |
2 | 179 <expand macro="paired_parameters" /> |
180 </when> | |
181 <when value="paired_collection"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
182 <param format="fastqsanger" name="input" type="data_collection" collection_type="paired" label="RNA-Seq FASTQ paired reads" help="Must have Sanger-scaled quality values with ASCII offset 33" /> |
2 | 183 <expand macro="paired_parameters" /> |
0 | 184 </when> |
185 </conditional> | |
186 <expand macro="refGenomeSourceConditional"> | |
187 <options from_data_table="tophat2_indexes"> | |
188 <filter type="sort_by" column="2"/> | |
189 <validator type="no_options" message="No genomes are available for the selected input dataset"/> | |
190 </options> | |
191 </expand> | |
192 <conditional name="params"> | |
193 <param name="settingsType" type="select" label="TopHat settings to use" help="You can use the default settings or set custom values for any of Tophat's parameters."> | |
194 <option value="preSet">Use Defaults</option> | |
195 <option value="full">Full parameter list</option> | |
196 </param> | |
197 <when value="preSet" /> | |
198 <!-- Full/advanced params. --> | |
199 <when value="full"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
200 <param name="read_realign_edit_dist" type="integer" value="1000" label="Max realign edit distance" help="--read-realign-edit-dist; Some of the reads spanning multiple exons may be mapped incorrectly as a contiguous alignment to the genome even though the correct alignment should be a spliced one - this can happen in the presence of processed pseudogenes that are rarely (if at all) transcribed or expressed. This option can direct TopHat to re-align reads for which the edit distance of an alignment obtained in a previous mapping step is above or equal to this option value. If you set this option to 0, TopHat will map every read in all the mapping steps (transcriptome if you provided gene annotations, genome, and finally splice variants detected by TopHat), reporting the best possible alignment found in any of these mapping steps. This may greatly increase the mapping accuracy at the expense of an increase in running time. The default value for this option is set such that TopHat will not try to realign reads already mapped in earlier steps." /> |
0 | 201 |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
202 <param name="read_edit_dist" type="integer" value="2" label="Max edit distance" help="--read-edit-dist; Final read alignments having more than these many edit distance are discarded." /> |
0 | 203 |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
204 <param name="library_type" type="select" label="Library Type" help="--library-type; TopHat will treat the reads as strand specific. Every read alignment will have an XS attribute tag. Consider supplying library type options below to select the correct RNA-seq protocol."> |
0 | 205 <option value="fr-unstranded">FR Unstranded</option> |
206 <option value="fr-firststrand">FR First Strand</option> | |
207 <option value="fr-secondstrand">FR Second Strand</option> | |
208 </param> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
209 <param name="read_mismatches" type="integer" value="2" label="Final read mismatches" help="--read-mismatches; Final read alignments having more than these many mismatches are discarded." /> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
210 <param name="bowtie_n" type="select" label="Use bowtie -n mode" help="--bowtie-n; TopHat uses "-v" in Bowtie for initial read mapping (the default), but with this option, "-n" is used instead. Read segments are always mapped using "-v" option."> |
0 | 211 <option selected="true" value="No">No</option> |
212 <option value="Yes">Yes</option> | |
213 </param> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
214 <param name="anchor_length" type="integer" value="8" label="Anchor length (at least 3)" help="-a/--min-anchor-length; TopHat will report junctions spanned by reads with at least this many bases on each side of the junction. Note that individual spliced alignments may span a junction with fewer than this many bases on one side. However, every junction involved in spliced alignments is supported by at least one read with this many bases on each side. This must be at least 3 and the default is 8." /> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
215 <param name="splice_mismatches" type="integer" value="0" label="Maximum number of mismatches that can appear in the anchor region of spliced alignment" help="-m/--splice-mismatches; The default is 0."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
216 <param name="min_intron_length" type="integer" value="70" label="The minimum intron length" help="-i/--min-intron-length; TopHat will ignore donor/acceptor pairs closer than this many bases apart. The default is 70." /> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
217 <param name="max_intron_length" type="integer" value="500000" label="The maximum intron length" help="-I/--max-intron-length; When searching for junctions ab initio, TopHat will ignore donor/acceptor pairs farther than this many bases apart, except when such a pair is supported by a split segment alignment of a long read. The default is 500000." /> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
218 |
0 | 219 <expand macro="indel_searchConditional" /> |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
220 |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
221 <param name="max_multihits" type="integer" value="20" label="Maximum number of alignments to be allowed" help="-g/--max-multihits; Instructs TopHat to allow up to this many alignments to the reference for a given read, and choose the alignments based on their alignment scores if there are more than this number. The default is 20 for read mapping. Unless you use --report-secondary-alignments, TopHat will report the alignments with the best alignment score. If there are more alignments with the same score than this number, TopHat will randomly report only this many alignments. In case of using --report-secondary-alignments, TopHat will try to report alignments up to this option value, and TopHat may randomly output some of the alignments with the same score to meet this number."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
222 <param name="min_segment_intron" type="integer" value="50" label="Minimum intron length that may be found during split-segment (default) search" help="--min-segment-intron; The minimum intron length that may be found during split-segment search. The default is 50."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
223 <param name="max_segment_intron" type="integer" value="500000" label="Maximum intron length that may be found during split-segment (default) search" help="--max-segment-intron; The maximum intron length that may be found during split-segment search. The default is 500000."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
224 <param name="seg_mismatches" type="integer" min="0" max="3" value="2" label="Number of mismatches allowed in each segment alignment for reads mapped independently" help="--segment-mismatches; Read segments are mapped independently, allowing up to this many mismatches in each segment alignment. The default is 2."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
225 <param name="seg_length" type="integer" value="25" label="Minimum length of read segments" help="--segment-length; Each read is cut up into segments, each at least this long. These segments are mapped independently. The default is 25."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
226 <param name="output_unmapped" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Output unmapped reads" help="If checked, a BAM with the unmapped reads will be added to the history" /> |
0 | 227 <!-- Options for supplying own junctions. --> |
228 <expand macro="own_junctionsConditional" /> | |
229 <!-- Coverage search. --> | |
230 <conditional name="coverage_search"> | |
8
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
231 <param name="use_search" type="select" label="Use coverage-based search for junctions" help="Select 'Auto' to let TopHat decide when to enable coverage search (e.g. disable it for reads 75bp or longer). Select 'Yes' to enforce maximum sensitivity and to specify minimum and maximum intron length"> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
232 <option selected="true" value="auto">Auto</option> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
233 <option value="No">No (--no-coverage-search)</option> |
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
234 <option value="Yes">Yes (--coverage-search)</option> |
0 | 235 </param> |
8
758594ed0364
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/tophat2 commit 1dbddfa19e12087e6e9fc177a088cdbf7ab9b414
devteam
parents:
7
diff
changeset
|
236 <when value="auto" /> |
0 | 237 <when value="Yes"> |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
238 <param name="min_coverage_intron" type="integer" value="50" label="Minimum intron length that may be found during coverage search" help="--min-coverage-intron; The minimum intron length that may be found during coverage search. The default is 50."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
239 <param name="max_coverage_intron" type="integer" value="20000" label="Maximum intron length that may be found during coverage search" help="--max-coverage-intron; The maximum intron length that may be found during coverage search. The default is 20000."/> |
0 | 240 </when> |
241 <when value="No" /> | |
242 </conditional> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
243 |
0 | 244 <!-- Microexon search params --> |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
245 <param name="microexon_search" type="select" label="Use Microexon Search" help="--microexon-search; With this option, the pipeline will attempt to find alignments incident to microexons. Works only for reads 50bp or longer."> |
0 | 246 <option value="No">No</option> |
247 <option value="Yes">Yes</option> | |
248 </param> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
249 |
0 | 250 <!-- Fusion mapping. --> |
251 <conditional name="fusion_search"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
252 <param name="do_search" type="select" label="Do Fusion Search" help="Reads can be aligned to potential fusion transcripts if the --fusion-search option is specified. The fusion alignments are reported in SAM format using custom fields XF and XP (see the output format) and some additional information about fusions will be reported (see fusions.out). Once mapping is done, you can run tophat-fusion-post to filter out fusion transcripts (see the TopHat-Fusion website for more details)."> |
0 | 253 <option selected="true" value="No">No</option> |
254 <option value="Yes">Yes</option> | |
255 </param> | |
256 <when value="No" /> | |
257 <when value="Yes"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
258 <param name="anchor_len" type="integer" value="20" label="Anchor Length" help="--fusion-anchor-length; A 'supporting' read must map to both sides of a fusion by at least this many bases. The default is 20."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
259 <param name="min_dist" type="integer" value="10000000" label="Minimum Distance" help="--fusion-min-dist; For intra-chromosomal fusions, TopHat-Fusion tries to find fusions separated by at least this distance. The default is 10000000."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
260 <param name="read_mismatches" type="integer" value="2" label="Read Mismatches" help="--fusion-read-mismatches; Reads support fusions if they map across fusion with at most this many mismatches. The default is 2."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
261 <param name="multireads" type="integer" value="2" label="Multireads" help="--fusion-multireads; Reads that map to more than this many places will be ignored. It may be possible that a fusion is supported by reads (or pairs) that map to multiple places. The default is 2."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
262 <param name="multipairs" type="integer" value="2" label="Multipairs" help="--fusion-multipairs; Pairs that map to more than this many places will be ignored. The default is 2."/> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
263 <param name="ignore_chromosomes" type="text" value='' label="--fusion-ignore-chromosomes; Ignore some chromosomes such as chrM when detecting fusion break points"/> |
0 | 264 </when> |
265 </conditional> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
266 |
0 | 267 <!-- Bowtie2 settings. --> |
268 <conditional name="bowtie2_settings"> | |
269 <param name="b2_settings" type="select" label="Set Bowtie2 settings"> | |
270 <option selected="true" value="No">No</option> | |
271 <option value="Yes">Yes</option> | |
272 </param> | |
273 <when value="No" /> | |
274 <when value="Yes"> | |
275 <conditional name="preset"> | |
276 <param name="b2_preset" type="select" label="Use Preset options"> | |
277 <option selected="true" value="Yes">Yes</option> | |
278 <option value="No">No</option> | |
279 </param> | |
280 <when value="Yes"> | |
281 <param name="b2_preset_select" type="select" label="Preset option"> | |
282 <option value="very-fast">Very fast</option> | |
283 <option value="fast">Fast</option> | |
284 <option selected="true" value="sensitive">Sensitive</option> | |
285 <option value="very-sensitive">Very sensitive</option> | |
286 </param> | |
287 </when> | |
288 <!-- TODO: --> | |
289 <when value="No" /> | |
290 </conditional> | |
291 </when> | |
292 </conditional> | |
293 </when> <!-- full --> | |
294 </conditional> <!-- params --> | |
295 <conditional name="readGroup"> | |
296 <param name="specReadGroup" type="select" label="Specify read group?"> | |
297 <option value="yes">Yes</option> | |
298 <option value="no" selected="True">No</option> | |
299 </param> | |
300 <when value="yes"> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
301 <param name="rgid" type="text" label="Read group identifier (ID). Each @RG line must have a unique ID. The value of ID is used in the RG tags of alignment records. Must be unique among all read groups in header section." help="Required if RG specified. Read group IDs may be modified when merging SAM files in order to handle collisions." /> |
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
302 <param name="rglb" type="text" label="Library name (LB)" help="Required if RG specified" /> |
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
303 <param name="rgpl" type="text" label="Platform/technology used to produce the reads (PL)" help="Required if RG specified. Valid values : CAPILLARY, LS454, ILLUMINA, SOLID, HELICOS, IONTORRENT and PACBIO" /> |
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
304 <param name="rgsm" type="text" label="Sample (SM)" help="Required if RG specified. Use pool name where a pool is being sequenced" /> |
0 | 305 </when> |
306 <when value="no" /> | |
307 </conditional> <!-- readGroup --> | |
308 </inputs> | |
309 | |
310 <outputs> | |
311 <data format="txt" name="align_summary" label="${tool.name} on ${on_string}: align_summary" from_work_dir="tophat_out/align_summary.txt"/> | |
312 <data format="tabular" name="fusions" label="${tool.name} on ${on_string}: fusions" from_work_dir="tophat_out/fusions.out"> | |
313 <filter>(params['settingsType'] == 'full' and params['fusion_search']['do_search'] == 'Yes')</filter> | |
314 </data> | |
315 <data format="bed" name="insertions" label="${tool.name} on ${on_string}: insertions" from_work_dir="tophat_out/insertions.bed"> | |
316 <expand macro="dbKeyActions" /> | |
317 </data> | |
318 <data format="bed" name="deletions" label="${tool.name} on ${on_string}: deletions" from_work_dir="tophat_out/deletions.bed"> | |
319 <expand macro="dbKeyActions" /> | |
320 </data> | |
321 <data format="bed" name="junctions" label="${tool.name} on ${on_string}: splice junctions" from_work_dir="tophat_out/junctions.bed"> | |
322 <expand macro="dbKeyActions" /> | |
323 </data> | |
324 <data format="bam" name="accepted_hits" label="${tool.name} on ${on_string}: accepted_hits" from_work_dir="tophat_out/accepted_hits.bam"> | |
325 <expand macro="dbKeyActions" /> | |
326 </data> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
327 <data format="bam" name="unmapped" label="${tool.name} on ${on_string}: unmapped" from_work_dir="tophat_out/unmapped.bam"> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
328 <filter>(params['settingsType'] == 'full' and params['output_unmapped'])</filter> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
329 <expand macro="dbKeyActions" /> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
330 </data> |
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
331 |
0 | 332 </outputs> |
333 | |
334 <tests> | |
335 <!-- Test base-space single-end reads with pre-built index and preset parameters --> | |
336 <test> | |
337 <!-- TopHat commands: | |
338 tophat2 -o tmp_dir -p 1 tophat_in1 test-data/tophat_in2.fastqsanger | |
339 Rename the files in tmp_dir appropriately | |
340 --> | |
341 <param name="sPaired" value="single" /> | |
342 <param name="input1" ftype="fastqsanger" value="tophat_in2.fastqsanger" /> | |
343 <param name="genomeSource" value="indexed" /> | |
344 <param name="index" value="tophat_test" /> | |
345 <param name="settingsType" value="preSet" /> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
346 <param name="specReadGroup" value="no" /> |
0 | 347 <output name="junctions" file="tophat2_out1j.bed" /> |
348 <output name="accepted_hits" file="tophat_out1h.bam" compare="sim_size" /> | |
349 </test> | |
350 <!-- Test using base-space test data: paired-end reads, index from history. --> | |
351 <test> | |
352 <!-- TopHat commands: | |
353 bowtie2-build -f test-data/tophat_in1.fasta tophat_in1 | |
354 tophat2 -o tmp_dir -p 1 -r 20 tophat_in1 test-data/tophat_in2.fastqsanger test-data/tophat_in3.fastqsanger | |
355 Rename the files in tmp_dir appropriately | |
356 --> | |
357 <param name="sPaired" value="paired" /> | |
358 <param name="input1" ftype="fastqsanger" value="tophat_in2.fastqsanger" /> | |
359 <param name="input2" ftype="fastqsanger" value="tophat_in3.fastqsanger" /> | |
360 <param name="genomeSource" value="history" /> | |
361 <param name="ownFile" ftype="fasta" value="tophat_in1.fasta" /> | |
362 <param name="mate_inner_distance" value="20" /> | |
363 <param name="settingsType" value="preSet" /> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
364 <param name="specReadGroup" value="no" /> |
0 | 365 <output name="junctions" file="tophat2_out2j.bed" /> |
366 <output name="accepted_hits" file="tophat_out2h.bam" compare="sim_size" /> | |
367 </test> | |
2 | 368 <test> |
369 <!-- Same test as above but with a collection. --> | |
370 <param name="sPaired" value="paired_collection" /> | |
371 <param name="input"> | |
372 <collection type="paired"> | |
373 <element name="forward" value="tophat_in2.fastqsanger" ftype="fastqsanger" /> | |
374 <element name="reverse" value="tophat_in3.fastqsanger" ftype="fastqsanger" /> | |
375 </collection> | |
376 </param> | |
377 <param name="genomeSource" value="history" /> | |
378 <param name="ownFile" ftype="fasta" value="tophat_in1.fasta" /> | |
379 <param name="mate_inner_distance" value="20" /> | |
380 <param name="settingsType" value="preSet" /> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
381 <param name="specReadGroup" value="no" /> |
2 | 382 <output name="junctions" file="tophat2_out2j.bed" /> |
383 <output name="accepted_hits" file="tophat_out2h.bam" compare="sim_size" /> | |
384 </test> | |
0 | 385 <!-- Test base-space single-end reads with user-supplied reference fasta and full parameters --> |
386 <test> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
387 <!-- TopHat commands: |
0 | 388 bowtie2-build -f test-data/tophat_in1.fasta tophat_in1 |
389 tophat2 -o tmp_dir -p 1 -a 8 -m 0 -i 70 -I 500000 -g 40 +coverage-search +min-coverage-intron 50 +max-coverage-intro 20000 +segment-mismatches 2 +segment-length 25 +microexon-search tophat_in1 test-data/tophat_in2.fastqsanger | |
390 Replace the + with double-dash | |
391 Rename the files in tmp_dir appropriately | |
392 --> | |
2 | 393 <conditional name="singlePaired"> |
394 <param name="sPaired" value="single"/> | |
395 <param name="input1" ftype="fastqsanger" value="tophat_in2.fastqsanger"/> | |
396 </conditional> | |
0 | 397 <param name="genomeSource" value="history"/> |
398 <param name="ownFile" value="tophat_in1.fasta"/> | |
2 | 399 <conditional name="params"> |
400 <param name="settingsType" value="full"/> | |
401 <param name="library_type" value="FR Unstranded"/> | |
402 <param name="read_mismatches" value="2"/> | |
403 <param name="bowtie_n" value="No"/> | |
404 <param name="anchor_length" value="8"/> | |
405 <param name="splice_mismatches" value="0"/> | |
406 <param name="min_intron_length" value="70"/> | |
407 <param name="max_intron_length" value="500000"/> | |
408 <param name="max_multihits" value="40"/> | |
409 <param name="min_segment_intron" value="50" /> | |
410 <param name="max_segment_intron" value="500000" /> | |
411 <param name="seg_mismatches" value="2"/> | |
412 <param name="seg_length" value="25"/> | |
413 <conditional name="indel_search"> | |
414 <param name="allow_indel_search" value="Yes"/> | |
415 <param name="max_insertion_length" value="3"/> | |
416 <param name="max_deletion_length" value="3"/> | |
417 </conditional> | |
418 <conditional name="own_junctions"> | |
419 <param name="use_junctions" value="Yes" /> | |
420 <conditional name="gene_model_ann"> | |
421 <param name="use_annotations" value="No" /> | |
422 </conditional> | |
423 <conditional name="raw_juncs"> | |
424 <param name="use_juncs" value="No" /> | |
425 </conditional> | |
426 <conditional name="no_novel_juncs"> | |
427 <param name="no_novel_juncs" value="No" /> | |
428 </conditional> | |
429 </conditional> | |
430 <conditional name="coverage_search"> | |
431 <param name="use_search" value="Yes" /> | |
432 <param name="min_coverage_intron" value="50" /> | |
433 <param name="max_coverage_intron" value="20000" /> | |
434 </conditional> | |
435 <param name="microexon_search" value="Yes" /> | |
436 <conditional name="bowtie2_settings"> | |
437 <param name="b2_settings" value="No" /> | |
438 </conditional> | |
439 <!-- Fusion search params --> | |
440 <conditional name="fusion_search"> | |
441 <param name="do_search" value="Yes" /> | |
442 <param name="anchor_len" value="21" /> | |
443 <param name="min_dist" value="10000021" /> | |
444 <param name="read_mismatches" value="3" /> | |
445 <param name="multireads" value="4" /> | |
446 <param name="multipairs" value="5" /> | |
447 <param name="ignore_chromosomes" value="chrM"/> | |
448 </conditional> | |
449 </conditional> | |
450 <conditional name="readGroup"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
451 <param name="specReadGroup" value="no" /> |
2 | 452 </conditional> |
0 | 453 <output name="insertions" file="tophat_out3i.bed" /> |
454 <output name="deletions" file="tophat_out3d.bed" /> | |
455 <output name="junctions" file="tophat2_out3j.bed" /> | |
456 <output name="accepted_hits" file="tophat_out3h.bam" compare="sim_size" /> | |
457 </test> | |
458 <!-- Test base-space paired-end reads with user-supplied reference fasta and full parameters --> | |
459 <test> | |
460 <!-- TopHat commands: | |
461 tophat2 -o tmp_dir -r 20 -p 1 -a 8 -m 0 -i 70 -I 500000 -g 40 +coverage-search +min-coverage-intron 50 +max-coverage-intro 20000 +segment-mismatches 2 +segment-length 25 +microexon-search +report_discordant_pairs tophat_in1 test-data/tophat_in2.fastqsanger test-data/tophat_in3.fastqsanger | |
462 Replace the + with double-dash | |
463 Rename the files in tmp_dir appropriately | |
464 --> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
465 <conditional name="singlePaired"> |
2 | 466 <param name="sPaired" value="paired"/> |
467 <param name="input1" ftype="fastqsanger" value="tophat_in2.fastqsanger"/> | |
468 <param name="input2" ftype="fastqsanger" value="tophat_in3.fastqsanger"/> | |
469 <param name="mate_inner_distance" value="20"/> | |
470 <param name="report_discordant_pairs" value="Yes" /> | |
471 </conditional> | |
0 | 472 <param name="genomeSource" value="indexed"/> |
473 <param name="index" value="tophat_test"/> | |
2 | 474 <conditional name="params"> |
475 <param name="settingsType" value="full"/> | |
476 <param name="library_type" value="FR Unstranded"/> | |
477 <param name="read_mismatches" value="5"/> | |
478 <!-- Error: the read mismatches (5) and the read gap length (2) should be less than or equal to the read edit dist (2) --> | |
479 <param name="read_edit_dist" value="5" /> | |
480 <param name="bowtie_n" value="Yes"/> | |
481 <param name="mate_std_dev" value="20"/> | |
482 <param name="anchor_length" value="8"/> | |
483 <param name="splice_mismatches" value="0"/> | |
484 <param name="min_intron_length" value="70"/> | |
485 <param name="max_intron_length" value="500000"/> | |
486 <param name="max_multihits" value="40"/> | |
487 <param name="min_segment_intron" value="50" /> | |
488 <param name="max_segment_intron" value="500000" /> | |
489 <param name="seg_mismatches" value="2"/> | |
490 <param name="seg_length" value="25"/> | |
491 <conditional name="indel_search"> | |
492 <param name="allow_indel_search" value="No"/> | |
493 </conditional> | |
494 <conditional name="own_junctions"> | |
495 <param name="use_junctions" value="Yes" /> | |
496 <conditional name="gene_model_ann"> | |
497 <param name="use_annotations" value="No" /> | |
498 </conditional> | |
499 <conditional name="raw_juncs"> | |
500 <param name="use_juncs" value="No" /> | |
501 </conditional> | |
502 <conditional name="no_novel_juncs"> | |
503 <param name="no_novel_juncs" value="No" /> | |
504 </conditional> | |
505 </conditional> | |
506 <conditional name="coverage_search"> | |
507 <param name="use_search" value="No" /> | |
508 </conditional> | |
509 <param name="microexon_search" value="Yes" /> | |
510 <conditional name="bowtie2_settings"> | |
511 <param name="b2_settings" value="No" /> | |
512 </conditional> | |
513 <!-- Fusion search params --> | |
514 <conditional name="fusion_search"> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
515 <param name="do_search" value="Yes" /> |
2 | 516 <param name="anchor_len" value="21" /> |
517 <param name="min_dist" value="10000021" /> | |
518 <param name="read_mismatches" value="3" /> | |
519 <param name="multireads" value="4" /> | |
520 <param name="multipairs" value="5" /> | |
521 <param name="ignore_chromosomes" value="chrM"/> | |
522 </conditional> | |
523 </conditional> | |
524 <conditional name="readGroup"> | |
5
5c5517d2a9e9
planemo upload commit a52cc16ed8d0d60e99742b55fccbdedcbb64b82c
devteam
parents:
3
diff
changeset
|
525 <param name="specReadGroup" value="no" /> |
2 | 526 </conditional> |
0 | 527 <output name="junctions" file="tophat2_out4j.bed" /> |
528 <output name="accepted_hits" file="tophat_out4h.bam" compare="sim_size" /> | |
529 </test> | |
530 </tests> | |
531 <help> | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
532 **TopHat Overview** |
0 | 533 |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
534 TopHat_ is a fast splice junction mapper for RNA-Seq reads. It aligns RNA-Seq reads to mammalian-sized genomes using the ultra high-throughput short read aligner Bowtie(2), and then analyzes the mapping results to identify splice junctions between exons. |
0 | 535 |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
536 .. _TopHat: http://ccb.jhu.edu/software/tophat/ |
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
537 |
0 | 538 ------ |
539 | |
540 **Know what you are doing** | |
541 | |
542 .. class:: warningmark | |
543 | |
544 There is no such thing (yet) as an automated gearshift in splice junction identification. It is all like stick-shift driving in San Francisco. In other words, running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy. | |
545 | |
1
ae06af1118dc
Update Tophat URLs in help text.
Nate Coraor <nate@bx.psu.edu>
parents:
0
diff
changeset
|
546 .. __: http://ccb.jhu.edu/software/tophat/manual.shtml |
0 | 547 |
548 ------ | |
549 | |
550 **Input formats** | |
551 | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
552 TopHat accepts files in Sanger FASTQ format. Use the FASTQ Groomer to prepare your files. |
0 | 553 |
554 ------ | |
555 | |
556 **Outputs** | |
557 | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
558 TopHat produces two output files: |
0 | 559 |
560 - junctions -- A UCSC BED_ track of junctions reported by TopHat. Each junction consists of two connected BED blocks, where each block is as long as the maximal overhang of any read spanning the junction. The score is the number of alignments spanning the junction. | |
561 - accepted_hits -- A list of read alignments in BAM_ format. | |
562 | |
563 .. _BED: http://genome.ucsc.edu/FAQ/FAQformat.html#format1 | |
564 .. _BAM: http://samtools.sourceforge.net/ | |
565 | |
566 Two other possible outputs, depending on the options you choose, are insertions and deletions, both of which are in BED format. | |
567 | |
568 ------- | |
569 | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
570 **TopHat settings** |
0 | 571 |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
572 All of the options have a default value. You can change any of them. Some of the options in TopHat have been implemented here. |
0 | 573 |
574 ------ | |
575 | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
576 **TopHat parameter list** |
0 | 577 |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
578 This is a list of implemented TopHat options:: |
0 | 579 |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
580 -r This is the expected (mean) inner distance between mate pairs. For, example, for paired end runs with fragments |
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
581 selected at 300bp, where each end is 50bp, you should set -r to be 200. There is no default, and this parameter |
0 | 582 is required for paired end runs. |
583 --mate-std-dev INT The standard deviation for the distribution on inner distances between mate pairs. The default is 20bp. | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
584 -a/--min-anchor-length INT The "anchor length". TopHat will report junctions spanned by reads with at least this many bases on each side of the junction. Note that individual spliced |
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
585 alignments may span a junction with fewer than this many bases on one side. However, every junction involved in spliced alignments is supported by at least one |
0 | 586 read with this many bases on each side. This must be at least 3 and the default is 8. |
587 -m/--splice-mismatches INT The maximum number of mismatches that may appear in the "anchor" region of a spliced alignment. The default is 0. | |
588 -i/--min-intron-length INT The minimum intron length. TopHat will ignore donor/acceptor pairs closer than this many bases apart. The default is 70. | |
589 -I/--max-intron-length INT The maximum intron length. When searching for junctions ab initio, TopHat will ignore donor/acceptor pairs farther than this many bases apart, except when such a pair is supported by a split segment alignment of a long read. The default is 500000. | |
7
4eb3c3beb9c7
planemo upload commit 4ec9eb1570ea116d83f5464a786af6e14fb5b57d
devteam
parents:
5
diff
changeset
|
590 -g/--max-multihits INT Instructs TopHat to allow up to this many alignments to the reference for a given read, and suppresses all alignments for reads with more than this many |
0 | 591 alignments. The default is 40. |
592 -G/--GTF [GTF 2.2 file] Supply TopHat with a list of gene model annotations. TopHat will use the exon records in this file to build a set of known splice junctions for each gene, and will attempt to align reads to these junctions even if they would not normally be covered by the initial mapping. | |
593 -j/--raw-juncs [juncs file] Supply TopHat with a list of raw junctions. Junctions are specified one per line, in a tab-delimited format. Records look like: [chrom] [left] [right] [+/-], left and right are zero-based coordinates, and specify the last character of the left sequenced to be spliced to the first character of the right sequence, inclusive. | |
594 -no-novel-juncs Only look for junctions indicated in the supplied GFF file. (ignored without -G) | |
595 --no-coverage-search Disables the coverage based search for junctions. | |
596 --coverage-search Enables the coverage based search for junctions. Use when coverage search is disabled by default (such as for reads 75bp or longer), for maximum sensitivity. | |
597 --microexon-search With this option, the pipeline will attempt to find alignments incident to microexons. Works only for reads 50bp or longer. | |
598 --segment-mismatches Read segments are mapped independently, allowing up to this many mismatches in each segment alignment. The default is 2. | |
599 --segment-length Each read is cut up into segments, each at least this long. These segments are mapped independently. The default is 25. | |
600 --min-coverage-intron The minimum intron length that may be found during coverage search. The default is 50. | |
601 --max-coverage-intron The maximum intron length that may be found during coverage search. The default is 20000. | |
602 --min-segment-intron The minimum intron length that may be found during split-segment search. The default is 50. | |
603 --max-segment-intron The maximum intron length that may be found during split-segment search. The default is 500000. | |
604 </help> | |
2 | 605 <citations> |
606 <citation type="doi">10.1186/gb-2013-14-4-r36</citation> | |
607 </citations> | |
0 | 608 </tool> |