Mercurial > repos > charles-bernard > alfa
comparison ALFA/alfa_wrapper.xml @ 22:1714165f5df0 draft
Uploaded
author | charles-bernard |
---|---|
date | Thu, 27 Oct 2016 04:42:59 -0400 |
parents | a74f6350f32e |
children | 887c6cb328e9 |
comparison
equal
deleted
inserted
replaced
21:728294cecd96 | 22:1714165f5df0 |
---|---|
6 <requirement type="package" version="2.24">bedtools</requirement> | 6 <requirement type="package" version="2.24">bedtools</requirement> |
7 <requirement type="package" version="1.2">samtools</requirement> | 7 <requirement type="package" version="1.2">samtools</requirement> |
8 <requirement type="package" version="1.4">matplotlib</requirement> | 8 <requirement type="package" version="1.4">matplotlib</requirement> |
9 </requirements> | 9 </requirements> |
10 | 10 |
11 <command interpreter="bash"> | 11 <command interpreter="python"> |
12 alfa_wrapper.sh $__root_dir__ $__tool_directory__ $ALFA_config $logReport | 12 <![CDATA[ |
13 </command> | 13 ALFA_wrapper.py |
14 | 14 |
15 --project_name "${projectName}" | |
16 | |
17 ##__INPUT 1__## | |
18 #if str ( $annotation.annotationSource['annotationSourceSelection'] ) == "index" | |
19 --index $annotation.annotationSource['strandedIndex'] $annotation.annotationSource['unstrandedIndex'] | |
20 #else if str ( $annotation.annotationSource['annotationSourceSelection'] ) == "built_in_index" | |
21 --bi_index $annotation.annotationSource.built_in_index_prefix.fields.prefix | |
22 #else | |
23 --annotation $annotation.annotationSource['annotationFile'] | |
24 #end if | |
25 | |
26 ##__INPUT 2__## | |
27 --reads_format $reads.readsType['readsTypeSelection'] | |
28 --reads | |
29 #for $i, $r in enumerate ( $reads.readsType['readsList'] ) | |
30 __fname__$r.readsFile | |
31 __label__$r.readsLabel | |
32 #end for | |
33 --strandness $reads['strandness'] | |
34 | |
35 ##__OUTPUT FILES__## | |
36 #if str ( $outputFiles['plot'] ) == "True" | |
37 #if str ( $outputOptions['plotFormat'] ) == "pdf" | |
38 --output_pdf $outputPdf | |
39 #else if str ( $outputOptions['plotFormat'] ) == "png" | |
40 --output_png $outputCategoriesPng $outputBiotypesPng | |
41 #else | |
42 --output_svg $outputCategoriesSvg $outputBiotypesSvg | |
43 #end if | |
44 #end if | |
45 #if str ( $outputFiles['countFile'] ) == "True" | |
46 --output_count $outputCountFile | |
47 #end if | |
48 #if str ( $outputFiles['index'] ) == "True" | |
49 --output_index $outputStrandedIndex $outputUnstrandedIndex | |
50 #end if | |
51 | |
52 ##__OUTPUT OPTIONS__## | |
53 --categories_depth $outputOptions['categoriesDepth'] | |
54 #if str ( $outputFiles['plot'] ) == "True" | |
55 --plot_format $outputOptions['plotFormat'] | |
56 #if str ( $outputOptions.plotThreshold['plotThresholdChoice'] ) == "True" | |
57 --threshold $outputOptions.plotThreshold.yMin $outputOptions.plotThreshold.yMax | |
58 #end if | |
59 #end if | |
60 | |
61 --log_report $logReport | |
62 --galaxy_root $__root_dir__ | |
63 --tool_dir $__tool_directory__ | |
64 ]]> | |
65 </command> | |
15 <inputs> | 66 <inputs> |
16 <param name="projectName" value="ALFA" type="text" size="20" label="Project Name"> | 67 <param name="projectName" value="ALFA" type="text" size="20" label="Project Name"> |
17 <validator type="empty_field" message="Please, specify a name for your project."/> | 68 <validator type="empty_field" message="Please, specify a name for your project."/> |
18 </param> | 69 </param> |
19 | 70 |
27 <when value="personal_gtf"> | 78 <when value="personal_gtf"> |
28 <param name="annotationFile" type="data" format="Gff, Gtf" label="Select your personal annotation file (GTF format)"> | 79 <param name="annotationFile" type="data" format="Gff, Gtf" label="Select your personal annotation file (GTF format)"> |
29 </param> | 80 </param> |
30 </when> | 81 </when> |
31 <when value="index"> | 82 <when value="index"> |
32 <param name="strandedIndex" type="data" format="index" label="Select your ALFA stranded index file (index format)"/> | 83 <param name="strandedIndex" type="data" format="index" label="Select your ALFA Stranded index file (index format)"/> |
33 <param name="unstrandedIndex" type="data" format="index" label="Select your ALFA Unstranded index file (index format)"/> | 84 <param name="unstrandedIndex" type="data" format="index" label="Select your ALFA Unstranded index file (index format)"/> |
34 </when> | 85 </when> |
35 <when value="built_in_index"> | 86 <when value="built_in_index"> |
36 <param name="built_in_index_prefix" type="select" label="Select Genome"> | 87 <param name="built_in_index_prefix" type="select" label="Select Genome"> |
37 <options from_data_table="alfa_indexes"> | 88 <options from_data_table="alfa_indexes"> |
72 <param name="plot" type="boolean" truevalue="True" falsevalue="False" checked="True" label="Categories and Biotypes Histograms" help="Plot the nucleotides distribution of the reads per genomic categories and biotypes"/> | 123 <param name="plot" type="boolean" truevalue="True" falsevalue="False" checked="True" label="Categories and Biotypes Histograms" help="Plot the nucleotides distribution of the reads per genomic categories and biotypes"/> |
73 <param name="countFile" type="boolean" truevalue="True" falsevalue="False" checked="True" label="Categories Count File" help="Edit the exact count of nucleotides in the reads per genomic categories and biotypes"/> | 124 <param name="countFile" type="boolean" truevalue="True" falsevalue="False" checked="True" label="Categories Count File" help="Edit the exact count of nucleotides in the reads per genomic categories and biotypes"/> |
74 <param name="index" type="boolean" truevalue="True" falsevalue="False" checked="False" label ="Indexes" help="Print the resulting stranded and unstranded indexes from the gtf input file (useful if you plan to run ALFA again with this annotated sequence)"/> | 125 <param name="index" type="boolean" truevalue="True" falsevalue="False" checked="False" label ="Indexes" help="Print the resulting stranded and unstranded indexes from the gtf input file (useful if you plan to run ALFA again with this annotated sequence)"/> |
75 </section> | 126 </section> |
76 | 127 |
77 <section name="outputOptions" title="ADVANCED OPTIONS" expanded="False"> | 128 <section name="outputOptions" title="ADVANCED SETTINGS" expanded="False"> |
78 <param name="categoriesDepth" type="select" label="Categories to Display"> | 129 <param name="categoriesDepth" type="select" label="Categories to Display"> |
79 <option value="1">gene | intergenic</option> | 130 <option value="1">gene | intergenic</option> |
80 <option value="2">exon | intron | intergenic</option> | 131 <option value="2">exon | intron | intergenic</option> |
81 <option value="3" selected="true">5’-UTR | CDS | 3’-UTR | intron | intergenic</option> | 132 <option value="3" selected="true">5’-UTR | CDS | 3’-UTR | intron | intergenic</option> |
82 <option value="4">5’-UTR | start_codon | CDS | stop_codon | 3’-UTR | intron | intergenic</option> | 133 <option value="4">5’-UTR | start_codon | CDS | stop_codon | 3’-UTR | intron | intergenic</option> |
90 <param name="plotThresholdChoice" type="boolean" truevalue="True" falsevalue="False" checked="false" label="Plot Options: Modify y axis range of the normalized counts of bio-features" help="Ignore if you did not choose the histograms output file"/> | 141 <param name="plotThresholdChoice" type="boolean" truevalue="True" falsevalue="False" checked="false" label="Plot Options: Modify y axis range of the normalized counts of bio-features" help="Ignore if you did not choose the histograms output file"/> |
91 <when value="True"> | 142 <when value="True"> |
92 <param name="yMin" type="float" value="-2.0" label="y min"/> | 143 <param name="yMin" type="float" value="-2.0" label="y min"/> |
93 <param name="yMax" type="float" value="2.0" label="y max"/> | 144 <param name="yMax" type="float" value="2.0" label="y max"/> |
94 </when> | 145 </when> |
146 <when value="False"></when> | |
95 </conditional> | 147 </conditional> |
96 </section> | 148 </section> |
97 </inputs> | 149 </inputs> |
98 | 150 |
99 <outputs> | 151 <outputs> |
121 </data> | 173 </data> |
122 <data name="outputUnstrandedIndex" format="txt" label="${projectName}-Unstranded Index"> | 174 <data name="outputUnstrandedIndex" format="txt" label="${projectName}-Unstranded Index"> |
123 <filter>outputFiles['index'] is True</filter> | 175 <filter>outputFiles['index'] is True</filter> |
124 </data> | 176 </data> |
125 </outputs> | 177 </outputs> |
126 | |
127 <configfiles> | |
128 <configfile name="ALFA_config"> | |
129 projectName=$projectName | |
130 | |
131 ##__INPUT 1__## | |
132 annotationSource=$annotation.annotationSource['annotationSourceSelection'] | |
133 #if str ( $annotation.annotationSource['annotationSourceSelection'] ) == "index" | |
134 annotationFile=None | |
135 strandedIndex=$annotation.annotationSource['strandedIndex'] | |
136 unstrandedIndex=$annotation.annotationSource['unstrandedIndex'] | |
137 #else if str ( $annotation.annotationSource['annotationSourceSelection'] ) == "built_in_index" | |
138 annotationFile=None | |
139 built_in_index_prefix=$annotation.annotationSource.built_in_index_prefix.fields.prefix | |
140 #else | |
141 annotationFile=$annotation.annotationSource['annotationFile'] | |
142 strandedIndex=None | |
143 unstrandedIndex=None | |
144 #end if | |
145 | |
146 ##__INPUT 2__## | |
147 readsType=$reads.readsType['readsTypeSelection'] | |
148 #for $i, $r in enumerate ( $reads.readsType['readsList'] ) | |
149 readsFile[$i]=$r.readsFile | |
150 readsLabel[$i]=$r.readsLabel | |
151 #end for | |
152 strandness=$reads['strandness'] | |
153 | |
154 ##__OUTPUT FILES__## | |
155 plotChoice=$outputFiles['plot'] | |
156 countFileChoice=$outputFiles['countFile'] | |
157 indexChoice=$outputFiles['index'] | |
158 | |
159 outputPdf=$outputPdf | |
160 outputCategoriesPng=$outputCategoriesPng | |
161 outputBiotypesPng=$outputBiotypesPng | |
162 outputCategoriesSvg=$outputCategoriesSvg | |
163 outputBiotypesSvg=$outputBiotypesSvg | |
164 outputCountFile=$outputCountFile | |
165 outputStrandedIndex=$outputStrandedIndex | |
166 outputUnstrandedIndex=$outputUnstrandedIndex | |
167 | |
168 ##__OUTPUT OPTIONS__## | |
169 categoriesDepth=$outputOptions['categoriesDepth'] | |
170 plotFormat=$outputOptions['plotFormat'] | |
171 plotThresholdChoice=$outputOptions.plotThreshold['plotThresholdChoice'] | |
172 #if str ( $outputOptions.plotThreshold['plotThresholdChoice'] ) == "True" | |
173 yMin=$outputOptions.plotThreshold.yMin | |
174 yMax=$outputOptions.plotThreshold.yMax | |
175 #else | |
176 yMin=None | |
177 yMax=None | |
178 #end if | |
179 </configfile> | |
180 </configfiles> | |
181 | 178 |
182 <tests> | 179 <tests> |
183 <test> | 180 <test> |
184 <param name="alfa_toy" /> | 181 <param name="alfa_toy" /> |
185 <section name="annotation"> | 182 <section name="annotation"> |
219 </assert_stdout> | 216 </assert_stdout> |
220 </test> | 217 </test> |
221 </tests> | 218 </tests> |
222 | 219 |
223 <help> | 220 <help> |
221 <![CDATA[ | |
222 **What it does** | |
223 | |
224 | |
225 | ALFA provides a global overview of features distribution composing New Generation Sequencing dataset(s). | |
226 | | |
227 | Given a set of aligned reads (BAM files) and an annotation file (GTF format), the tool produces plots of the raw and normalized distributions of those reads among genomic categories (stop codon, 5'-UTR, CDS, intergenic, etc.) and biotypes (protein coding genes, miRNA, tRNA, etc.). Whatever the sequencing technique, whatever the organism. | |
228 | |
229 ---- | |
230 | |
224 **ALFA acronym** | 231 **ALFA acronym** |
225 | 232 |
226 - Annotation.Landscape.For.Aligned reads | 233 - Annotation.Landscape.For.Aligned reads |
227 | 234 |
228 ---- | 235 ---- |
229 | 236 |
230 **What it does** | |
231 | |
232 | ALFA provides a global overview of features distribution composing New Generation Sequencing dataset(s). | |
233 | | |
234 | Given a set of aligned reads (BAM files) and an annotation file (GTF format), the tool produces plots of the raw and normalized distributions of those reads among genomic categories (stop codon, 5'-UTR, CDS, intergenic, etc.) and biotypes (protein coding genes, miRNA, tRNA, etc.). Whatever the sequencing technique, whatever the organism. | |
235 | |
236 ---- | |
237 | |
238 **Official documentation of the tool** | 237 **Official documentation of the tool** |
239 | 238 |
240 | 239 |
241 - https://github.com/biocompibens/ALFA | 240 - https://github.com/biocompibens/ALFA |
242 | 241 |
248 | 247 |
249 ---- | 248 ---- |
250 | 249 |
251 **Nota Bene** | 250 **Nota Bene** |
252 | 251 |
253 1. **Input 1: Annotation File** | 252 * **Input 1: Annotation File** |
254 | 253 |
255 | 254 |
256 | ALFA requires as first input an annotation file (sequence, genome...) in gtf format in order to generate indexes that will be used in a 2nd step of the program. | 255 | ALFA requires as first input an annotation file (sequence, genome...) in gtf format in order to generate alfa indexes needed in a second round of the program. |
257 | Indexes are files which list all the coordinates of all categories (stop codon, 5'-UTR, CDS, intergenic...) and biotypes (protein coding genes, miRNA, tRNA, ...) encountered in the annotated sequence. | 256 | Indexes are files which list all the coordinates of the categories (stop codon, 5'-UTR, CDS, intergenic...) and biotypes (protein coding genes, miRNA, tRNA, ...) encountered in the annotated sequence. |
257 | | |
258 | 258 |
259 .. class:: warningmark | 259 .. class:: warningmark |
260 | 260 |
261 Gtf File must be sorted. | 261 | Gtf File must be sorted. |
262 | 262 | |
263 .. class:: infomark | 263 |
264 | 264 .. class:: infomark |
265 Generation of indexes from an annotation file may be time consuming (i.e ~10min for the human genome). Thus, ALFA allows the user to submit directly indexes generated in previous runs. | 265 |
266 | 266 | Generation of indexes from an annotation file might be time consuming (i.e ~10min for the human genome). Thus, ALFA allows the user to submit directly indexes generated in previous runs. |
267 2. **Input 2: Reads** | 267 | |
268 | 268 |
269 | ALFA requires as second input a single or a set of mapped reads file(s) in either bam or bedgraph format. These files are required to intersect the coordinates of the mapped reads with the associated categories and biotypes on the annotated sequence. | 269 .. class:: infomark |
270 | |
271 | ALFA also allows to use built-in indexes to save even more computational time. In order to generate these built-in indexes, install the data manager tool 'data_manager_build_alfa_indexes' available on the toolshed. | |
272 | |
273 * **Input 2: Reads** | |
274 | |
275 | ALFA requires as second input a single or a set of mapped reads file(s) in either bam or bedgraph format. The coordinates of the mapped reads will be intersected with the according categories and biotypes mentioned in the indexes. | |
270 | The strandness option determines which strand of the annotated sequence will be taken into account during this intersection. | 276 | The strandness option determines which strand of the annotated sequence will be taken into account during this intersection. |
271 | 277 | |
272 .. class:: warningmark | 278 |
273 | 279 .. class:: warningmark |
274 Bam or Bedgraph file(s) must be sorted. | 280 |
275 | 281 | Bam or Bedgraph file(s) must be sorted. |
276 <!-- | 282 | |
277 .. class:: warningmark | 283 |
278 | 284 .. class:: warningmark |
279 For oriented reads (either matching the forward strand or the reverse strand), 'forward' or 'reverse' strandness must be selected. | 285 |
280 | 286 | Chromosome names in reads and in annotation file (gtf or indexes) must be the same for the intersection to occur |
281 .. class:: warningmark | 287 | |
282 | 288 |
283 For paired-end or non-oriented reads, 'unstranded' strandness must be selected. | 289 * **Output files** |
284 --> | |
285 | |
286 3. **Output files** | |
287 | 290 |
288 | The result of the intersection is a count file displaying the count of nucleotides in the reads for each genomic categories and biotypes. From this count file, plots of the raw and normalized distributions of the reads among these categories are generated. | 291 | The result of the intersection is a count file displaying the count of nucleotides in the reads for each genomic categories and biotypes. From this count file, plots of the raw and normalized distributions of the reads among these categories are generated. |
289 | In the output files section, the user can choose what kind of files he desires as ALFA output. Categories Count File and Plots are proposed by default. | 292 | In the output files section, the user can choose what kind of files he desires as ALFA output. Categories Count File and Plots are proposed by default. |
290 | 293 | |
291 .. class:: infomark | 294 |
292 | 295 .. class:: infomark |
293 The user can also select the 'indexes' option as output. This option is interesting if you plan to run ALFA again with the same submitted annotation file. *See Nota Bene/Input 1: Annotation File for more information.* | 296 |
294 | 297 | The user can also select the 'indexes' option as output. This option is interesting if you plan to run ALFA again with the same submitted annotation file. *See Nota Bene/Input 1: Annotation File for more information.* |
295 | 298 | |
296 - `How the plots look like`_ | 299 |
297 | 300 - `How the plots look like`_ |
298 .. _How the plots look like: https://github.com/biocompibens/ALFA#plots | 301 |
299 | 302 .. _How the plots look like: https://github.com/biocompibens/ALFA#plots |
300 - `How they are generated`_ | 303 |
301 | 304 | |
302 .. _How they are generated: https://github.com/biocompibens/ALFA#detailed-example | 305 |
306 - `How they are generated`_ | |
307 | |
308 .. _How they are generated: https://github.com/biocompibens/ALFA#detailed-example | |
303 | 309 |
304 ---- | 310 ---- |
305 | 311 |
306 **ALFA Developpers** | 312 **ALFA Developpers** |
307 | 313 |
308 | Benoît Noël and Mathieu Bahin: *compbio team, Institut de Biologie de l'Ecole Normale Supérieure de Paris* | 314 | Benoît Noël and Mathieu Bahin: *compbio team, Institut de Biologie de l'Ecole Normale Supérieure de Paris* |
309 | 315 |
310 | 316 ]]> |
311 </help> | 317 </help> |
312 | 318 |
313 <citations> | 319 <citations> |
314 <citation type="bibtex">@MISC{ | 320 <citation type="bibtex">@MISC{ |
315 author="Benoît Noël and Mathieu Bahin" | 321 author="Benoît Noël and Mathieu Bahin" |