annotate prepare.xml @ 0:e01de823e919 draft default tip

Uploaded
author biotechcoder
date Fri, 01 May 2015 05:41:51 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
1 <tool id="riboseqr_prepare_input" name="Prepare riboSeqR input" version="0.4.0">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
2 <description>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
3 (Step 1) Prepare alignment file (SAM format, Ribo-Seq or RNA-Seq alignments)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
4 for riboSeqR analysis.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
5 </description>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
6 <requirements>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
7 <requirement type="R-module">riboSeqR</requirement>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
8 </requirements>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
9 <command interpreter="python">riboseqr/prepare.py
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
10 #set $files_ribo = []
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
11 #set $files_rna = []
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
12 #set $replicates = []
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
13
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
14 #for $i, $s in enumerate($rnaseq.datasets)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
15 #silent $replicates.append($s.replicate_name.value)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
16 #silent $files_ribo.append($s.ribo_files.file_name)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
17 #try:
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
18 #silent $s.rna_files
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
19 #except:
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
20 #pass
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
21 #else:
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
22 #silent $files_rna.append($s.rna_files.file_name)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
23 #end try
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
24 #end for
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
25
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
26 #set $ribofiles = ", ".join($files_ribo)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
27 #set $rnafiles = ", ".join($files_rna)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
28 #set $replicate_names = ", ".join($replicates)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
29
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
30 --ribo_files "$ribofiles"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
31 --rna_files "$rnafiles"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
32 --replicate_names "$replicate_names"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
33 --seqnames "$seqnames"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
34 --rdata_save "$rdata_save"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
35 --sam_format
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
36 --html_file "$html_file"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
37 --output_path "$html_file.files_path"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
38 </command>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
39 <inputs>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
40 <conditional name="rnaseq">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
41 <param name="have-rnaseq" type="boolean" truevalue="checked"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
42 falsevalue="unchecked" label="Have RNA-Seq data?"/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
43 <when value="checked">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
44 <repeat name="datasets" title="Ribo and RNA-Seq alignment"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
45 default="1">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
46 <param type="text" name="replicate_name" size="20"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
47 label="Provide a common name for each replicate group"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
48 value=""/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
49 <param format="sam" name="ribo_files" type="data"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
50 label="Ribo-Seq alignment file (SAM)"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
51 multiple="false"/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
52 <param format="sam" name="rna_files" type="data"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
53 label="RNA-Seq alignment file (SAM)"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
54 multiple="false"/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
55 </repeat>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
56 </when>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
57 <when value="unchecked">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
58 <repeat name="datasets" title="Ribo-Seq alignment" default="1">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
59 <param type="text" name="replicate_name" size="20"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
60 label="Provide a common name for each replicate group"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
61 value=""/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
62 <param format="sam" name="ribo_files" type="data"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
63 label="Ribo-Seq alignment file (SAM)"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
64 multiple="false">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
65 </param>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
66 </repeat>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
67 </when>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
68 </conditional>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
69 <param name="seqnames" type="text" area="True" label="Transcript (seqname)
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
70 names to be read" size="3x60"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
71 help="[Optional] - only the mapped footprints for these transcripts will be
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
72 used in further riboSeqR analysis. Multiple transcript names should
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
73 be separated by commas. There should be no quotes around transcript names.">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
74 <sanitizer>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
75 <valid>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
76 <add value="|"/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
77 </valid>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
78 </sanitizer>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
79 </param>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
80 </inputs>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
81 <outputs>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
82 <data format="rda" name="rdata_save"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
83 label="Prepare riboSeqR input (R data file)"/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
84 <data format="html" name="html_file"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
85 label="Prepare riboSeqR input (HTML report)"/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
86 </outputs>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
87 <tests>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
88 <test>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
89 <param name="ribo_files" value="12hRPF.sam" />
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
90 <output name="html_file" file="Prepare_riboSeqR_input_(HTML_report).html">
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
91 <extra_files type="file" name="RiboSeq file 1" value="RiboSeq file 1"/>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
92 </output>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
93 </test>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
94 </tests>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
95 <help>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
96 About
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
97 -----
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
98 This tool can be used to prepare input data for riboSeqR from SAM
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
99 format alignments of Ribo or RNA-Seq data to a reference transcriptome. You can
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
100 do this alignment manually using bowtie or the
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
101 "Transcriptome Mapping" -> "Align to transcriptome using Bowtie"
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
102 tool on RiboGalaxy_
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
103
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
104 The required input format for riboSeqR_ is mentioned in the
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
105 **"Getting Data"** section of the documentation_.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
106
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
107 riboSeqR version: **1.0.4**.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
108
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
109 How to use?
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
110 -----------
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
111 Inputs
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
112 ......
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
113 Select SAM format Ribo-Seq alignment files in the input section.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
114
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
115 If you have RNA-Seq data, these can be included if the **"Have RNA-Seq data"**
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
116 option is checked.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
117
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
118 Outputs
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
119 .......
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
120 The following files will be generated on completion:
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
121
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
122 #. Prepare riboSeqR input (HTML report) - A HTML file with links to all other
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
123 output files.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
124
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
125 * Generated riboSeqR format input files of RiboSeq and RNASeq data(if provided).
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
126 These files are plain text and lines have the following information -
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
127 strand, transcript name, alignment position, sequence.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
128
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
129 Please note the alignments are made **0-indexed**.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
130
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
131 * R script used in this session.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
132
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
133 #. Prepare riboSeqR input (R data file) - used as input for the next step -
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
134 *Triplet Periodicity*.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
135
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
136 How are the SAM alignments processed?
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
137 .....................................
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
138 #. Lines starting with ``@`` are ignored.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
139 #. Lines having a ``FLAG=0`` are considered as successful alignments. These are
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
140 considered for the next step.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
141 #. Alignment start is located on ``column 4``. These are decremented by
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
142 1 as SAM alignments are 1-indexed.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
143 #. riboSeqR input file is written with the strand (``+``), transcript name,
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
144 alignment start and the aligned sequence.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
145
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
146 riboSeqR functions used
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
147 .......................
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
148 readRibodata.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
149
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
150 For detailed description of the functions and the options used, please consult
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
151 the riboSeqR documentation.
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
152
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
153 Links
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
154 .....
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
155 * `Bioconductor package information on riboSeqR`__
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
156 * riboSeqR - `Reference manual`_
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
157 * riboSeqR - `Introduction and workflow example`_
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
158
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
159 .. _RiboGalaxy: http://ribogalaxy.ucc.ie
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
160
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
161 .. _riboSeqR: http://bioconductor.org/packages/3.0/bioc/html/riboSeqR.html
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
162
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
163 __ riboSeqR_
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
164
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
165 .. _manual: http://bioconductor.org/packages/3.0/bioc/manuals/riboSeqR/man/riboSeqR.pdf
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
166
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
167 .. _`Reference manual`: manual_
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
168
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
169 .. _documentation: http://bioconductor.org/packages/3.0/bioc/vignettes/riboSeqR/inst/doc/riboSeqR.pdf
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
170
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
171 .. _`Introduction and workflow example`: documentation_
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
172
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
173 </help>
e01de823e919 Uploaded
biotechcoder
parents:
diff changeset
174 </tool>