comparison cuffnorm_wrapper.xml @ 0:a26af05ac218 draft

Uploaded
author devteam
date Fri, 19 Dec 2014 12:00:45 -0500
parents
children 7d4c2097aac5
comparison
equal deleted inserted replaced
-1:000000000000 0:a26af05ac218
1 <tool id="cuffnorm" name="Cuffnorm" version="@VERSION@.0">
2 <description>Create normalized expression levels</description>
3 <expand macro="requirements" />
4 <expand macro="stdio" />
5 <macros>
6 <import>cuff_macros.xml</import>
7 </macros>
8 <version_command>cuffnorm 2>&amp;1 | head -n 1</version_command>
9 <command>
10 cuffnorm
11 --no-update-check
12 --num-threads="\${GALAXY_SLOTS:-4}"
13 --library-norm-method=$library_norm_method
14 --output-format=$output_format
15
16 @CONDITION_LABELS@
17
18 ## Set advanced parameters for cufflinks
19 #if $advanced_settings.sAdvanced == "Yes":
20 #if str($advanced_settings.library_type) != 'auto':
21 --library-type=$advanced_settings.library_type
22 #end if
23 $advanced_settings.hits_norm
24 #end if
25 ## Inputs.
26 $gtf_input
27
28 @CONDITION_SAMPLES@
29 </command>
30 <inputs>
31 <param format="gtf,gff3" name="gtf_input" type="data" label="Transcripts" help="A transcript GFF3 or GTF file produced by cufflinks, cuffcompare, or other source."/>
32 <expand macro="condition_inputs" />
33 <param name="library_norm_method" type="select" label="Library normalization method">
34 <option value="geometric" selected="True">geometric</option>
35 <option value="classic-fpkm">classic-fpkm</option>
36 <option value="quartile">quartile</option>
37 </param>
38
39 <param name="include_read_group_files" type="select" label="Include Read_Group/Attribute Datasets"
40 help="Read group/attribute datasets provide information on replicates. One of both is provided, depending on the output format.">
41 <option value="No" selected="true">No</option>
42 <option value="Yes">Yes</option>
43 </param>
44
45 <param name="output_format" type="select" lable="Output format"
46 help="By default, Cuffnorm reports expression levels in the 'simple-table' tab-delimted text files. The program also reports information about your samples and about the genes, transcripts, TSS groups, and CDS groups as tab delimited text files. Note that these files have a different format than the files used by Cuffdiff. However, you can direct Cuffnorm to report its output in the same format as used by Cuffdiff if you wish" >
47 <option value="simple-table" selected="True">Simple Table</option>
48 <option value="cuffdiff">Cuffdiff format</option>
49 </param>
50
51 <conditional name="advanced_settings">
52 <param name="sAdvanced" type="select" label="Set Advanced Cuffnorm parameters? ">
53 <option value="No" selected="True">No</option>
54 <option value="Yes">Yes</option>
55 </param>
56 <when value="No"></when>
57 <when value="Yes">
58 <param type="select" name="library_type" label="Library prep used for input reads" help="">
59 <option value="auto" selected="True">Auto Detect</option>
60 <option value="ff-firststrand">ff-firststrand</option>
61 <option value="ff-secondstrand">ff-secondstrand</option>
62 <option value="ff-unstranded">ff-unstranded</option>
63 <option value="fr-firststrand">fr-firststrand</option>
64 <option value="fr-secondstrand">fr-secondstrand</option>
65 <option value="fr-unstranded" >fr-unstranded</option>
66 <option value="transfrags">transfrags</option>
67 </param>
68 <param name="hits_norm" type="select" label="Hits included in normalization" help="All Hits: With this option, Cufflinks counts all fragments, including those not compatible with any reference transcript, towards the number of mapped fragments used in the FPKM denominator. Compatible Hits: With this option, Cufflinks counts only those fragments compatible with some reference transcript towards the number of mapped fragments used in the FPKM denominator. Using this mode is generally recommended in Cuffdiff to reduce certain types of bias caused by differential amounts of ribosomal reads which can create the impression of falsely differentially expressed genes. It is active by default." >
69 <option value="--compatible-hits-norm" selected="True">Compatible Hits</option>
70 <option value="--total-hits-norm">All Hits</option>
71 </param>
72 </when>
73 </conditional>
74 </inputs>
75
76 <outputs>
77 <!-- Optional read group / attr datasets. -->
78 <!-- cuffdif format -->
79 <data format="tabular" name="isoforms_read_group" label="${tool.name} on ${on_string}: isoforms read group tracking" from_work_dir="isoforms.read_group_tracking" >
80 <filter>(include_read_group_files == 'Yes')</filter>
81 <filter>(output_format == 'cuffdiff')</filter>
82 </data>
83 <data format="tabular" name="genes_read_group" label="${tool.name} on ${on_string}: genes read group tracking" from_work_dir="genes.read_group_tracking" >
84 <filter>(include_read_group_files == 'Yes')</filter>
85 <filter>(output_format == 'cuffdiff')</filter>
86 </data>
87 <data format="tabular" name="cds_read_group" label="${tool.name} on ${on_string}: CDs read group tracking" from_work_dir="cds.read_group_tracking" >
88 <filter>(include_read_group_files == 'Yes')</filter>
89 <filter>(output_format == 'cuffdiff')</filter>
90 </data>
91 <data format="tabular" name="tss_groups_read_group" label="${tool.name} on ${on_string}: TSS groups read group tracking" from_work_dir="tss_groups.read_group_tracking" >
92 <filter>(include_read_group_files == 'Yes')</filter>
93 <filter>(output_format == 'cuffdiff')</filter>
94 </data>
95 <data format="text" name="read_groups_info" label="${tool.name} on ${on_string}: Read Groups" from_work_dir="read_groups.info" >
96 <filter>(include_read_group_files == 'Yes')</filter>
97 <filter>(output_format == 'cuffdiff')</filter>
98 </data>
99 <!-- simple-table format-->
100 <data format="tabular" name="isoforms_attr" label="${tool.name} on ${on_string}: isoforms read group tracking" from_work_dir="isoforms.attr_table" >
101 <filter>(include_read_group_files == 'Yes')</filter>
102 <filter>(output_format == 'simple-table')</filter>
103 </data>
104 <data format="tabular" name="genes_read_group" label="${tool.name} on ${on_string}: genes read group tracking" from_work_dir="genes.attr_table" >
105 <filter>(include_read_group_files == 'Yes')</filter>
106 <filter>(output_format == 'simple-table')</filter>
107 </data>
108 <data format="tabular" name="cds_read_group" label="${tool.name} on ${on_string}: CDs read group tracking" from_work_dir="cds.attr_table" >
109 <filter>(include_read_group_files == 'Yes')</filter>
110 <filter>(output_format == 'simple-table')</filter>
111 </data>
112 <data format="tabular" name="tss_groups_read_group" label="${tool.name} on ${on_string}: TSS groups read group tracking" from_work_dir="tss_groups.attr_table" >
113 <filter>(include_read_group_files == 'Yes')</filter>
114 <filter>(output_format == 'simple-table')</filter>
115 </data>
116
117 <!-- Cuffdiff format datasets. -->
118 <data format="tabular" name="cds_fpkm_tracking" label="${tool.name} on ${on_string}: CDS FPKM tracking" from_work_dir="cds.fpkm_tracking" >
119 <filter>(output_format == 'cuffdiff')</filter>
120 </data>
121 <data format="tabular" name="cds_count_tracking" label="${tool.name} on ${on_string}: CDS count tracking" from_work_dir="cds.count_tracking" >
122 <filter>(output_format == 'cuffdiff')</filter>
123 </data>
124 <data format="tabular" name="tss_groups_fpkm_tracking" label="${tool.name} on ${on_string}: TSS groups FPKM tracking" from_work_dir="tss_groups.fpkm_tracking" >
125 <filter>(output_format == 'cuffdiff')</filter>
126 </data>
127 <data format="tabular" name="tss_groups_count_tracking" label="${tool.name} on ${on_string}: TSS groups count tracking" from_work_dir="tss_groups.count_tracking" >
128 <filter>(output_format == 'cuffdiff')</filter>
129 </data>
130 <data format="tabular" name="genes_fpkm_tracking" label="${tool.name} on ${on_string}: gene FPKM tracking" from_work_dir="genes.fpkm_tracking" >
131 <filter>(output_format == 'cuffdiff')</filter>
132 </data>
133 <data format="tabular" name="genes_count_tracking" label="${tool.name} on ${on_string}: gene count tracking" from_work_dir="genes.count_tracking" >
134 <filter>(output_format == 'cuffdiff')</filter>
135 </data>
136 <data format="tabular" name="isoforms_fpkm_tracking" label="${tool.name} on ${on_string}: transcript FPKM tracking" from_work_dir="isoforms.fpkm_tracking" >
137 <filter>(output_format == 'cuffdiff')</filter>
138 </data>
139 <data format="tabular" name="isoforms_count_tracking" label="${tool.name} on ${on_string}: transcript count tracking" from_work_dir="isoforms.count_tracking" >
140 <filter>(output_format == 'cuffdiff')</filter>
141 </data>
142 <!-- Simple-table format datasets. -->
143 <data format="tabular" name="cds_fpkm_table" label="${tool.name} on ${on_string}: CDS FPKM table" from_work_dir="cds.fpkm_table" >
144 <filter>(output_format == 'simple-table')</filter>
145 </data>
146 <data format="tabular" name="cds_count_table" label="${tool.name} on ${on_string}: CDS count table" from_work_dir="cds.count_table" >
147 <filter>(output_format == 'simple-table')</filter>
148 </data>
149 <data format="tabular" name="tss_groups_fpkm_table" label="${tool.name} on ${on_string}: TSS groups FPKM table" from_work_dir="tss_groups.fpkm_table" >
150 <filter>(output_format == 'simple-table')</filter>
151 </data>
152 <data format="tabular" name="tss_groups_count_table" label="${tool.name} on ${on_string}: TSS groups count table" from_work_dir="tss_groups.count_table" >
153 <filter>(output_format == 'simple-table')</filter>
154 </data>
155 <data format="tabular" name="genes_fpkm_table" label="${tool.name} on ${on_string}: gene FPKM table" from_work_dir="genes.fpkm_table" >
156 <filter>(output_format == 'simple-table')</filter>
157 </data>
158 <data format="tabular" name="genes_count_table" label="${tool.name} on ${on_string}: gene count table" from_work_dir="genes.count_table" >
159 <filter>(output_format == 'simple-table')</filter>
160 </data>
161 <data format="tabular" name="isoforms_fpkm_table" label="${tool.name} on ${on_string}: transcript FPKM table" from_work_dir="isoforms.fpkm_table" >
162 <filter>(output_format == 'simple-table')</filter>
163 </data>
164 <data format="tabular" name="isoforms_count_table" label="${tool.name} on ${on_string}: transcript count table" from_work_dir="isoforms.count_table" >
165 <filter>(output_format == 'simple-table')</filter>
166 </data>
167 </outputs>
168 <tests>
169 <test>
170 <!--
171 NOTE: as of version 0.0.6 of the wrapper, tests cannot be run because multiple inputs to a repeat
172 element are not supported.
173 -->
174 </test>
175 </tests>
176
177 <help>
178 **Cuffnorm Overview**
179
180 Cuffnorm is part of Cufflinks_. Running Cuffnorm is very similar to running Cuffdiff. Cuffnorm takes a GTF2/GFF3 file of transcripts as input, along with two or more SAM, BAM, or CXB files for two or more samples. It produces a number of output files that contain expression levels and normalized fragment counts at the level of transcripts, primary transcripts, and genes. It also tracks changes in the relative abundance of transcripts sharing a common transcription start site, and in the relative abundances of the primary transcripts of each gene. Tracking the former allows one to see changes in splicing, and the latter lets one see changes in relative promoter use within a gene.. Please cite: Trapnell C, Williams BA, Pertea G, Mortazavi AM, Kwan G, van Baren MJ, Salzberg SL, Wold B, Pachter L. Transcript assembly and abundance estimation from RNA-Seq reveals thousands of new transcripts and switching among isoforms. Nature Biotechnology doi:10.1038/nbt.1621
181
182 .. _Cufflinks: http://cole-trapnell-lab.github.io/cufflinks/
183
184 ------
185
186 **Know what you are doing**
187
188 .. class:: warningmark
189
190 There is no such thing (yet) as an automated gearshift in expression analysis. It is all like stick-shift driving in San Francisco. In other words, running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy.
191
192 .. __: http://cole-trapnell-lab.github.io/cufflinks/cuffnorm/
193
194 ------
195
196 **Input format**
197
198 Cuffdiff takes Cufflinks or Cuffcompare GTF files as input along with two SAM files containing the fragment alignments for two or more samples.
199
200 ------
201
202 **Outputs**
203
204 Cuffnorm outputs a set of files containing normalized expression levels for each gene, transcript, TSS group, and CDS group in the experiment. It does not perform differential expression analysis. To assess the significance of changes in expression for genes and transcripts between conditions, use Cuffdiff. Cuffnorm's output files are useful when you have many samples and you simply want to cluster them or plot expression levels of genes important in your study.
205 By default, Cuffnorm reports expression levels in the "simple-table" tab-delimted text files. The program also reports information about your samples and about the genes, transcripts, TSS groups, and CDS groups as tab delimited text files. Note that these files have a different format than the files used by Cuffdiff. However, you can direct Cuffnorm to report its output in the same format as used by Cuffdiff if you wish. Simply supply the option --output-format cuffdiff at the command line.
206 Cuffnorm will report both FPKM values and normalized, estimates for the number of fragments that originate from each gene, transcript, TSS group, and CDS group. Note that because these counts are already normalized to account for differences in library size, they should not be used with downstream differential expression tools that require raw counts as input.
207 To see the details of the simple table format used by Cuffnorm, refer to the simple table expression format, simple table sample attribute format, and simple table feature (e.g. gene) attribute format sections below.
208
209 -------
210
211 **Settings**
212
213 All of the options have a default value. You can change any of them. Most of the options in Cuffdiff have been implemented here.
214
215 ------
216
217 **Cuffdiff parameter list**
218
219 This is a list of implemented Cuffdiff options::
220
221 --library-norm-method Library Normalization method : Geometric (default), classic-fpkm, quartile
222 --library-type ff-firststrand,ff-secondstrand,ff-unstranded,fr-firstrand,fr-secondstrand,fr-unstranded,transfrags
223 --compatible-hits-norm With this option, Cufflinks counts only those fragments compatible with some reference transcript towards the number of mapped fragments used in the FPKM denominator. Using this mode is generally recommended in Cuffdiff to reduce certain types of bias caused by differential amounts of ribosomal reads which can create the impression of falsely differentially expressed genes.
224 --total-hits-norm With this option, Cufflinks counts all fragments, including those not compatible with any reference transcript, towards the number of mapped fragments used in the FPKM denominator
225 </help>
226 <citations>
227 <citation type="doi">10.1038/nbt.1621</citation>
228 </citations>
229 </tool>