comparison abims_xcms_group.xml @ 0:f3f97841564f draft

Uploaded
author lecorguille
date Fri, 07 Aug 2015 11:02:28 -0400
parents
children ed149026836e
comparison
equal deleted inserted replaced
-1:000000000000 0:f3f97841564f
1 <tool id="abims_xcms_group" name="xcms.group" version="2.0.2">
2
3 <description>Group peaks together across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time.</description>
4
5 <requirements>
6 <requirement type="package" version="3.1.2">R</requirement>
7 <requirement type="binary">Rscript</requirement>
8 <requirement type="package" version="1.44.0">xcms</requirement>
9 <requirement type="package" version="2.1">xcms_w4m_script</requirement>
10 </requirements>
11
12 <stdio>
13 <exit_code range="1:" level="fatal" />
14 </stdio>
15
16 <command>
17 xcms.r
18 xfunction group image $image method $methods.method sleep 0.001
19 #if $methods.method == "density":
20 ## minsamp $methods.minsamp
21 minfrac $methods.minfrac
22 bw $methods.bw
23 mzwid $methods.mzwid
24 #if $methods.density_options.option == "show":
25 max $methods.density_options.max
26 #end if
27 #elif $methods.method == "mzClust":
28 mzppm $methods.mzppm
29 mzabs $methods.mzabs
30 minfrac $methods.minfrac
31 ## minsamp $methods.minsamp
32 #else:
33 mzVsRTbalance $methods.mzVsRTbalance
34 mzCheck $methods.mzCheck
35 rtCheck $methods.rtCheck
36 kNN $methods.kNN
37 #end if
38 &amp;&amp; (
39 mv group.RData $xsetRData;
40 mv Rplots.pdf $rplotsPdf
41 );
42 cat xset.log
43 </command>
44
45 <inputs>
46 <param name="image" type="data" format="rdata.xcms.raw,rdata.xcms.group,rdata.xcms.retcor,rdata" label="xset RData file" help="output file from another function xcms (xcmsSet, retcor etc.)" />
47 <conditional name="methods">
48 <param name="method" type="select" label="Method to use for grouping" help="[method] See the help section below">
49 <option value="density" selected="true">density</option>
50 <option value="mzClust" >mzClust</option>
51 <option value="nearest" >nearest</option>
52 </param>
53 <when value="density">
54 <param name="bw" type="integer" value="30" label="Bandwidth" help="[bw] bandwidth (standard deviation or half width at half maximum) of gaussian smoothing kernel to apply to the peak density chromatogram" />
55 <param name="minfrac" type="float" value="0.5" label="Minimum fraction of samples necessary" help="[minfrac] in at least one of the sample groups for it to be a valid group" />
56 <param name="mzwid" type="float" value="0.25" label="Width of overlapping m/z slices" help="[mzwid] to use for creating peak density chromatograms and grouping peaks across samples " />
57 <!--
58 <param name="minsamp" type="hidden" value="1" label="minsamp" help="minimum number of samples necessary in at least one of the sample groups for it to be a valid group " />
59 -->
60 <conditional name="density_options">
61 <param name="option" type="select" label="Advanced options">
62 <option value="show">show</option>
63 <option value="hide" selected="true">hide</option>
64 </param>
65 <when value="show">
66 <param name="max" type="integer" value="5" label="Maximum number of groups to identify in a single m/z slice" help="[max]" />
67 </when>
68 <when value="hide">
69 </when>
70 </conditional>
71
72 </when>
73 <when value="mzClust">
74 <param name="mzppm" type="integer" value="20 " label="Relative error used for clustering/grouping in ppm" help="[mzppm]" />
75 <param name="mzabs" type="float" value="0" label="Absolute error used for clustering/grouping" help="[mzabs]" />
76 <param name="minfrac" type="float" value="0" label="Minimum fraction of each class in one bin" help="[minfrac] minimum fraction of samples necessary in at least one of the sample groups for it to be a valid group" />
77 <!--
78 <param name="minsamp" type="hidden" value="1" label="minsamp" help="minimum number of samples necessary in at least one of the sample groups for it to be a valid group " />
79 -->
80 </when>
81 <when value="nearest">
82 <param name="mzVsRTbalance" type="integer" value="10 " label="Multiplicator for mz value before calculating the (euclidean) distance between two peaks." help="[mzVsRTbalance]" />
83 <param name="mzCheck" type="float" value="0.2" label="Maximum tolerated distance for mz" help="[mzCheck]" />
84 <param name="rtCheck" type="integer" value="15" label="Maximum tolerated distance for RT" help="[rtCheck]" />
85 <param name="kNN" type="integer" value="10" label="Number of nearest Neighbours to check" help="[kNN]" />
86 </when>
87 </conditional>
88 <!--
89 <param name="sleepy" type="float" value="0.001" label="sleep" help="seconds to pause between plotting successive steps of the peak grouping algorithm. peaks are plotted as points showing relative intensity. identified groups are flanked by dotted vertical lines">
90 <validator type="in_range" message="Must be more than 0" min="0.001" max="inf"/>
91 </param>
92 -->
93
94 </inputs>
95
96 <outputs>
97 <data name="xsetRData" format="rdata.xcms.group" label="${image.name[:-6]}.group.RData"/>
98 <data name="rplotsPdf" format="pdf" label="${image.name[:-6]}.group.Rplots.pdf"/>
99 </outputs>
100
101 <tests>
102 <test>
103 <param name="image" value="xset.RData"/>
104 <param name="methods.method" value="density"/>
105 <param name="methods.bw" value="5"/>
106 <param name="methods.minfrac" value="0.3"/>
107 <param name="methods.mzwid" value="0.01"/>
108 <param name="methods.density_options.option" value="show"/>
109 <param name="methods.density_options.max" value="50"/>
110 <output name="xsetRData" file="xset.group.RData" />
111 <output name="rplotsPdf" file="xset.group.Rplots.pdf" />
112
113 </test>
114 </tests>
115
116 <help>
117
118 .. class:: infomark
119
120 **Authors** Colin A. Smith csmith@scripps.edu, Ralf Tautenhahn rtautenh@gmail.com, Steffen Neumann sneumann@ipb-halle.de, Paul Benton hpaul.benton08@imperial.ac.uk and Christopher Conley cjconley@ucdavis.edu
121
122 **Galaxy integration** ABiMS TEAM - UPMC/CNRS - Station biologique de Roscoff and Yann Guitton yann.guitton@univ-nantes.fr - part of Workflow4Metabolomics.org [W4M]
123
124 | Contact support@workflow4metabolomics.org for any questions or concerns about the Galaxy implementation of this tool.
125
126
127
128 ---------------------------------------------------
129
130 ==========
131 Xcms.Group
132 ==========
133
134 -----------
135 Description
136 -----------
137
138 After peak identification with xcmsSet, this tool groups the peaks which represent the same analyte across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time. Allows rejection of features, which are only partially detected within the replicates of a sample class.
139
140
141
142 -----------------
143 Workflow position
144 -----------------
145
146 **Upstream tools**
147
148 ========================= ================= =================== ==========
149 Name output file format parameter
150 ========================= ================= =================== ==========
151 xcms.xcmsSet xset.RData rdata.xcms.raw RData file
152 ------------------------- ----------------- ------------------- ----------
153 xcms.retcor xset.RData rdata.xcms.retcor RData file
154 ========================= ================= =================== ==========
155
156
157 **Downstream tools**
158
159 +---------------------------+--------------------------------------+
160 | Name | Output file | Format |
161 +===========================+=================+====================+
162 |xcms.retcor | xset.RData | rdata.xcms.group |
163 +---------------------------+--------------------------------------+
164 |xcms.fillPeaks | xset.RData | rdata.xcms.group |
165 +---------------------------+--------------------------------------+
166
167 The output file is an xcmsSet.RData file. You can continue your analysis using it in **xcms.retcor** tool as an next step and then **xcms.fillPeaks**.
168
169 **General schema of the metabolomic workflow**
170
171 .. image:: xcms_group_workflow.png
172
173
174 -----------
175 Input files
176 -----------
177
178 +---------------------------+-----------------------+
179 | Parameter : num + label | Format |
180 +===========================+=======================+
181 | 1 : RData file | rdata.xcms.group |
182 +---------------------------+-----------------------+
183
184
185 ----------
186 Parameters
187 ----------
188
189 Method to use for grouping
190 --------------------------
191
192 **mzClust**
193
194 | Runs high resolution alignment on single spectra samples stored in the RData file generated by the **xcmsSet tool**.
195
196 **density**
197
198 | Groups peaks together across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time.
199
200 **nearest**
201
202 | Groups peaks together across samples by creating a master peak list and assigning corresponding peaks from all samples. It is inspired by the alignment algorithm of mzMine.
203
204
205 ------------
206 Output files
207 ------------
208
209 xset.group.Rplots.pdf
210
211 xset.group.RData: rdata.xcms.group format
212
213 | Rdata file that will be necessary in the third and fourth step of the workflow (xcms.retcor and xcms.fillpeaks).
214
215
216 ------
217
218 .. class:: infomark
219
220 The output file is an xset.group.RData file. You can continue your analysis using it in **xcms.retcor** tool.
221
222
223 ---------------------------------------------------
224
225
226 ---------------
227 Working example
228 ---------------
229
230 Input files
231 -----------
232
233 | RData file -> **xset.RData**
234
235 Parameters
236 ----------
237
238 | Method -> **density**
239 | bw -> **5**
240 | minfrac -> **0.3**
241 | mzwid -> **0.01**
242 | Advanced options: **show**
243 | max -> **50**
244
245
246 Output files
247 ------------
248
249 | **1) xset.RData: RData file**
250
251 | **2) Example of an xset.group.Rplots pdf file**
252
253 .. image:: xcms_group.png
254 :width: 700
255
256
257 </help>
258
259
260 <citations>
261 <citation type="doi">10.1021/ac051437y</citation>
262 <citation type="doi">10.1093/bioinformatics/btu813</citation>
263 </citations>
264
265
266 </tool>