Mercurial > repos > lecorguille > xcms_group
comparison abims_xcms_group.xml @ 14:833d2c821d9c draft
planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 9f72e947d9c241d11221cad561f3525d27231857
author | lecorguille |
---|---|
date | Tue, 18 Sep 2018 16:11:06 -0400 |
parents | 13558e8a4778 |
children | 95e689b7f27f |
comparison
equal
deleted
inserted
replaced
13:13558e8a4778 | 14:833d2c821d9c |
---|---|
1 <tool id="abims_xcms_group" name="xcms.group" version="2.1.1"> | 1 <tool id="abims_xcms_group" name="xcms groupChromPeaks (group)" version="@WRAPPER_VERSION@.0"> |
2 | 2 |
3 <description>Group peaks together across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time.</description> | 3 <description>Perform the correspondence, the grouping of chromatographic peaks within and between samples.</description> |
4 | 4 |
5 <macros> | 5 <macros> |
6 <import>macros.xml</import> | 6 <import>macros.xml</import> |
7 <import>macros_xcms.xml</import> | |
7 </macros> | 8 </macros> |
8 | 9 |
9 <expand macro="requirements"/> | 10 <expand macro="requirements"/> |
10 <expand macro="stdio"/> | 11 <expand macro="stdio"/> |
11 | 12 |
12 <command><![CDATA[ | 13 <command><![CDATA[ |
13 @COMMAND_XCMS_SCRIPT@ | 14 @COMMAND_RSCRIPT@/xcms_group.r |
14 xfunction group | |
15 image '$image' | 15 image '$image' |
16 | 16 |
17 xsetRdataOutput '$xsetRData' | |
18 rplotspdf '$rplotsPdf' | |
19 | |
20 method $methods.method | 17 method $methods.method |
21 #if $methods.method == "density": | 18 #if $methods.method == "PeakDensity": |
22 ## minsamp $methods.minsamp | |
23 minfrac $methods.minfrac | |
24 bw $methods.bw | 19 bw $methods.bw |
25 mzwid $methods.mzwid | 20 minFraction $methods.minFraction |
26 sleep 0.001 | 21 minSamples $methods.minSamples |
27 #if $methods.density_options.option == "show": | 22 binSize $methods.binSize |
28 max $methods.density_options.max | 23 ## Advanced |
29 #end if | 24 maxFeatures $methods.PeakDensityAdv.maxFeatures |
30 #elif $methods.method == "mzClust": | 25 #elif $methods.method == "MzClust": |
31 mzppm $methods.mzppm | 26 ppm $methods.ppm |
32 mzabs $methods.mzabs | 27 absMz $methods.absMz |
33 minfrac $methods.minfrac | 28 minFraction $methods.minFraction |
34 ## minsamp $methods.minsamp | 29 minSamples $methods.minSamples |
35 #else: | 30 #else: |
36 mzVsRTbalance $methods.mzVsRTbalance | 31 mzVsRtBalance $methods.mzVsRtBalance |
37 mzCheck $methods.mzCheck | 32 absMz $methods.absMz |
38 rtCheck $methods.rtCheck | 33 absRt $methods.absRt |
39 kNN $methods.kNN | 34 kNN $methods.kNN |
40 #end if | 35 #end if |
41 | 36 |
42 @COMMAND_PEAKLIST@ | 37 @COMMAND_PEAKLIST@ |
43 | 38 |
39 @COMMAND_FILE_LOAD@ | |
40 | |
44 @COMMAND_LOG_EXIT@ | 41 @COMMAND_LOG_EXIT@ |
45 ]]></command> | 42 ]]></command> |
46 | 43 |
47 <inputs> | 44 <inputs> |
48 <param name="image" type="data" format="rdata.xcms.raw,rdata.xcms.group,rdata.xcms.retcor,rdata" label="xset RData file" help="output file from another function xcms (xcmsSet, retcor etc.)" /> | 45 <param name="image" type="data" format="rdata.xcms.findchrompeaks,rdata.xcms.group,rdata.xcms.retcor,rdata" label="@INPUT_IMAGE_LABEL@" help="@INPUT_IMAGE_HELP@ from: findChromPeaks, groupChromPeaks or adjustRtime" /> |
49 <conditional name="methods"> | 46 <conditional name="methods"> |
50 <param name="method" type="select" label="Method to use for grouping" help="[method] See the help section below"> | 47 <param name="method" type="select" label="Method to use for grouping" help="See the help section below"> |
51 <option value="density" selected="true">density</option> | 48 <option value="PeakDensity" selected="true">PeakDensity - peak grouping based on time dimension peak densities</option> |
52 <option value="mzClust" >mzClust</option> | 49 <option value="MzClust">MzClust - high resolution peak grouping for single spectra (direct infusion) MS data</option> |
53 <option value="nearest" >nearest</option> | 50 <option value="NearestPeaks">NearestPeaks - chromatographic peak grouping based on their proximity in the mz-rt space</option> |
54 </param> | 51 </param> |
55 <when value="density"> | 52 <when value="PeakDensity"> |
56 <param name="bw" type="float" value="30" label="Bandwidth" help="[bw] bandwidth (standard deviation or half width at half maximum) of gaussian smoothing kernel to apply to the peak density chromatogram" /> | 53 <param argument="bw" type="float" value="30" label="Bandwidth" help="bandwidth (standard deviation or half width at half maximum) of gaussian smoothing kernel to apply to the peak density chromatogram" /> |
57 <param name="minfrac" type="float" value="0.5" label="Minimum fraction of samples necessary" help="[minfrac] in at least one of the sample groups for it to be a valid group" /> | 54 <param argument="minFraction" type="float" value="0.5" label="Minimum fraction of samples" help="in at least one sample group in which the peaks have to be present to be considered as a peak group (feature)" /> |
58 <param name="mzwid" type="float" value="0.25" label="Width of overlapping m/z slices" help="[mzwid] to use for creating peak density chromatograms and grouping peaks across samples " /> | 55 <param argument="minSamples" type="integer" value="1" label="Minimum number of samples" help="in at least one sample group in which the peaks have to be detected to be considered a peak group (feature)" /> |
59 <!-- | 56 <param argument="binSize" type="float" value="0.25" label="Width of overlapping m/z slices" help="to use for creating peak density chromatograms and grouping peaks across samples (previously mzdiff)" /> |
60 <param name="minsamp" type="hidden" value="1" label="minsamp" help="minimum number of samples necessary in at least one of the sample groups for it to be a valid group " /> | 57 |
61 --> | 58 <section name="PeakDensityAdv" title="Advanced Options" expanded="False"> |
62 <conditional name="density_options"> | 59 <param argument="maxFeatures" type="integer" value="50" label="Maximum number of groups to identify in a single m/z slice" /> |
63 <param name="option" type="select" label="Advanced options"> | 60 </section> |
64 <option value="show">show</option> | |
65 <option value="hide" selected="true">hide</option> | |
66 </param> | |
67 <when value="show"> | |
68 <param name="max" type="integer" value="50" label="Maximum number of groups to identify in a single m/z slice" help="[max]" /> | |
69 </when> | 61 </when> |
70 <when value="hide"> | 62 <when value="MzClust"> |
63 <param argument="ppm" type="integer" value="20" label="Relative mz error for clustering/grouping in ppm" /> | |
64 <param argument="absMz" type="float" value="0" label="Absolute mz error for clustering/grouping" /> | |
65 <param argument="minFraction" type="float" value="0.5" label="Minimum fraction of samples" help="in at least one sample group in which the peaks have to be present to be considered as a peak group (feature)" /> | |
66 <param argument="minSamples" type="integer" value="1" label="Minimum number of samples" help="in at least one sample group in which the peaks have to be detected to be considered a peak group (feature)" /> | |
67 </when> | |
68 <when value="NearestPeaks"> | |
69 <param argument="mzVsRtBalance" type="integer" value="10" label="Factor by which mz values are multiplied before calculating the (euclician) distance between two peaks" /> | |
70 <param argument="absMz" type="float" value="0.2" label="Maximum tolerated distance for mz values" /> | |
71 <param argument="absRt" type="integer" value="15" label="Maximum tolerated distance for RT values" /> | |
72 <param argument="kNN" type="integer" value="10" label="Number of nearest Neighbours to check" /> | |
71 </when> | 73 </when> |
72 </conditional> | 74 </conditional> |
73 | 75 |
74 </when> | |
75 <when value="mzClust"> | |
76 <param name="mzppm" type="integer" value="20 " label="Relative error used for clustering/grouping in ppm" help="[mzppm]" /> | |
77 <param name="mzabs" type="float" value="0" label="Absolute error used for clustering/grouping" help="[mzabs]" /> | |
78 <param name="minfrac" type="float" value="0" label="Minimum fraction of each class in one bin" help="[minfrac] minimum fraction of samples necessary in at least one of the sample groups for it to be a valid group" /> | |
79 <!-- | |
80 <param name="minsamp" type="hidden" value="1" label="minsamp" help="minimum number of samples necessary in at least one of the sample groups for it to be a valid group " /> | |
81 --> | |
82 </when> | |
83 <when value="nearest"> | |
84 <param name="mzVsRTbalance" type="integer" value="10 " label="Multiplicator for mz value before calculating the (euclidean) distance between two peaks." help="[mzVsRTbalance]" /> | |
85 <param name="mzCheck" type="float" value="0.2" label="Maximum tolerated distance for mz" help="[mzCheck]" /> | |
86 <param name="rtCheck" type="integer" value="15" label="Maximum tolerated distance for RT" help="[rtCheck]" /> | |
87 <param name="kNN" type="integer" value="10" label="Number of nearest Neighbours to check" help="[kNN]" /> | |
88 </when> | |
89 </conditional> | |
90 <!-- | |
91 <param name="sleepy" type="float" value="0.001" label="sleep" help="seconds to pause between plotting successive steps of the peak grouping algorithm. peaks are plotted as points showing relative intensity. identified groups are flanked by dotted vertical lines"> | |
92 <validator type="in_range" message="Must be more than 0" min="0.001" max="inf"/> | |
93 </param> | |
94 --> | |
95 | |
96 <expand macro="input_peaklist"/> | 76 <expand macro="input_peaklist"/> |
77 | |
78 <expand macro="input_file_load"/> | |
97 </inputs> | 79 </inputs> |
98 | 80 |
99 <outputs> | 81 <outputs> |
100 <data name="xsetRData" format="rdata.xcms.group" label="${image.name[:-6]}.group.RData"/> | 82 <data name="xsetRData" format="rdata.xcms.group" label="${image.name[:-6]}.groupChromPeaks.RData" from_work_dir="group.RData"/> |
101 <data name="rplotsPdf" format="pdf" label="${image.name[:-6]}.group.Rplots.pdf"/> | 83 <data name="plotChromPeakDensity" format="pdf" label="${image.name[:-6]}.groupChromPeaks.plotChromPeakDensity.pdf" from_work_dir="plotChromPeakDensity.pdf"/> |
102 <expand macro="output_peaklist" function="group"/> | 84 <expand macro="output_peaklist" function="group"/> |
103 <data name="log" format="txt" label="xset.log.txt" hidden="true" /> | |
104 </outputs> | 85 </outputs> |
105 | 86 |
106 <tests> | 87 <tests> |
107 <!--<test> | 88 <!-- from xcmsSet |
108 <param name="image" value="xset.RData"/> | 89 <test> |
109 <param name="methods|method" value="density"/> | 90 <param name="image" value="faahKO-single-class.xset.merged.RData" ftype="rdata"/> |
110 <param name="methods|bw" value="5"/> | 91 <conditional name="methods"> |
111 <param name="methods|minfrac" value="0.3"/> | 92 <param name="method" value="PeakDensity"/> |
112 <param name="methods|mzwid" value="0.01"/> | 93 <param name="bw" value="5"/> |
113 <param name="methods|density_options|option" value="show"/> | 94 <param name="minFraction" value="0.3"/> |
114 <param name="methods|density_options|max" value="50"/> | 95 <param name="binSize" value="0.01"/> |
115 <output name="log"> | 96 <section name="PeakDensityAdv"> |
116 <assert_contents> | 97 <param name="maxFeatures" value="50"/> |
117 <has_text text="object with 4 samples" /> | 98 </section> |
118 <has_text text="Time range: 0.7-1139.7 seconds (0-19 minutes)" /> | 99 </conditional> |
119 <has_text text="Mass range: 50.0021-999.9863 m/z" /> | 100 <conditional name="peaklist"> |
120 <has_text text="Peaks: 59359 (about 14840 per sample)" /> | 101 <param name="peaklistBool" value="true" /> |
121 <has_text text="Peak Groups: 48998" /> | 102 <param name="convertRTMinute" value="false" /> |
122 <has_text text="Sample classes: bio, blank" /> | 103 <param name="numDigitsMZ" value="4" /> |
123 </assert_contents> | 104 <param name="numDigitsRT" value="1" /> |
124 </output> | 105 <param name="naTOzero" value="false" /> |
106 </conditional> | |
107 <expand macro="test_file_load_single"/> | |
108 <assert_stdout> | |
109 <has_text text="bw: 5" /> | |
110 <has_text text="minFraction: 0.3" /> | |
111 <has_text text="maxFeatures: 50" /> | |
112 <has_text text="object with 4 samples" /> | |
113 <has_text text="Time range: 2506.1-4477.9 seconds (41.8-74.6 minutes)" /> | |
114 <has_text text="Mass range: 200.1-600 m/z" /> | |
115 <has_text text="Peaks: 9251 (about 2313 per sample)" /> | |
116 <has_text text="Peak Groups: 8372" /> | |
117 <has_text text="Sample classes: KO, WT" /> | |
118 </assert_stdout> | |
119 <output name="variableMetadata" file="faahKO.xset.group.variableMetadata.tsv" /> | |
120 <output name="dataMatrix" file="faahKO.xset.group.dataMatrix.tsv" /> | |
125 </test>--> | 121 </test>--> |
126 <test> | 122 <!-- DISABLE FOR TRAVIS |
127 <param name="image" value="faahKO.xset.RData"/> | 123 <test> |
128 <param name="methods|method" value="density"/> | 124 <param name="image" value="faahKO-single.xset.merged.RData" ftype="rdata"/> |
129 <param name="methods|bw" value="5"/> | 125 <conditional name="methods"> |
130 <param name="methods|minfrac" value="0.3"/> | 126 <param name="method" value="PeakDensity"/> |
131 <param name="methods|mzwid" value="0.01"/> | 127 <param name="bw" value="5"/> |
132 <param name="methods|density_options|option" value="show"/> | 128 <param name="minFraction" value="0.3"/> |
133 <param name="methods|density_options|max" value="50"/> | 129 <param name="binSize" value="0.01"/> |
130 <conditional name="density_options"> | |
131 <param name="option" value="show"/> | |
132 <param name="maxFeatures" value="50"/> | |
133 </conditional> | |
134 </conditional> | |
135 <expand macro="test_file_load_single"/> | |
136 <assert_stdout> | |
137 <has_text text="object with 4 samples" /> | |
138 <has_text text="Time range: 2506.1-4477.9 seconds (41.8-74.6 minutes)" /> | |
139 <has_text text="Mass range: 200.1-600 m/z" /> | |
140 <has_text text="Peaks: 9251 (about 2313 per sample)" /> | |
141 <has_text text="Peak Groups: 611" /> | |
142 <has_text text="Sample classes: ." /> | |
143 </assert_stdout> | |
144 </test> | |
145 --> | |
146 <!-- DISABLE FOR TRAVIS Zip from xcmsSet | |
147 <test> | |
148 <param name="image" value="faahKO.xset.RData" ftype="rdata"/> | |
149 <conditional name="methods"> | |
150 <param name="method" value="PeakDensity"/> | |
151 <param name="bw" value="5"/> | |
152 <param name="minFraction" value="0.3"/> | |
153 <param name="binSize" value="0.01"/> | |
154 <conditional name="density_options"> | |
155 <param name="option" value="show"/> | |
156 <param name="maxFeatures" value="50"/> | |
157 </conditional> | |
158 </conditional> | |
134 <conditional name="peaklist"> | 159 <conditional name="peaklist"> |
135 <param name="convertRTMinute" value="false" /> | 160 <param name="convertRTMinute" value="false" /> |
136 <param name="peaklistBool" value="true" /> | 161 <param name="peaklistBool" value="true" /> |
137 <param name="numDigitsMZ" value="4" /> | 162 <param name="numDigitsMZ" value="4" /> |
138 <param name="numDigitsRT" value="1" /> | 163 <param name="numDigitsRT" value="1" /> |
139 </conditional> | 164 <param name="naTOzero" value="false" /> |
140 <output name="log"> | 165 </conditional> |
141 <assert_contents> | 166 <expand macro="test_file_load_zip"/> |
142 <has_text text="object with 4 samples" /> | 167 <assert_stdout> |
143 <has_text text="Time range: 2506.1-4477.9 seconds (41.8-74.6 minutes)" /> | 168 <has_text text="object with 4 samples" /> |
144 <has_text text="Mass range: 200.1-600 m/z" /> | 169 <has_text text="Time range: 2506.1-4477.9 seconds (41.8-74.6 minutes)" /> |
145 <has_text text="Peaks: 9251 (about 2313 per sample)" /> | 170 <has_text text="Mass range: 200.1-600 m/z" /> |
146 <has_text text="Peak Groups: 8275" /> | 171 <has_text text="Peaks: 9251 (about 2313 per sample)" /> |
147 <has_text text="Sample classes: KO, WT" /> | 172 <has_text text="Peak Groups: 8372" /> |
148 </assert_contents> | 173 <has_text text="Sample classes: KO, WT" /> |
149 </output> | 174 </assert_stdout> |
150 <output name="variableMetadata" file="faahKO.xset.group.variableMetadata.tsv" /> | 175 <output name="variableMetadata" file="faahKO.xset.group.variableMetadata.tsv" /> |
151 <output name="dataMatrix" file="faahKO.xset.group.dataMatrix.tsv" /> | 176 <output name="dataMatrix" file="faahKO.xset.group.dataMatrix.tsv" /> |
152 </test> | 177 </test> |
153 <test> | 178 --> |
154 <param name="image" value="faahKO-single-class.xset.merged.RData"/> | 179 |
155 <param name="methods|method" value="density"/> | 180 <!-- DISABLE FOR TRAVIS Zip from retcor |
156 <param name="methods|bw" value="5"/> | 181 <test> |
157 <param name="methods|minfrac" value="0.3"/> | 182 <param name="image" value="faahKO.xset.group.retcor.RData" ftype="rdata"/> |
158 <param name="methods|mzwid" value="0.01"/> | 183 <conditional name="methods"> |
159 <param name="methods|density_options|option" value="show"/> | 184 <param name="method" value="PeakDensity"/> |
160 <param name="methods|density_options|max" value="50"/> | 185 <param name="bw" value="5"/> |
161 <conditional name="peaklist"> | 186 <param name="minFraction" value="0.3"/> |
162 <param name="convertRTMinute" value="false" /> | 187 <param name="binSize" value="0.01"/> |
163 <param name="peaklistBool" value="true" /> | 188 <conditional name="density_options"> |
164 <param name="numDigitsMZ" value="4" /> | 189 <param name="option" value="show"/> |
165 <param name="numDigitsRT" value="1" /> | 190 <param name="maxFeatures" value="50"/> |
166 </conditional> | 191 </conditional> |
167 <output name="log"> | 192 </conditional> |
168 <assert_contents> | 193 <expand macro="test_file_load_zip"/> |
169 <has_text text="object with 4 samples" /> | 194 <assert_stdout> |
170 <has_text text="Time range: 2506.1-4477.9 seconds (41.8-74.6 minutes)" /> | 195 <has_text text="object with 4 samples" /> |
171 <has_text text="Mass range: 200.1-600 m/z" /> | 196 <has_text text="Time range: 2509.2-4480.3 seconds (41.8-74.7 minutes)" /> |
172 <has_text text="Peaks: 9251 (about 2313 per sample)" /> | 197 <has_text text="Mass range: 200.1-600 m/z" /> |
173 <has_text text="Peak Groups: 8275" /> | 198 <has_text text="Peaks: 9251 (about 2313 per sample)" /> |
174 <has_text text="Sample classes: KO, WT" /> | 199 <has_text text="Peak Groups: 8209" /> |
175 </assert_contents> | 200 <has_text text="Sample classes: KO, WT" /> |
176 </output> | 201 </assert_stdout> |
177 <output name="variableMetadata" file="faahKO.xset.group.variableMetadata.tsv" /> | 202 </test> |
178 <output name="dataMatrix" file="faahKO.xset.group.dataMatrix.tsv" /> | 203 --> |
179 </test> | 204 <!-- from retcor --> |
180 <test> | 205 <test> |
181 <param name="image" value="faahKO-single.xset.merged.RData"/> | 206 <param name="image" value="faahKO-single.xset.merged.group.retcor.RData" ftype="rdata"/> |
182 <param name="methods|method" value="density"/> | 207 <conditional name="methods"> |
183 <param name="methods|bw" value="5"/> | 208 <param name="method" value="PeakDensity"/> |
184 <param name="methods|minfrac" value="0.3"/> | 209 <param name="bw" value="5"/> |
185 <param name="methods|mzwid" value="0.01"/> | 210 <param name="minFraction" value="0.3"/> |
186 <param name="methods|density_options|option" value="show"/> | 211 <param name="binSize" value="0.01"/> |
187 <param name="methods|density_options|max" value="50"/> | 212 <section name="PeakDensityAdv"> |
188 <output name="log"> | 213 <param name="maxFeatures" value="50"/> |
189 <assert_contents> | 214 </section> |
190 <has_text text="object with 4 samples" /> | 215 </conditional> |
191 <has_text text="Time range: 2506.1-4477.9 seconds (41.8-74.6 minutes)" /> | 216 <expand macro="test_file_load_single"/> |
192 <has_text text="Mass range: 200.1-600 m/z" /> | 217 <assert_stdout> |
193 <has_text text="Peaks: 9251 (about 2313 per sample)" /> | 218 <has_text text="bw: 5" /> |
194 <has_text text="Peak Groups: 664" /> | 219 <has_text text="minFraction: 0.3" /> |
195 <has_text text="Sample classes: ." /> | 220 <has_text text="binSize: 0.01"/> |
196 </assert_contents> | 221 <has_text text="maxFeatures: 50" /> |
197 </output> | 222 <has_text text="object with 4 samples" /> |
198 </test> | 223 <has_text text="Time range: 2509.2-4480.3 seconds (41.8-74.7 minutes)" /> |
199 <test> | 224 <has_text text="Mass range: 200.1-600 m/z" /> |
200 <param name="image" value="MM-single.xset.merged.RData"/> | 225 <has_text text="Peaks: 9251 (about 2313 per sample)" /> |
201 <param name="methods|method" value="density"/> | 226 <has_text text="Peak Groups: 8209" /> |
202 <param name="methods|bw" value="5"/> | 227 <has_text text="Sample classes: KO, WT" /> |
203 <param name="methods|minfrac" value="0.3"/> | 228 </assert_stdout> |
204 <param name="methods|mzwid" value="0.01"/> | 229 </test> |
205 <param name="methods|density_options|option" value="show"/> | 230 <!-- DISABLE FOR TRAVIS |
206 <param name="methods|density_options|max" value="50"/> | 231 Test to test the different methods parameters |
207 <output name="log"> | 232 <test expect_failure="True"> |
208 <assert_contents> | 233 <param name="image" value="faahKO-single.xset.merged.group.retcor.RData" ftype="rdata"/> |
209 <has_text text="object with 2 samples" /> | 234 <conditional name="methods"> |
210 <has_text text="Time range: 19.7-307.3 seconds (0.3-5.1 minutes)" /> | 235 <param name="method" value="MzClust"/> |
211 <has_text text="Mass range: 117.0357-936.7059 m/z" /> | 236 <param name="ppm" value="21"/> |
212 <has_text text="Peaks: 236 (about 118 per sample)" /> | 237 <param name="absMz" value="0.1"/> |
213 <has_text text="Peak Groups: 236" /> | 238 </conditional> |
214 <has_text text="Sample classes: ." /> | 239 <expand macro="test_file_load_single"/> |
215 </assert_contents> | 240 <assert_stdout> |
216 </output> | 241 <has_text text="ppm: 21" /> |
217 </test> | 242 <has_text text="absMz: 0.1" /> |
218 <!--<test> | 243 </assert_stdout> |
219 <param name="image" value="xset.group.retcor.RData"/> | 244 </test> |
220 <param name="methods|method" value="density"/> | 245 <test> |
221 <param name="methods|bw" value="5"/> | 246 <param name="image" value="faahKO-single.xset.merged.group.retcor.RData" ftype="rdata"/> |
222 <param name="methods|minfrac" value="0.3"/> | 247 <conditional name="methods"> |
223 <param name="methods|mzwid" value="0.01"/> | 248 <param name="method" value="NearestPeaks"/> |
224 <param name="methods|density_options|option" value="show"/> | 249 <param name="mzVsRtBalance" value="11"/> |
225 <param name="methods|density_options|max" value="50"/> | 250 <param name="absMz" value="0.1"/> |
226 <output name="log"> | 251 </conditional> |
227 <assert_contents> | 252 <expand macro="test_file_load_single"/> |
228 <has_text text="object with 4 samples" /> | 253 <assert_stdout> |
229 <has_text text="Time range: 0.2-1140.1 seconds (0-19 minutes)" /> | 254 <has_text text="mzVsRtBalance: 11" /> |
230 <has_text text="Mass range: 50.0021-999.9863 m/z" /> | 255 <has_text text="absMz: 0.1" /> |
231 <has_text text="Peaks: 59359 (about 14840 per sample)" /> | 256 </assert_stdout> |
232 <has_text text="Peak Groups: 48958" /> | 257 </test> |
233 <has_text text="Sample classes: bio, blank" /> | 258 --> |
234 </assert_contents> | |
235 </output> | |
236 </test>--> | |
237 <test> | |
238 <param name="image" value="faahKO.xset.group.retcor.RData"/> | |
239 <param name="methods|method" value="density"/> | |
240 <param name="methods|bw" value="5"/> | |
241 <param name="methods|minfrac" value="0.3"/> | |
242 <param name="methods|mzwid" value="0.01"/> | |
243 <param name="methods|density_options|option" value="show"/> | |
244 <param name="methods|density_options|max" value="50"/> | |
245 <output name="log"> | |
246 <assert_contents> | |
247 <has_text text="object with 4 samples" /> | |
248 <has_text text="Time range: 2507.7-4481.7 seconds (41.8-74.7 minutes)" /> | |
249 <has_text text="Mass range: 200.1-600 m/z" /> | |
250 <has_text text="Peaks: 9251 (about 2313 per sample)" /> | |
251 <has_text text="Peak Groups: 8157" /> | |
252 <has_text text="Sample classes: KO, WT" /> | |
253 </assert_contents> | |
254 </output> | |
255 </test> | |
256 <test> | |
257 <param name="image" value="faahKO-single.xset.merged.group.retcor.RData"/> | |
258 <param name="methods|method" value="density"/> | |
259 <param name="methods|bw" value="5"/> | |
260 <param name="methods|minfrac" value="0.3"/> | |
261 <param name="methods|mzwid" value="0.01"/> | |
262 <param name="methods|density_options|option" value="show"/> | |
263 <param name="methods|density_options|max" value="50"/> | |
264 <output name="log"> | |
265 <assert_contents> | |
266 <has_text text="object with 4 samples" /> | |
267 <has_text text="Time range: 2507.7-4481.7 seconds (41.8-74.7 minutes)" /> | |
268 <has_text text="Mass range: 200.1-600 m/z" /> | |
269 <has_text text="Peaks: 9251 (about 2313 per sample)" /> | |
270 <has_text text="Peak Groups: 8157" /> | |
271 <has_text text="Sample classes: KO, WT" /> | |
272 </assert_contents> | |
273 </output> | |
274 </test> | |
275 </tests> | 259 </tests> |
276 | 260 |
277 <help><![CDATA[ | 261 <help><![CDATA[ |
278 | 262 |
279 @HELP_AUTHORS@ | 263 @HELP_AUTHORS@ |
280 | 264 |
281 ========== | 265 ==================== |
282 Xcms.Group | 266 xcms groupChromPeaks |
283 ========== | 267 ==================== |
284 | 268 |
285 ----------- | 269 ----------- |
286 Description | 270 Description |
287 ----------- | 271 ----------- |
288 | 272 |
289 After peak identification with xcmsSet, this tool groups the peaks which represent the same analyte across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time. Allows rejection of features, which are only partially detected within the replicates of a sample class. | 273 After peak identification with xcmsSet, this tool groups the peaks which represent the same analyte across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time. Allows rejection of features, which are only partially detected within the replicates of a sample class. |
290 | 274 |
291 | |
292 | |
293 ----------------- | 275 ----------------- |
294 Workflow position | 276 Workflow position |
295 ----------------- | 277 ----------------- |
296 | 278 |
297 **Upstream tools** | 279 **Upstream tools** |
298 | 280 |
299 ========================= ================= =================== ========== | 281 ==================================== ======================== ============================== |
300 Name output file format parameter | 282 Name Output file Format |
301 ========================= ================= =================== ========== | 283 ==================================== ======================== ============================== |
302 xcms.xcmsSet xset.RData rdata.xcms.raw RData file | 284 xcms.findChromPeaks Merger (single) xset.merged.RData rdata.xcms.findchrompeaks |
303 ------------------------- ----------------- ------------------- ---------- | 285 ------------------------------------ ------------------------ ------------------------------ |
304 xcms.xcmsSet Merger xset.RData rdata.xcms.raw RData file | 286 xcms.findChromPeaks (zip) ``*``.raw.xset.RData rdata.xcms.findchrompeaks |
305 ------------------------- ----------------- ------------------- ---------- | 287 ------------------------------------ ------------------------ ------------------------------ |
306 xcms.retcor xset.RData rdata.xcms.retcor RData file | 288 xcms.adjustRtime ``*``.adjustRtime.RData rdata.xcms.retcor |
307 ========================= ================= =================== ========== | 289 ==================================== ======================== ============================== |
308 | 290 |
309 | 291 |
310 **Downstream tools** | 292 **Downstream tools** |
311 | 293 |
312 +---------------------------+--------------------------------------+ | 294 =========================== =========================== ==================== |
313 | Name | Output file | Format | | 295 Name Output file Format |
314 +===========================+=================+====================+ | 296 =========================== =========================== ==================== |
315 |xcms.retcor | xset.RData | rdata.xcms.group | | 297 xcms.adjustRtime ``*``.groupChromPeaks.RData rdata.xcms.group |
316 +---------------------------+--------------------------------------+ | 298 --------------------------- --------------------------- -------------------- |
317 |xcms.fillPeaks | xset.RData | rdata.xcms.group | | 299 xcms.fillChromPeaks ``*``.groupChromPeaks.RData rdata.xcms.group |
318 +---------------------------+--------------------------------------+ | 300 =========================== =========================== ==================== |
319 | |
320 The output file is an xcmsSet.RData file. You can continue your analysis using it in **xcms.retcor** tool as an next step and then **xcms.fillPeaks**. | |
321 | 301 |
322 **General schema of the metabolomic workflow** | 302 **General schema of the metabolomic workflow** |
323 | 303 |
324 .. image:: xcms_group_workflow.png | 304 .. image:: xcms_group_workflow.png |
325 | 305 |
326 | 306 --------------------------------------------------- |
327 ----------- | |
328 Input files | |
329 ----------- | |
330 | |
331 +---------------------------+-----------------------+ | |
332 | Parameter : num + label | Format | | |
333 +===========================+=======================+ | |
334 | Or : RData file | rdata.xcms.raw | | |
335 +---------------------------+-----------------------+ | |
336 | Or : RData file | rdata.xcms.retcor | | |
337 +---------------------------+-----------------------+ | |
338 | |
339 | 307 |
340 ---------- | 308 ---------- |
341 Parameters | 309 Parameters |
342 ---------- | 310 ---------- |
343 | 311 |
344 Method to use for grouping | 312 Method to use for grouping |
345 -------------------------- | 313 -------------------------- |
346 | 314 |
347 **mzClust** | 315 **MzClust** |
348 | 316 |
349 | Runs high resolution alignment on single spectra samples stored in the RData file generated by the **xcmsSet tool**. | 317 | This method performs high resolution correspondence for single spectra samples. |
350 | 318 | See the MzClust_manual_ |
351 **density** | 319 |
352 | 320 **PeakDensity** |
353 | Groups peaks together across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time. | 321 |
354 | 322 | This method performs performs correspondence (chromatographic peak grouping) based on the density (distribution) of identified peaks along the retention time axis within slices of overlapping mz ranges. All peaks (from the same or from different samples) being close on the retention time axis are grouped into a feature (peak group). |
355 **nearest** | 323 | See the PeakDensity_manual_ |
356 | 324 |
357 | Groups peaks together across samples by creating a master peak list and assigning corresponding peaks from all samples. It is inspired by the alignment algorithm of mzMine. | 325 **NearestPeaks** |
358 | 326 |
327 | This method is inspired by the grouping algorithm of mzMine [Katajamaa 2006] and performs correspondence based on proximity of peaks in the space spanned by retention time and mz values. The method creates first a master peak list consisting of all chromatographic peaks from the sample in which most peaks were identified, and starting from that, calculates distances to peaks from the sample with the next most number of peaks. If peaks are closer than the defined threshold they are grouped together. | |
328 | See the NearestPeaks_manual_ | |
329 | |
330 .. _MzClust_manual: https://rdrr.io/bioc/xcms/man/groupChromPeaks-mzClust.html#heading-2 | |
331 .. _PeakDensity_manual: https://rdrr.io/bioc/xcms/man/groupChromPeaks-density.html#heading-2 | |
332 .. _NearestPeaks_manual: https://rdrr.io/bioc/xcms/man/groupChromPeaks-nearest.html#heading-2 | |
333 | |
334 @HELP_XCMS_MANUAL@ | |
335 | |
336 @HELP_PEAKLIST@ | |
359 | 337 |
360 ------------ | 338 ------------ |
361 Output files | 339 Output files |
362 ------------ | 340 ------------ |
363 | 341 |
364 xset.group.Rplots.pdf | 342 xset.groupChromPeaks.RData: rdata.xcms.group format |
365 | 343 |
366 xset.group.RData: rdata.xcms.group format | 344 | RData file that will be necessary in the third and fourth step of the workflow (xcms.adjustRtime and xcms.fillChromPeaks). |
367 | 345 |
368 | Rdata file that will be necessary in the third and fourth step of the workflow (xcms.retcor and xcms.fillpeaks). | 346 xset.groupChromPeaks.plotChromPeakDensity.pdf |
369 | 347 |
370 | 348 | Density plot |
371 ------ | 349 |
372 | 350 @HELP_PEAKLIST_OUTPUT@ |
373 .. class:: infomark | |
374 | |
375 The output file is an xset.group.RData file. You can continue your analysis using it in **xcms.retcor** tool. | |
376 | |
377 | |
378 --------------------------------------------------- | |
379 | |
380 | |
381 --------------- | |
382 Working example | |
383 --------------- | |
384 | |
385 Input files | |
386 ----------- | |
387 | |
388 | RData file -> **xset.RData** | |
389 | |
390 Parameters | |
391 ---------- | |
392 | |
393 | Method -> **density** | |
394 | bw -> **5** | |
395 | minfrac -> **0.3** | |
396 | mzwid -> **0.01** | |
397 | Advanced options: **show** | |
398 | max -> **50** | |
399 | |
400 | |
401 Output files | |
402 ------------ | |
403 | |
404 | **1) xset.RData: RData file** | |
405 | |
406 | **2) Example of an xset.group.Rplots pdf file** | |
407 | |
408 .. image:: xcms_group.png | |
409 :width: 700 | |
410 | 351 |
411 | 352 |
412 --------------------------------------------------- | 353 --------------------------------------------------- |
413 | 354 |
414 Changelog/News | 355 Changelog/News |
415 -------------- | 356 -------------- |
416 | 357 |
358 **Version 3.0.0.0 - 08/03/2018** | |
359 | |
360 - UPGRADE: upgrade the xcms version from 1.46.0 to 3.0.0. So refactoring of a lot of underlying codes and methods. Some parameters may have been renamed. | |
361 | |
362 - NEW: a bunch of new options: PeakDensity.minSamples), MzClust.minSamples) | |
363 | |
364 - NEW: a new density plot | |
365 | |
366 - IMPROVEMENT: the advanced options are now in sections. It will allow you to access to all the parameters and to know their default values. | |
367 | |
368 | |
417 **Version 2.1.1 - 29/11/2017** | 369 **Version 2.1.1 - 29/11/2017** |
418 | 370 |
419 - BUGFIX: To avoid issues with accented letter in the parentFile tag of the mzXML files, we changed a hidden mechanim to LC_ALL=C | 371 - BUGFIX: To avoid issues with accented letter in the parentFile tag of the mzXML files, we changed a hidden mechanim to LC_ALL=C |
420 | 372 |
373 | |
421 **Version 2.1.0 - 07/02/2017** | 374 **Version 2.1.0 - 07/02/2017** |
422 | 375 |
423 - IMPROVEMENT: Add an option to export the peak list at this step without have to wait camara.annotate | 376 - IMPROVEMENT: Add an option to export the peak list at this step without have to wait camara.annotate |
424 | 377 |
425 - IMPROVEMENT: xcms.group can deal with merged individual data from "xcms.xcmsSet Merger" | 378 - IMPROVEMENT: xcms.group can deal with merged individual data from "xcms.xcmsSet Merger" |
426 | 379 |
427 - BUGFIX: the default value of "density" -> "Maximum number of groups to identify in a single m/z slice" which was of 5 have been changed to fix with the XMCS default values to 50 | 380 - BUGFIX: the default value of "density" -> "Maximum number of groups to identify in a single m/z slice" which was of 5 have been changed to fix with the XMCS default values to 50 |
428 | 381 |
382 | |
429 **Version 2.0.6 - 06/07/2016** | 383 **Version 2.0.6 - 06/07/2016** |
430 | 384 |
431 - UPGRADE: upgrate the xcms version from 1.44.0 to 1.46.0 | 385 - UPGRADE: upgrate the xcms version from 1.44.0 to 1.46.0 |
432 | 386 |
387 | |
433 **Version 2.0.5 - 04/04/2016** | 388 **Version 2.0.5 - 04/04/2016** |
434 | 389 |
435 - TEST: refactoring to pass planemo test using conda dependencies | 390 - TEST: refactoring to pass planemo test using conda dependencies |
436 | 391 |
437 | 392 |