Mercurial > repos > eschen42 > w4mclassfilter
comparison w4mclassfilter.xml @ 12:38f509903a0b draft
"planemo upload for repository https://github.com/HegemanLab/w4mclassfilter_galaxy_wrapper/tree/master commit b9712e554d16ed26f6c6d0c2e8cd74552b49f694"
author | eschen42 |
---|---|
date | Tue, 01 Oct 2019 16:57:58 -0400 |
parents | 9f5c0e23c205 |
children | c18040b6e8b9 |
comparison
equal
deleted
inserted
replaced
11:9f5c0e23c205 | 12:38f509903a0b |
---|---|
1 <tool id="w4mclassfilter" name="W4m Data Subset" version="0.98.11"> | 1 <tool id="w4mclassfilter" name="W4m Data Subset" version="0.98.13"> |
2 <description>Filter W4m data by values or metadata</description> | 2 <description>Filter W4m data by values or metadata</description> |
3 <!-- Here is the hyphenation standard that I *try* to apply consistently in my documentation: http://www.sandranoonan.com/dont-let-hyphenation-drive-crazy/ --> | 3 <!-- Here is the hyphenation standard that I *try* to apply consistently in my documentation: http://www.sandranoonan.com/dont-let-hyphenation-drive-crazy/ --> |
4 <requirements> | 4 <requirements> |
5 <!-- <requirement type="package" version="6.2">readline</requirement> --> | 5 <requirement type="package" version="3.6.1">r-base</requirement> |
6 <requirement type="package" version="3.4.1">r-base</requirement> | 6 <requirement type="package" version="1.1_5">r-batch</requirement> |
7 <requirement type="package" version="1.1_4">r-batch</requirement> | 7 <requirement type="package" version="0.98.13">w4mclassfilter</requirement> |
8 <requirement type="package" version="0.98.8">w4mclassfilter</requirement> | |
9 </requirements> | 8 </requirements> |
10 <command detect_errors="aggressive"><![CDATA[ | 9 <command detect_errors="aggressive"><![CDATA[ |
10 unset R_HOME; | |
11 Rscript $__tool_directory__/w4mclassfilter_wrapper.R | 11 Rscript $__tool_directory__/w4mclassfilter_wrapper.R |
12 dataMatrix_in '$dataMatrix_in' | 12 dataMatrix_in '$dataMatrix_in' |
13 sampleMetadata_in '$sampleMetadata_in' | 13 sampleMetadata_in '$sampleMetadata_in' |
14 variableMetadata_in '$variableMetadata_in' | 14 variableMetadata_in '$variableMetadata_in' |
15 sampleclassNames '$sampleclassNames' | 15 sampleclassNames '$sampleclassNames' |
16 inclusive '$inclusive' | 16 inclusive '$inclusive' |
17 wildcards '$wildcards' | 17 wildcards '$wildcards' |
18 classnameColumn '$classnameColumn' | 18 classnameColumn '$classnameColumn' |
19 samplenameColumn 'sampleMetadata' | 19 samplenameColumn 'sampleMetadata' |
20 variable_range_filter '$variableRangeFilter' | 20 variable_range_filter '$variableRangeFilter' |
21 transformation '$transformation' | 21 transformation '$transformation' |
22 dataMatrix_out '$dataMatrix_out' | 22 imputation '$imputation' |
23 sampleMetadata_out '$sampleMetadata_out' | 23 dataMatrix_out '$dataMatrix_out' |
24 variableMetadata_out '$variableMetadata_out' | 24 sampleMetadata_out '$sampleMetadata_out' |
25 variableMetadata_out '$variableMetadata_out' | |
25 ]]></command> | 26 ]]></command> |
26 <inputs> | 27 <inputs> |
27 <param name="dataMatrix_in" format="tabular" label="Data matrix file" type="data" | 28 <param name="dataMatrix_in" format="tabular" label="Data matrix file" type="data" |
28 help="variables ✖ samples" /> | 29 help="variables ✖ samples" /> |
29 <param name="sampleMetadata_in" format="tabular" label="Sample metadata file" type="data" | 30 <param name="sampleMetadata_in" format="tabular" label="Sample metadata file" type="data" |
93 help="'none' (the default) - do not transform data; 'log2' - log base 2 of data; 'log10' - log base 10 of data; in all cases, negative and missing values are imputed to zero"> | 94 help="'none' (the default) - do not transform data; 'log2' - log base 2 of data; 'log10' - log base 10 of data; in all cases, negative and missing values are imputed to zero"> |
94 <option value="none" selected="true">none</option> | 95 <option value="none" selected="true">none</option> |
95 <option value="log2">log2</option> | 96 <option value="log2">log2</option> |
96 <option value="log10">log10</option> | 97 <option value="log10">log10</option> |
97 </param> | 98 </param> |
99 <param name="imputation" label="Imputation of missing values" type="select" | |
100 help="'zero' (the default) - replace missing values with zero; 'center' - replace missing values with feature-median; 'none' - perform no imputation"> | |
101 <option value="zero" selected="true">zero</option> | |
102 <option value="center">center</option> | |
103 <option value="none">none</option> | |
104 </param> | |
98 </inputs> | 105 </inputs> |
99 <outputs> | 106 <outputs> |
100 <data name="dataMatrix_out" format="tabular" label="${dataMatrix_in.name}.subset" ></data> | 107 <data name="dataMatrix_out" format="tabular" label="${dataMatrix_in.name}.subset" ></data> |
101 <data name="sampleMetadata_out" format="tabular" label="${sampleMetadata_in.name}.subset" ></data> | 108 <data name="sampleMetadata_out" format="tabular" label="${sampleMetadata_in.name}.subset" ></data> |
102 <data name="variableMetadata_out" format="tabular" label="${variableMetadata_in.name}.subset" ></data> | 109 <data name="variableMetadata_out" format="tabular" label="${variableMetadata_in.name}.subset" ></data> |
108 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 115 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
109 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 116 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
110 <param name="classnameColumn" value="gender"/> | 117 <param name="classnameColumn" value="gender"/> |
111 <param name="sampleclassNames" value="M"/> | 118 <param name="sampleclassNames" value="M"/> |
112 <param name="wildcards" value="FALSE"/> | 119 <param name="wildcards" value="FALSE"/> |
113 <param name="inclusive" value="filter-in"/> | 120 <param name="inclusive" value="TRUE"/> |
114 <param name="variableRangeFilter" value="FEATMAX:6.30103:,mz:200:,rt::800"/> | 121 <param name="variableRangeFilter" value="FEATMAX:2e6:,mz:200:,rt::800"/> |
115 <param name="transformation" value="log10"/> | 122 <param name="transformation" value="none"/> |
116 <output name="dataMatrix_out"> | 123 <output name="dataMatrix_out"> |
117 <assert_contents> | 124 <assert_contents> |
118 <has_text text="5.87336711011293" /> | 125 <has_text text="747080" /> |
126 <not_has_text text="13420742" /> | |
127 <not_has_text text="47259" /> | |
119 </assert_contents> | 128 </assert_contents> |
120 </output> | 129 </output> |
121 <output name="sampleMetadata_out"> | 130 <output name="sampleMetadata_out"> |
122 <assert_contents> | 131 <assert_contents> |
132 <has_text text="HU_017" /> | |
133 <has_text text="HU_034" /> | |
134 <has_text text="HU_078" /> | |
135 <has_text text="HU_091" /> | |
136 <has_text text="HU_093" /> | |
137 <has_text text="HU_099" /> | |
138 <has_text text="HU_130" /> | |
139 <has_text text="HU_134" /> | |
140 <has_text text="HU_138" /> | |
123 <not_has_text text="HU_028" /> | 141 <not_has_text text="HU_028" /> |
124 <not_has_text text="HU_051" /> | 142 <not_has_text text="HU_051" /> |
125 <not_has_text text="HU_060" /> | 143 <not_has_text text="HU_060" /> |
126 <not_has_text text="HU_110" /> | 144 <not_has_text text="HU_110" /> |
127 <not_has_text text="HU_149" /> | 145 <not_has_text text="HU_149" /> |
129 <not_has_text text="HU_175" /> | 147 <not_has_text text="HU_175" /> |
130 <not_has_text text="HU_178" /> | 148 <not_has_text text="HU_178" /> |
131 <not_has_text text="HU_185" /> | 149 <not_has_text text="HU_185" /> |
132 <not_has_text text="HU_204" /> | 150 <not_has_text text="HU_204" /> |
133 <not_has_text text="HU_208" /> | 151 <not_has_text text="HU_208" /> |
134 <has_text text="HU_017" /> | |
135 <has_text text="HU_034" /> | |
136 <has_text text="HU_078" /> | |
137 <has_text text="HU_091" /> | |
138 <has_text text="HU_093" /> | |
139 <has_text text="HU_099" /> | |
140 <has_text text="HU_130" /> | |
141 <has_text text="HU_134" /> | |
142 <has_text text="HU_138" /> | |
143 </assert_contents> | 152 </assert_contents> |
144 </output> | 153 </output> |
145 <output name="variableMetadata_out"> | 154 <output name="variableMetadata_out"> |
146 <assert_contents> | 155 <assert_contents> |
156 <has_text text="HMDB00208" /> | |
157 <has_text text="HMDB01032" /> | |
158 <has_text text="HMDB01101.1" /> | |
159 <has_text text="HMDB13189" /> | |
147 <not_has_text text="HMDB00191" /> | 160 <not_has_text text="HMDB00191" /> |
148 <has_text text="HMDB00208" /> | |
149 <not_has_text text="HMDB00251" /> | 161 <not_has_text text="HMDB00251" /> |
150 <not_has_text text="HMDB00299" /> | 162 <not_has_text text="HMDB00299" /> |
151 <not_has_text text="HMDB00512" /> | 163 <not_has_text text="HMDB00512" /> |
152 <not_has_text text="HMDB00518" /> | 164 <not_has_text text="HMDB00518" /> |
153 <not_has_text text="HMDB00715" /> | 165 <not_has_text text="HMDB00715" /> |
154 <not_has_text text="HMDB00822" /> | 166 <not_has_text text="HMDB00822" /> |
155 <has_text text="HMDB01032" /> | |
156 <has_text text="HMDB01101.1" /> | |
157 <not_has_text text="HMDB03193" /> | 167 <not_has_text text="HMDB03193" /> |
158 <not_has_text text="HMDB04824" /> | 168 <not_has_text text="HMDB04824" /> |
159 <not_has_text text="HMDB10348" /> | 169 <not_has_text text="HMDB10348" /> |
160 <has_text text="HMDB13189" /> | |
161 <not_has_text text="HMDB59717" /> | 170 <not_has_text text="HMDB59717" /> |
162 </assert_contents> | 171 </assert_contents> |
163 </output> | 172 </output> |
164 </test> | 173 </test> |
165 <!-- test 2 --> | 174 <!-- test 2 --> |
166 <test> | 175 <test> |
167 <param name="dataMatrix_in" value="input_dataMatrix.tsv"/> | 176 <param name="dataMatrix_in" value="input_dataMatrix.tsv"/> |
168 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 177 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
169 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 178 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
170 <param name="classnameColumn" value="sampleMetadata"/> | |
171 <!-- test that hyphens in regular expressions work --> | 179 <!-- test that hyphens in regular expressions work --> |
172 <param name="sampleclassNames" value="HU_[0-9][0-9][0-9]"/> | 180 <param name="sampleclassNames" value="HU_[0-9][0-9][0-9]"/> |
181 <param name="inclusive" value="TRUE"/> | |
173 <param name="wildcards" value="FALSE"/> | 182 <param name="wildcards" value="FALSE"/> |
174 <param name="inclusive" value="filter-in"/> | 183 <param name="classnameColumn" value="sampleMetadata"/> |
175 <param name="variableRangeFilter" value="FEATMAX:20.93157:,mz:200:,rt::800"/> | 184 <!-- test that variableRangeFilter works with tranformation --> |
176 <param name="transformation" value="log2"/> | 185 <param name="variableRangeFilter" value="FEATMAX:6.30103:,mz:200:,rt::800"/> |
177 <output name="dataMatrix_out"> | 186 <param name="transformation" value="log10"/> |
178 <assert_contents> | 187 <param name="imputation" value="zero"/> |
179 <has_text text="19.5109032146715" /> | 188 <output name="dataMatrix_out" md5="5644d2ea01d072ee1d0c40e29e9d0089"> |
189 <assert_contents> | |
190 <has_text text="5.8733671" /> | |
180 </assert_contents> | 191 </assert_contents> |
181 </output> | 192 </output> |
182 <output name="sampleMetadata_out"> | 193 <output name="sampleMetadata_out"> |
183 <assert_contents> | 194 <assert_contents> |
195 <has_text text="HU_017" /> | |
184 <has_text text="HU_028" /> | 196 <has_text text="HU_028" /> |
197 <has_text text="HU_034" /> | |
185 <has_text text="HU_051" /> | 198 <has_text text="HU_051" /> |
186 <has_text text="HU_060" /> | 199 <has_text text="HU_060" /> |
200 <has_text text="HU_078" /> | |
201 <has_text text="HU_091" /> | |
202 <has_text text="HU_093" /> | |
203 <has_text text="HU_099" /> | |
187 <has_text text="HU_110" /> | 204 <has_text text="HU_110" /> |
205 <has_text text="HU_130" /> | |
206 <has_text text="HU_134" /> | |
207 <has_text text="HU_138" /> | |
188 <has_text text="HU_149" /> | 208 <has_text text="HU_149" /> |
189 <has_text text="HU_152" /> | 209 <has_text text="HU_152" /> |
190 <has_text text="HU_175" /> | 210 <has_text text="HU_175" /> |
191 <has_text text="HU_178" /> | 211 <has_text text="HU_178" /> |
192 <has_text text="HU_185" /> | 212 <has_text text="HU_185" /> |
193 <not_has_text text="HU_204" /> | |
194 <has_text text="HU_208" /> | 213 <has_text text="HU_208" /> |
195 <has_text text="HU_017" /> | 214 <not_has_text text="HU_204" /> |
196 <has_text text="HU_034" /> | |
197 <has_text text="HU_078" /> | |
198 <has_text text="HU_091" /> | |
199 <has_text text="HU_093" /> | |
200 <has_text text="HU_099" /> | |
201 <has_text text="HU_130" /> | |
202 <has_text text="HU_134" /> | |
203 <has_text text="HU_138" /> | |
204 </assert_contents> | 215 </assert_contents> |
205 </output> | 216 </output> |
206 <output name="variableMetadata_out"> | 217 <output name="variableMetadata_out"> |
207 <assert_contents> | 218 <assert_contents> |
208 <has_text text="HMDB00191" /> | 219 <has_text text="HMDB00191" /> |
209 <has_text text="HMDB00208" /> | 220 <has_text text="HMDB00208" /> |
221 <has_text text="HMDB01032" /> | |
222 <has_text text="HMDB01101.1" /> | |
223 <has_text text="HMDB13189" /> | |
210 <not_has_text text="HMDB00251" /> | 224 <not_has_text text="HMDB00251" /> |
211 <not_has_text text="HMDB00299" /> | 225 <not_has_text text="HMDB00299" /> |
212 <not_has_text text="HMDB00512" /> | 226 <not_has_text text="HMDB00512" /> |
213 <not_has_text text="HMDB00518" /> | 227 <not_has_text text="HMDB00518" /> |
214 <not_has_text text="HMDB00715" /> | 228 <not_has_text text="HMDB00715" /> |
215 <not_has_text text="HMDB00822" /> | 229 <not_has_text text="HMDB00822" /> |
216 <has_text text="HMDB01032" /> | |
217 <has_text text="HMDB01101.1" /> | |
218 <not_has_text text="HMDB03193" /> | 230 <not_has_text text="HMDB03193" /> |
219 <not_has_text text="HMDB04824" /> | 231 <not_has_text text="HMDB04824" /> |
220 <not_has_text text="HMDB10348" /> | 232 <not_has_text text="HMDB10348" /> |
221 <has_text text="HMDB13189" /> | |
222 <not_has_text text="HMDB59717" /> | 233 <not_has_text text="HMDB59717" /> |
223 </assert_contents> | 234 </assert_contents> |
224 </output> | 235 </output> |
225 </test> | 236 </test> |
226 <!-- test 3 --> | 237 <!-- test 3 --> |
228 <param name="dataMatrix_in" value="input_dataMatrix.tsv"/> | 239 <param name="dataMatrix_in" value="input_dataMatrix.tsv"/> |
229 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 240 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
230 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 241 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
231 <param name="classnameColumn" value="gender"/> | 242 <param name="classnameColumn" value="gender"/> |
232 <param name="sampleclassNames" value="M"/> | 243 <param name="sampleclassNames" value="M"/> |
233 <param name="inclusive" value="filter-in"/> | 244 <param name="inclusive" value="TRUE"/> |
234 <param name="transformation" value="none"/> | 245 <param name="transformation" value="none"/> |
235 <output name="dataMatrix_out"> | 246 <output name="dataMatrix_out"> |
236 <assert_contents> | 247 <assert_contents> |
237 <not_has_text text="HU_028" /> | 248 <not_has_text text="HU_028" /> |
238 <not_has_text text="HU_051" /> | 249 <not_has_text text="HU_051" /> |
279 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 290 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
280 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 291 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
281 <param name="classnameColumn" value="gender"/> | 292 <param name="classnameColumn" value="gender"/> |
282 <param name="sampleclassNames" value="*"/> | 293 <param name="sampleclassNames" value="*"/> |
283 <param name="wildcards" value="TRUE"/> | 294 <param name="wildcards" value="TRUE"/> |
284 <param name="inclusive" value="filter-in"/> | 295 <param name="inclusive" value="TRUE"/> |
296 <param name="imputation" value="zero"/> | |
297 <output name="dataMatrix_out" md5="b2eac4946d3803a07606286b50451af4"> | |
298 <assert_contents> | |
299 <not_has_text text="NA" /> | |
300 </assert_contents> | |
301 </output> | |
285 <output name="sampleMetadata_out"> | 302 <output name="sampleMetadata_out"> |
286 <assert_contents> | 303 <assert_contents> |
287 <not_has_text text="HU_204" /> | 304 <not_has_text text="HU_204" /> |
288 <has_text text="HU_028" /> | 305 <has_text text="HU_028" /> |
289 <has_text text="HU_051" /> | 306 <has_text text="HU_051" /> |
313 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 330 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
314 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 331 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
315 <param name="classnameColumn" value="gender"/> | 332 <param name="classnameColumn" value="gender"/> |
316 <param name="sampleclassNames" value="M"/> | 333 <param name="sampleclassNames" value="M"/> |
317 <param name="wildcards" value="FALSE"/> | 334 <param name="wildcards" value="FALSE"/> |
318 <param name="inclusive" value="filter-in"/> | 335 <param name="inclusive" value="TRUE"/> |
319 <output name="sampleMetadata_out"> | 336 <output name="sampleMetadata_out"> |
320 <assert_contents> | 337 <assert_contents> |
321 <not_has_text text="HU_028" /> | 338 <not_has_text text="HU_028" /> |
322 <not_has_text text="HU_051" /> | 339 <not_has_text text="HU_051" /> |
323 <not_has_text text="HU_060" /> | 340 <not_has_text text="HU_060" /> |
347 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 364 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
348 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 365 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
349 <param name="classnameColumn" value="gender"/> | 366 <param name="classnameColumn" value="gender"/> |
350 <param name="sampleclassNames" value="M"/> | 367 <param name="sampleclassNames" value="M"/> |
351 <param name="wildcards" value="FALSE"/> | 368 <param name="wildcards" value="FALSE"/> |
352 <param name="inclusive" value="filter-in"/> | 369 <param name="inclusive" value="TRUE"/> |
353 <output name="variableMetadata_out"> | 370 <output name="variableMetadata_out"> |
354 <assert_contents> | 371 <assert_contents> |
355 <has_text text="HMDB03193" /> | 372 <has_text text="HMDB03193" /> |
356 <not_has_text text="HMDB00822" /> | 373 <not_has_text text="HMDB00822" /> |
357 <has_text text="HMDB01101" /> | 374 <has_text text="HMDB01101" /> |
377 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 394 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
378 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 395 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
379 <param name="classnameColumn" value="gender"/> | 396 <param name="classnameColumn" value="gender"/> |
380 <param name="sampleclassNames" value="M"/> | 397 <param name="sampleclassNames" value="M"/> |
381 <param name="wildcards" value="FALSE"/> | 398 <param name="wildcards" value="FALSE"/> |
382 <param name="inclusive" value="filter-in"/> | 399 <param name="inclusive" value="TRUE"/> |
383 <output name="variableMetadata_out"> | 400 <output name="variableMetadata_out"> |
384 <assert_contents> | 401 <assert_contents> |
385 <has_text text="HMDB03193" /> | 402 <has_text text="HMDB03193" /> |
386 <not_has_text text="HMDB00822" /> | 403 <not_has_text text="HMDB00822" /> |
387 <has_text text="HMDB01101" /> | 404 <has_text text="HMDB01101" /> |
407 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 424 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
408 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 425 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
409 <param name="classnameColumn" value="gender"/> | 426 <param name="classnameColumn" value="gender"/> |
410 <param name="sampleclassNames" value="[Mm],[fF]"/> | 427 <param name="sampleclassNames" value="[Mm],[fF]"/> |
411 <param name="wildcards" value="FALSE"/> | 428 <param name="wildcards" value="FALSE"/> |
412 <param name="inclusive" value="filter-in"/> | 429 <param name="inclusive" value="TRUE"/> |
413 <output name="sampleMetadata_out"> | 430 <output name="sampleMetadata_out"> |
414 <assert_contents> | 431 <assert_contents> |
415 <has_text text="HU_028" /> | 432 <has_text text="HU_028" /> |
416 <has_text text="HU_051" /> | 433 <has_text text="HU_051" /> |
417 <has_text text="HU_060" /> | 434 <has_text text="HU_060" /> |
441 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | 458 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> |
442 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | 459 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> |
443 <param name="classnameColumn" value=""/> | 460 <param name="classnameColumn" value=""/> |
444 <param name="sampleclassNames" value="M"/> | 461 <param name="sampleclassNames" value="M"/> |
445 <param name="wildcards" value="FALSE"/> | 462 <param name="wildcards" value="FALSE"/> |
446 <param name="inclusive" value="filter-in"/> | 463 <param name="inclusive" value="TRUE"/> |
447 <output name="sampleMetadata_out"> | 464 <output name="sampleMetadata_out"> |
448 <assert_contents> | 465 <assert_contents> |
449 <has_text text="HU_028" /> | 466 <has_text text="HU_028" /> |
450 <has_text text="HU_051" /> | 467 <has_text text="HU_051" /> |
451 <has_text text="HU_060" /> | 468 <has_text text="HU_060" /> |
467 <has_text text="HU_134" /> | 484 <has_text text="HU_134" /> |
468 <has_text text="HU_138" /> | 485 <has_text text="HU_138" /> |
469 </assert_contents> | 486 </assert_contents> |
470 </output> | 487 </output> |
471 </test> | 488 </test> |
489 <!-- test 10 - extends test4 with no imputation rather than zero imputation --> | |
490 <test> | |
491 <param name="dataMatrix_in" value="input_dataMatrix.tsv"/> | |
492 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | |
493 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | |
494 <param name="classnameColumn" value="gender"/> | |
495 <param name="sampleclassNames" value="*"/> | |
496 <param name="wildcards" value="TRUE"/> | |
497 <param name="inclusive" value="TRUE"/> | |
498 <param name="imputation" value="none"/> | |
499 <output name="dataMatrix_out" md5="cc9ab8bdb70b68b43b19b7327d285166"> | |
500 <assert_contents> | |
501 <not_has_text text="HU_204" /> | |
502 <has_text text="NA" /> | |
503 <has_text text="HU_028" /> | |
504 </assert_contents> | |
505 </output> | |
506 <output name="sampleMetadata_out"> | |
507 <assert_contents> | |
508 <not_has_text text="HU_204" /> | |
509 <has_text text="HU_028" /> | |
510 </assert_contents> | |
511 </output> | |
512 </test> | |
513 <!-- test 11 - extends test4 with center imputation rather than zero imputation --> | |
514 <test> | |
515 <param name="dataMatrix_in" value="input_dataMatrix.tsv"/> | |
516 <param name="sampleMetadata_in" value="input_sampleMetadata.tsv"/> | |
517 <param name="variableMetadata_in" value="input_variableMetadata.tsv"/> | |
518 <param name="classnameColumn" value="gender"/> | |
519 <param name="sampleclassNames" value="*"/> | |
520 <param name="wildcards" value="TRUE"/> | |
521 <param name="inclusive" value="TRUE"/> | |
522 <param name="imputation" value="center"/> | |
523 <output name="dataMatrix_out" md5="75a4802bb8887709e4d4dec8c2c3d3cf"> | |
524 <assert_contents> | |
525 <not_has_text text="HU_204" /> | |
526 <not_has_text text="NA" /> | |
527 <has_text text="HU_028" /> | |
528 </assert_contents> | |
529 </output> | |
530 <output name="sampleMetadata_out"> | |
531 <assert_contents> | |
532 <not_has_text text="HU_204" /> | |
533 <has_text text="HU_028" /> | |
534 </assert_contents> | |
535 </output> | |
536 </test> | |
472 </tests> | 537 </tests> |
473 <help><![CDATA[ | 538 <help><![CDATA[ |
474 | 539 |
475 | 540 |
476 **Author** Arthur Eschenlauer (University of Minnesota, esch0041@umn.edu) | 541 **Author** Arthur Eschenlauer (University of Minnesota, esch0041@umn.edu) |
529 - Features may be eliminated by specifying minimum or maximum value (or both) allowable in columns of variableMetadata. | 594 - Features may be eliminated by specifying minimum or maximum value (or both) allowable in columns of variableMetadata. |
530 - Features may be eliminated by “range of row-maximum for each feature”, i.e., by specifying minimum or maximum intensity (or both) allowable in each row of the dataMatrix (i.e., for the feature across all samples). | 595 - Features may be eliminated by “range of row-maximum for each feature”, i.e., by specifying minimum or maximum intensity (or both) allowable in each row of the dataMatrix (i.e., for the feature across all samples). |
531 | 596 |
532 This tool also performs several operations to address several data issues that may impede downstream statistical analysis: | 597 This tool also performs several operations to address several data issues that may impede downstream statistical analysis: |
533 | 598 |
534 - Missing values in dataMatrix are imputed to zero. | |
535 - The values in the dataMatrix may be log-transformed if desired. | |
536 - Samples that are missing from either sampleMetadata or dataMatrix are eliminated. | 599 - Samples that are missing from either sampleMetadata or dataMatrix are eliminated. |
537 - Features that are missing from either variableMetadata or dataMatrix are eliminated. | 600 - Features that are missing from either variableMetadata or dataMatrix are eliminated. |
538 - Features and samples that have zero variance are eliminated. | 601 - Features and samples that have zero variance are eliminated. |
539 - Samples and features are sorted alphabetically in rows and columns of dataMatrix and in rows of variableMetadata and sampleMetadata. | 602 - Samples and features are sorted alphabetically in rows and columns of dataMatrix and in rows of variableMetadata and sampleMetadata. |
540 - The names of the first columns of variableMetadata and sampleMetadata are set respectively to "variableMetadata" and "sampleMetadata". | 603 - The names of the first columns of variableMetadata and sampleMetadata are set respectively to "variableMetadata" and "sampleMetadata". |
604 - If desired, the values in the dataMatrix may be log-transformed. | |
605 - If desired, each missing value in dataMatrix is replaced with zero or the median value observed for the corresponding feature. | |
541 | 606 |
542 This tool may be applied several times sequentially, which may be useful for: | 607 This tool may be applied several times sequentially, which may be useful for: |
543 | 608 |
544 - analyzing subsets of samples for progressively smaller sets of treatment-levels, or | 609 - analyzing subsets of samples for progressively smaller sets of treatment-levels, or |
545 - choosing subsets of samples based on criteria in several columns of the sampleMetadata table. | 610 - choosing subsets of samples based on criteria in several columns of the sampleMetadata table. |
605 Variable-range filters (default = no filters) | 670 Variable-range filters (default = no filters) |
606 | comma-separated names of variable-range filters (see the 'Variable-range filters' section below) | 671 | comma-separated names of variable-range filters (see the 'Variable-range filters' section below) |
607 | | 672 | |
608 | 673 |
609 Data-transformation (default = '``none``') | 674 Data-transformation (default = '``none``') |
610 | '``none``' - do not transform data matrix values | 675 | '``none``' - Do not transform data matrix values. |
611 | '``log2``' - take the log base 2 of the values in the data matrix | 676 | '``log2``' - Take the log base 2 of the values in the data matrix. |
612 | '``log10``' - take the log base 10 of the values in the data matrix | 677 | '``log10``' - Take the log base 10 of the values in the data matrix. |
613 | In both cases, negative and missing values are imputed to zero. | 678 | |
679 | |
680 Data-imputation (default = '``zero``') | |
681 | '``none``' - Do not impute data matrix values. | |
682 | '``zero``' - Negative and missing values are imputed to zero. | |
683 | '``center``' - For each feature, negative and missing values are imputed to the median of other values. | |
614 | | 684 | |
615 | 685 |
616 | 686 |
617 ------------ | 687 ------------ |
618 Output files | 688 Output files |
706 - **If the "maximum" is less than the "minimum", then the range is exclusive** (e.g., "mz:800:200" means retain only features whose mz is NOT in the range 200-800) | 776 - **If the "maximum" is less than the "minimum", then the range is exclusive** (e.g., "mz:800:200" means retain only features whose mz is NOT in the range 200-800) |
707 - **If the name supplied in the first field is 'FEATMAX',** then the string is defining the minimum (and possibly, though less useful, maximum) intensity for each feature in the dataMatrix. For example, "FEATMAX:1e6:" would specify that any feature would be excluded if no sample had an intensity for that feature greater than 1000000. | 777 - **If the name supplied in the first field is 'FEATMAX',** then the string is defining the minimum (and possibly, though less useful, maximum) intensity for each feature in the dataMatrix. For example, "FEATMAX:1e6:" would specify that any feature would be excluded if no sample had an intensity for that feature greater than 1000000. |
708 | 778 |
709 - Note, however, that when the "maximum" is greater than the "minimum" for the FEATMAX range specification, then the specification is ignored. | 779 - Note, however, that when the "maximum" is greater than the "minimum" for the FEATMAX range specification, then the specification is ignored. |
710 | 780 |
781 ---------------------------------- | |
782 Data transformation and imputation | |
783 ---------------------------------- | |
784 | |
785 Data may optionally be log2- or log10-transformed. | |
786 | |
787 Negative intensity values are always substituted with zeros. | |
788 | |
789 Missing intensity data values may optionally be imputed. Missing values may be substituted with zeros (as may be appropriate for univariate analysis) or with the median for the feature (as may be appropriate for multivariate analysis). (Note that the median feature-intensity is computed for the samples *before* variable-range filters are applied.) | |
790 | |
711 ----------------------------------------------------------------------------- | 791 ----------------------------------------------------------------------------- |
712 | 792 |
713 ---------------- | 793 ---------------- |
714 WORKING EXAMPLES | 794 WORKING EXAMPLES |
715 ---------------- | 795 ---------------- |
716 | |
717 .. class:: infomark | |
718 | 796 |
719 ----------- | 797 ----------- |
720 Input Files | 798 Input Files |
721 ----------- | 799 ----------- |
722 | 800 |
728 | https://raw.githubusercontent.com/HegemanLab/w4mclassfilter_galaxy_wrapper/master/tools/w4mclassfilter/test-data/input_sampleMetadata.tsv | | 806 | https://raw.githubusercontent.com/HegemanLab/w4mclassfilter_galaxy_wrapper/master/tools/w4mclassfilter/test-data/input_sampleMetadata.tsv | |
729 +------------------------------------------------------------------------------------------------------------------------------------------------------+ | 807 +------------------------------------------------------------------------------------------------------------------------------------------------------+ |
730 | https://raw.githubusercontent.com/HegemanLab/w4mclassfilter_galaxy_wrapper/master/tools/w4mclassfilter/test-data/input_variableMetadata.tsv | | 808 | https://raw.githubusercontent.com/HegemanLab/w4mclassfilter_galaxy_wrapper/master/tools/w4mclassfilter/test-data/input_variableMetadata.tsv | |
731 +------------------------------------------------------------------------------------------------------------------------------------------------------+ | 809 +------------------------------------------------------------------------------------------------------------------------------------------------------+ |
732 | 810 |
733 .. class:: infomark | |
734 | |
735 ------------------------------- | 811 ------------------------------- |
736 Running Without Range-Filtering | 812 Running Without Range-Filtering |
737 ------------------------------- | 813 ------------------------------- |
738 | 814 |
739 This example retains only samples whose 'gender' attribute is 'M'. | 815 This example retains only samples whose 'gender' attribute is 'M'. |
740 | 816 |
741 **Input parameters** | 817 **Input parameters** |
742 | 818 |
743 +------------------------------------+-------------------------------+ | 819 +---------------------------------------------+-------------------------------+ |
744 | Input Parameter | Value | | 820 | Input Parameter | Value | |
745 +====================================+===============================+ | 821 +=============================================+===============================+ |
746 | Names of sample-classes | M | | 822 | Column that names the sample-class | gender | |
747 +------------------------------------+-------------------------------+ | 823 +---------------------------------------------+-------------------------------+ |
748 | Include named classes | filter-in | | 824 | Names of sample-classes | M | |
749 +------------------------------------+-------------------------------+ | 825 +---------------------------------------------+-------------------------------+ |
750 | Column that names the sample-class | gender | | 826 | Use 'wild-cards' or 'regular expressions' | wild-cards | |
751 +------------------------------------+-------------------------------+ | 827 +---------------------------------------------+-------------------------------+ |
752 | Variable range-filters | (Leave this field empty.) | | 828 | Exclude/include named classes | filter-in | |
753 +------------------------------------+-------------------------------+ | 829 +---------------------------------------------+-------------------------------+ |
754 | Data transforamtion | none | | 830 | Variable range-filters | (Leave this field empty.) | |
755 +------------------------------------+-------------------------------+ | 831 +---------------------------------------------+-------------------------------+ |
832 | Data transforamtion | none | | |
833 +---------------------------------------------+-------------------------------+ | |
834 | Missing-value imputation | center | | |
835 +---------------------------------------------+-------------------------------+ | |
756 | 836 |
757 **Expected outputs** | 837 **Expected outputs** |
758 | 838 |
759 +-------------------+-------------------------------------------------------------------------------------------------------------------------------------------------+ | 839 +-------------------+-------------------------------------------------------------------------------------------------------------------------------------------------+ |
760 | Expected Output | Download from URL | | 840 | Expected Output | Download from URL | |
764 | Sample metadata | https://raw.githubusercontent.com/HegemanLab/w4mclassfilter_galaxy_wrapper/master/tools/w4mclassfilter/test-data/expected_sampleMetadata.tsv | | 844 | Sample metadata | https://raw.githubusercontent.com/HegemanLab/w4mclassfilter_galaxy_wrapper/master/tools/w4mclassfilter/test-data/expected_sampleMetadata.tsv | |
765 +-------------------+-------------------------------------------------------------------------------------------------------------------------------------------------+ | 845 +-------------------+-------------------------------------------------------------------------------------------------------------------------------------------------+ |
766 | Variable metadata | https://raw.githubusercontent.com/HegemanLab/w4mclassfilter_galaxy_wrapper/master/tools/w4mclassfilter/test-data/expected_variableMetadata.tsv | | 846 | Variable metadata | https://raw.githubusercontent.com/HegemanLab/w4mclassfilter_galaxy_wrapper/master/tools/w4mclassfilter/test-data/expected_variableMetadata.tsv | |
767 +-------------------+-------------------------------------------------------------------------------------------------------------------------------------------------+ | 847 +-------------------+-------------------------------------------------------------------------------------------------------------------------------------------------+ |
768 | 848 |
769 .. class:: infomark | |
770 | |
771 ---------------------------- | 849 ---------------------------- |
772 Running With Range-Filtering | 850 Running With Range-Filtering |
773 ---------------------------- | 851 ---------------------------- |
774 | 852 |
775 This example retains only features whose mz is greater than 200, whose rt is less than 800, and whose maximum intensity across all samples is 2,000,000. | 853 This example retains only features whose mz is greater than 200, whose rt is less than 800, and whose maximum intensity across all samples is 2,000,000. |
776 This example retains all samples (except those having zero variance for all feature), although it would be possible to filter on samples as well. | 854 This example retains all samples (except those having zero variance for all feature), although it would be possible to filter on samples as well. |
777 | 855 |
778 **Input parameters** | 856 **Input parameters** |
779 | 857 |
780 +------------------------------------+------------------------------------+ | 858 +---------------------------------------------+-----------------------------------+ |
781 | Input Parameter | Value | | 859 | Input Parameter | Value | |
782 +====================================+====================================+ | 860 +=============================================+===================================+ |
783 | Names of sample-classes | (Leave this field empty.) | | 861 | Column that names the sample-class | sampleMetadata | |
784 +------------------------------------+------------------------------------+ | 862 +---------------------------------------------+-----------------------------------+ |
785 | Include named classes | filter-out | | 863 | Names of sample-classes | HU_13[48] | |
786 +------------------------------------+------------------------------------+ | 864 +---------------------------------------------+-----------------------------------+ |
787 | Column that names the sample-class | gender | | 865 | Use 'wild-cards' or 'regular expressions' | regular-expressions | |
788 +------------------------------------+------------------------------------+ | 866 +---------------------------------------------+-----------------------------------+ |
789 | Variable range-filters | FEATMAX:20.93157:,mz:200:,rt::800 | | 867 | Exclude/include named classes | filter-out | |
790 +------------------------------------+------------------------------------+ | 868 +---------------------------------------------+-----------------------------------+ |
791 | Data transforamtion | log2 | | 869 | Variable range-filters | FEATMAX:20.93157:,mz:200:,rt::800 | |
792 +------------------------------------+------------------------------------+ | 870 +---------------------------------------------+-----------------------------------+ |
871 | Data transforamtion | log2 | | |
872 +---------------------------------------------+-----------------------------------+ | |
873 | Missing-value imputation | zero | | |
874 +---------------------------------------------+-----------------------------------+ | |
793 | 875 |
794 **Expected outputs** | 876 **Expected outputs** |
795 | 877 |
796 +-------------------+---------------------------------------------------------------------------------------------------------------------------------------------------+ | 878 +-------------------+---------------------------------------------------------------------------------------------------------------------------------------------------+ |
797 | Expected Output | Download from URL | | 879 | Expected Output | Download from URL | |