# HG changeset patch # User eschen42 # Date 1520135894 18000 # Node ID d5cf23369d12f711557c0b6e1f43a65a6c884826 # Parent 582a8a42a93baaf4fa0e01b3564880444230844b planemo upload for repository https://github.com/HegemanLab/w4mclassfilter_galaxy_wrapper/tree/master commit 7b824bc01884125dc8bb2e4c9ef70fb0a6d88db1 diff -r 582a8a42a93b -r d5cf23369d12 README --- a/README Mon Jan 29 21:20:07 2018 -0500 +++ b/README Sat Mar 03 22:58:14 2018 -0500 @@ -1,7 +1,8 @@ Galaxy Wrapper for the w4mclassfilter R Package + -This is a planemo -oriented galaxy-tool-wrapper +This is a Galaxy tool-wrapper to wrap the w4mclassfilter R package for use with the Workflow4Metabolomics -flavor of Galaxy +flavor of Galaxy . +The tool is built with Planemo . diff -r 582a8a42a93b -r d5cf23369d12 test-data/rangefilter_dataMatrix.tsv --- a/test-data/rangefilter_dataMatrix.tsv Mon Jan 29 21:20:07 2018 -0500 +++ b/test-data/rangefilter_dataMatrix.tsv Sat Mar 03 22:58:14 2018 -0500 @@ -1,6 +1,6 @@ HU_017 HU_028 HU_034 HU_051 HU_060 HU_078 HU_091 HU_093 HU_099 HU_110 HU_130 HU_134 HU_138 HU_149 HU_152 HU_175 HU_178 HU_185 HU_208 -HMDB00191 560002 771533 575790 392284 888498 785428 645785 591569 960658 910201 639437 1092885 1409045 2292023 1246459 1945577 710519 773384 622898 -HMDB00208 747080 13420742 595872 1172376 7172632 3143654 4059767 1433702 5593888 5402629 2477288 3346077 4230072 7621236 8960828 10335722 7037373 1574738 2540044 -HMDB01032 2569205 26023086 1604999 430453 8103558 26222916 257139 675754 59906109 263055 31151730 18648127 14989438 1554658 20249262 5588731 871010 15920 44276 -HMDB01101.1 6877586 52217 3158 10789748 229568 4763576 3878773 976436 831937 608298 1605075 72021 442510 1107705 1464339 31250 2724553 72900 30689 -HMDB13189 2644620 727587 1661412 619181 136278 2755434 593863 837865 3526136 2003278 1608814 3446611 1941527 113937 3132404 2893445 2092753 1034666 841661 +HMDB00191 19.0950724540801 19.5573683394871 19.1351832076319 18.581538968171 19.7610090032025 19.5831195045026 19.3006944055142 19.1741869272827 19.8736633887651 19.7958256457729 19.2864427002132 20.0597101691826 20.4262862563728 21.1281900906526 20.2494039981067 20.8917666482316 19.438513703552 19.5608253922588 19.2486364146654 +HMDB00208 19.5109032146715 23.6779611010349 19.1846429313023 20.1610039089984 22.7740711828923 21.5840110083096 21.9529654992985 20.451313755289 22.4154199380002 22.3652301844309 21.2403301698498 21.6740392144135 22.0122507889717 22.8615935600174 23.0952006159265 23.3011358356974 22.746605551146 20.5866803867983 21.2764220576728 +HMDB01032 21.2928905785523 24.6332887213057 20.6141409677961 18.7154961966847 22.9501240553341 24.6443247870262 17.9721889132336 19.3661386209868 25.8361997953493 18.0050049466979 24.8928089492302 24.1525273990616 23.8374429574498 20.5681658146509 24.2713659930314 22.4140893053724 19.7323297568288 13.958552715431 15.4342372710269 +HMDB01101.1 22.7134708439962 15.6722319530667 11.6247954558602 23.3631578345615 17.8085620299575 22.183613575742 21.8871689158671 19.8971659609365 19.6661147561338 19.214418735272 20.6142092807528 16.1361300108053 18.7553505325418 20.079142288524 20.4818181509538 14.9315685693242 21.3775881248719 16.1536311941017 14.9054340159519 +HMDB13189 21.3346290086766 19.4727602406215 20.6639784491577 19.2400016764968 17.0561931543153 21.3938481405109 19.1797706242895 19.6763582845664 21.7496566885488 20.9339312108399 20.6175661105571 21.7167470481744 20.8887603396637 16.7978767996065 21.5788388647145 21.4643567902489 20.9969706149343 19.9807336965562 19.6828797432404 diff -r 582a8a42a93b -r d5cf23369d12 w4mclassfilter.xml --- a/w4mclassfilter.xml Mon Jan 29 21:20:07 2018 -0500 +++ b/w4mclassfilter.xml Sat Mar 03 22:58:14 2018 -0500 @@ -1,6 +1,7 @@ - - - Filter W4M data by sample class + + Filter W4m data by values or metadata + + @@ -23,8 +24,9 @@ inclusive '$inclusive' wildcards '$wildcards' classnameColumn '$classnameColumn' - samplenameColumn '$samplenameColumn' + samplenameColumn 'sampleMetadata' variable_range_filter '$variableRangeFilter' + transformation '$transformation' dataMatrix_out '$dataMatrix_out' sampleMetadata_out '$sampleMetadata_out' variableMetadata_out '$variableMetadata_out' @@ -34,12 +36,23 @@ - - - + + + + + + + + + + + + + + @@ -54,38 +67,43 @@ - - - + - + - + - + + + - + + + + + + - - - + + + @@ -93,12 +111,76 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + - - + + + + + + + @@ -149,8 +231,8 @@ - + @@ -199,7 +281,6 @@ - @@ -233,7 +314,6 @@ - @@ -267,7 +347,6 @@ - @@ -297,7 +376,6 @@ - @@ -327,7 +405,6 @@ - @@ -361,7 +438,6 @@ - @@ -402,7 +478,7 @@ **R package** -The *w4mclassfilter* package is available from the Hegeman lab github repository (https://github.com/HegemanLab/w4mclassfilter/releases). +The *w4mclassfilter* package (which is used by the W4m Data Subset tool) is available from the Hegeman lab github repository (https://github.com/HegemanLab/w4mclassfilter/releases). ----------------------------------------------------------------------------------------------------------------------------------------- @@ -413,44 +489,67 @@ --------------------------------------------------- -============================================== -Filter Workflow4Metabolomics data matrix files -============================================== +=========================================================== +"W4m Data Subset" - Filter Workflow4Metabolomics data files +=========================================================== + +---------- +Motivation +---------- + +GC-MS and LC-MS experiments seek to resolve as features chemicals that have distinct chromatographic retention-time ("rt") and (after ionization) mass-to-charge ratio ("m/z" or "mz"). +(If the MS protocol includes fragmentation, several features may result for each chemical.) +Data for a sample are collected as MS intensities, each of which is associated with a position on a 2D plane with dimensions of rt and m/z. +Ideally, features would be sufficiently reproducible among sample-runs to distinguish features that are commmon among samples from those that differ. + +The chromatographic retention-time for a chemical can vary from one chromatography run to the next. +Workflow4Metabolomics (W4m, [Giacomoni *et al.*, 2014, Guitton *et al.* 2017]) is a "flavor" of Galaxy that uses the XCMS preprocessing tools for "retention-time correction" to align features among samples. +Features may be better aligned if pooled samples and blanks are included. + +Multivariate statistical techniques may be used to discover clusters of similar samples (Th]]>é - + 10.1093/bioinformatics/btu813 - + 10.1016/j.biocel.2017.07.002 + + 10.1021/ac202450g 10.1021/ac051437y - + 10.1021/acs.jproteome.5b00354