annotate secimtools/principal_component_analysis.xml @ 0:b54326490b4d draft

Upload 21.3.4.2 release
author malex
date Mon, 08 Mar 2021 20:55:03 +0000
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
1 <tool id="secimtools_principal_component_analysis" name="Principal Component Analysis (PCA)" version="@WRAPPER_VERSION@">
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
2 <description>for visual summaries of the components.</description>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
3 <macros>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
4 <import>macros.xml</import>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
5 </macros>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
6 <expand macro="requirements" />
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
7 <command detect_errors="exit_code"><![CDATA[
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
8 principal_component_analysis.py
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
9 --input $input
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
10 --design $design
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
11 --ID $uniqID
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
12 --load_out $loadings
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
13 --score_out $scores
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
14 --summary_out $summary
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
15 --figure $figures
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
16
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
17 #if $group
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
18 --group $group
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
19 #end if
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
20 ]]></command>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
21 <inputs>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
22 <param name="input" type="data" format="tabular" label="Wide Dataset" help="Input your tab-separated wide format dataset. If file is not tab separated see TIP below."/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
23 <param name="design" type="data" format="tabular" label="Design File" help="Input your design file (tab-separated). Note you need a 'sampleID' column. If not tab separated see TIP below."/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
24 <param name="uniqID" type="text" size="30" value="" label="Unique Feature ID" help="Name of the column in your wide dataset that has unique identifiers."/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
25 <param name="group" type="text" size="30" label="Group/Treatment [Optional]" help="Name of the column in your design file that contains group classifications."/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
26 </inputs>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
27 <outputs>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
28 <data format="tabular" name="loadings" label="${tool.name} on ${on_string}: loadings"/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
29 <data format="tabular" name="scores" label="${tool.name} on ${on_string}: scores"/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
30 <data format="tabular" name="summary" label="${tool.name} on ${on_string}: summary"/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
31 <data format="pdf" name="figures" label="${tool.name} on ${on_string}: scatter plots"/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
32 </outputs>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
33 <tests>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
34 <test>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
35 <param name="input" value="ST000006_data.tsv"/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
36 <param name="design" value="ST000006_design.tsv"/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
37 <param name="uniqID" value="Retention_Index" />
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
38 <param name="group" value="White_wine_type_and_source" />
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
39 <output name="loadings" file="ST000006_principal_component_analysis_load_out.tsv" />
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
40 <output name="scores" file="ST000006_principal_component_analysis_score_out.tsv" />
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
41 <output name="summary" file="ST000006_principal_component_analysis_summary_out.tsv" />
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
42 <output name="figures" file="ST000006_principal_component_analysis_figure.pdf" compare="sim_size" delta="10000" />
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
43 </test>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
44 </tests>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
45 <help><![CDATA[
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
46
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
47 @TIP_AND_WARNING@
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
48
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
49 **Tool Description**
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
50
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
51 The tool performs principal component analysis (PCA) of the data.
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
52 Visual summaries are provided in the from of 2D and 3D scatter plots for the first three principal components.
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
53 Samples in the scatter plots are colored based on the group classification.
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
54
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
55 --------------------------------------------------------------------------------
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
56
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
57 **Note**
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
58
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
59 - This tool currently treats all variables as continuous numeric variables. Running the tool on categorical variables might result in incorrect results.
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
60 - Rows containing non-numeric (or missing) data in any of the chosen columns will be skipped from the analysis.
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
61
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
62 --------------------------------------------------------------------------------
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
63
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
64 **Input**
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
65
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
66 - Two input datasets are required.
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
67
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
68 @WIDE@
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
69
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
70 **NOTE:** The sample IDs must match the sample IDs in the Design File (below).
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
71 Extra columns will automatically be ignored.
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
72
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
73
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
74 @METADATA@
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
75
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
76 @UNIQID@
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
77
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
78 @GROUP_OPTIONAL@
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
79
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
80 --------------------------------------------------------------------------------
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
81
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
82 **Output**
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
83
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
84 Four different outputs are produced by the Principal Component Analysis tool:
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
85
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
86 (1) a TSV file containing eigenvectors/variable loadings
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
87 (2) a TSV file containing scores of input data on principal components
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
88 (3) a TSV file with the summary for each component
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
89 (4) and a PDF file of scatter plots of the first three principal components
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
90
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
91 There are a total of four scatterplots: three pairwise plots for the first three components and a single 3D plot of the first three components.
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
92
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
93 ]]></help>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
94 <expand macro="citations"/>
b54326490b4d Upload 21.3.4.2 release
malex
parents:
diff changeset
95 </tool>