annotate SPIA.xml @ 1:401181d40d7a draft

Uploaded
author mora-lab
date Thu, 20 May 2021 08:52:23 +0000
parents
children 1928527cb55d
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
1 <tool id="SPIA" name="SPIA (Signaling Pathway Impact Analysis)" version="0.1.0" >
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
2 <description>A method based on over-representation and signaling perturbation accumulation to analyze KEGG signaling pathways.</description>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
3
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
4 <requirements>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
5 <requirement type="package" version="1.20.3">r-getopt</requirement>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
6 <requirement type="package" version="2.42.0">bioconductor-SPIA</requirement>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
7 <requirement type="package" version="2.14.0">bioconductor-chipenrich.data</requirement>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
8 </requirements>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
9
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
11 Rscript '$__tool_directory__/SPIA.R'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
12 -D '$input_data'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
13 -O '$organism'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
14 -R '$sigP_output'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
15
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
16 -P '$adv.P_value_threshold'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
17
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
18 -N '$adv.Number_bootstrap'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
19 -C '$adv.method_combine_pvalue'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
20 #if $adv.plot_perturbation=="True":
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
21 -W
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
22 -L '$SPIA_Perturbation_Plots'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
23 #end if
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
24
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
25 #if $adv.pathwayId !="":
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
26 -I '$adv.pathwayId'
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
27 #end if
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
28
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
29 ]]></command>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
30
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
31 <inputs>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
32 <param type="data" name="input_data" format="csv" multiple="false" label="Input data" help="A csv file including the columns ENTREZ, logFC, and adj.P.Val"/>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
33 <param type="text" name="organism" value="hsa" label="Organism" help="A three letter character designating the organism. Default is `hsa` (human). See a full list at https://www.genome.jp/kegg/catalog/org_list.html" />
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
34
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
35 <section name="adv" title="Advanced Options" expanded="false">
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
36 <param type="float" name="P_value_threshold" label="P value threshold to select DEgenes" value="0.05" min="0.00" max="1.00" help="Set a threshold value to define differentially expressed genes"/>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
37 <param type="integer" name="Number_bootstrap" value="2000" min="100" label="Bootstrap iterations" help="Number of bootstrap iterations used to compute the P PERT value. Should be larger than 100. A recommended value is 2000." />
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
38 <param type="select" name="method_combine_pvalue" label="Method to combine P values" help="Method used to combine the two types of p-values. If set to 'fisher' it will use Fisher's method. If set to 'norminv' it will use the normal inversion method.">
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
39 <option value="fisher" selected="True">fisher</option>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
40 <option value="norminv">norminv</option>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
41 </param>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
42 <param type="boolean" name="plot_perturbation" truevalue="True" falsevalue="False" checked="False" label="Plot perturbation" help="If set to Yes, plot the gene perturbation accumulation vs log2 fold change for every gene on each pathway. Default is No." />
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
43 <param type="text" name="pathwayId" value="" label="Pathway IDs -- default as NULL and analysis all pathway. " help="Special one or more pathway to analysis, input pathway ID at here. For example: 03018, 03320."/>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
44 </section>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
45
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
46 </inputs>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
47
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
48 <outputs>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
49 <data name="sigP_output" format="csv" label="SPIA_enrich_kegg" />
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
50 <data format="pdf" name="SPIA_Perturbation_Plots" label="SPIA_Perturbation_Plots">
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
51 <filter>adv['plot_perturbation'] == True</filter>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
52 </data>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
53 </outputs>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
54
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
55 <tests>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
56 <test>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
57 <param name="input_data" value="SPIA_input.csv" ftype="csv" />
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
58 <output name="sigP_output" file="x.csv" ftype="csv" />
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
59 </test>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
60 </tests>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
61
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
62 <help><![CDATA[
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
63
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
64 .. class:: infomark
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
65
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
66 **What it does**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
67
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
68 SPIA (Signaling pathway impact analysis) combines the evidence obtained from the
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
69 classical enrichment analysis with a novel type of evidence, which measures the actual
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
70 perturbation on a given pathway under a given condition.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
71
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
72 A bootstap procedure is used to assess the significance of the observed total pathway perturbation.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
73
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
74 Then we can calculate a global pathway significance P-value, which combines the enrichment and perturbation P-values.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
75
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
76 SPIA tool analyzes KEGG signaling pathways.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
77
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
78 -------
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
79
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
80 =========
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
81 **Input**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
82 =========
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
83
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
84 Basic options
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
85 --------------
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
86
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
87 **Input data**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
88
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
89 The input data is a csv file, which includes the columns `ENTREZ`, `logFC` and `adj.P.Val`.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
90 This file contains all genes of your dataset.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
91
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
92 ====== ========== ======= ========== ========= ==== ========
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
93 logFC AveExpr t P.Value adj.P.Val B ENTREZ
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
94 ====== ========== ======= ========== ========= ==== ========
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
95 5.96 6.23 23.9 1.79e-17 9.78e-13 25.4 3491
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
96 5.14 7.49 17.4 1.56e-14 2.84e-10 21.0 2353
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
97 4.15 7.04 16.5 5.15e-14 7.04e-10 20.1 1958
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
98 2.43 9.59 14.1 1.29e-12 1.41e- 8 17.7 1843
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
99 1.53 8.22 11.0 1.69e-10 1.15e- 6 13.6 3725
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
100 1.43 5.33 10.5 4.27e-10 2.42e- 6 12.8 23645
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
101 ====== ========== ======= ========== ========= ==== ========
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
102
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
103 **Organism**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
104
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
105 A three letter word designating the organism of your data. Default is `hsa` (Human). See a full list of options at https://www.genome.jp/kegg/catalog/org_list.html.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
106
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
107 ------
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
108
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
109 Advanced Options
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
110 -----------------
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
111
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
112 **P value threshold to select DEgenes**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
113
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
114 Set a threshold value to define differentially expressed genes. Default is 0.05.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
115
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
116 **Bootstrap iterations**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
117
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
118 Number of bootstrap iterations used to compute the `pPERT` value. Should be larger than 100. A recommended value is 2000.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
119
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
120 **Method to combine P values**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
121
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
122 Method used to combine the two types of p-values. If set to 'fisher' it will use Fisher's method. If set to 'norminv' it will use the normal inversion method.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
123
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
124 **Plot perturbation**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
125
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
126 If set to `Yes`, plots the gene perturbation accumulation vs log2 fold change for every gene on each pathway. Default is `No`.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
127
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
128 **Pathway IDs -- default as NULL and analysis all pathway.**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
129
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
130 if you want special one or more pathway to analysis, Input pathway id at here. for example: `03018, 03320`.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
131
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
132 ------
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
133
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
134 ==========
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
135 **Output**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
136 ==========
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
137
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
138 **CSV file**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
139
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
140 This file contains the ranked pathways and various statistics:
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
141 - **Name** is the pathway name;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
142 - **ID** is the pathway ID;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
143 - **pSize** is the number of genes on the pathway;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
144 - **NDE** is the number of DE genes per pathway;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
145 - **tA** is the observed total perturbation accumulation in the pathway;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
146 - **pNDE** is the probability to observe at least NDE genes on the pathway using a hypergeometric model;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
147 - **pPERT** is the probability to observe a total accumulation more extreme than tA only by chance;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
148 - **pG** is the p-value obtained by combining pNDE and pPERT;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
149 - **pGFdr** and **pGFWER** are the False Discovery Rate and Bonferroni adjusted global p-values;
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
150 - **Status** gives the direction in which the pathway is perturbed (activated or inhibited).
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
151 - **KEGGLINK** gives a web link to the KEGG website that displays the pathway image with the differentially expressed genes highlighted in red.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
152
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
153 **PDF file**
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
154
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
155 If the plot argument is set to `Yes`, it will output the plots for the gene perturbation accumulation vs log2 fold change for every gene on each pathway.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
156
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
157 ------
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
158
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
159 Please cite SPIA_ appropriately if you use them.
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
160
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
161 .. _SPIA: https://pubmed.ncbi.nlm.nih.gov/18990722/
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
162
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
163 ]]></help>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
164
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
165 <citations>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
166 <citation type="doi">10.1093/bioinformatics/btn577</citation>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
167 </citations>
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
168
401181d40d7a Uploaded
mora-lab
parents:
diff changeset
169 </tool>