comparison pathifier.xml @ 0:fec313f5c889 draft

"planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/pathifier commit b94cfc7bf8df30aa8e9249b75ea31332ee2bada1"
author artbio
date Mon, 12 Apr 2021 09:55:24 +0000
parents
children 0960bd1161fa
comparison
equal deleted inserted replaced
-1:000000000000 0:fec313f5c889
1 <tool id="pathifier" name="Pathifier" version="1.0.1">
2 <description>: Quantify deregulation of pathways in cancer</description>
3 <requirements>
4 <requirement type="package" version="1.6.2=r35h6115d3f_0">r-optparse</requirement>
5 <requirement type="package" version="1.22.0=r351_0">bioconductor-pathifier</requirement>
6 <requirement type="package" version="1.0.12=r351h6115d3f_0">r-pheatmap</requirement>
7 <requirement type="package" version="0.3_41=r351h6115d3f_0">r-scatterplot3d</requirement>
8 <requirement type="package" version="0.4.7=r35h6115d3f_0">r-circlize</requirement>
9 </requirements>
10 <stdio>
11 <exit_code range="1:" level="fatal" description="Tool exception" />
12 </stdio>
13 <command detect_errors="exit_code"><![CDATA[
14 Rscript $__tool_directory__/pathifier.R
15 --exp '$input'
16 --sep '$input_sep'
17 --genes '$genes'
18
19 #if $reference.is_normal == "Yes":
20 --is_normal 'TRUE'
21 --normals '$reference.normals'
22 #end if
23
24 --max_stability '$max_stability'
25 --attempts '$attempts'
26 --min_std '$min_std'
27 --min_exp '$min_exp'
28
29 --heatmap_cluster_cells '$heatmap_cluster_cells'
30 --heatmap_cluster_pathways '$heatmap_cluster_pathways'
31 --heatmap_show_cell_labels '$heatmap_show_cell_labels'
32 --heatmap_show_pathway_labels '$heatmap_show_pathway_labels'
33
34 --pds '$pds'
35 --logfile '$logfile'
36 --plot '$plot'
37 --rdata '$rdatafile'
38
39 ]]></command>
40 <inputs>
41 <param name="input" type="data" format="txt,tabular" label="expression data"/>
42 <param name="input_sep" type="select" label="Input column separator">
43 <option value="tab" selected="true">Tabs</option>
44 <option value=",">Comma</option>
45 </param>
46 <param name="genes" type="data" format="txt" label="Gene sets Pathways"
47 help="Must be in gmt format (one pathway per line : Name, description, genes (one by column), tab separated)" />
48 <conditional name="reference">
49 <param name="is_normal" label="Do you have non cancer transcriptomes in your data set ?" type="boolean" truevalue="Yes" falsevalue="" checked="false"
50 help="If set the starting curve depends on the matrix of points with in a certain row order (first 'normal' then 'cancer' samples), otherwise the first principal component is used. See help for more informations"/>
51 <when value="Yes">
52 <param name="normals" type="data" format="tabular" label="Sample status"
53 help="A two-column data frame, first column contains data labels, second column the levels of sample status : 1 = Healthy, 0 = Tumor (no header)" />
54 </when>
55 <when value="">
56 </when>
57 </conditional>
58 <param name="max_stability" label="Throw away components leading to low stability of sampling noise" type="boolean" truevalue="TRUE"
59 falsevalue="FALSE" checked="true" />
60 <param name="attempts" type="integer" label="Number of runs to determine stability" value="100"/>
61 <param name="min_std" type="text" value="0.4" label="Minimum of standard deviation to filter out low variable genes"
62 help="Use 'data' to use the minimum standard deviation of your data" />
63 <param name="min_exp" type="text" value="4" label="Minimum of gene expression to filter out low variable genes"
64 help="Use 'data' to use the minimum expression of your data" />
65 <param name="heatmap_cluster_cells" label="Cluster samples on heatmap" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="true" />
66 <param name="heatmap_cluster_pathways" label="Cluster pathways on heatmap" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="true" />
67 <param name="heatmap_show_cell_labels" label="Show sample labels on heatmap" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="false" />
68 <param name="heatmap_show_pathway_labels" label="Cluster pathway labels on heatmap" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="true" />
69 <param label="Return log file of pathifier" name="log" type="select" >
70 <option value="no" selected="True">No</option>
71 <option value="yes">Yes</option>
72 </param>
73 <param label="Return Pathifier S4 object" name="rdata" type="select" >
74 <option value="no" selected="True">No</option>
75 <option value="yes">Yes</option>
76 </param>
77
78 </inputs>
79 <outputs>
80 <data name="pds" format="tabular" label="Pathifier Deregulation Score (PDS) of ${on_string}" />
81 <data name="logfile" format="txt" label="Pathifier log file of ${on_string}" >
82 <filter>log == 'yes'</filter>
83 </data>
84 <data name="plot" format="pdf" label="Pathifier vizualization of ${on_string}" />
85 <data name="rdatafile" format="rdata" label="Pathifier S4 object of ${on_string}" >
86 <filter>rds == 'yes'</filter>
87 </data>
88 </outputs>
89 <tests>
90 <test>
91 <param name="input" value="sheffer.tsv" ftype="tabular"/>
92 <param name="genes" value="kegg_pathways.gmt" ftype="txt" />
93 <param name="is_normal" value="True" />
94 <param name="normals" value="normals.tsv" ftype="tabular" />
95 <param name="log" value="yes" />
96 <param name="attempts" value="100" />
97 <output name="logfile" file="sheffer.kegg.log" ftype="txt" compare="sim_size" />
98 <output name="pds" file="sheffer.kegg.tsv" ftype="tabular"/>
99 <output name="plot" file="plot.pdf" ftype="pdf" compare="sim_size" />
100 </test>
101 <test>
102 <param name="input" value="sheffer_noref.tsv" ftype="tabular"/>
103 <param name="genes" value="kegg_pathways.gmt" ftype="txt" />
104 <param name="is_normal" value="" />
105 <param name="log" value="no" />
106 <param name="rdata" value="yes" />
107 <param name="attempts" value="50" />
108 <param name="min_exp" value="data" />
109 <param name="min_std" value="data" />
110 <output name="pds" file="sheffer.kegg_noref.tsv" ftype="tabular"/>
111 <output name="rdatafile" file="sheffer.kegg_noref.rdata" ftype="rdata" compare="sim_size" />
112 <output name="plot" file="plot_noref.pdf" ftype="pdf" compare="sim_size" />
113 </test>
114 </tests>
115 <help>
116
117 **What it does**
118
119 Pathifier is an algorithm that infers pathway deregulation scores for each (tumor) sample on the basis
120 of expression data. This score is determined, in a context-specific manner, for every particular dataset
121 and type of cancer that is being investigated. The algorithm transforms gene-level information into
122 pathway-level information, generating a compact and biologically relevant representation of each sample.
123
124 For each pathway analysed, the transcriptome datasets are plotted in the gene pathway space using a
125 Principal Component analysis (PCA) and a principal curve is regressed from these points. All transcriptomes
126 are projected on the nearest point of this curve. Pathifier finally computes a score which corresponds to
127 the distance (normalized to 1) of each point (transcriptome) to the curve origin.
128
129 **Inputs**
130
131 * a matrix of n columns of observations (generally RNAseq experiments) and k rows of variables (generally k genes).
132 * a Gene Matrix Transposed file (GMT format) where each row represents a gene set :
133 * first column : gene set name (pathway name)
134 * second : description of gene set
135 * third and + : list of genes that composed the gene set tab-separated
136 * (Optional) a two column table with no header, to described transcriptome status (Tumor or not) :
137 * first column : sample labels
138 * second : levels of sample status : 1 = Healthy, 0 = Tumor
139
140 **Outputs**
141
142 * Table of Pathway Deregulation Scores : one by pathway (column) and by transcriptome (row)
143 * Visualization of PDS (pdf) :
144 * Principal curve of different PDS
145 * Heatmap of PDS that allows (through clustering) to see pattern in pathway deregulation
146 * (Optional) Log file of Pathifier algorithm
147 * (Optional) Pathifier S4 object which contains all informations and results generated by Pathifier, for each pathway :
148 * `scores` : PDS scores
149 * `genesinpathway` : Gene identifiers in each pathway
150 * `newmeanstd`
151 * `origmeanstd`
152 * `pathwaysize` : Number of genes retained in pathway
153 * `curves` : Coordinates of transcriptomes projected on the principal curve
154 * `curves_order` : Order of transcriptomes along the principal curve
155 * `z` : z-scores matrix
156 * `compin`
157 * `xm`
158 * `xs`
159 * `center`
160 * `rot`
161 * `pctaken` : Number of principal component retained for pathifier analysis
162 * `samplings`
163 * `sucess` : List of pathway index that passed Pathfiier filters (more info in log file)
164 * `logfile` : Name of logfile
165
166 </help>
167 <citations>
168 <citation type="bibtex">@Manual{,
169 title = {{pathifier}: Quantify deregulation of pathways in cancer},
170 author = {Yotam Drier},
171 year = {2013-06-27},
172 note = {R package version 1.22.0},
173 url = {https://git.bioconductor.org/packages/pathifier},
174 }
175 </citation>
176 <citation type="bibtex">@article {Drier6388,
177 author = {Drier, Yotam and Sheffer, Michal and Domany, Eytan},
178 title = {Pathway-based personalized analysis of cancer},
179 volume = {110},
180 number = {16},
181 pages = {6388--6393},
182 year = {2013},
183 doi = {10.1073/pnas.1219651110},
184 publisher = {National Academy of Sciences},
185 issn = {0027-8424},
186 URL = {https://www.pnas.org/content/110/16/6388},
187 eprint = {https://www.pnas.org/content/110/16/6388.full.pdf},
188 journal = {Proceedings of the National Academy of Sciences}
189 }
190 </citation>
191 </citations>
192 </tool>