comparison mageck_gsea.xml @ 0:d95eae71878e draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/mageck commit 71cef018eec5ee7ff7f3853599c027e80e2637fe
author iuc
date Wed, 14 Feb 2018 06:41:59 -0500
parents
children b946929d31c4
comparison
equal deleted inserted replaced
-1:000000000000 0:d95eae71878e
1 <?xml version="1.0"?>
2 <tool id="mageck_gsea" name="MAGeCK GSEA" version="@VERSION@" >
3 <description>- a fast implementation of Gene Set Enrichment Analysis</description>
4 <macros>
5 <import>mageck_macros.xml</import>
6 </macros>
7 <expand macro="requirements" />
8 <version_command>mageckGSEA --version</version_command>
9 <command detect_errors="exit_code"><![CDATA[
10
11 mageckGSEA
12
13 -r '$rank_file'
14 -g '$gmt_file'
15 -c $score_column
16
17 #if str( $pathway_name ) != "":
18 -n '$pathway_name'
19 #end if
20
21 #if $adv.reverse_value:
22 -e
23 #end if
24 #if $adv.sort_byp:
25 -s
26 #end if
27 -p $adv.perm_time
28 -o output_file
29
30 ]]></command>
31 <inputs>
32 <param name="rank_file" argument="--rank_file" type="data" format="tabular" label="Gene Ranking file" help="A gene ranking file such as that generated by mageck test. The first column of the rank file must contain gene identifiers, of the same type used in the GMT file" />
33 <param name="gmt_file" argument="--gmt-file" type="data" format="tabular" label="Pathway GMT file" help="The pathway file in GMT format. See Help below for more information" />
34 <param argument="--score_column" type="integer" value="0" optional="true" label="Gene Ranking column number" help="The column number containing gene scores in the gene ranking file. If you just want to use the ranking of the gene (located at the 1st column), use 0. The column number starts from 0. Default: 0" />
35 <param argument="--pathway_name" type="text" value="" label="Name of the pathway to be tested" help=" If not found, will test all pathways" />
36 <section name="adv" title="Advanced Options">
37 <param argument="--reverse_value" type="boolean" truevalue="--reverse_value" falsevalue="" checked="false" optional="true" label="Reverse the order of the gene" help="Default: No" />
38 <param argument="--sort_byp" type="boolean" truevalue="--sort_byp" falsevalue="" checked="true" optional="true" label="Sort the pathways by p value" help="Default: Yes" />
39 <param argument="--perm_time" type="integer" min="0" value="1000" optional="true" label="Number of permutation number" help="Default: 1000" />
40 </section>
41 </inputs>
42 <outputs>
43 <data name="output_file" format="tabular" from_work_dir="output_file" label="${tool.name} on ${on_string}: mageckGSEA Output" />
44 </outputs>
45 <tests>
46 <test><!-- Ensure MAGeCK's demo1 test works -->
47 <param name="rank_file" ftype="tabular" value="out.test.gene_summary.txt" />
48 <param name="gmt_file" ftype="tabular" value="in.mageckQC.gmt" />
49 <output name="output_file" value="out.mageckGSEA.txt" />
50 </test>
51 </tests>
52 <help><![CDATA[
53 .. class:: infomark
54
55 **What it does**
56
57 mageckGSEA_ is a fast implementation of Gene Set Enrichment Analysis (GSEA). It's used by MAGeCK_ for quality controls and pathway enrichment tests.
58
59 .. _mageckGSEA: https://sourceforge.net/p/mageck/wiki/usage/#mageckgsea
60 .. _MAGeCK: http://liulab.dfci.harvard.edu/Mageck/
61
62 -----
63
64 **Inputs**
65
66 **Gene Ranking file**
67
68 mageckGSEA requires a gene ranking file as input. A gene raking file can be produced using **mageck test**. An example of the gene ranking file is as follows:
69
70 ======= ======= ============= =============== =========== ============ ================= =========== ============= =============== =========== ============ ================= ===========
71 **id** **num** **neg|score** **neg|p-value** **neg|fdr** **neg|rank** **neg|goodsgrna** **neg|lfc** **pos|score** **pos|p-value** **pos|fdr** **pos|rank** **pos|goodsgrna** **pos|lfc**
72 ------- ------- ------------- --------------- ----------- ------------ ----------------- ----------- ------------- --------------- ----------- ------------ ----------------- -----------
73 ESPL1 12 6.4327e-10 7.558e-06 7.9e-05 1 -2.35 11 0.99725 0.99981 0.999992 615 0 -0.07
74 RPL18 12 6.4671e-10 7.558e-06 7.9e-05 2 -2.12 11 0.99799 0.99989 0.999992 620 0 -0.32
75 CDK1 12 2.6439e-09 7.558e-06 7.9e-05 3 -1.93 12 1.0 0.99999 0.999992 655 0 -0.12
76 ======= ======= ============= =============== =========== ============ ================= =========== ============= =============== =========== ============ ================= ===========
77
78
79 **Pathway file**
80
81 mageckGSEA also requires a pathway file in GMT format. The GMT (Gene Matrix Transposed) file format is a tab delimited file format that describes gene sets and is consistent with the `GMT file in Gene Set Enrichment Analysis (GSEA)`_. In the GMT format, each row represents a gene set, with the first column containing the gene set name, and the second column containing a description for the gene set, followed by the names or ids of the genes in the gene set. You can download different GMT pathway files directly from the `GSEA MSigDB database`_. An example of the GMT format is as follows:
82
83 ================= ============================================================= =======================
84 **Gene Set Name** **Description** **Genes**
85 ----------------- ------------------------------------------------------------- -----------------------
86 KEGG_RIBOSOME http://www.broadinstitute.org/gsea/msigdb/cards/KEGG_RIBOSOME RPL35 RPL23 RPL3...
87 ================= ============================================================= =======================
88
89 -----
90
91 **Outputs**
92
93 **mageckGSEA output file**
94
95 An example of the output file is as follows:
96
97 ============= ======== ====== ===== ================= ======= =========== ======== =======
98 **Pathway** **Size** **ES** **p** **p_permutation** **FDR** **Ranking** **Hits** **LFC**
99 ------------- -------- ------ ----- ----------------- ------- ----------- -------- -------
100 KEGG_RIBOSOME 88 1 0 0 0 1 0 0
101 ============= ======== ====== ===== ================= ======= =========== ======== =======
102
103 Pathways are sorted by P value field by default in the output.
104
105 .. _`GMT file in Gene Set Enrichment Analysis (GSEA)`: http://software.broadinstitute.org/cancer/software/gsea/wiki/index.php/Data_formats#GMT:_Gene_Matrix_Transposed_file_format_.28.2A.gmt.29
106 .. _`GSEA MSigDB database`: http://software.broadinstitute.org/gsea/login.jsp
107
108 ]]></help>
109 <expand macro="citations" />
110 </tool>