annotate ensembl2symbol.xml @ 1:ec9ee8edb84d draft

Initial upload of 21.6.10 release.
author malex
date Fri, 18 Jun 2021 20:23:19 +0000
parents
children 2c218a253d56
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
1 <tool id="secimtools_ensembl2symbol" name="Map ENSEMBLIDs to Gene Symbols." version="@WRAPPER_VERSION@">
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
2 <description></description>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
3 <macros>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
4 <import>macros.xml</import>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
5 </macros>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
6 <expand macro="requirements" />
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
7 <stdio>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
8 <exit_code range="1" level="fatal" description="Repeated Unique IDs"/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
9 </stdio>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
11 ensembl2symbol.py
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
12 -s=$species
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
13 -ga=$geneAnnot
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
14 -id=$uniqId
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
15 -e=$ensemblId
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
16 -o=$output
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
17 ]]></command>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
18 <inputs>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
19 <param name="species" type="select" label="Select the species your ENSEMBLIDs are from" >
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
20 <option value="human">Homo sapiens</option>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
21 <option value="mouse">Mus musculus</option>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
22 <option value="rat">Rattus norvegicus</option>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
23 <option value="fruitfly">Drosophila melanogaster</option>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
24 </param>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
25 <param name="geneAnnot" type="data" format="tabular" label="Select the Dataset from your History containing the ENSEMBLIDs"/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
26 <param name="uniqId" type="text" size="30" value="" label="Unique Gene FeatureID" help="Name of the column in your dataset containing unique FeatureIDs."/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
27 <param name="ensemblId" type="text" size="30" value="" label="ENSEMBLID" help="Name of the column containing the ENSEMBLIDs to use for linking to gene symbols."/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
28 </inputs>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
29 <outputs>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
30 <data format="tabular" name="output" label="${tool.name} on ${on_string}: ENSEMBL to GeneSymbol Annotation File"/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
31 </outputs>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
32 <tests>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
33 <test>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
34 <param name="species" value="rat"/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
35 <param name="geneAnnot" value="gene_annotation_file_01fhl.tsv"/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
36 <param name="uniqId" value="UniqueID"/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
37 <param name="ensemblId" value="GeneName"/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
38 <param name="Output" value="ensembl2symbol_annotation_file_01fhl.tsv"/>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
39 </test>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
40 </tests>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
41 <help><![CDATA[
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
42
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
43 **Tool Description**
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
44
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
45 This tool takes a dataset containing unique FeatureIDs and ENSEMBLIDs and provides gene symbols. The link from the ENSEMBLIDs to gene symbols is made using Biomart. The tool adds the following columns to the input dataset: GeneSymbol, Score, Selected, and Tie. The GeneSymbol column contains the short identifiers (typically 3 letter abbreviations) of the gene name. The Score column contains a value that represents how well the ENSEMBLID matched the returned GeneSymbol using the PyPi package Gene 3.0.0 (https://www.ncbi.nlm.nih.gov/pubmed/23175613). The Selected column = 'Yes' when an ENSEMBLID uniquely matches a GeneSymbol or when that row has the highest Score value. The Selected column = 'No' in the absence of a unique match for rows lower than the maximum score. If there is a tie in the Score the alphabetically first value is selected and the Tie column has a value of Yes. We note that FeatureID may not be unique in the resulting output dataset.
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
46
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
47 --------------------------------------------------------------------------------
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
48
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
49 **INPUT**
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
50
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
51 **Dataset with unique FeatureIDs and ENSEMBLIDs**
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
52
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
53 +-------------+--------------+-----+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
54 | FeatureID | ENSEMBLID | ... |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
55 +=============+==============+=====+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
56 | FeatureID_1 | ENS... | ... |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
57 +-------------+--------------+-----+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
58 | FeatureID_2 | ENS... | ... |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
59 +-------------+--------------+-----+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
60 | FeatureID_3 | ENS... | ... |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
61 +-------------+--------------+-----+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
62 | ... | ... | ... |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
63 +-------------+--------------+-----+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
64
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
65 **NOTE:** This file must contain at least two columns, a column with unique FeatureIDs and a column containing ENSEMBLIDs. Other columns may be present.
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
66
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
67 **Unique FeatureID**
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
68
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
69 Name of the column in your input dataset that has unique FeatureIDs.
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
70
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
71 **ENSEMBLID**
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
72
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
73 Name of the column containing the ENSEMBLIDs.
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
74
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
75 --------------------------------------------------------------------------------
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
76
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
77 **OUTPUT**
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
78
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
79 The user will get a single output file.
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
80
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
81 **Output Table**
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
82
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
83 +------------+------------+--------------+-------------+-----------+----------+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
84 | FeatureID | ENSEMBLID | ... | GeneSymbol | Score | Selected |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
85 +============+============+==============+=============+===========+==========+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
86 | FeatureID_1 | ENS... | ... | one* | 13.550056 | Yes |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
87 +------------+------------+--------------+-------------+-----------+----------+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
88 | FeatureID_2 | ENS... | ... | two* | 12.984067 | Yes |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
89 +------------+------------+--------------+-------------+-----------+----------+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
90 | FeatureID_2 | ENS... | ... | three* | 11.995048 | No |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
91 +------------+------------+--------------+-------------+-----------+----------+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
92 | FeatureID_3 | ENS... | ... | four* | 12.549084 | Yes |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
93 +------------+------------+--------------+-------------+-----------+----------+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
94 | ... | ... | ... | ... | ... | ... |
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
95 +------------+------------+--------------+-------------+-----------+----------+
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
96
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
97 ]]>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
98 </help>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
99 <citations>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
100 <citation type="bibtex">@article{wu2014mygene,
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
101 title={MyGene. info: gene annotation query as a service},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
102 author={Wu, Chunlei and Mark, Adam and Su, Andrew I},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
103 journal={bioRxiv},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
104 pages={009332},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
105 year={2014},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
106 publisher={Cold Spring Harbor Laboratory}
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
107 }</citation>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
108 <citation type="bibtex">@ARTICLE{Kirpich17secimtools,
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
109 author = {Alexander S. Kirpich, Miguel Ibarra, Oleksandr Moskalenko, Justin M. Fear, Joseph Gerken, Xinlei Mi, Ali Ashrafi, Alison M. Morse, Lauren M. McIntyre},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
110 title = {SECIMTools: A suite of Metabolomics Data Analysis Tools},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
111 journal = {BMC Bioinformatics},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
112 year = {in press}
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
113 }</citation>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
114 <citation type="bibtex">
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
115 @article{garcia2010paintomics,
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
116 title={Paintomics: a web based tool for the joint visualization of transcriptomics and metabolomics data},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
117 author={Garc{\'\i}a-Alcalde, Fernando and Garc{\'\i}a-L{\'o}pez, Federico and Dopazo, Joaqu{\'\i}n and Conesa, Ana},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
118 journal={Bioinformatics},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
119 volume={27},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
120 number={1},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
121 pages={137--139},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
122 year={2010},
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
123 publisher={Oxford University Press}
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
124 }</citation>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
125 </citations>
ec9ee8edb84d Initial upload of 21.6.10 release.
malex
parents:
diff changeset
126 </tool>