annotate term_mapper.xml @ 9:89264646e458

improvements release
author pieter.lukasse@wur.nl
date Sat, 28 Mar 2015 14:28:45 +0100
parents 97e10319d86f
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
1 <tool name="TermMapperTool" id="TermMapperTool1" version="0.0.2">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
2 <description>use cross-reference lookup tables to annotate results</description>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
3 <!--
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
4 For remote debugging start you listener on port 8000 and use the following as command interpreter:
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
5 java -jar -Xdebug -Xrunjdwp:transport=dt_socket,address=D0100564.wurnet.nl:8000
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
6 -->
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
7 <!-- similar to "join two datasets" tool http://galaxy.wur.nl/galaxy_production/root?tool_id=join1
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
8 but this one is probably having more powerful features like supporting multiple ';' codes in key fields
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
9 and the feature in termColName(s) supporting direct hierarchy like annotation -->
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
10 <command interpreter="java -jar ">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
11 TermMapperTool.jar
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
12 -inputFileName $inputFileName
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
13 -inputIdColumnName "$inputIdColumnName"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
14 #if $inputIdCol.inputIdHasPrefix == True
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
15 -inputIdPrefix "$inputIdCol.inputIdPrefix"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
16 #end if
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
17
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
18 -mappingFileName $mappingFileName
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
19 -mappingFileIdColName "$mappingFileIdColName"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
20
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
21 #if $mappingIdCol.mappingIdHasPrefix == True
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
22 -mappingIdPrefix "$mappingIdCol.mappingIdPrefix"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
23 #end if
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
24
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
25 -mappingFileTermColName "$mappingFileTermColName"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
26
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
27 -outputFileName $outputFileName
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
28
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
29 #if $genObservations.genObservationsFile == True
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
30 -outputObservationsFileName $outputObservationsFileName
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
31 -quantifColumn "$genObservations.quantifColumn"
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
32 -multipleMappingSolution $genObservations.multipleMappingSolution
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
33 -filterZeros $genObservations.filterZeros
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
34 #end if
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
35
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
36 -mappedTermsColName $mappedTermsColName
8
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
37 -numberOfHeaderLines $numberOfHeaderLines
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
38
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
39 -htmlReportFile $htmlReportFile
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
40 -htmlReportFilesPath $htmlReportFile.files_path
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
41
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
42 </command>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
43
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
44 <inputs>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
45
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
46 <param name="inputFileName" type="data" format="tabular,csv,txt" label="Target file (TSV/CSV)" />
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
47
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
48 <param name="inputIdColumnName" type="text" size="50" value="" label="ID column name"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
49 help="Name of the column containing the identification codes (in the given input file)"/>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
50
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
51 <conditional name="inputIdCol">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
52 <param name="inputIdHasPrefix" type="boolean" truevalue="Yes" falsevalue="No" checked="false"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
53 label="ID values have a prefix"/>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
54 <when value="Yes">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
55 <param name="inputIdPrefix" type="text" size="50" value="" label="Prefix in ID column"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
56 help="Fill in if any prefix is found in the ID column values (e.g. in some
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
57 files the value is preceded by a fixed value like for example 'lipidmaps:LMFA00000007' instead of just 'LMFA00000007' - in this
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
58 example one would fill in 'lipidmaps:' as prefix)"/>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
59 </when>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
60 <when value="No">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
61 </when>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
62 </conditional>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
63
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
64 <!-- =================== cross-reference part ============== -->
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
65 <param name="mappingFileName" type="data" format="tabular,csv" label="Lookup table (TSV/CSV)" help="Simple mapping file between the coding scheme used to another scheme"/>
8
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
66 <param name="numberOfHeaderLines" type="select" label="Number of header lines in mapping file"
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
67 help="If this is '0', use the column numbers starting from 1 as the 'names' in the paramters below.">
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
68 <option value="0" >0</option>
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
69 <option value="1" selected="true">1</option>
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
70 </param>
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
71
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
72
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
73 <param name="mappingFileIdColName" type="text" size="50" value="" label="ID column name or number (in lookup table)" help="Name (or number) of the ID column for the lookup"/>
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
74
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
75 <conditional name="mappingIdCol">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
76 <param name="mappingIdHasPrefix" type="boolean" truevalue="Yes" falsevalue="No" checked="false"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
77 label="ID values have a prefix"/>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
78 <when value="Yes">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
79 <param name="mappingIdPrefix" type="text" size="50" value="" label="Prefix in ID column"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
80 help="Fill in if any prefix is found in the ID column values (e.g. in some
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
81 files the value is preceded by a fixed value like for example 'lipidmaps:LMFA00000007' instead of just 'LMFA00000007' - in this
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
82 example one would fill in 'lipidmaps:' as prefix)"/>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
83 </when>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
84 <when value="No">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
85 </when>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
86 </conditional>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
87
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
88 <param name="mappingFileTermColName" type="text" size="50" value="" label="Term column name(s) or number(s)"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
89 help="Name(s) or number(s) of the column(s) containing the term(s) in the lookup table (and which will be transfered to the target file based on ID match in 'ID column name').
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
90 For using multiple term column names, set the names separated by comma (,).
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
91 If multiple columns are specified, the algorithm will look for an annotation in the first one, if none
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
92 found it will try the second one, and so forth. "/>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
93
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
94
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
95 <param name="mappedTermsColName" type="text" size="50" value="Mapped terms" label="Name to give to the new column"
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
96 help="Name to give to the new column that will be added to the target file. This new column is the one
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
97 that will contain the respectively mapped terms."/>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
98
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
99 <conditional name="genObservations">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
100 <param name="genObservationsFile" type="boolean" truevalue="Yes" falsevalue="No" checked="false"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
101 label="Generate also observations file"/>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
102 <when value="Yes">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
103 <param name="quantifColumn" type="text" size="50" value=""
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
104 label="(Optional) Values column name"
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
105 help="Name of the column containing the quantification values (in the given input file)"/>
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
106 <param name="multipleMappingSolution" type="select"
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
107 label="(when using values column above) What to do when multiple items map to the same term"
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
108 help="When e.g. two Uniprot codes map to the same KEGG code, which quantification value to use">
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
109 <option value="not" selected="true">Do nothing, leave as is</option>
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
110 <option value="max" >Use max value</option>
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
111 <option value="min">Use min value</option>
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
112 <option value="avg">Use avg value</option>
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
113 </param>
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
114 <param name="filterZeros" type="boolean" checked="false"
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
115 label="Filter zeros"
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
116 help="Filter out the items that have quantification value = 0"/>
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
117 </when>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
118 <when value="No">
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
119 </when>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
120 </conditional>
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
121
8
97e10319d86f supporting column indexes
pieter.lukasse@wur.nl
parents: 7
diff changeset
122
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
123 </inputs>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
124 <outputs>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
125 #if isinstance( $inputFileName.datatype, $__app__.datatypes_registry.get_datatype_by_extension('tabular').__class__):
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
126 <data name="outputFileName" format="tabular" label="${tool.name} on ${on_string}: annotated file " ></data>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
127 #else:
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
128 <data name="outputFileName" format="csv" label="${tool.name} on ${on_string}: annotated file " ></data>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
129 #end if
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
130 #if $genObservations.genObservationsFile == True :
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
131 <data name="outputObservationsFileName" format="tabular" label="${tool.name} on ${on_string}: term observations file (TSV)"></data>
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
132 #end if
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
133 <data name="htmlReportFile" format="html" label="${tool.name} on ${on_string} - HTML report"/>
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
134 </outputs>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
135 <tests>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
136 <!-- find out how to use -->
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
137 <test>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
138 </test>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
139 </tests>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
140 <help>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
141
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
142 .. class:: infomark
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
143
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
144
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
145 This tool is responsible for annotating the given target file
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
146 with the terms given in a lookup table. This lookup table maps the items found in the target file
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
147 (e.g. protein identifications coded in common protein coding formats such as UniProt )
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
148 to their respective terms (e.g. GO terms). It enables users to use the cross-reference
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
149 information now available from different repositories (like uniprot and KEGG - see for example
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
150 http://www.uniprot.org/taxonomy/ or http://www.genome.jp/linkdb/ )
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
151 to map their data to other useful coding schemes or to ontologies and functional annotations.
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
152
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
153 .. class:: infomark
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
154
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
155 **NB:** Currently the tool will do "smart parsing" of hierarchy based fields in the target file ID column.
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
156 This means that if the colum contains a ".", the trailing part of the ID after the "." is ignored if the full
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
157 ID does not get a match in the lookup table while the part before the "." does.
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
158
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
159 .. class:: infomark
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
160
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
161 Examples of usage:
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
162
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
163 annotate protein identifications with Gene Ontology[GO] terms
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
164
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
165 annotate metabolite CAS identifications with chebi codes
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
166
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
167 add KEGG gene codes to a file containing UNIPROT codes
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
168
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
169 add KEGG compound codes to a file containing chebi codes
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
170
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
171 etc
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
172
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
173 As an example for transcripts and proteins, users can check http://www.uniprot.org/taxonomy/ to
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
174 see if their organism has been mapped to GO terms by Uniprot. For example the link
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
175 http://www.uniprot.org/uniprot/?query=taxonomy:2850 will show the Uniprot repository and cross-references
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
176 for the taxonomy 2850.
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
177 When the organism being studied is not available, then other strategies
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
178 could be tried (like Blast2GO for example).
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
179
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
180 Despite the specific examples above, this class is generic and can be used to map any
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
181 values to new terms according to a given lookup table.
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
182
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
183 .. class:: infomark
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
184
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
185 *Omics cross-reference resources on the web:*
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
186
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
187 LinkDB: http://www.genome.jp/linkdb/
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
188
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
189 *Ready to use metabolomics links:*
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
190
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
191 http://rest.genome.jp/link/compound/chebi
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
192
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
193 http://rest.genome.jp/link/compound/lipidmaps
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
194
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
195 http://rest.genome.jp/link/compound/lipidbank
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
196
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
197 http://rest.genome.jp/link/compound/hmdb
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
198
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
199
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
200 *Ready to use proteomics links:*
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
201
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
202 http://rest.genome.jp/link/uniprot/pti (Phaeodactylum Tricornutum)
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
203 http://rest.genome.jp/link/pti/uniprot
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
204
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
205 http://rest.genome.jp/link/uniprot/hsa (Homo Sapiens)
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
206
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
207 (for organism code list see: )
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
208
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
209
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
210 Uniprot to GO
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
211
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
212 http://www.uniprot.org/taxonomy/
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
213
9
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
214 http://www.uniprot.org/uniprot/?sort=&amp;desc=&amp;query=proteome:UP000000759&amp;fil=&amp;format=tab&amp;force=yes&amp;columns=id,go-id (Phaeodactylum Tricornutum)
89264646e458 improvements release
pieter.lukasse@wur.nl
parents: 8
diff changeset
215
7
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
216
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
217 -----
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
218
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
219 **Output**
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
220
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
221 This method will read in the given input file and for each line it will add a new column
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
222 containing the terms found for the ID in that line. So the output file is the same as the
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
223 input file + extra terms column (separated by ; ).
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
224
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
225 -----
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
226
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
227 **Link to ontology viewer**
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
228
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
229 A second summarized "terms observations" file can also be generated.
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
230 In case the terms are ontology terms, this file can be used for visualizing the results
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
231 in the ontology viewer "OntologyAndObservationsViewer".
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
232
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
233 </help>
ce9228263148 renamed to TermMapper
pieter.lukasse@wur.nl
parents:
diff changeset
234 </tool>