annotate unipept.xml @ 3:34758ab8aaa4 draft

Uploaded
author galaxyp
date Mon, 20 Feb 2017 10:32:03 -0500
parents 503ab8a39006
children 4953dcd7dd39
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
1 <tool id="unipept" name="Unipept" version="2.0.1">
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
2 <description>retrieve taxonomy for peptides</description>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
3 <macros>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
4 <xml name="equate_il">
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
5 <param name="equate_il" type="boolean" truevalue="-e" falsevalue="" checked="true" label="Equate isoleucine and leucine">
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
6 <help>isoleucine (I) and leucine (L) are equated when matching tryptic peptides to UniProt records</help>
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
7 </param>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
8 </xml>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
9 <xml name="extra">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
10 <param name="extra" type="boolean" truevalue="-x" falsevalue="" checked="false" label="retrieve extra information">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
11 <yield/>
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
12 </param>
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
13 </xml>
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
14 <xml name="extra_true">
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
15 <param name="extra" type="boolean" truevalue="-x" falsevalue="" checked="true" label="retrieve extra information">
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
16 <yield/>
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
17 </param>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
18 </xml>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
19 <xml name="names">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
20 <param name="names" type="boolean" truevalue="-n" falsevalue="" checked="true" label="names" >
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
21 <help>return the names in complete taxonomic lineage</help>
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
22 </param>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
23 <param name="allfields" type="boolean" truevalue="-A" falsevalue="" checked="false" label="allfields" >
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
24 <help>include fields for most specific taxonomic classification: taxon_rank,taxon_id,taxon_name before lineage</help>
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
25 </param>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
26 </xml>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
27 </macros>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
28 <requirements>
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
29 <requirement type="package" version="2.7">python</requirement>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
30 </requirements>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
31 <stdio>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
32 <exit_code range="1:" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
33 </stdio>
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
34 <command><![CDATA[
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
35 python '$__tool_directory__/unipept.py'
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
36 --api=$unipept.api
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
37 $unipept.equate_il $unipept.extra
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
38 #if $unipept.api != 'pept2prot':
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
39 $unipept.names $unipept.allfields
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
40 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
41 $strict
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
42 #if str($peptide_src.fmt) == 'proteomic':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
43 #if $peptide_src.input.datatype.file_ext == 'fasta':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
44 --fasta="$peptide_src.input"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
45 #elif $peptide_src.input.datatype.file_ext == 'mzid':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
46 --mzid="$peptide_src.input"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
47 #elif $peptide_src.input.datatype.file_ext == 'pepxml':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
48 --pepxml="$peptide_src.input"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
49 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
50 #elif str($peptide_src.fmt) == 'tabular':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
51 --tabular="$peptide_src.input_tsv"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
52 #set $col = int(str($peptide_src.column)) - 1
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
53 --column=$col
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
54 #elif str($peptide_src.fmt) == 'fasta':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
55 --fasta="$peptide_src.input_fasta"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
56 #elif str($peptide_src.fmt) == 'mzid':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
57 --mzid="$peptide_src.input_mzid"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
58 #elif str($peptide_src.fmt) == 'pepxml':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
59 --pepxml="$peptide_src.input_pepxml"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
60 #end if
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
61 #if 'json' in str($outputs).split(',') and str($unipept.api) != 'pept2prot':
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
62 --json $output_json
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
63 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
64 #if 'tsv' in str($outputs).split(','):
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
65 --tsv $output_tsv
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
66 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
67 #if 'csv' in str($outputs).split(','):
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
68 --csv $output_csv
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
69 #end if
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
70 #if 'unmatched' in str($outputs).split(','):
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
71 --unmatched $output_unmatched
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
72 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
73 ]]></command>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
74 <inputs>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
75 <conditional name="unipept">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
76 <param name="api" type="select" label="Unipept application" >
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
77 <option value="pept2lca" selected="true">pept2lca: lowest common ancestor</option>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
78 <option value="pept2taxa">pept2taxa: organisms associated with the UniProt entries containing a given tryptic peptide</option>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
79 <option value="pept2prot">pept2prot: UniProt entries containing a given tryptic peptide</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
80 </param>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
81 <when value="pept2lca">
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
82 <expand macro="equate_il" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
83 <expand macro="extra">
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
84 <help>Return the complete lineage of the taxonomic lowest common ancestor, and include ID fields.</help>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
85 </expand>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
86 <expand macro="names" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
87 </when>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
88 <when value="pept2taxa">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
89 <expand macro="equate_il" />
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
90 <expand macro="extra_true">
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
91 <help>Return the complete lineage of each organism, and include ID fields.</help>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
92 </expand>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
93 <expand macro="names" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
94 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
95 <when value="pept2prot">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
96 <expand macro="equate_il" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
97 <expand macro="extra">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
98 <help>Return additional information fields: taxon_name, ec_references, go_references, refseq_ids, refseq_protein_ids, insdc_ids, insdc_protein_ids
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
99 WARNING: Huge perfomance penalty! Only use for small number of peptides when the extra infomation is required.
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
100 </help>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
101 </expand>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
102 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
103 </conditional>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
104 <conditional name="peptide_src">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
105 <param name="fmt" type="select" label="Peptides input format" >
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
106 <option value="proteomic">proteomics formats: mzid, pepxml, fasta</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
107 <option value="tabular">tabular</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
108 <option value="fasta">fasta</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
109 <option value="mzid">mzid</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
110 <option value="pepxml">pepxml</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
111 </param>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
112 <when value="proteomic">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
113 <param name="input" type="data" format="mzid,pepxml,fasta" label="Peptide Input" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
114 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
115 <when value="tabular">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
116 <param name="input_tsv" type="data" format="tabular" label="Tabular Input Containing Peptide column" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
117 <param name="column" label="Select column with peptides" type="data_column" numerical="false" data_ref="input_tsv" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
118 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
119 <when value="fasta">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
120 <param name="input_fasta" type="data" format="fasta" label="Peptide Fasta Input" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
121 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
122 <when value="mzid">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
123 <param name="input_mzid" type="data" format="mzid" label="mzIndetML Input" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
124 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
125 <when value="pepxml">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
126 <param name="input_pepxml" type="data" format="pepxml" label="mzIndetML Input" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
127 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
128 </conditional>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
129 <param name="outputs" type="select" multiple="true" display="checkboxes" label="Choose outputs">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
130 <option value="tsv" selected="true">tabular</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
131 <option value="csv">Comma Separated Values (.csv)</option>
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
132 <option value="json">JSON Taxomony Tree (ignored for pept2prot)</option>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
133 <option value="unmatched">Unmatched peptides</option>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
134 </param>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
135 <param name="strict" type="boolean" truevalue="--strict" falsevalue="" checked="false" label="Exit with error on invalid peptides, otherwise ignore them"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
136 </inputs>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
137 <outputs>
3
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
138 <data name="output_json" format="d3_hierarchy" label="${tool.name} ${unipept.api} on ${on_string} json">
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
139 <filter>'json' in outputs and unipept['api'] != 'pept2prot'</filter>
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
140 <change_format>
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
141 <when input="api" value="pept2prot" format="json" />
34758ab8aaa4 Uploaded
galaxyp
parents: 2
diff changeset
142 </change_format>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
143 </data>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
144 <data name="output_tsv" format="tabular" label="${tool.name} ${unipept.api} on ${on_string} tsv">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
145 <filter>'tsv' in outputs</filter>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
146 </data>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
147 <data name="output_csv" format="csv" label="${tool.name} ${unipept.api} on ${on_string} csv">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
148 <filter>'csv' in outputs</filter>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
149 </data>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
150 <data name="output_unmatched" format="tabular" label="${tool.name} ${unipept.api} on ${on_string} unmatched">
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
151 <filter>'unmatched' in outputs</filter>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
152 </data>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
153 </outputs>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
154 <tests>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
155 <test>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
156 <param name="api" value="pept2lca"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
157 <param name="fmt" value="tabular"/>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
158 <param name="input_tsv" value="tryptic.tsv"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
159 <param name="column" value="2"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
160 <param name="extra" value="True"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
161 <param name="names" value="True"/>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
162 <param name="outputs" value="tsv,unmatched"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
163 <output name="output_tsv">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
164 <assert_contents>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
165 <has_text text="Homininae" />
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
166 </assert_contents>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
167 </output>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
168 <output name="output_unmatched">
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
169 <assert_contents>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
170 <has_text text="QTAMAV" />
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
171 </assert_contents>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
172 </output>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
173 </test>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
174 <test>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
175 <param name="api" value="pept2lca"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
176 <param name="fmt" value="fasta"/>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
177 <param name="input_fasta" value="peptide.fa"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
178 <param name="equate_il" value="True"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
179 <param name="extra" value="True"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
180 <param name="names" value="True"/>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
181 <param name="outputs" value="json,tsv"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
182 <output name="output_json">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
183 <assert_contents>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
184 <has_text text="VMDVNDHKPEFYNCSLPACTFTPEEAQVNFTGYVDEHASPHIPIDDLTMVVYDPDKGSNGTFLLSLGGPDAEAFSVSPERAAGSASVQVLVRVSALVDYERQTAMAV" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
185 </assert_contents>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
186 </output>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
187 <output name="output_tsv">
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
188 <assert_contents>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
189 <has_text text="9606" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
190 <has_text text="9598" />
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
191 </assert_contents>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
192 </output>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
193 </test>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
194 <test>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
195 <param name="api" value="pept2taxa"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
196 <param name="fmt" value="fasta"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
197 <param name="input_fasta" value="peptide.fa"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
198 <param name="equate_il" value="True"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
199 <param name="extra" value="False"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
200 <param name="names" value="False"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
201 <param name="outputs" value="tsv"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
202 <output name="output_tsv">
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
203 <assert_contents>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
204 <has_text text="sapiens" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
205 <has_text text="troglodytes" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
206 <has_text text="Gorilla" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
207 <has_text text="Macaca" />
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
208 </assert_contents>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
209 </output>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
210 </test>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
211 </tests>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
212 <help><![CDATA[
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
213 **Unipept**
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
214
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
215 Retrieve Uniprot and taxanomic information for trypic peptides.
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
216
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
217 Unipept API documentation - http://unipept.ugent.be/apidocs
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
218
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
219 **Input**
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
220
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
221 Input peptides can be retrieved from tabular, fasta, mzid, or pepxml datasets.
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
222
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
223 Processing deatils::
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
224
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
225 The input peptides are split into typtic peptide fragments in order to match the Unipept records.
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
226 Only fragments that are complete tryptic peptides between 5 and 50 animo acid in length will be matched by Unipept.
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
227 The match to the most specific tryptic fragment is reported.
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
228
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
229
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
230 **Unipept APIs**
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
231
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
232 **pept2prot** - http://unipept.ugent.be/apidocs/pept2prot
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
233
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
234 Returns the list of UniProt entries containing a given tryptic peptide. This is the same information as provided on the Protein matches tab when performing a search with the Tryptic Peptide Analysis in the web interface.
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
235
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
236 By default, each object contains the following information fields extracted from the UniProt record::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
237
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
238 peptide: the peptide that matched this record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
239 uniprot_id: the UniProt accession number of the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
240 taxon_id: the NCBI taxon id of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
241
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
242 When the extra parameter is set to true, objects contain the following additional fields extracted from the UniProt record::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
243
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
244 taxon_name: the name of the organism associated with the matching UniProt record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
245 ec_references: a space separated list of associated EC numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
246 go_references: a space separated list of associated GO terms
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
247 refseq_ids: a space separated list of associated RefSeq accession numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
248 refseq_protein_ids: a space separated list of associated RefSeq protein accession numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
249 insdc_ids: a space separated list of associated insdc accession numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
250 insdc_protein_ids: a space separated list of associated insdc protein accession numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
251
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
252
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
253 **pept2taxa** - http://unipept.ugent.be/apidocs/pept2taxa
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
254
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
255 Returns the set of organisms associated with the UniProt entries containing a given tryptic peptide. This is the same information as provided on the Lineage table tab when performing a search with the Tryptic Peptide Analysis in the web interface.
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
256
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
257 By default, each object contains the following information fields extracted from the UniProt record and NCBI taxonomy::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
258
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
259 peptide: the peptide that matched this record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
260 taxon_id: the NCBI taxon id of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
261 taxon_name: the name of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
262 taxon_rank: the taxonomic rank of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
263
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
264 When the extra parameter is set to true, objects contain additional information about the lineages of the organism extracted from the NCBI taxonomy. The taxon id of each rank in the lineage is specified using the following information fields::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
265
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
266 superkingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
267 kingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
268 subkingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
269 superphylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
270 phylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
271 subphylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
272 superclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
273 class_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
274 subclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
275 infraclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
276 superorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
277 order_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
278 suborder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
279 infraorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
280 parvorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
281 superfamily_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
282 family_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
283 subfamily_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
284 tribe_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
285 subtribe_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
286 genus_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
287 subgenus_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
288 species_group_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
289 species_subgroup_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
290 species_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
291 subspecies_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
292 varietas_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
293 forma_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
294
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
295
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
296 **pept2lca** - http://unipept.ugent.be/apidocs/pept2lca
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
297
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
298 Returns the taxonomic lowest common ancestor for a given tryptic peptide. This is the same information as provided when performing a search with the Tryptic Peptide Analysis in the web interface.
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
299
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
300 By default, each object contains the following information fields extracted from the UniProt record and NCBI taxonomy::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
301
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
302 peptide: the peptide that matched this record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
303 taxon_id: the NCBI taxon id of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
304 taxon_name: the name of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
305 taxon_rank: the taxonomic rank of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
306
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
307 When the extra parameter is set to true, objects contain additional information about the lineage of the taxonomic lowest common ancestor extracted from the NCBI taxonomy. The taxon id of each rank in the lineage is specified using the following information fields::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
308
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
309 superkingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
310 kingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
311 subkingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
312 superphylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
313 phylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
314 subphylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
315 superclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
316 class_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
317 subclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
318 infraclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
319 superorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
320 order_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
321 suborder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
322 infraorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
323 parvorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
324 superfamily_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
325 family_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
326 subfamily_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
327 tribe_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
328 subtribe_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
329 genus_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
330 subgenus_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
331 species_group_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
332 species_subgroup_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
333 species_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
334 subspecies_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
335 varietas_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
336 forma_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
337
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
338
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
339 **Attributions**
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
340
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
341 The Unipept metaproteomics analysis pipeline
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
342 Bart Mesuere1,*, Griet Debyser2, Maarten Aerts3, Bart Devreese2, Peter Vandamme3 andPeter Dawyndt1
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
343 Article first published online: 11 FEB 2015
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
344 DOI: 10.1002/pmic.201400361
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
345 http://onlinelibrary.wiley.com/doi/10.1002/pmic.201400361/abstract;jsessionid=BFF1994E4C14DA73D7C907EB208AD710.f04t04
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
346
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
347 ]]></help>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
348 <citations>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
349 <citation type="doi">doi:10.1002/pmic.201400361</citation>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
350 </citations>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
351
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
352 </tool>