Mercurial > repos > mikel-egana-aranguren > sadi_docker_workflow
comparison Galaxy-Workflow-SADI-Docker_use_case.ga @ 1:47db0b303a50 default tip
Added annotations to workflow
author | Mikel Egana <mikel.egana.aranguren@gmail.com> |
---|---|
date | Mon, 07 Sep 2015 19:18:27 +0200 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
0:22be3a551998 | 1:47db0b303a50 |
---|---|
1 { | |
2 "a_galaxy_workflow": "true", | |
3 "annotation": "The workflow answers the following question: Given a set of UniProt proteins, which ones are related to PubMed abstracts containing the term ``brain'', and what are they KEGG entries? The workflow starts from a simple list of UniProt identifiers, and retrieves different datasets from a regular SADI service (to obtain KEGG entries) and a set of 3 OpenLifeData2SADI services (to obtain PubMed abstracts). The results are then merged and queried to obtain the KEGG entries of proteins that are related to PubMed abstracts that contain the term", | |
4 "format-version": "0.1", | |
5 "name": "SADI-Docker use case", | |
6 "steps": { | |
7 "0": { | |
8 "annotation": "Convert white spaces to tabs, so that Galaxy recognises the list of UniProt IDs as a column", | |
9 "id": 0, | |
10 "input_connections": {}, | |
11 "inputs": [], | |
12 "label": null, | |
13 "name": "Convert", | |
14 "outputs": [ | |
15 { | |
16 "name": "out_file1", | |
17 "type": "tabular" | |
18 } | |
19 ], | |
20 "position": { | |
21 "left": 204.9895977973938, | |
22 "top": 202.90626764297485 | |
23 }, | |
24 "post_job_actions": {}, | |
25 "tool_errors": null, | |
26 "tool_id": "Convert characters1", | |
27 "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"condense\": \"\\\"True\\\"\", \"strip\": \"\\\"True\\\"\", \"input\": \"null\", \"convert_from\": \"\\\"s\\\"\"}", | |
28 "tool_version": "1.0.0", | |
29 "type": "tool", | |
30 "user_outputs": [], | |
31 "uuid": "658762bb-9052-4dd2-bb6b-e77613a6dcfe" | |
32 }, | |
33 "1": { | |
34 "annotation": "Convert UniProt identifiers to URIs: Add a column with the first part of the URI", | |
35 "id": 1, | |
36 "input_connections": { | |
37 "input": { | |
38 "id": 0, | |
39 "output_name": "out_file1" | |
40 } | |
41 }, | |
42 "inputs": [], | |
43 "label": null, | |
44 "name": "Add column", | |
45 "outputs": [ | |
46 { | |
47 "name": "out_file1", | |
48 "type": "input" | |
49 } | |
50 ], | |
51 "position": { | |
52 "left": 199.9895977973938, | |
53 "top": 335.9097466468811 | |
54 }, | |
55 "post_job_actions": {}, | |
56 "tool_errors": null, | |
57 "tool_id": "addValue", | |
58 "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"__rerun_remap_job_id__\": null, \"exp\": \"\\\"http://openlifedata.org/uniprot:\\\"\", \"iterate\": \"\\\"no\\\"\"}", | |
59 "tool_version": "1.0.0", | |
60 "type": "tool", | |
61 "user_outputs": [], | |
62 "uuid": "c2421757-1d5d-435c-ac9e-fb036ccd4448" | |
63 }, | |
64 "2": { | |
65 "annotation": "Convert UniProt identifiers to URIs", | |
66 "id": 2, | |
67 "input_connections": { | |
68 "input1": { | |
69 "id": 1, | |
70 "output_name": "out_file1" | |
71 } | |
72 }, | |
73 "inputs": [], | |
74 "label": null, | |
75 "name": "Merge Columns", | |
76 "outputs": [ | |
77 { | |
78 "name": "out_file1", | |
79 "type": "tabular" | |
80 } | |
81 ], | |
82 "position": { | |
83 "left": 201.96875429153442, | |
84 "top": 473.91322565078735 | |
85 }, | |
86 "post_job_actions": {}, | |
87 "tool_errors": null, | |
88 "tool_id": "mergeCols1", | |
89 "tool_state": "{\"__page__\": 0, \"input1\": \"null\", \"__rerun_remap_job_id__\": null, \"col2\": \"\\\"\\\"\", \"col1\": \"\\\"\\\"\", \"columns\": \"[]\"}", | |
90 "tool_version": "1.0.1", | |
91 "type": "tool", | |
92 "user_outputs": [], | |
93 "uuid": "63b4d2ff-0e1d-449d-aad5-a2ccd033d36a" | |
94 }, | |
95 "3": { | |
96 "annotation": "Obtain the UniProt URIs", | |
97 "id": 3, | |
98 "input_connections": { | |
99 "input": { | |
100 "id": 2, | |
101 "output_name": "out_file1" | |
102 } | |
103 }, | |
104 "inputs": [], | |
105 "label": null, | |
106 "name": "Cut", | |
107 "outputs": [ | |
108 { | |
109 "name": "out_file1", | |
110 "type": "tabular" | |
111 } | |
112 ], | |
113 "position": { | |
114 "left": 202.99307680130005, | |
115 "top": 592.906298160553 | |
116 }, | |
117 "post_job_actions": {}, | |
118 "tool_errors": null, | |
119 "tool_id": "Cut1", | |
120 "tool_state": "{\"columnList\": \"\\\"c3\\\"\", \"input\": \"null\", \"delimiter\": \"\\\"T\\\"\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", | |
121 "tool_version": "1.0.2", | |
122 "type": "tool", | |
123 "user_outputs": [], | |
124 "uuid": "f3912f69-b561-4dd5-91f0-1e492e19bb9c" | |
125 }, | |
126 "4": { | |
127 "annotation": "Add a column with the URI of the SADI service input OWL class", | |
128 "id": 4, | |
129 "input_connections": { | |
130 "input": { | |
131 "id": 3, | |
132 "output_name": "out_file1" | |
133 } | |
134 }, | |
135 "inputs": [], | |
136 "label": null, | |
137 "name": "Add column", | |
138 "outputs": [ | |
139 { | |
140 "name": "out_file1", | |
141 "type": "input" | |
142 } | |
143 ], | |
144 "position": { | |
145 "left": 448.9826703071594, | |
146 "top": 480.9097466468811 | |
147 }, | |
148 "post_job_actions": {}, | |
149 "tool_errors": null, | |
150 "tool_id": "addValue", | |
151 "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"__rerun_remap_job_id__\": null, \"exp\": \"\\\"http://purl.oclc.org/SADI/LSRN/UniProt_Record\\\"\", \"iterate\": \"\\\"no\\\"\"}", | |
152 "tool_version": "1.0.0", | |
153 "type": "tool", | |
154 "user_outputs": [], | |
155 "uuid": "c01e5509-2a60-4ad4-848c-b31f9ccfc841" | |
156 }, | |
157 "5": { | |
158 "annotation": "Add a column with the URI of the SADI service input OWL class", | |
159 "id": 5, | |
160 "input_connections": { | |
161 "input": { | |
162 "id": 3, | |
163 "output_name": "out_file1" | |
164 } | |
165 }, | |
166 "inputs": [], | |
167 "label": null, | |
168 "name": "Add column", | |
169 "outputs": [ | |
170 { | |
171 "name": "out_file1", | |
172 "type": "input" | |
173 } | |
174 ], | |
175 "position": { | |
176 "left": 449.9896283149719, | |
177 "top": 636.9166741371155 | |
178 }, | |
179 "post_job_actions": {}, | |
180 "tool_errors": null, | |
181 "tool_id": "addValue", | |
182 "tool_state": "{\"__page__\": 0, \"input\": \"null\", \"__rerun_remap_job_id__\": null, \"exp\": \"\\\"http://openlifedata.org/uniprot_vocabulary:Resource\\\"\", \"iterate\": \"\\\"no\\\"\"}", | |
183 "tool_version": "1.0.0", | |
184 "type": "tool", | |
185 "user_outputs": [], | |
186 "uuid": "98b1f088-3de5-4dbd-a655-63a630517e1a" | |
187 }, | |
188 "6": { | |
189 "annotation": "Convert to RDF, adding the triple rdf:type input OWL class", | |
190 "id": 6, | |
191 "input_connections": { | |
192 "input_file": { | |
193 "id": 4, | |
194 "output_name": "out_file1" | |
195 } | |
196 }, | |
197 "inputs": [], | |
198 "label": null, | |
199 "name": "SADI - Tab-to-RDF", | |
200 "outputs": [ | |
201 { | |
202 "name": "output_file", | |
203 "type": "rdf" | |
204 } | |
205 ], | |
206 "position": { | |
207 "left": 449.9896283149719, | |
208 "top": 340.9097466468811 | |
209 }, | |
210 "post_job_actions": {}, | |
211 "tool_errors": null, | |
212 "tool_id": "SADI-Docker-tab2rdf", | |
213 "tool_state": "{\"__page__\": 0, \"triples\": \"[{\\\"__index__\\\": 0, \\\"o_col\\\": \\\"\\\", \\\"o_type\\\": \\\"False\\\", \\\"s_col\\\": \\\"\\\", \\\"p_val\\\": \\\"http://www.w3.org/1999/02/22-rdf-syntax-ns#type\\\"}]\", \"input_file\": \"null\", \"output_format\": \"\\\"ntriples\\\"\", \"namespace\": \"{\\\"choose_namespace\\\": \\\"none\\\", \\\"__current_case__\\\": 1}\", \"__rerun_remap_job_id__\": null}", | |
214 "tool_version": "0.1", | |
215 "type": "tool", | |
216 "user_outputs": [], | |
217 "uuid": "a05b8d4f-1b5f-4930-bd77-dfb5163b4556" | |
218 }, | |
219 "7": { | |
220 "annotation": "Convert to RDF, adding the triple rdf:type input OWL class", | |
221 "id": 7, | |
222 "input_connections": { | |
223 "input_file": { | |
224 "id": 5, | |
225 "output_name": "out_file1" | |
226 } | |
227 }, | |
228 "inputs": [], | |
229 "label": null, | |
230 "name": "SADI - Tab-to-RDF", | |
231 "outputs": [ | |
232 { | |
233 "name": "output_file", | |
234 "type": "rdf" | |
235 } | |
236 ], | |
237 "position": { | |
238 "left": 447.9757122993469, | |
239 "top": 766.9166741371155 | |
240 }, | |
241 "post_job_actions": {}, | |
242 "tool_errors": null, | |
243 "tool_id": "SADI-Docker-tab2rdf", | |
244 "tool_state": "{\"__page__\": 0, \"triples\": \"[{\\\"__index__\\\": 0, \\\"o_col\\\": \\\"\\\", \\\"o_type\\\": \\\"False\\\", \\\"s_col\\\": \\\"\\\", \\\"p_val\\\": \\\"http://www.w3.org/1999/02/22-rdf-syntax-ns#type\\\"}]\", \"input_file\": \"null\", \"output_format\": \"\\\"ntriples\\\"\", \"namespace\": \"{\\\"choose_namespace\\\": \\\"none\\\", \\\"__current_case__\\\": 1}\", \"__rerun_remap_job_id__\": null}", | |
245 "tool_version": "0.1", | |
246 "type": "tool", | |
247 "user_outputs": [], | |
248 "uuid": "217c654d-5353-4d93-a6de-c5c5bb205e64" | |
249 }, | |
250 "8": { | |
251 "annotation": "Convert to RDF/XML syntax", | |
252 "id": 8, | |
253 "input_connections": { | |
254 "input_file": { | |
255 "id": 6, | |
256 "output_name": "output_file" | |
257 } | |
258 }, | |
259 "inputs": [], | |
260 "label": null, | |
261 "name": "SADI - RDF Format (Rapper)", | |
262 "outputs": [ | |
263 { | |
264 "name": "output_file", | |
265 "type": "rdf" | |
266 } | |
267 ], | |
268 "position": { | |
269 "left": 438.9826703071594, | |
270 "top": 200.90973138809204 | |
271 }, | |
272 "post_job_actions": {}, | |
273 "tool_errors": null, | |
274 "tool_id": "SADI-Docker-rapper", | |
275 "tool_state": "{\"__page__\": 0, \"output_format\": \"\\\"rdfxml\\\"\", \"__rerun_remap_job_id__\": null, \"input_format\": \"\\\"ntriples\\\"\", \"input_file\": \"null\"}", | |
276 "tool_version": "0.1", | |
277 "type": "tool", | |
278 "user_outputs": [], | |
279 "uuid": "b5e1600e-a4ef-4ed6-a839-46bd1bcc59b3" | |
280 }, | |
281 "9": { | |
282 "annotation": "Convert to RDF/XML syntax", | |
283 "id": 9, | |
284 "input_connections": { | |
285 "input_file": { | |
286 "id": 7, | |
287 "output_name": "output_file" | |
288 } | |
289 }, | |
290 "inputs": [], | |
291 "label": null, | |
292 "name": "SADI - RDF Format (Rapper)", | |
293 "outputs": [ | |
294 { | |
295 "name": "output_file", | |
296 "type": "rdf" | |
297 } | |
298 ], | |
299 "position": { | |
300 "left": 446.98611879348755, | |
301 "top": 913.9132561683655 | |
302 }, | |
303 "post_job_actions": {}, | |
304 "tool_errors": null, | |
305 "tool_id": "SADI-Docker-rapper", | |
306 "tool_state": "{\"__page__\": 0, \"output_format\": \"\\\"rdfxml\\\"\", \"__rerun_remap_job_id__\": null, \"input_format\": \"\\\"ntriples\\\"\", \"input_file\": \"null\"}", | |
307 "tool_version": "0.1", | |
308 "type": "tool", | |
309 "user_outputs": [], | |
310 "uuid": "995db5b3-4e12-48c8-bda0-f961861f008c" | |
311 }, | |
312 "10": { | |
313 "annotation": "Execute SADI service to obtain KEGG entries", | |
314 "id": 10, | |
315 "input_connections": { | |
316 "input": { | |
317 "id": 8, | |
318 "output_name": "output_file" | |
319 } | |
320 }, | |
321 "inputs": [], | |
322 "label": null, | |
323 "name": "SADI client", | |
324 "outputs": [ | |
325 { | |
326 "name": "output", | |
327 "type": "rdf" | |
328 } | |
329 ], | |
330 "position": { | |
331 "left": 775.9965863227844, | |
332 "top": 202.90626764297485 | |
333 }, | |
334 "post_job_actions": {}, | |
335 "tool_errors": null, | |
336 "tool_id": "SADI-Docker-sadi_client", | |
337 "tool_state": "{\"url\": \"\\\"http://sadiframework.org/services/getKEGGIDFromUniProt\\\"\", \"input\": \"null\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", | |
338 "tool_version": "0.1", | |
339 "type": "tool", | |
340 "user_outputs": [], | |
341 "uuid": "01c2bbe7-a5e1-4bad-8c93-b01c6d0a5c8f" | |
342 }, | |
343 "11": { | |
344 "annotation": "Execute SADI service to obtain HGNC entries", | |
345 "id": 11, | |
346 "input_connections": { | |
347 "input": { | |
348 "id": 9, | |
349 "output_name": "output_file" | |
350 } | |
351 }, | |
352 "inputs": [], | |
353 "label": null, | |
354 "name": "SADI client", | |
355 "outputs": [ | |
356 { | |
357 "name": "output", | |
358 "type": "rdf" | |
359 } | |
360 ], | |
361 "position": { | |
362 "left": 788.9826703071594, | |
363 "top": 579.9201531410217 | |
364 }, | |
365 "post_job_actions": {}, | |
366 "tool_errors": null, | |
367 "tool_id": "SADI-Docker-sadi_client", | |
368 "tool_state": "{\"url\": \"\\\"http://biordf.org/cgi-bin/SADI/OpenLifeData2SADI/SADI/hgnc/uniprot_vocabulary_Resource_hgnc_vocabulary_x-uniprot-inverse_hgnc_vocabulary_Resource\\\"\", \"input\": \"null\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", | |
369 "tool_version": "0.1", | |
370 "type": "tool", | |
371 "user_outputs": [], | |
372 "uuid": "ccdd413c-36be-48c3-96fc-4f233208a6b8" | |
373 }, | |
374 "12": { | |
375 "annotation": "Execute SADI service to obtain OMIM entries", | |
376 "id": 12, | |
377 "input_connections": { | |
378 "input": { | |
379 "id": 11, | |
380 "output_name": "output" | |
381 } | |
382 }, | |
383 "inputs": [], | |
384 "label": null, | |
385 "name": "SADI client", | |
386 "outputs": [ | |
387 { | |
388 "name": "output", | |
389 "type": "rdf" | |
390 } | |
391 ], | |
392 "position": { | |
393 "left": 793.9826703071594, | |
394 "top": 753.9132561683655 | |
395 }, | |
396 "post_job_actions": {}, | |
397 "tool_errors": null, | |
398 "tool_id": "SADI-Docker-sadi_client", | |
399 "tool_state": "{\"url\": \"\\\"http://biordf.org/cgi-bin/SADI/OpenLifeData2SADI/SADI/hgnc/hgnc_vocabulary_Resource_hgnc_vocabulary_x-omim_omim_vocabulary_Gene\\\"\", \"input\": \"null\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", | |
400 "tool_version": "0.1", | |
401 "type": "tool", | |
402 "user_outputs": [], | |
403 "uuid": "b7af50a8-a92a-44d9-bf1e-ca90cb69905d" | |
404 }, | |
405 "13": { | |
406 "annotation": "Execute SADI service to obtain PubMed entries", | |
407 "id": 13, | |
408 "input_connections": { | |
409 "input": { | |
410 "id": 12, | |
411 "output_name": "output" | |
412 } | |
413 }, | |
414 "inputs": [], | |
415 "label": null, | |
416 "name": "SADI client", | |
417 "outputs": [ | |
418 { | |
419 "name": "output", | |
420 "type": "rdf" | |
421 } | |
422 ], | |
423 "position": { | |
424 "left": 799.9896283149719, | |
425 "top": 914.9201531410217 | |
426 }, | |
427 "post_job_actions": {}, | |
428 "tool_errors": null, | |
429 "tool_id": "SADI-Docker-sadi_client", | |
430 "tool_state": "{\"url\": \"\\\"http://biordf.org/cgi-bin/SADI/OpenLifeData2SADI/SADI/omim/omim_vocabulary_Gene_omim_vocabulary_article_pubmed_vocabulary_PubMedRecord\\\"\", \"input\": \"null\", \"__rerun_remap_job_id__\": null, \"__page__\": 0}", | |
431 "tool_version": "0.1", | |
432 "type": "tool", | |
433 "user_outputs": [], | |
434 "uuid": "3dcb6fc4-4021-4ea6-8e88-31c71d68699d" | |
435 }, | |
436 "14": { | |
437 "annotation": "Merge all the inputs and outputs in single RDF graph: SADI only decorates inputs with new triples, so we can keep track of the whole process via URIs", | |
438 "id": 14, | |
439 "input_connections": { | |
440 "input_files_0|input_file": { | |
441 "id": 13, | |
442 "output_name": "output" | |
443 }, | |
444 "input_files_1|input_file": { | |
445 "id": 12, | |
446 "output_name": "output" | |
447 }, | |
448 "input_files_2|input_file": { | |
449 "id": 11, | |
450 "output_name": "output" | |
451 }, | |
452 "input_files_3|input_file": { | |
453 "id": 10, | |
454 "output_name": "output" | |
455 }, | |
456 "input_files_4|input_file": { | |
457 "id": 9, | |
458 "output_name": "output_file" | |
459 }, | |
460 "input_files_5|input_file": { | |
461 "id": 8, | |
462 "output_name": "output_file" | |
463 } | |
464 }, | |
465 "inputs": [], | |
466 "label": null, | |
467 "name": "SADI - Merge RDF Graphs", | |
468 "outputs": [ | |
469 { | |
470 "name": "output_file", | |
471 "type": "rdf" | |
472 } | |
473 ], | |
474 "position": { | |
475 "left": 1125.9965252876282, | |
476 "top": 318.91319513320923 | |
477 }, | |
478 "post_job_actions": {}, | |
479 "tool_errors": null, | |
480 "tool_id": "SADI-Docker-mergeRDFgraphs", | |
481 "tool_state": "{\"__page__\": 0, \"__rerun_remap_job_id__\": null, \"input_files\": \"[{\\\"__index__\\\": 0, \\\"input_file\\\": null}, {\\\"__index__\\\": 1, \\\"input_file\\\": null}, {\\\"__index__\\\": 2, \\\"input_file\\\": null}, {\\\"__index__\\\": 3, \\\"input_file\\\": null}, {\\\"__index__\\\": 4, \\\"input_file\\\": null}, {\\\"__index__\\\": 5, \\\"input_file\\\": null}]\"}", | |
482 "tool_version": "0.1", | |
483 "type": "tool", | |
484 "user_outputs": [], | |
485 "uuid": "7c24dd55-3032-4329-9fa3-734c963d8ed2" | |
486 }, | |
487 "15": { | |
488 "annotation": "Query the merged RDF graph with the actual question", | |
489 "id": 15, | |
490 "input_connections": { | |
491 "ontology": { | |
492 "id": 14, | |
493 "output_name": "output_file" | |
494 } | |
495 }, | |
496 "inputs": [], | |
497 "label": null, | |
498 "name": "SADI - Execute an SPARQL query against an RDF file", | |
499 "outputs": [ | |
500 { | |
501 "name": "output", | |
502 "type": "html" | |
503 } | |
504 ], | |
505 "position": { | |
506 "left": 1439.993106842041, | |
507 "top": 461.92015266418457 | |
508 }, | |
509 "post_job_actions": {}, | |
510 "tool_errors": null, | |
511 "tool_id": "SADI-Docker-SPARQLGalaxy", | |
512 "tool_state": "{\"out_format\": \"\\\"html\\\"\", \"__page__\": 0, \"pasted_query\": \"\\\"PREFIX rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> \\\\nPREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>\\\\nPREFIX sadi: <http://sadiframework.org/ontologies/predicates.owl#>\\\\nPREFIX lsrn: <http://purl.oclc.org/SADI/LSRN/>\\\\n\\\\nSELECT ?protein ?label ?KEGG\\\\nWHERE { \\\\n?protein rdf:type lsrn:UniProt_Record . \\\\n?protein sadi:isEncodedBy ?KEGG . \\\\n?protein ?prot2hgnc ?hgnc . \\\\n?hgnc ?hgnc2omim ?omim . \\\\n?omim ?omim2pubmed ?pubmed . \\\\n?pubmed rdfs:label ?label . \\\\nFILTER (regex (?label, 'brain'))\\\\n}\\\"\", \"ontology\": \"null\", \"__rerun_remap_job_id__\": null}", | |
513 "tool_version": "0.1", | |
514 "type": "tool", | |
515 "user_outputs": [], | |
516 "uuid": "9a453f8c-370e-4ab7-8e45-73cbba721db9" | |
517 } | |
518 }, | |
519 "uuid": "8796e5be-1c91-4f91-9946-02a09a79401d" | |
520 } |