Mercurial > repos > galaxyp > dbbuilder
comparison tools/dbbuilder.xml @ 4:b39347891609 draft
Uploaded
author | galaxyp |
---|---|
date | Fri, 26 Sep 2014 14:31:06 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
3:a38cd98a6b41 | 4:b39347891609 |
---|---|
1 <tool id="dbbuilder" version="0.2.0" name="Protein Database Downloader"> | |
2 <description> | |
3 </description> | |
4 <requirements> | |
5 <requirement type="binary">wget</requirement> | |
6 </requirements> | |
7 <stdio> | |
8 <exit_code range="1:" level="fatal" description="Error downloading database." /> | |
9 <regex match="ERROR" level="fatal" source="stderr" description="Error downloading database." /> | |
10 </stdio> | |
11 <!-- TODO: escape quotes. --> | |
12 <!-- Add NCBI and maxquant contaminants. --> | |
13 <!-- http://maxquant.org/contaminants.zip --> | |
14 <!-- ftp://ftp.ncbi.nih.gov/refseq/H_sapiens/mRNA_Prot/human.protein.faa.gz--> | |
15 <command> | |
16 #if $source.from == "uniprot" | |
17 #set $url = "http://www.uniprot.org/uniprot/?query=taxonomy%3a%22" + str($source.taxon) + "%22" + str($source.set) + str($source.reviewed) + "&force=yes&format=fasta" + str($source.include_isoform) | |
18 #set $type = "direct" | |
19 #elif $source.from == "cRAP" | |
20 #set $url = "ftp://ftp.thegpm.org/fasta/cRAP/crap.fasta" | |
21 #set $type = "direct" | |
22 #elif $source.from == "url" | |
23 #set $url = $source.url | |
24 #set $type = "direct" | |
25 #end if | |
26 #if $type =="direct" | |
27 wget -nv '$url' -O '${output_database}' | |
28 #end if | |
29 </command> | |
30 <inputs> | |
31 <conditional name="source"> | |
32 <param name="from" type="select" label="Download from" help="select database source. cRAP acts as a database for common MS contaminants. UniProtKB is a corss species collection of functional protein databases"> | |
33 <option value="uniprot">UniProtKB</option> | |
34 <option value="cRAP">cRAP (contaminants)</option> | |
35 <option value="url">Custom URL</option> | |
36 </param> | |
37 <when value="uniprot"> | |
38 <param name="taxon" type="select" format="text" help="select species for protein database"> | |
39 <label>Taxonomy</label> | |
40 <options from_file="uniprot_taxons.loc"> | |
41 <column name="name" index="0" /> | |
42 <column name="value" index="1" /> | |
43 </options> | |
44 </param> | |
45 <param name="reviewed" type="select" help="UniProtKB/TrEMBL (unreviewed)is a large, automatically annotated database- may contain redundant sequences, but there is a higher chance peptides will be identified. UniProtKB/Swiss-Prot (reviewed) is a smaller, manually annotated database- less of a chance peptides will be identified but less sequence redundancy"> | |
46 <option value="+">UniProtKB</option> | |
47 <option value="+reviewed%3Ayes">UniProtKB/Swiss-Prot (reviewed only)</option> | |
48 <option value="+reviewed%3Ano">UniProtKB/TrEMBL (unreviewed only)</option> | |
49 <sanitizer> | |
50 <valid> | |
51 <add value="%"/> | |
52 </valid> | |
53 </sanitizer> | |
54 </param> | |
55 <param name="set" type="select" label="Proteome Set"> | |
56 <option value="+">Any</option> | |
57 <option value="+keyword%3a1185" selected="true">Reference Proteome Set</option> | |
58 <option value="+keyword%3a181">Complete Proteome Set</option> | |
59 <sanitizer> | |
60 <valid> | |
61 <add value="%"/> | |
62 </valid> | |
63 </sanitizer> | |
64 </param> | |
65 <param name="include_isoform" type="boolean" truevalue="&include=yes" falsevalue="" label="Include isoform data" help="several different forms of a given protein are incorporated into database" /> | |
66 </when> | |
67 <when value="cRAP" /> | |
68 <when value="url"> | |
69 <param name="url" value="" type="text" label="URL (http, ftp)"> | |
70 <sanitizer> | |
71 <valid> | |
72 <add value="%"/> | |
73 </valid> | |
74 </sanitizer> | |
75 </param> | |
76 </when> | |
77 </conditional> | |
78 </inputs> | |
79 <outputs> | |
80 <data format="fasta" name="output_database" label="Protein Database" /> | |
81 </outputs> | |
82 <help> | |
83 **Output** | |
84 | |
85 Creates a FASTA file of specified protein sequences for comparison with experimental MS/MS data in search algorithm. | |
86 | |
87 **External Links** | |
88 | |
89 _Galaxy-P 101 shows usage Protein Database Downloader tool in the creation of a workflow | |
90 .. _Galaxy-P 101: http://msi-galaxy-p.readthedocs.org/en/latest/sections/galaxyp_101.html | |
91 _UniProtKB provides additional information about the UniProt Knowledgebase | |
92 .. _UniProtKB: http://www.uniprot.org/help/uniprotkb | |
93 </help> | |
94 </tool> | |
95 |