Mercurial > repos > iuc > proteinortho_grab_proteins
comparison proteinortho_grab_proteins.xml @ 0:d348c3a151d9 draft
"planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
author | iuc |
---|---|
date | Tue, 18 Feb 2020 17:57:53 -0500 |
parents | |
children | fa2d1e652ec1 |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:d348c3a151d9 |
---|---|
1 <tool id="proteinortho_grab_proteins" name="Proteinortho grab proteins" version="@TOOL_VERSION@+galaxy@WRAPPER_VERSION@"> | |
2 <description>finds genes/proteins in a given fasta file</description> | |
3 <macros> | |
4 <import>proteinortho_macros.xml</import> | |
5 </macros> | |
6 <expand macro="requirements"/> | |
7 <expand macro="version_command"/> | |
8 <command detect_errors="exit_code"><![CDATA[ | |
9 ## the following ln-action is necessary, since the file names are used by proteinortho (output contains filenames => species names) | |
10 #import re | |
11 #for $f in $input_files# | |
12 ln -sf '$f' '${re.sub('[^\w\-_.]', '_', f.element_identifier)}' && | |
13 #end for# | |
14 #if $query.querytype == "file": | |
15 ln -sf '$query.queryfile' 'query' && | |
16 #end if | |
17 mkdir output && cd output && | |
18 proteinortho_grab_proteins.pl | |
19 --tofiles | |
20 #if $regex: | |
21 $regex | |
22 #end if | |
23 #if $source: | |
24 $source | |
25 #end if | |
26 #if $query.querytype == "string": | |
27 '$query.querystring' | |
28 #else: | |
29 ../query | |
30 #end if | |
31 #for $f in $input_files# | |
32 ../${re.sub('[^\w\-_.]', '_', f.element_identifier)} | |
33 #end for# | |
34 ]]></command> | |
35 <inputs> | |
36 <param name="input_files" type="data" format="fasta" multiple="true" min="1" label="Select the input fasta files"/> | |
37 <conditional name="query"> | |
38 <param name="querytype" type="select" label="Query type"> | |
39 <option value="string" selected="true">String</option> | |
40 <option value="file">orthology-groups output file</option> | |
41 </param> | |
42 <when value="string"> | |
43 <param name="querystring" type="text" label="A string of the protein/gene name/identifier that you want to search"> | |
44 <sanitizer invalid_char=""> | |
45 <valid initial="string.letters,string.digits"> | |
46 <add value="!"/> | |
47 <add value="="/> | |
48 <add value="-"/> | |
49 <add value="."/> | |
50 <add value="*"/> | |
51 <add value="?"/> | |
52 <add value="+"/> | |
53 <add value="\\"/> | |
54 <add value="_"/> | |
55 <add value="|"/> | |
56 <add value="["/> <!-- left square bracket, e.g subselecting from vec[1] --> | |
57 <add value="]"/> <!-- right square bracket --> | |
58 <add value="("/> <!-- left parenthesis --> | |
59 <add value=")"/> <!-- right parenthesis --> | |
60 </valid> | |
61 </sanitizer> | |
62 </param> | |
63 </when> | |
64 <when value="file"> | |
65 <param name="queryfile" type="data" format="tabular" label="A orthology-groups file" help="For each group a fasta file is generated containing all proteins/genes of that group."/> | |
66 </when> | |
67 </conditional> | |
68 <param argument="--regex" type="boolean" checked="false" truevalue="-E" falsevalue="" label="Enable regular expressions (perl)" help="If not: the string is escaped (e.g. | -> \|) [-E]"/> | |
69 <param argument="--source" type="boolean" checked="false" truevalue="-source" falsevalue="" label="Add the filename to the gene/protein-name [--source]"/> | |
70 </inputs> | |
71 <outputs> | |
72 <collection name="listproteinorthograbproteins" type="list" label="${tool.name} on ${on_string}: list of fasta"> | |
73 <discover_datasets pattern="__designation__" format="fasta" directory="output" visible="false"/> | |
74 </collection> | |
75 </outputs> | |
76 <tests> | |
77 <test> | |
78 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/> | |
79 <param name="querytype" value="string"/> | |
80 <param name="querystring" value="E_1"/> | |
81 <output_collection name="listproteinorthograbproteins" count="1"/> | |
82 </test> | |
83 <test> | |
84 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/> | |
85 <param name="querytype" value="string"/> | |
86 <param name="regex" value="true"/> | |
87 <param name="source" value="true"/> | |
88 <param name="querystring" value="M..2"/> | |
89 <output_collection name="listproteinorthograbproteins" count="1"/> | |
90 </test> | |
91 <test> | |
92 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/> | |
93 <param name="querytype" value="file"/> | |
94 <param name="queryfile" value="result.proteinortho.tsv"/> | |
95 <output_collection name="listproteinorthograbproteins" count="34"/> | |
96 </test> | |
97 </tests> | |
98 <help><![CDATA[proteinortho grab proteins | |
99 | |
100 **What it does** | |
101 | |
102 proteinortho_grab_proteins : find gene(s)/protein(s) in a given fasta file and retrieve their sequence(s). You can also use a orthology-groups file, then all sequences for each group (one line of the file) is outputted. This can result in many files! | |
103 | |
104 **Other Proteinortho-Tools for downstream analysis** | |
105 | |
106 * `proteinortho summary` : Summaries the orthology-pairs/RBH files to determine how the species are connected to each other. | |
107 | |
108 More information can be found on github https://gitlab.com/paulklemm_PHD/proteinortho | |
109 ]]> | |
110 </help> | |
111 <expand macro="citations"/> | |
112 </tool> |