annotate proteinortho.xml @ 0:4850f0d15f01 draft

"planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
author iuc
date Tue, 18 Feb 2020 17:57:28 -0500
parents
children 26abc7846e6f
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
1 <tool id="proteinortho" name="Proteinortho" version="@TOOL_VERSION@+galaxy@WRAPPER_VERSION@">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
2 <description>detects orthologous proteins/genes within different species</description>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
3 <macros>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
4 <import>proteinortho_macros.xml</import>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
5 </macros>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
6 <expand macro="requirements"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
7 <expand macro="version_command"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
8 <command detect_errors="exit_code"><![CDATA[
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
9 ## the following ln-action is necessary, since the file names are used by proteinortho (output contains filenames => species names)
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
10 #import re
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
11 #for $f in $input_files#
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
12 ln -sf '$f' '${re.sub('[^\w\-_.]', '_', f.element_identifier)}' &&
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
13 #end for
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
14 #if $synteny.synteny_options == "specified":
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
15 #for $f in $synteny.input_files_syn#
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
16 ln -sf '$f' '${re.sub('[^\w\-_.]', '_', f.element_identifier)}' &&
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
17 #end for#
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
18 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
19 proteinortho
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
20 --project=result
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
21 --cpus="\${GALAXY_SLOTS:-4}"
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
22 --ram="\${GALAXY_MEMORY_MB:-16000}"
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
23 #if $more_options.selfblast:
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
24 $more_options.selfblast
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
25 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
26 #if $more_options.singles:
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
27 $more_options.singles
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
28 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
29 --p=$p
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
30 --e=$evalue
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
31 #if $more_options.cov:
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
32 --cov=$more_options.cov
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
33 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
34 #if $more_options.sim:
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
35 --sim=`LC_NUMERIC=C awk "BEGIN {printf \"%.2f\",$more_options.sim/100}"`
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
36 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
37 #if $more_options.identity:
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
38 --cov=$more_options.identity
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
39 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
40 #if $more_options.isoform != "no":
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
41 --isoform=$more_options.isoform
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
42 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
43 #if $synteny.synteny_options == "specified":
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
44 --synteny
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
45 --dups=$synteny.dups
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
46 --cs=$synteny.cs
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
47 --alpha=$synteny.alpha
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
48 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
49 #for $f in $input_files#
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
50 ${re.sub('[^\w\-_.]', '_', f.element_identifier)}
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
51 #end for#
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
52 #if $synteny.synteny_options == "specified":
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
53 #for $f in $synteny.input_files_syn#
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
54 ${re.sub('[^\w\-_.]', '_', f.element_identifier)}
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
55 #end for#
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
56 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
57 2> >(sed -E "s/.\[([0-9]{1,2}(;[0-9]{1,2})?)?[mGK]//g" 1>&2)
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
58 #if $synteny.synteny_options == "specified":
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
59 &&
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
60 mv result.poff-graph result.proteinortho-graph &&
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
61 mv result.poff.tsv result.proteinortho.tsv &&
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
62 mv result.poff.html result.proteinortho.html ;
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
63 #end if
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
64 ]]></command>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
65 <inputs>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
66 <param name="input_files" format="fasta" type="data" multiple="true" min="2" label="Select the input fasta files (>2)" help="The input fasta files. At least 2 are needed!"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
67 <param argument="--p" type="select" label="Similarity comparision algorithm" help="In the first step of proteinortho an all-versus-all reciprocal best hit graph is build from the input files (using this algorithm).">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
68 <option value="diamond" selected="true">diamond (aminoacid sequences)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
69 <option value="autoblast">auto detect NCBI-BLAST (protein and nucleotide sequences)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
70 <option value="blastp">NCBI-BLASTP+ (protein sequences)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
71 <option value="blastn">NCBI-BLASTN+ (nucleotide sequences)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
72 <option value="lastp">Last (aminoacid sequences)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
73 <option value="lastn">Last (nucleotide sequences)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
74 <option value="blatp">BLAT (aminoacid sequences)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
75 <option value="blatn">BLAT (nucleotide sequences)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
76 </param>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
77 <param argument="--evalue" type="float" value="0.001" min="0" label="E-value threshold of the blast algorithm" help="This is the main parameter for the generation of the reciprocal best hit graph. Larger values results in more false positives (connections between proteins)."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
78 <param argument="--conn" type="float" value="0.1" min="0." max="10." label="Minimal algebraic connectivity" help="This is the main parameter for the clustering step. Choose larger values then more splits are done, resulting in more and smaller clusters."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
79 <section name="more_options" title="Additional Options" expanded="False">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
80 <param argument="--cov" type="integer" value="50" min="0" max="100" label="Minimal coverage of best blast alignments in %"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
81 <param argument="--sim" type="integer" value="95" min="0" max="100" label="Minimal sequence similarity in %"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
82 <param argument="--identity" type="integer" value="25" min="0" max="100" label="Minimal percent identity of best blast hits in %"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
83 <param argument="--selfblast" type="boolean" checked="false" truevalue="--selfblast" falsevalue="" label="Apply selfblast, detects paralogs without orthologs "/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
84 <param argument="--singles" type="boolean" checked="false" truevalue="--singles" falsevalue="" label="Report singleton genes without any hit "/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
85 <param argument="--isoform" type="select" label="Use isoform information" help="The reciprocal best hit graph is build using isoform information (isoforms are treated equivalent). For ncbi : simply add the additional files to the input (file names need to match). For uniprot : the isoforms need to contain the word isoform and the corresponding identifier. For trinity simply use the trinity output format.">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
86 <option value="no" selected="true">Don't use isoform information</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
87 <option value="ncbi">ncbi style (..._additional.fasta)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
88 <option value="uniprot">uniprot style (...isoform of...)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
89 <option value="trinity">trinity style (...i4)</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
90 </param>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
91 </section>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
92 <conditional name="synteny">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
93 <param name="synteny_options" type="select" label="Activate synteny feature (POFF)" help="To enhance the prediction accuracy, the relative order of genes (synteny) can be used as additional feature for the discrimination of orthologs. For more details see doi:10.1371/journal.pone.0105015.">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
94 <option value="no" selected="true">no</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
95 <option value="specified">yes</option>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
96 </param>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
97 <when value="no"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
98 <when value="specified">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
99 <param argument="--dups" type="integer" value="0" min="0" max="100" label="Number of reiterations for adjacencies heuristic, to determine duplicated regions"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
100 <param argument="--cs" type="integer" value="3" min="0" max="100" label="Size of a maximum common substring (MCS) for adjacency matches"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
101 <param argument="--alpha" type="float" value="0.5" min="0." max="1." label="Minimal percent identity of best blast hits"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
102 <param name="input_files_syn" type="data" format="gff" multiple="true" min="2" label="Select the GFF3 files matching the input fasta files" help="The GFF3 files need matching names with the input fasta files. If you provide mybacteria123.faa or mybacteria123.fasta ... then you need to provide mybacteria123.gff here accoringly. The attributes column (#9) must contain the attribute Name=GENE IDENTIFIER where GENE IDENTIFIER corresponds to the respective (protein) identifier in the FASTA input. For example see https://gitlab.com/paulklemm_PHD/proteinortho/-/blob/master/test/C.gff"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
103 </when>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
104 </conditional>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
105 </inputs>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
106 <outputs>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
107 <data name="blastgraph" format="tabular" label="${tool.name} on ${on_string}: RBH graph" from_work_dir="result.blast-graph"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
108 <data name="proteinortho" format="tabular" label="${tool.name} on ${on_string}: orthology-groups" from_work_dir="result.proteinortho.tsv"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
109 <data name="proteinorthograph" format="tabular" label="${tool.name} on ${on_string}: orthology-pairs" from_work_dir="result.proteinortho-graph"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
110 </outputs>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
111 <tests>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
112 <test expect_num_outputs="3"> <!-- test normal -->
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
113 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
114 <output name="proteinortho">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
115 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
116 <has_text text="# Species&#009;Genes&#009;Alg.-Conn."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
117 <has_text text="2&#009;5&#009;0.16"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
118 <has_text text="M_640,M_642,M_649"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
119 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
120 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
121 <output name="blastgraph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
122 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
123 <has_text text="L_10&#009;E_10&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
124 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
125 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
126 <output name="proteinorthograph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
127 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
128 <has_text text="L_11&#009;E_11&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
129 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
130 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
131 </test>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
132 <test expect_num_outputs="3"> <!-- various parameter -->
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
133 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
134 <param name="evalue" value="1"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
135 <param name="conn" value="1"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
136 <param name="cov" value="42"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
137 <param name="sim" value="42"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
138 <param name="identity" value="42"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
139 <param name="selfblast" value="true"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
140 <param name="singles" value="true"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
141 <output name="proteinortho">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
142 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
143 <has_text text="# Species&#009;Genes&#009;Alg.-Conn."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
144 <has_text text="1&#009;1&#009;0"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
145 <has_text text="&#009;C_177&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
146 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
147 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
148 <output name="blastgraph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
149 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
150 <has_text text="C_1&#009;C_1&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
151 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
152 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
153 <output name="proteinorthograph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
154 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
155 <has_text text="C_12&#009;C_21&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
156 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
157 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
158 </test>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
159 <test expect_num_outputs="3"> <!-- synteny -->
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
160 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
161 <param name="input_files_syn" value="L.gff,C.gff,C2.gff,E.gff,M.gff"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
162 <param name="synteny_options" value="specified"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
163 <output name="proteinortho">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
164 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
165 <has_text text="# Species&#009;Genes&#009;Alg.-Conn."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
166 <has_text text="4&#009;5&#009;0.144"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
167 <has_text text="E_313,E_315"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
168 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
169 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
170 <output name="proteinorthograph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
171 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
172 <has_text text="M_313&#009;L_313&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
173 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
174 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
175 </test>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
176 <test expect_num_outputs="3"> <!-- blast -->
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
177 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
178 <param name="--p" value="blastp"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
179 <output name="proteinortho">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
180 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
181 <has_text text="# Species&#009;Genes&#009;Alg.-Conn."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
182 <has_text text="2&#009;5&#009;0.16"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
183 <has_text text="M_640,M_642,M_649"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
184 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
185 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
186 <output name="blastgraph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
187 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
188 <has_text text="M_3&#009;L_3&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
189 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
190 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
191 <output name="proteinorthograph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
192 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
193 <has_text text="M_317&#009;L_317&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
194 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
195 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
196 </test>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
197 <test expect_num_outputs="3"> <!-- auto blast -->
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
198 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
199 <param name="--p" value="autoblast"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
200 <output name="proteinortho">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
201 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
202 <has_text text="# Species&#009;Genes&#009;Alg.-Conn."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
203 <has_text text="2&#009;5&#009;0.16"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
204 <has_text text="M_640,M_642,M_649"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
205 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
206 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
207 <output name="blastgraph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
208 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
209 <has_text text="M_3&#009;L_3&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
210 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
211 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
212 <output name="proteinorthograph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
213 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
214 <has_text text="M_317&#009;L_317&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
215 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
216 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
217 </test>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
218 <test expect_num_outputs="3"> <!-- last -->
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
219 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
220 <param name="--p" value="lastp"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
221 <output name="proteinortho">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
222 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
223 <has_text text="# Species&#009;Genes&#009;Alg.-Conn."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
224 <has_text text="2&#009;5&#009;0.16"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
225 <has_text text="M_640,M_642,M_649"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
226 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
227 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
228 <output name="blastgraph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
229 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
230 <has_text text="M_636&#009;E_317&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
231 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
232 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
233 <output name="proteinorthograph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
234 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
235 <has_text text="E_11&#009;C_11&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
236 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
237 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
238 </test>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
239 <test expect_num_outputs="3"> <!-- blat -->
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
240 <param name="input_files" value="L.fasta,C.fasta,C2.fasta,E.fasta,M.fasta"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
241 <param name="--p" value="blastp"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
242 <output name="proteinortho">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
243 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
244 <has_text text="# Species&#009;Genes&#009;Alg.-Conn."/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
245 <has_text text="2&#009;5&#009;0.16"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
246 <has_text text="M_640,M_642,M_649"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
247 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
248 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
249 <output name="blastgraph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
250 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
251 <has_text text="E_10&#009;C_10&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
252 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
253 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
254 <output name="proteinorthograph">
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
255 <assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
256 <has_text text="E_10&#009;C_10&#009;"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
257 </assert_contents>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
258 </output>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
259 </test>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
260 </tests>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
261 <help><![CDATA[Proteinortho with POFF - An orthology detection tool
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
262
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
263 **What it does**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
264
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
265 Proteinortho is a tool to detect orthologous proteins/genes within different species (at least 2).
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
266
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
267 | It compares similarities of given gene/protein sequences and clusters them to find significant groups.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
268 | The algorithm was designed to handle large-scale data and can be applied to hundreds of species at one.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
269 | Details can be found in (doi:10.1186/1471-2105-12-124).
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
270 | To enhance the prediction accuracy, the relative order of genes (synteny) can be used as additional feature for the discrimination of orthologs. The corresponding extension, namely PoFF (details see doi:10.1371/journal.pone.0105015), is already build in Proteinortho.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
271
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
272 ----
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
273
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
274 **Proteinortho in a nutshell**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
275
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
276 ----
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
277
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
278 * **(i) Build adaptive reciprocal best hit graph (RBH)**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
279
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
280 | Using the blast algorithm (diamond,blast,blat,...) all input sequences are compared against each other.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
281 | If two proteins find each other with respect to multiple criteria like minimal evalue, similarity compared to the best hit, ... then a edge is drawn between the two proteins.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
282 | The result of this step is outputted to RBH
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
283
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
284 * **(ii) Cluster the RBH**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
285
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
286 | Using two clustering algorithms, edges are removed that weakly connect two connected components to reduce false positive hits.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
287 | The resulting connected components are outputted in orthology-groups / -PAIRS
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
288
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
289 ----
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
290
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
291 **Proteinortho output files**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
292
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
293 ----
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
294
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
295 * **RBH**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
296
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
297 | The result of the (i) step, the reciprocal best hit graph.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
298 | First a comment line announces 2 species (# ecoli.faa human.faa), then each line corresponds to a reciprocal best hit between 2 proteins/genes of the announced species. The output format is shown below.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
299 | *seqidA*,*seqidB* = the 2 ids/names of the proteins involved
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
300 | *evalue_ab* = evalue with seqidA as query and seqidB as part of the database
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
301 | *bitscore_ab* = bitscore with seqidA as query ...
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
302 | *evalue_ba* = evalue with seqidB as query ...
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
303 | ...
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
304
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
305 .. csv-table::
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
306
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
307 seqidA,seqidB,evalue_ab,bitscore_ab,evalue_ba,bitscore_ba
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
308
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
309 ----
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
310
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
311 * **orthology-groups**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
312
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
313 | The result of the (ii) step, the clustered reciprocal best hit graph or the orthology groups.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
314 | Every line corresponds to an orthology group of proteins/genes.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
315 | The first 3 columns characterize general properties of that group: number of proteins, species and the algebraic connectivity. The higher the algebraic connectivity the more edges are there and the better the group is connected to itself in general.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
316 | Then a column for each species follows containing the proteins of that species. If a species contributes with more than one protein to a group of orthologs, then they are ordered by connectivity.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
317
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
318 .. csv-table::
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
319
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
320 Species,Genes,Alg.-Conn.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
321
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
322 ----
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
323
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
324 * **orthology-pairs**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
325
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
326 | The same as orthology-groups but every edge is printed one-by-one here. The output is formatted the same as the RBH graph:
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
327
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
328 .. csv-table::
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
329
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
330 seqidA,seqidB,evalue_ab,bitscore_ab,evalue_ba,bitscore_ba
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
331
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
332 ----
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
333
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
334 **Proteinortho-Tools for downstream analysis**
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
335
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
336 * `proteinortho grab proteins` : find gene(s)/protein(s) in a given fasta file and retrieve their sequence(s). You can also use a orthology-groups file.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
337 * `proteinortho summary` : Summaries the orthology-pairs/RBH files to determine how the species are connected to each other.
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
338
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
339 More information can be found on github https://gitlab.com/paulklemm_PHD/proteinortho
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
340 ]]>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
341 </help>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
342 <expand macro="citations"/>
4850f0d15f01 "planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
iuc
parents:
diff changeset
343 </tool>