Mercurial > repos > petr-novak > dante
comparison dante.xml @ 10:d0431a839606 draft
Uploaded
author | petr-novak |
---|---|
date | Wed, 14 Aug 2019 11:24:15 -0400 |
parents | 6dcecbe81d78 |
children | 3151a72a6671 |
comparison
equal
deleted
inserted
replaced
9:ed4d9ede9cb4 | 10:d0431a839606 |
---|---|
2 <description> Tool for annotation of transposable elements based on the similarity to conserved protein domains database. </description> | 2 <description> Tool for annotation of transposable elements based on the similarity to conserved protein domains database. </description> |
3 <requirements> | 3 <requirements> |
4 <requirement type="package">last</requirement> | 4 <requirement type="package">last</requirement> |
5 <requirement type="package">numpy</requirement> | 5 <requirement type="package">numpy</requirement> |
6 <requirement type="package" version="1.0">rexdb</requirement> | 6 <requirement type="package" version="1.0">rexdb</requirement> |
7 <requirement type="set_environment">REXDB</requirement> | |
7 </requirements> | 8 </requirements> |
8 <stdio> | 9 <stdio> |
9 <regex match="Traceback" source="stderr" level="fatal" description="Unknown error" /> | 10 <regex match="Traceback" source="stderr" level="fatal" description="Unknown error" /> |
10 <regex match="error" source="stderr" level="fatal" description="Unknown error" /> | 11 <regex match="error" source="stderr" level="fatal" description="Unknown error" /> |
11 </stdio> | 12 </stdio> |
12 <command> | 13 <command> |
13 python3 ${__tool_directory__}/dante.py --query ${input} --domain_gff ${DomGff} | 14 python3 ${__tool_directory__}/dante.py --query ${input} --domain_gff ${DomGff} |
14 --protein_database \${REXDB}/${db_type}_pdb | 15 --protein_database \${REXDB}/${db_type}_pdb |
15 --classification \${REXDB}/${db_type}_class | 16 --classification \${REXDB}/${db_type}_class |
17 --scoring_matrix ${scoring_matrix} | |
18 && | |
19 | |
20 python3 ${__tool_directory__}/dante_gff_output_filtering.py --dom_gff ${DomGff} | |
21 --domains_prot_seq domains_filtered.fasta --domains_filtered domains_filtered.gff | |
22 --output_dir . | |
23 --selected_dom All --th_identity 0.35 | |
24 --th_similarity 0.45 --th_length 0.9 | |
25 --interruptions 1 --max_len_proportion 1.1 | |
26 --element_type '' && | |
27 | |
28 python3 ${__tool_directory__}/fasta2database.py domains_filtered.fasta domains_filtered.db | |
29 domains_filtered.class && | |
30 | |
31 lastdb -p domains_filtered.db domains_filtered.db && | |
32 | |
33 python3 ${__tool_directory__}/dante.py --query ${input} --domain_gff ${DomGff2} | |
34 --protein_database domains_filtered.db | |
35 --classification domains_filtered.class | |
36 --scoring_matrix BL80 | |
37 | |
16 </command> | 38 </command> |
17 <inputs> | 39 <inputs> |
18 <param format="fasta" type="data" name="input" label="Choose your input sequence" help="Input DNA must be in proper fasta format, multi-fasta containing more sequences is allowed" /> | 40 <param format="fasta" type="data" name="input" |
41 label="Choose your input sequence" help="Input DNA must be in proper fasta format, multi-fasta containing more sequences is allowed" /> | |
19 | 42 |
20 <param name="db_type" type="select" label="Select taxon and protein domain database version (REXdb)" help=""> | 43 <param name="db_type" type="select" label="Select taxon and protein domain database version (REXdb)" help=""> |
21 <options from_file="rexdb_versions.loc"> | 44 <options from_file="rexdb_versions.loc"> |
22 <column name="name" index="0"/> | 45 <column name="name" index="0"/> |
23 <column name="value" index="1"/> | 46 <column name="value" index="1"/> |
24 </options> | 47 </options> |
25 </param> | 48 </param> |
49 | |
50 <param name="scoring_matrix" type="select" label="Select scoring matrix"> | |
51 <option value="BL80" selected="true" >BLOSUM80</option> | |
52 <option value="BL62">BLOSUM62</option> | |
53 <option value="MIQS">MIQS</option> | |
54 </param> | |
26 </inputs> | 55 </inputs> |
27 | 56 |
28 <outputs> | 57 <outputs> |
29 <data format="gff3" name="DomGff" label="Unfiltered GFF3 file of ALL protein domains from dataset ${input.hid}" /> | 58 <data format="gff3" name="DomGff" label="protein domains detected in ${input.hid} - 1st pass (unfiltered)" /> |
59 <data format="gff3" name="DomGff2" label="protein domains detected in ${input.hid} - 2nd pass (unfiltered)" /> | |
30 </outputs> | 60 </outputs> |
31 <help> | 61 <help> |
32 | 62 |
33 THIS IS A PRIMARY OUTPUT THAT SHOULD UNDERGO FURTHER QUALITY FILTERING TO GET RID OFF POTENTIAL FALSE POSITIVE DOMAINS | 63 THIS IS A PRIMARY OUTPUT THAT SHOULD UNDERGO FURTHER QUALITY FILTERING TO GET RID OFF POTENTIAL FALSE POSITIVE DOMAINS |
34 | 64 |