Mercurial > repos > cpt > cpt_putative_isp
annotate generate-putative-isp.xml @ 5:0f6659efd912 draft
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
author | cpt |
---|---|
date | Wed, 18 Sep 2024 04:44:36 +0000 |
parents | bc16792ecfd2 |
children | 7a0ed74e9ff8 |
rev | line source |
---|---|
1
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
1 <tool id="edu.tamu.cpt2.spanin.generate-putative-isp" name="ISP candidates" version="1.0"> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
2 <description>constructs a putative list of potential i-spanin from an input genomic FASTA</description> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
3 <macros> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
4 <import>macros.xml</import> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
5 </macros> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
6 <expand macro="requirements"> |
4
bc16792ecfd2
planemo upload commit ad5355b899dc8f8300c206522e2a65d49809fb73
cpt
parents:
3
diff
changeset
|
7 <requirement type="package" version="2019.06.08">regex</requirement> |
5
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
8 <requirement type="package" version="1.77">biopython</requirement> |
1
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
9 </expand> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
10 <command detect_errors="aggressive"><![CDATA[ |
5
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
11 python '$__tool_directory__/generate-putative-isp.py' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
12 '$fasta_file' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
13 --strand '$strand' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
14 --switch '$switch' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
15 --isp_on '$isp_on' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
16 --isp_op '$isp_op' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
17 --isp_ob '$isp_ob' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
18 --isp_og '$isp_og' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
19 --isp_min_len '$isp_min_len' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
20 --isp_min_dist '$isp_min_dist' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
21 --isp_max_dist '$isp_max_dist' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
22 --min_tmd_size '$min_tmd_size' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
23 --max_tmd_size '$max_tmd_size' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
24 --putative_isp '$putative_isp' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
25 --summary_isp_txt '$summary_isp' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
26 --putative_isp_gff '$putative_isp_gff' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
27 --isp_max '$isp_max' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
28 --peri_min '$peri_min' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
29 --peri_max '$peri_max' |
0f6659efd912
planemo upload commit d213efcbada7995b34f93ed64202e551fa4fcf07
cpt
parents:
4
diff
changeset
|
30 ]]></command> |
1
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
31 <inputs> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
32 <param type="select" label="Strand Choice" name="strand"> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
33 <option value="both">both</option> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
34 <option value="forward">+</option> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
35 <option value="reverse">-</option> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
36 </param> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
37 <param label="Single Genome FASTA" name="fasta_file" type="data" format="fasta"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
38 <param label="i-spanin minimal length" name="isp_min_len" type="integer" value="60"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
39 <param label="i-spanin maximum length" name="isp_max" type="integer" value="230"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
40 <param label="Range Selection; default is all; for a specific range to check for a spanin input integers separated by a colon (eg. 1000:2000)" type="text" name="switch" value="all"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
41 <param label="TMD minimal distance from start codon" name="isp_min_dist" type="integer" value="10"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
42 <param label="TMD maximum distance from start codon" name="isp_max_dist" type="integer" value="35" help="Searches for a TMD between TMDmin and TMDmax ie [TMDmin,TMDmax]"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
43 <param label="TMD minimal size" name="min_tmd_size" type="integer" value="10"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
44 <param label="TMD maximum size" name="max_tmd_size" type="integer" value="25"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
45 <param label="Periplasmic minimal residue amount" name="peri_min" type="integer" value="16"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
46 <param label="Periplasmic maximum residue amount" name="peri_max" type="integer" value="206"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
47 </inputs> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
48 <outputs> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
49 <data format="fasta" name="isp_on" label="NucSequences.fa" hidden="true"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
50 <data format="fasta" name="isp_op" label="ProtSequences.fa" hidden="true"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
51 <data format="bed" name="isp_ob" label="BED_Output.bed" hidden="true"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
52 <data format="gff3" name="isp_og" label="GFF_Output.gff" hidden="true"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
53 <data format="fasta" name="putative_isp" label="putative_isp.fa"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
54 <data format="txt" name="summary_isp" label="summary_isp.txt"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
55 <data format="gff3" name="putative_isp_gff" label="putative_isp.gff3"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
56 </outputs> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
57 <help><![CDATA[ |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
58 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
59 **What it does** |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
60 Searches a genome for candidate i-spanins (ISPs), a phage protein involved in outer membrane disruption during Gram-negative bacterial host cell lysis. |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
61 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
62 **METHODOLOGY** |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
63 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
64 Locates ALL potential start sequences, based on TTG / ATG / GTG (M / L / V). This list is pared down to those within the user-set min/max lengths. That filtered list generates a set of files with the ORFs in FASTA (nt and aa), BED, and GFF3 file formats. |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
65 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
66 With the protein FASTA, the tool next reads in each potential sequence and determines if it has a putative transmembrane domain (TMD) with the following criteria: |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
67 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
68 1. Presence of snorkeling Lysine residues surrounded by hydrophobic residues described for TMD below, within the range the user specifies. |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
69 2. A putative transmembrane domain, or TMD, defined as a repeated hydrophobic region within the sequence ([FIWLVMYCATGSP]), of length and position within the range the user inputs. |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
70 3. Length of expected periplasmic region. User defines minimum and maximum thresholds for required number of residues after TMD. |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
71 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
72 **INPUT** --> Genomic FASTA |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
73 *NOTE: This tool only takes a SINGLE genomic fasta. It does not work with multiFASTAs.* |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
74 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
75 **OUTPUT** --> putative_isp.fa (FASTA) file, putative_isp.gff3, and basic summary statistics as summary_isp.txt. |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
76 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
77 Protein sequences which passed the above filters are returned as the candidate ISPs. |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
78 |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
79 ]]></help> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
80 <expand macro="citations-crr"/> |
4e02e6e9e77d
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
81 </tool> |