annotate extract_GFF_Features.xml @ 0:696e702ebf74 draft

"planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
author petr-novak
date Mon, 09 May 2022 08:26:30 +0000
parents
children 639c0edb7e64
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
1 <tool id="Extract_features1" name="Extract features" version="1.0.0">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
2 <description>from GFF data</description>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
3 <command interpreter="python">extract_GFF_Features.py $input1 $out_file1 ${column_choice.col} ${column_choice.feature}</command>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
4 <inputs>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
5 <param format="gff" name="input1" type="data" label="Select GFF data"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
6 <conditional name="column_choice">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
7 <param name="col" type="select" label="From">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
8 <option value="0" selected="true">Column 1 / Sequence name</option>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
9 <option value="1">Column 2 / Source</option>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
10 <option value="2">Column 3 / Feature</option>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
11 <option value="6">Column 7 / Strand</option>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
12 <option value="7">Column 8 / Frame</option>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
13 </param>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
14 <when value="0">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
15 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
16 <options from_dataset="input1">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
17 <column name="name" index="0"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
18 <column name="value" index="0"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
19 <filter type="unique_value" name="unique" column="0"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
20 </options>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
21 </param>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
22 </when>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
23 <when value="1">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
24 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
25 <options from_dataset="input1">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
26 <column name="name" index="1"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
27 <column name="value" index="1"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
28 <filter type="unique_value" name="unique" column="1"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
29 </options>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
30 </param>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
31 </when>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
32 <when value="2">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
33 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
34 <options from_dataset="input1">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
35 <column name="name" index="2"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
36 <column name="value" index="2"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
37 <filter type="unique_value" name="unique" column="2"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
38 </options>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
39 </param>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
40 </when>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
41 <when value="6">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
42 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
43 <options from_dataset="input1">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
44 <column name="name" index="6"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
45 <column name="value" index="6"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
46 <filter type="unique_value" name="unique" column="6"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
47 </options>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
48 </param>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
49 </when>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
50 <when value="7">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
51 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
52 <options from_dataset="input1">
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
53 <column name="name" index="7"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
54 <column name="value" index="7"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
55 <filter type="unique_value" name="unique" column="7"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
56 </options>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
57 </param>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
58 </when>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
59 </conditional>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
60 </inputs>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
61 <outputs>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
62 <data format="input" name="out_file1" metadata_source="input1"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
63 </outputs>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
64 <tests>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
65 <test>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
66 <param name="input1" value="5.gff"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
67 <param name="col" value="0" />
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
68 <param name="feature" value="chr5,chr6,chr7,chr8" />
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
69 <output name="out_file1" file="Extract_features1_out.gff"/>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
70 </test>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
71 </tests>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
72 <help>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
73
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
74 **What it does**
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
75
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
76 This tool extracts selected features from GFF data.
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
77
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
78 -----
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
79
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
80 **Example**
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
81
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
82 Selecting **promoter** from the following GFF data::
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
83
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
84 chr22 GeneA enhancer 10000000 10001000 500 + . TGA
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
85 chr22 GeneA promoter 10010000 10010100 900 + . TGA
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
86 chr22 GeneB promoter 10020000 10025000 400 - . TGB
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
87 chr22 GeneB CCDS2220 10030000 10065000 800 - . TGB
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
88
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
89 will produce the following output::
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
90
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
91 chr22 GeneA promoter 10010000 10010100 900 + . TGA
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
92 chr22 GeneB promoter 10020000 10025000 400 - . TGB
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
93
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
94 ----
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
95
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
96 .. class:: infomark
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
97
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
98 **About formats**
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
99
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
100 **GFF format** General Feature Format is a format for describing genes and other features associated with DNA, RNA and Protein sequences. GFF lines have nine tab-separated fields::
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
101
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
102 1. seqname - Must be a chromosome or scaffold.
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
103 2. source - The program that generated this feature.
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
104 3. feature - The name of this type of feature. Some examples of standard feature types are "CDS", "start_codon", "stop_codon", and "exon".
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
105 4. start - The starting position of the feature in the sequence. The first base is numbered 1.
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
106 5. end - The ending position of the feature (inclusive).
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
107 6. score - A score between 0 and 1000. If there is no score value, enter ".".
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
108 7. strand - Valid entries include '+', '-', or '.' (for don't know/care).
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
109 8. frame - If the feature is a coding exon, frame should be a number between 0-2 that represents the reading frame of the first base. If the feature is not a coding exon, the value should be '.'.
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
110 9. group - All lines with the same group are linked together into a single item.
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
111
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
112
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
113 </help>
696e702ebf74 "planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
petr-novak
parents:
diff changeset
114 </tool>