Mercurial > repos > petr-novak > various_galaxy_tools
comparison extract_GFF_Features.xml @ 0:696e702ebf74 draft
"planemo upload commit 0f6eca49bafc3c946189d793161a7f81d595e1a1-dirty"
author | petr-novak |
---|---|
date | Mon, 09 May 2022 08:26:30 +0000 |
parents | |
children | 639c0edb7e64 |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:696e702ebf74 |
---|---|
1 <tool id="Extract_features1" name="Extract features" version="1.0.0"> | |
2 <description>from GFF data</description> | |
3 <command interpreter="python">extract_GFF_Features.py $input1 $out_file1 ${column_choice.col} ${column_choice.feature}</command> | |
4 <inputs> | |
5 <param format="gff" name="input1" type="data" label="Select GFF data"/> | |
6 <conditional name="column_choice"> | |
7 <param name="col" type="select" label="From"> | |
8 <option value="0" selected="true">Column 1 / Sequence name</option> | |
9 <option value="1">Column 2 / Source</option> | |
10 <option value="2">Column 3 / Feature</option> | |
11 <option value="6">Column 7 / Strand</option> | |
12 <option value="7">Column 8 / Frame</option> | |
13 </param> | |
14 <when value="0"> | |
15 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns"> | |
16 <options from_dataset="input1"> | |
17 <column name="name" index="0"/> | |
18 <column name="value" index="0"/> | |
19 <filter type="unique_value" name="unique" column="0"/> | |
20 </options> | |
21 </param> | |
22 </when> | |
23 <when value="1"> | |
24 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns"> | |
25 <options from_dataset="input1"> | |
26 <column name="name" index="1"/> | |
27 <column name="value" index="1"/> | |
28 <filter type="unique_value" name="unique" column="1"/> | |
29 </options> | |
30 </param> | |
31 </when> | |
32 <when value="2"> | |
33 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns"> | |
34 <options from_dataset="input1"> | |
35 <column name="name" index="2"/> | |
36 <column name="value" index="2"/> | |
37 <filter type="unique_value" name="unique" column="2"/> | |
38 </options> | |
39 </param> | |
40 </when> | |
41 <when value="6"> | |
42 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns"> | |
43 <options from_dataset="input1"> | |
44 <column name="name" index="6"/> | |
45 <column name="value" index="6"/> | |
46 <filter type="unique_value" name="unique" column="6"/> | |
47 </options> | |
48 </param> | |
49 </when> | |
50 <when value="7"> | |
51 <param name="feature" type="select" multiple="true" label="Extract features" help="Multi-select list - hold the appropriate key while clicking to select multiple columns"> | |
52 <options from_dataset="input1"> | |
53 <column name="name" index="7"/> | |
54 <column name="value" index="7"/> | |
55 <filter type="unique_value" name="unique" column="7"/> | |
56 </options> | |
57 </param> | |
58 </when> | |
59 </conditional> | |
60 </inputs> | |
61 <outputs> | |
62 <data format="input" name="out_file1" metadata_source="input1"/> | |
63 </outputs> | |
64 <tests> | |
65 <test> | |
66 <param name="input1" value="5.gff"/> | |
67 <param name="col" value="0" /> | |
68 <param name="feature" value="chr5,chr6,chr7,chr8" /> | |
69 <output name="out_file1" file="Extract_features1_out.gff"/> | |
70 </test> | |
71 </tests> | |
72 <help> | |
73 | |
74 **What it does** | |
75 | |
76 This tool extracts selected features from GFF data. | |
77 | |
78 ----- | |
79 | |
80 **Example** | |
81 | |
82 Selecting **promoter** from the following GFF data:: | |
83 | |
84 chr22 GeneA enhancer 10000000 10001000 500 + . TGA | |
85 chr22 GeneA promoter 10010000 10010100 900 + . TGA | |
86 chr22 GeneB promoter 10020000 10025000 400 - . TGB | |
87 chr22 GeneB CCDS2220 10030000 10065000 800 - . TGB | |
88 | |
89 will produce the following output:: | |
90 | |
91 chr22 GeneA promoter 10010000 10010100 900 + . TGA | |
92 chr22 GeneB promoter 10020000 10025000 400 - . TGB | |
93 | |
94 ---- | |
95 | |
96 .. class:: infomark | |
97 | |
98 **About formats** | |
99 | |
100 **GFF format** General Feature Format is a format for describing genes and other features associated with DNA, RNA and Protein sequences. GFF lines have nine tab-separated fields:: | |
101 | |
102 1. seqname - Must be a chromosome or scaffold. | |
103 2. source - The program that generated this feature. | |
104 3. feature - The name of this type of feature. Some examples of standard feature types are "CDS", "start_codon", "stop_codon", and "exon". | |
105 4. start - The starting position of the feature in the sequence. The first base is numbered 1. | |
106 5. end - The ending position of the feature (inclusive). | |
107 6. score - A score between 0 and 1000. If there is no score value, enter ".". | |
108 7. strand - Valid entries include '+', '-', or '.' (for don't know/care). | |
109 8. frame - If the feature is a coding exon, frame should be a number between 0-2 that represents the reading frame of the first base. If the feature is not a coding exon, the value should be '.'. | |
110 9. group - All lines with the same group are linked together into a single item. | |
111 | |
112 | |
113 </help> | |
114 </tool> |