0
|
1 <?xml version="1.0"?>
|
|
2 <tool id="edu.tamu.cpt.genbank.GBKtoFiveCol" name="Genbank to Five Column Format" version="1.0">
|
|
3 <description></description>
|
|
4 <macros>
|
|
5 <import>macros.xml</import>
|
|
6 <import>cpt-macros.xml</import>
|
|
7 </macros>
|
|
8 <expand macro="requirements"/>
|
|
9 <command detect_errors="aggressive"><![CDATA[
|
|
10 python $__tool_directory__/gbk_to_five_col.py
|
|
11 "$file"
|
|
12
|
|
13 > "$output"
|
|
14
|
|
15 ]]></command>
|
|
16 <inputs>
|
|
17 <param label="GenBank file" name="file" type="data" format="genbank" />
|
|
18 </inputs>
|
|
19 <outputs>
|
|
20 <data format="tabular" name="output">
|
|
21 </data>
|
|
22 </outputs>
|
|
23 <tests>
|
|
24 <test>
|
|
25 <param name="file" value="complex_feature_locs.gbk" />
|
|
26 <output name="output" value="gbkto5col.tsv" />
|
|
27 </test>
|
|
28 </tests>
|
|
29 <help>
|
|
30 Genbank Format to Five Column Format
|
|
31 ====================================
|
|
32
|
|
33 Output format is:
|
|
34
|
|
35 >Feature ID
|
|
36 Line 1
|
|
37 - Column 1: Start location (first nucleotide) of a feature
|
|
38 - Column 2: Stop location (last nucleotide) of a feature
|
|
39 - Column 3: Feature name (for example, 'CDS' or 'mRNA' or 'rRNA' or 'gene' or 'exon')
|
|
40
|
|
41 Line2:
|
|
42 - Column 4: Qualifier name (for example, 'product' or 'number' or 'gene' or 'note')
|
|
43 - Column 5: Qualifier value
|
|
44
|
|
45 Example Output::
|
|
46
|
|
47 >Feature contig00077
|
|
48 0 22956 source
|
|
49 mol_type genomic DNA
|
|
50 organism AU1189
|
|
51 11652 11326 CDS
|
|
52 11327 11158
|
|
53 note tapemeasure frameshift chaperone
|
|
54 product P2 E' tapemeasure frameshift chaperone
|
|
55 gene gp14
|
|
56 translation MNPIQSDAAAPDLQADAAAIATPAQDDPATHTLDTPLVRGTQTITSITLRKPKSGELRGVSLSDLVSLDVVALSKVLPRISSPMLTEADVASIDPADLVQLGGIFAGFFDAEGREIPTGLPDRVEDPMADIATVFGWTPPVMDAFSLAELMDWRERARVRAGAQ
|
|
57 11900 11599 CDS
|
|
58 11600 11408
|
|
59 11910 11904 RBS
|
|
60
|
|
61 </help>
|
|
62 <expand macro="citations" />
|
|
63 </tool>
|