comparison test-data/human_augustus_utr-on.gff @ 3:f5075dee9d6b draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/augustus commit cf04d83d615ff09c4458982282d422fbef7d83ac
author iuc
date Fri, 22 May 2015 04:55:25 -0400
parents af307d3285c5
children 4de31938431b
comparison
equal deleted inserted replaced
2:a77a4e9921e0 3:f5075dee9d6b
1 ##gff-version 3 1 ##gff-version 3
2 # This output was generated with AUGUSTUS (version 2.7). 2 # This output was generated with AUGUSTUS (version 3.1.0).
3 # AUGUSTUS is a gene prediction tool for eukaryotes written by Mario Stanke (mario.stanke@uni-greifswald.de) 3 # AUGUSTUS is a gene prediction tool written by Mario Stanke (mario.stanke@uni-greifswald.de),
4 # and Oliver Keller (keller@cs.uni-goettingen.de). 4 # Oliver Keller, Stefanie König and Lizzy Gerischer.
5 # Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008), 5 # Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008),
6 # Using native and syntenically mapped cDNA alignments to improve de novo gene finding 6 # Using native and syntenically mapped cDNA alignments to improve de novo gene finding
7 # Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013 7 # Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013
8 # No extrinsic information on sequences given. 8 # No extrinsic information on sequences given.
9 # Initialising the parameters ... 9 # Initialising the parameters using config directory /home/bag/projects/code/galaxy/tool_deps/augustus/3.1/iuc/package_augustus_3_1/820bf3789c44/config/ ...
10 # human version. Using species specific transition matrix: /home/bag/Downloads/augustus.2.7/config/species/human/human_trans_shadow_partial_utr.pbl 10 # human version. Using default transition matrix.
11 # Looks like ./examples/example.fa is in fasta format. 11 # Looks like /tmp/tmpboMLLQ/job_working_directory/000/4/task_0/dataset_5.dat is in fasta format.
12 # We have hints for 0 sequences and for 0 of the sequences in the input set. 12 # We have hints for 0 sequences and for 0 of the sequences in the input set.
13 # 13 #
14 # ----- prediction on sequence number 1 (length = 9453, name = HS04636) ----- 14 # ----- prediction on sequence number 1 (length = 9453, name = HS04636) -----
15 # 15 #
16 # Predicted genes for sequence number 1 on both strands 16 # Predicted genes for sequence number 1 on both strands
17 # start gene g1 17 # start gene HS04636.g1
18 HS04636 AUGUSTUS gene 836 8857 1 + . ID=g1 18 HS04636 AUGUSTUS gene 836 8857 1 + . ID=HS04636.g1
19 HS04636 AUGUSTUS transcript 836 8857 . + . ID=g1.t1;Parent=g1 19 HS04636 AUGUSTUS transcript 836 8857 . + . ID=HS04636.g1.t1;Parent=HS04636.g1
20 HS04636 AUGUSTUS transcription_start_site 836 836 . + . Parent=g1.t1 20 HS04636 AUGUSTUS transcription_start_site 836 836 . + . Parent=HS04636.g1.t1
21 HS04636 AUGUSTUS exon 836 1017 . + . Parent=g1.t1 21 HS04636 AUGUSTUS exon 836 1017 . + . Parent=HS04636.g1.t1
22 HS04636 AUGUSTUS start_codon 966 968 . + 0 Parent=g1.t1 22 HS04636 AUGUSTUS start_codon 966 968 . + 0 Parent=HS04636.g1.t1
23 HS04636 AUGUSTUS CDS 966 1017 . + 0 ID=g1.t1.cds;Parent=g1.t1 23 HS04636 AUGUSTUS CDS 966 1017 . + 0 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
24 HS04636 AUGUSTUS CDS 1818 1934 . + 2 ID=g1.t1.cds;Parent=g1.t1 24 HS04636 AUGUSTUS CDS 1818 1934 . + 2 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
25 HS04636 AUGUSTUS exon 1818 1934 . + . Parent=g1.t1 25 HS04636 AUGUSTUS exon 1818 1934 . + . Parent=HS04636.g1.t1
26 HS04636 AUGUSTUS CDS 2055 2198 . + 2 ID=g1.t1.cds;Parent=g1.t1 26 HS04636 AUGUSTUS CDS 2055 2198 . + 2 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
27 HS04636 AUGUSTUS exon 2055 2198 . + . Parent=g1.t1 27 HS04636 AUGUSTUS exon 2055 2198 . + . Parent=HS04636.g1.t1
28 HS04636 AUGUSTUS CDS 2852 2995 . + 2 ID=g1.t1.cds;Parent=g1.t1 28 HS04636 AUGUSTUS CDS 2852 2995 . + 2 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
29 HS04636 AUGUSTUS exon 2852 2995 . + . Parent=g1.t1 29 HS04636 AUGUSTUS exon 2852 2995 . + . Parent=HS04636.g1.t1
30 HS04636 AUGUSTUS CDS 3426 3607 . + 2 ID=g1.t1.cds;Parent=g1.t1 30 HS04636 AUGUSTUS CDS 3426 3607 . + 2 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
31 HS04636 AUGUSTUS exon 3426 3607 . + . Parent=g1.t1 31 HS04636 AUGUSTUS exon 3426 3607 . + . Parent=HS04636.g1.t1
32 HS04636 AUGUSTUS CDS 4340 4423 . + 0 ID=g1.t1.cds;Parent=g1.t1 32 HS04636 AUGUSTUS CDS 4340 4423 . + 0 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
33 HS04636 AUGUSTUS exon 4340 4423 . + . Parent=g1.t1 33 HS04636 AUGUSTUS exon 4340 4423 . + . Parent=HS04636.g1.t1
34 HS04636 AUGUSTUS CDS 4543 4789 . + 0 ID=g1.t1.cds;Parent=g1.t1 34 HS04636 AUGUSTUS CDS 4543 4789 . + 0 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
35 HS04636 AUGUSTUS exon 4543 4789 . + . Parent=g1.t1 35 HS04636 AUGUSTUS exon 4543 4789 . + . Parent=HS04636.g1.t1
36 HS04636 AUGUSTUS CDS 5072 5358 . + 2 ID=g1.t1.cds;Parent=g1.t1 36 HS04636 AUGUSTUS CDS 5072 5358 . + 2 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
37 HS04636 AUGUSTUS exon 5072 5358 . + . Parent=g1.t1 37 HS04636 AUGUSTUS exon 5072 5358 . + . Parent=HS04636.g1.t1
38 HS04636 AUGUSTUS CDS 5860 6007 . + 0 ID=g1.t1.cds;Parent=g1.t1 38 HS04636 AUGUSTUS CDS 5860 6007 . + 0 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
39 HS04636 AUGUSTUS exon 5860 6007 . + . Parent=g1.t1 39 HS04636 AUGUSTUS exon 5860 6007 . + . Parent=HS04636.g1.t1
40 HS04636 AUGUSTUS CDS 6494 6903 . + 2 ID=g1.t1.cds;Parent=g1.t1 40 HS04636 AUGUSTUS CDS 6494 6903 . + 2 ID=HS04636.g1.t1.cds;Parent=HS04636.g1.t1
41 HS04636 AUGUSTUS exon 6494 8857 . + . Parent=g1.t1 41 HS04636 AUGUSTUS exon 6494 8857 . + . Parent=HS04636.g1.t1
42 HS04636 AUGUSTUS stop_codon 6901 6903 . + 0 Parent=g1.t1 42 HS04636 AUGUSTUS transcription_end_site 8857 8857 . + . Parent=HS04636.g1.t1
43 HS04636 AUGUSTUS transcription_end_site 8857 8857 . + . Parent=g1.t1 43 # coding sequence = [atgctcgcccgcgccctgctgctgtgcgcggtcctggcgctcagccatacagcaaatccttgctgttcccacccatgtc
44 # aaaaccgaggtgtatgtatgagtgtgggatttgaccagtataagtgcgattgtacccggacaggattctatggagaaaactgctcaacaccggaattt
45 # ttgacaagaataaaattatttctgaaacccactccaaacacagtgcactacatacttacccacttcaagggattttggaacgttgtgaataacattcc
46 # cttccttcgaaatgcaattatgagttatgtcttgacatccagatcacatttgattgacagtccaccaacttacaatgctgactatggctacaaaagct
47 # gggaagccttctctaacctctcctattatactagagcccttcctcctgtgcctgatgattgcccgactcccttgggtgtcaaaggtaaaaagcagctt
48 # cctgattcaaatgagattgtggaaaaattgcttctaagaagaaagttcatccctgatccccagggctcaaacatgatgtttgcattctttgcccagca
49 # cttcacgcatcagtttttcaagacagatcataagcgagggccagctttcaccaacgggctgggccatggggtggacttaaatcatatttacggtgaaa
50 # ctctggctagacagcgtaaactgcgccttttcaaggatggaaaaatgaaatatcagataattgatggagagatgtatcctcccacagtcaaagatact
51 # caggcagagatgatctaccctcctcaagtccctgagcatctacggtttgctgtggggcaggaggtctttggtctggtgcctggtctgatgatgtatgc
52 # cacaatctggctgcgggaacacaacagagtatgcgatgtgcttaaacaggagcatcctgaatggggtgatgagcagttgttccagacaagcaggctaa
53 # tactgataggagagactattaagattgtgattgaagattatgtgcaacacttgagtggctatcacttcaaactgaaatttgacccagaactacttttc
54 # aacaaacaattccagtaccaaaatcgtattgctgctgaatttaacaccctctatcactggcatccccttctgcctgacacctttcaaattcatgacca
55 # gaaatacaactatcaacagtttatctacaacaactctatattgctggaacatggaattacccagtttgttgaatcattcaccaggcaaattgctggca
56 # gggttgctggtggtaggaatgttccacccgcagtacagaaagtatcacaggcttccattgaccagagcaggcagatgaaataccagtcttttaatgag
57 # taccgcaaacgctttatgctgaagccctatgaatcatttgaagaacttacaggagaaaaggaaatgtctgcagagttggaagcactctatggtgacat
58 # cgatgctgtggagctgtatcctgcccttctggtagaaaagcctcggccagatgccatctttggtgaaaccatggtagaagttggagcaccattctcct
59 # tgaaaggacttatgggtaatgttatatgttctcctgcctactggaagccaagcacttttggtggagaagtgggttttcaaatcatcaacactgcctca
60 # attcagtctctcatctgcaataacgtgaagggctgtccctttacttcattcagtgttccagatccagagctcattaaaacagtcaccatcaatgcaag
61 # ttcttcccgctccggactagatgatatcaatcccacagtactactaaaagaacgttcgactgaactgtag]
44 # protein sequence = [MLARALLLCAVLALSHTANPCCSHPCQNRGVCMSVGFDQYKCDCTRTGFYGENCSTPEFLTRIKLFLKPTPNTVHYIL 62 # protein sequence = [MLARALLLCAVLALSHTANPCCSHPCQNRGVCMSVGFDQYKCDCTRTGFYGENCSTPEFLTRIKLFLKPTPNTVHYIL
45 # THFKGFWNVVNNIPFLRNAIMSYVLTSRSHLIDSPPTYNADYGYKSWEAFSNLSYYTRALPPVPDDCPTPLGVKGKKQLPDSNEIVEKLLLRRKFIPD 63 # THFKGFWNVVNNIPFLRNAIMSYVLTSRSHLIDSPPTYNADYGYKSWEAFSNLSYYTRALPPVPDDCPTPLGVKGKKQLPDSNEIVEKLLLRRKFIPD
46 # PQGSNMMFAFFAQHFTHQFFKTDHKRGPAFTNGLGHGVDLNHIYGETLARQRKLRLFKDGKMKYQIIDGEMYPPTVKDTQAEMIYPPQVPEHLRFAVG 64 # PQGSNMMFAFFAQHFTHQFFKTDHKRGPAFTNGLGHGVDLNHIYGETLARQRKLRLFKDGKMKYQIIDGEMYPPTVKDTQAEMIYPPQVPEHLRFAVG
47 # QEVFGLVPGLMMYATIWLREHNRVCDVLKQEHPEWGDEQLFQTSRLILIGETIKIVIEDYVQHLSGYHFKLKFDPELLFNKQFQYQNRIAAEFNTLYH 65 # QEVFGLVPGLMMYATIWLREHNRVCDVLKQEHPEWGDEQLFQTSRLILIGETIKIVIEDYVQHLSGYHFKLKFDPELLFNKQFQYQNRIAAEFNTLYH
48 # WHPLLPDTFQIHDQKYNYQQFIYNNSILLEHGITQFVESFTRQIAGRVAGGRNVPPAVQKVSQASIDQSRQMKYQSFNEYRKRFMLKPYESFEELTGE 66 # WHPLLPDTFQIHDQKYNYQQFIYNNSILLEHGITQFVESFTRQIAGRVAGGRNVPPAVQKVSQASIDQSRQMKYQSFNEYRKRFMLKPYESFEELTGE
49 # KEMSAELEALYGDIDAVELYPALLVEKPRPDAIFGETMVEVGAPFSLKGLMGNVICSPAYWKPSTFGGEVGFQIINTASIQSLICNNVKGCPFTSFSV 67 # KEMSAELEALYGDIDAVELYPALLVEKPRPDAIFGETMVEVGAPFSLKGLMGNVICSPAYWKPSTFGGEVGFQIINTASIQSLICNNVKGCPFTSFSV
50 # PDPELIKTVTINASSSRSGLDDINPTVLLKERSTEL] 68 # PDPELIKTVTINASSSRSGLDDINPTVLLKERSTEL]
51 # end gene g1 69 # end gene HS04636.g1
52 ### 70 ###
53 # 71 #
54 # ----- prediction on sequence number 2 (length = 2344, name = HS08198) ----- 72 # ----- prediction on sequence number 2 (length = 2344, name = HS08198) -----
55 # 73 #
56 # Predicted genes for sequence number 2 on both strands 74 # Predicted genes for sequence number 2 on both strands
57 # start gene g2 75 # start gene HS08198.g2
58 HS08198 AUGUSTUS gene 86 2344 1 + . ID=g2 76 HS08198 AUGUSTUS gene 86 2105 1 + . ID=HS08198.g2
59 HS08198 AUGUSTUS transcript 86 2344 . + . ID=g2.t1;Parent=g2 77 HS08198 AUGUSTUS transcript 86 2105 . + . ID=HS08198.g2.t1;Parent=HS08198.g2
60 HS08198 AUGUSTUS transcription_start_site 86 86 . + . Parent=g2.t1 78 HS08198 AUGUSTUS transcription_start_site 86 86 . + . Parent=HS08198.g2.t1
61 HS08198 AUGUSTUS exon 86 582 . + . Parent=g2.t1 79 HS08198 AUGUSTUS exon 86 582 . + . Parent=HS08198.g2.t1
62 HS08198 AUGUSTUS start_codon 445 447 . + 0 Parent=g2.t1 80 HS08198 AUGUSTUS start_codon 445 447 . + 0 Parent=HS08198.g2.t1
63 HS08198 AUGUSTUS CDS 445 582 . + 0 ID=g2.t1.cds;Parent=g2.t1 81 HS08198 AUGUSTUS CDS 445 582 . + 0 ID=HS08198.g2.t1.cds;Parent=HS08198.g2.t1
64 HS08198 AUGUSTUS CDS 812 894 . + 0 ID=g2.t1.cds;Parent=g2.t1 82 HS08198 AUGUSTUS CDS 812 894 . + 0 ID=HS08198.g2.t1.cds;Parent=HS08198.g2.t1
65 HS08198 AUGUSTUS exon 812 894 . + . Parent=g2.t1 83 HS08198 AUGUSTUS exon 812 894 . + . Parent=HS08198.g2.t1
66 HS08198 AUGUSTUS CDS 1053 1123 . + 1 ID=g2.t1.cds;Parent=g2.t1 84 HS08198 AUGUSTUS CDS 1053 1123 . + 1 ID=HS08198.g2.t1.cds;Parent=HS08198.g2.t1
67 HS08198 AUGUSTUS exon 1053 1123 . + . Parent=g2.t1 85 HS08198 AUGUSTUS exon 1053 1123 . + . Parent=HS08198.g2.t1
68 HS08198 AUGUSTUS CDS 1208 1315 . + 2 ID=g2.t1.cds;Parent=g2.t1 86 HS08198 AUGUSTUS CDS 1208 1315 . + 2 ID=HS08198.g2.t1.cds;Parent=HS08198.g2.t1
69 HS08198 AUGUSTUS exon 1208 1315 . + . Parent=g2.t1 87 HS08198 AUGUSTUS exon 1208 1315 . + . Parent=HS08198.g2.t1
70 HS08198 AUGUSTUS CDS 1587 1688 . + 2 ID=g2.t1.cds;Parent=g2.t1 88 HS08198 AUGUSTUS CDS 1587 1688 . + 2 ID=HS08198.g2.t1.cds;Parent=HS08198.g2.t1
71 HS08198 AUGUSTUS exon 1587 1688 . + . Parent=g2.t1 89 HS08198 AUGUSTUS exon 1587 1688 . + . Parent=HS08198.g2.t1
90 HS08198 AUGUSTUS CDS 1772 1848 . + 2 ID=HS08198.g2.t1.cds;Parent=HS08198.g2.t1
91 HS08198 AUGUSTUS exon 1772 2105 . + . Parent=HS08198.g2.t1
92 HS08198 AUGUSTUS transcription_end_site 2105 2105 . + . Parent=HS08198.g2.t1
93 # coding sequence = [atgctgccccctgggactgcgaccctcttgactctgctcctggcagctggctcgctgggccagaagcctcagaggccac
94 # gccggcccgcatcccccatcagcaccatccagcccaaggccaattttgatgcgcagcaggagcagggccaccgggccgaggccaccacactgcatgtg
95 # gctccccagggcacagccatggctgtcagtaccttccgaaagctggatgggatctgctggcaggtgcgccagctctatggagacacaggggtcctcgg
96 # ccgcttcctgcttcaagcccgaggcgcccgaggggctgtgcacgtggttgtcgctgagaccgactaccagagtttcgctgtcctgtacctggagcggg
97 # cggggcagctgtcagtgaagctctacgcccgctcgctccctgtgagcgactcggtcctgagtgggtttgagcagcgggtccaggaggcccacctgact
98 # gaggaccagatcttctacttccccaagtacggcttctgcgaggctgcagaccagttccacgtcctggacggtgagtgcacagcgggggcaagcatggc
99 # ggcgtggtga]
72 # protein sequence = [MLPPGTATLLTLLLAAGSLGQKPQRPRRPASPISTIQPKANFDAQQEQGHRAEATTLHVAPQGTAMAVSTFRKLDGIC 100 # protein sequence = [MLPPGTATLLTLLLAAGSLGQKPQRPRRPASPISTIQPKANFDAQQEQGHRAEATTLHVAPQGTAMAVSTFRKLDGIC
73 # WQVRQLYGDTGVLGRFLLQARGARGAVHVVVAETDYQSFAVLYLERAGQLSVKLYARSLPVSDSVLSGFEQRVQEAHLTEDQIFYFPKY] 101 # WQVRQLYGDTGVLGRFLLQARGARGAVHVVVAETDYQSFAVLYLERAGQLSVKLYARSLPVSDSVLSGFEQRVQEAHLTEDQIFYFPKYGFCEAADQF
74 # end gene g2 102 # HVLDGECTAGASMAAW]
103 # end gene HS08198.g2
75 ### 104 ###
76 # command line: 105 # command line:
77 # ./bin/augustus --species=human --UTR=on --gff3=on ./examples/example.fa 106 # augustus --strand=both --noInFrameStop=false --gff3=on --uniqueGeneId=true --protein=on --codingseq=on --introns=off --stop=off --stop=off --cds=on --singlestrand=false /tmp/tmpboMLLQ/job_working_directory/000/4/task_0/dataset_5.dat --UTR=on --genemodel=complete --species=human