Mercurial > repos > bgruening > augustus
diff test-data/arabidopsis_augustus_utr-off_singlestrand-on_mea-on.gtf @ 0:af307d3285c5 draft
Uploaded
author | bgruening |
---|---|
date | Sat, 06 Jul 2013 10:07:41 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/arabidopsis_augustus_utr-off_singlestrand-on_mea-on.gtf Sat Jul 06 10:07:41 2013 -0400 @@ -0,0 +1,85 @@ +# This output was generated with AUGUSTUS (version 2.7). +# AUGUSTUS is a gene prediction tool for eukaryotes written by Mario Stanke (mario.stanke@uni-greifswald.de) +# and Oliver Keller (keller@cs.uni-goettingen.de). +# Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008), +# Using native and syntenically mapped cDNA alignments to improve de novo gene finding +# Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013 +# No extrinsic information on sequences given. +# arabidopsis version. Using default transition matrix. +# We have hints for 0 sequences and for 0 of the sequences in the input set. +# +# ----- prediction on sequence number 1 (length = 2066, name = arabidopsis) ----- +# +# Constraints/Hints: +# (none) +# Predicted genes for sequence number 1 on both strands +# start gene g1 +arabidopsis AUGUSTUS gene 775 1851 0 + . g1 +arabidopsis AUGUSTUS transcript 775 1851 . + . g1.t1 +arabidopsis AUGUSTUS start_codon 775 777 . + 0 transcript_id "g1.t1"; gene_id "g1"; +arabidopsis AUGUSTUS CDS 775 1851 0.99 + 0 transcript_id "g1.t1"; gene_id "g1"; +arabidopsis AUGUSTUS stop_codon 1849 1851 . + 0 transcript_id "g1.t1"; gene_id "g1"; +# protein sequence = [MDLSLAPTTTTSSDQEQDRDQELTSNIGASSSSGPSGNNNNLPMMMIPPPEKEHMFDKVVTPSDVGKLNRLVIPKQHA +# ERYFPLDSSNNQNGTLLNFQDRNGKMWRFRYSYWNSSQSYVMTKGWSRFVKEKKLDAGDIVSFQRGIGDESERSKLYIDWRHRPDMSLVQAHQFGNFG +# FNFNFPTTSQYSNRFHPLPEYNSVPIHRGLNIGNHQRSYYNTQRQEFVGYGYGNLAGRCYYTGSPLDHRNIVGSEPLVIDSVPVVPGRLTPVMLPPLP +# PPPSTAGKRLRLFGVNMECGNDYNQQEESWLVPRGEIGASSSSSSALRLNLSTDHDDDNDDGDDGDDDQFAKKGKSSLSLNFNP] +# end gene g1 +### +# start gene g2 +arabidopsis AUGUSTUS gene 841 1661 . - . g2 +arabidopsis AUGUSTUS transcript 841 1661 . - . g2.t1 +arabidopsis AUGUSTUS stop_codon 841 843 . - 0 transcript_id "g2.t1"; gene_id "g2"; +arabidopsis AUGUSTUS intron 1024 1101 0.75 - . transcript_id "g2.t1"; gene_id "g2"; +arabidopsis AUGUSTUS intron 1193 1325 0.03 - . transcript_id "g2.t1"; gene_id "g2"; +arabidopsis AUGUSTUS intron 1416 1512 0.85 - . transcript_id "g2.t1"; gene_id "g2"; +arabidopsis AUGUSTUS CDS 841 1023 0.87 - 0 transcript_id "g2.t1"; gene_id "g2"; +arabidopsis AUGUSTUS CDS 1102 1192 0.78 - 1 transcript_id "g2.t1"; gene_id "g2"; +arabidopsis AUGUSTUS CDS 1326 1415 0.05 - 1 transcript_id "g2.t1"; gene_id "g2"; +arabidopsis AUGUSTUS CDS 1513 1661 0.35 - 0 transcript_id "g2.t1"; gene_id "g2"; +# protein sequence = [SLPHSIFTPKSLSLFPAVEGGGGSGGNITGVNLPGTTGTESITNGSDPTMNVGDFRCLSPGESGRSYILAMDEICWNI +# EKDNVSCIELFLFDETAPSFGHNVALARVPIRREIPLSVLFRDHESVEFSDVAWCYHFVEHVFFLRRWNHHHRKVVVVSAGTGAAACSDVGG] +# end gene g2 +### +# +# ----- prediction on sequence number 2 (length = 1802, name = arabidopsis2) ----- +# +# Constraints/Hints: +# (none) +# Predicted genes for sequence number 2 on both strands +# start gene g3 +arabidopsis2 AUGUSTUS gene 97 1600 . - . g3 +arabidopsis2 AUGUSTUS transcript 97 1600 . - . g3.t1 +arabidopsis2 AUGUSTUS stop_codon 97 99 . - 0 transcript_id "g3.t1"; gene_id "g3"; +arabidopsis2 AUGUSTUS intron 349 521 0.73 - . transcript_id "g3.t1"; gene_id "g3"; +arabidopsis2 AUGUSTUS intron 1210 1333 0.36 - . transcript_id "g3.t1"; gene_id "g3"; +arabidopsis2 AUGUSTUS intron 1452 1560 0.54 - . transcript_id "g3.t1"; gene_id "g3"; +arabidopsis2 AUGUSTUS CDS 97 348 0.73 - 0 transcript_id "g3.t1"; gene_id "g3"; +arabidopsis2 AUGUSTUS CDS 522 1209 0.6 - 1 transcript_id "g3.t1"; gene_id "g3"; +arabidopsis2 AUGUSTUS CDS 1334 1451 0.44 - 2 transcript_id "g3.t1"; gene_id "g3"; +arabidopsis2 AUGUSTUS CDS 1561 1600 0.42 - 0 transcript_id "g3.t1"; gene_id "g3"; +arabidopsis2 AUGUSTUS start_codon 1598 1600 . - 0 transcript_id "g3.t1"; gene_id "g3"; +# protein sequence = [MVKLVFSDLSCAFASANSTASSTNSSIFFSIDFSSASFASLFSIKYFFNAAIGITELIGISQGVSSESISLTFNQGWT +# FSSSSSSDSFFSDFPDLQDIHTVNMNTRHPKCRTFLPNLGVRSGSQVRHPNGPQVILDNKDNRQFIESSHVETLEELSVVTSSISEKGDSDIITILFQ +# DFPPVLGAKGSTSGDRNAFTNKSKATKHVVFFGEHVHGSTLASAASSNLAEELAHNSTSRDTFAEGMDMVTVGTNDRVRLGKELDKASRNSLLAIVQV +# NKTKHLASAGIIGGLLLLDNFLDRDDGRSTGGVGVIESAKGEGTGGSEERRRRSQSDREQETILMGSMQRNRGSELSGSESRRHCYQWKPQ] +# end gene g3 +### +# start gene g4 +arabidopsis2 AUGUSTUS gene 121 1582 0 + . g4 +arabidopsis2 AUGUSTUS transcript 121 1582 . + . g4.t1 +arabidopsis2 AUGUSTUS start_codon 121 123 . + 0 transcript_id "g4.t1"; gene_id "g4"; +arabidopsis2 AUGUSTUS intron 352 434 0.97 + . transcript_id "g4.t1"; gene_id "g4"; +arabidopsis2 AUGUSTUS intron 1213 1304 1 + . transcript_id "g4.t1"; gene_id "g4"; +arabidopsis2 AUGUSTUS CDS 121 351 0.72 + 0 transcript_id "g4.t1"; gene_id "g4"; +arabidopsis2 AUGUSTUS CDS 435 1212 0.97 + 0 transcript_id "g4.t1"; gene_id "g4"; +arabidopsis2 AUGUSTUS CDS 1305 1582 1 + 2 transcript_id "g4.t1"; gene_id "g4"; +arabidopsis2 AUGUSTUS stop_codon 1580 1582 . + 0 transcript_id "g4.t1"; gene_id "g4"; +# protein sequence = [MATAFAPTKLTATVPLHGSHENRLLLPIRLAPPSSFLGSTRSLSLRRLNHSNATRRSPVVSVQEVVKEKQSTNNTSLL +# ITKEEGLELYEDMILGRSFEDMCAQMYYRGKMFGFVHLYNGQEAVSTGFIKLLTKSDSVVSTYRDHVHALSKGVSARAVMSELFGKVTGCCRGQGGSM +# HMFSKEHNMLGGFAFIGEGIPVATGAAFSSKYRREVLKQDCDDVTVAFFGDGTCNNGQFFECLNMAALYKLPIIFVVENNLWAIGMSHLRATSDPEIW +# KKGPAFGMPGVHVDGMDVLKVREVAKEAVTRARRGEGPTLVECETYRFRGHSLADPDELRDAAEKAKYAARDPIAALKKYLIENKLAKEAELKSIEKK +# IDELVEEAVEFADASPQPGRSQLLENVFADPKGFGIGPDGRYRCEDPKFTEGTAQV] +# end gene g4 +### +# command line: +# ./bin/augustus --species=arabidopsis --UTR=off --singlestrand=true --mea=1 /home/bag/projects/github/galaxytools/augustus/test-data/arabidopsis_augustus.fa