# HG changeset patch
# User earlhaminst
# Date 1524668433 14400
# Node ID 56bbdbfe3eaa2390ea285cd85daa0a16c29c45c3
# Parent  b3ba0c84667c5bd18099954272c18a82d010eeca
planemo upload for repository https://github.com/TGAC/earlham-galaxytools/tree/master/tools/gstf_preparation commit fa875eea77a9471acada2b7b8882a0467994c960
diff -r b3ba0c84667c -r 56bbdbfe3eaa gstf_preparation.py
--- a/gstf_preparation.py	Mon Apr 16 14:05:09 2018 -0400
+++ b/gstf_preparation.py	Wed Apr 25 11:00:33 2018 -0400
@@ -6,7 +6,7 @@
 import sqlite3
 import sys
 
-version = "0.3.0"
+version = "0.4.0"
 gene_count = 0
 
 Sequence = collections.namedtuple('Sequence', ['header', 'sequence'])
@@ -41,6 +41,10 @@
     cur.execute('''CREATE TABLE gene (
         gene_id VARCHAR PRIMARY KEY NOT NULL,
         gene_symbol VARCHAR,
+        seq_region_name VARCHAR NOT NULL,
+        seq_region_start INTEGER NOT NULL,
+        seq_region_end INTEGER NOT NULL,
+        seq_region_strand INTEGER NOT NULL,
         species VARCHAR NOT NULL,
         gene_json VARCHAR NOT NULL)''')
     cur.execute('CREATE INDEX gene_symbol_index ON gene (gene_symbol)')
@@ -52,7 +56,7 @@
         gene_id VARCHAR NOT NULL REFERENCES gene(gene_id))''')
 
     cur.execute('''CREATE VIEW transcript_species AS
-        SELECT transcript_id, species
+        SELECT transcript_id, species, seq_region_name
         FROM transcript JOIN gene
         ON transcript.gene_id = gene.gene_id''')
 
@@ -225,8 +229,8 @@
             # This can happen when loading a JSON file from Ensembl
             continue
         gene_id = gene['id']
-        cur.execute('INSERT INTO gene (gene_id, gene_symbol, species, gene_json) VALUES (?, ?, ?, ?)',
-                    (gene_id, gene.get('display_name', None), gene['species'], json.dumps(gene)))
+        cur.execute('INSERT INTO gene (gene_id, gene_symbol, seq_region_name, seq_region_start, seq_region_end, seq_region_strand, species, gene_json) VALUES (?, ?, ?, ?, ?, ?, ?, ?)',
+                    (gene_id, gene.get('display_name', None), gene['seq_region_name'], gene['start'], gene['end'], gene['strand'], gene['species'], json.dumps(gene)))
 
         if "Transcript" in gene:
             for transcript in gene["Transcript"]:
@@ -241,15 +245,15 @@
     conn.commit()
 
 
-def fetch_species_for_transcript(conn, transcript_id):
+def fetch_species_and_seq_region_for_transcript(conn, transcript_id):
     cur = conn.cursor()
 
-    cur.execute('SELECT species FROM transcript_species WHERE transcript_id=?',
+    cur.execute('SELECT species, seq_region_name FROM transcript_species WHERE transcript_id=?',
                 (transcript_id, ))
     results = cur.fetchone()
     if not results:
         return None
-    return results[0]
+    return results
 
 
 def fetch_gene_id_for_transcript(conn, transcript_id):
@@ -280,8 +284,11 @@
     parser.add_option('--fasta', action='append', default=[], help='Path of the input FASTA files')
     parser.add_option('-l', action='store_true', default=False, dest='longestCDS', help='Keep only the longest CDS per gene')
     parser.add_option('--headers', action='store_true', default=False, help='Change the header line of the FASTA sequences to the >TranscriptId_species format')
+    parser.add_option('--regions', default="", help='Comma-separated list of region IDs for which FASTA sequences should be filtered')
     parser.add_option('-o', '--output', help='Path of the output SQLite file')
     parser.add_option('--of', help='Path of the output FASTA file')
+    parser.add_option('--ff', help='Path of the filtered sequences output FASTA file')
+
     options, args = parser.parse_args()
     if args:
         raise Exception('Use options to provide inputs')
@@ -368,14 +375,15 @@
         # first one to appear in the FASTA file is selected
         selected_transcript_ids = [max(transcript_id_lengths, key=lambda _: _[1])[0] for transcript_id_lengths in gene_transcripts_dict.values()]
 
-    with open(options.of, 'w') as output_fasta_file:
+    regions = [_.strip().lower() for _ in options.regions.split(",")]
+    with open(options.of, 'w') as output_fasta_file, open(options.ff, 'w') as filtered_fasta_file:
         for fasta_arg in options.fasta:
             for entry in FASTAReader_gen(fasta_arg):
                 transcript_id = remove_id_version(entry.header[1:].lstrip().split(' ')[0])
                 if options.longestCDS and transcript_id not in selected_transcript_ids:
                     continue
 
-                species_for_transcript = fetch_species_for_transcript(conn, transcript_id)
+                species_for_transcript, seq_region_for_transcript = fetch_species_and_seq_region_for_transcript(conn, transcript_id)
                 if not species_for_transcript:
                     print("Transcript '%s' in file '%s' not found in the gene feature information" % (transcript_id, fasta_arg), file=sys.stderr)
                     continue
@@ -387,7 +395,10 @@
                 else:
                     header = entry.header
 
-                output_fasta_file.write("%s\n%s\n" % (header, entry.sequence))
+                if seq_region_for_transcript.lower() in regions:
+                    filtered_fasta_file.write("%s\n%s\n" % (header, entry.sequence))
+                else:
+                    output_fasta_file.write("%s\n%s\n" % (header, entry.sequence))
 
     conn.close()
 
diff -r b3ba0c84667c -r 56bbdbfe3eaa gstf_preparation.xml
--- a/gstf_preparation.xml	Mon Apr 16 14:05:09 2018 -0400
+++ b/gstf_preparation.xml	Wed Apr 25 11:00:33 2018 -0400
@@ -20,8 +20,12 @@
 #if $longestCDS
     -l
 #end if
+#if $regions
+    --regions '$regions'
+#end if
 -o '$output_db'
 --of '$output_fasta'
+--ff '$filtered_fasta'
 ]]>
     
 
@@ -36,11 +40,13 @@
         
         
         
+        
     
 
     
          
          
+         
     
 
     
@@ -53,6 +59,7 @@
 
             
             
+            
         
         
             
@@ -63,6 +70,7 @@
 
             
             
+            
         
         
             
@@ -73,6 +81,7 @@
 
             
             
+            
         
         
             
@@ -80,8 +89,20 @@
             
             
 
-            
-            
+            
+            
+            
+        
+        
+            
+            
+            
+            
+            
+
+            
+            
+            
         
     
     
diff -r b3ba0c84667c -r 56bbdbfe3eaa schema/gstf.mwb
Binary file schema/gstf.mwb has changed
diff -r b3ba0c84667c -r 56bbdbfe3eaa schema/gstf.png
Binary file schema/gstf.png has changed
diff -r b3ba0c84667c -r 56bbdbfe3eaa schema/gstf.svg
--- a/schema/gstf.svg	Mon Apr 16 14:05:09 2018 -0400
+++ b/schema/gstf.svg	Wed Apr 25 11:00:33 2018 -0400
@@ -9,7 +9,7 @@
 
 
 
-
+
 
 
 
@@ -18,16 +18,16 @@
 
 
 
-
+
 
 
-
+
 
 
 
 
 
-
+
 
 
 
@@ -48,7 +48,7 @@
 
 
 
-
+
 
 
 
@@ -69,13 +69,13 @@
 
 
 
-
+
 
 
-
+
 
 
-
+
 
 
 
@@ -84,10 +84,10 @@
 
 
 
-
+
 
 
-
+
 
 
 
@@ -96,7 +96,7 @@
 
 
 
-
+
 
 
 
@@ -111,67 +111,73 @@
 
 
 
-
+
 
 
-
+
 
 
-
+
 
 
-
+
 
 
-
+
 
 
 
 
 
-
+
 
 
-
+
 
 
-
+
 
 
-
+
 
 
-
+
 
 
-
+
 
 
-
+
 
 
+
+
+
+
+
+
+
+
+
+
+
+
 
 
-
+
 
 
-
-
-
-
+
 
 
-
-
-
-
+
 
 
-
+
 
 
-
-
+
+
 
 
 
@@ -186,7 +192,7 @@
 
 
 
-
+
 
 
 
@@ -195,30 +201,30 @@
 
 
 
-
-
-
-
-
-
+
+
+
+
+
+
 
-
-
-
-
-
-
-
-
-
+
+
+
+
+
+
+
+
+
 
   
   
   
   
 
-
-
+
+
 
   
   
@@ -241,7 +247,7 @@
   
   
 
-
+
 
   
   
@@ -268,278 +274,392 @@
   
   
 
-
+
 
   
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
+
+
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+
+
+
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+
+
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
-
-  
-  
-  
-  
-  
-  
-  
+
+
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
+
 
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+
+
+
+  
+  
+  
+  
+  
+  
+  
+
+
+
+  
+  
+  
+  
+  
+  
+  
 
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
-
-
-
+
+
+
+
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
-
+
+
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
+
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
+
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
+
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
+
 
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
 
-
+
 
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
 
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
 
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
-  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
+  
 
-
+
 
 
-
+
 
   
   
@@ -547,11 +667,11 @@
   
 
 
-
+
 
-  
+  
   
-  
+  
   
   
   
@@ -565,7 +685,7 @@
   
   
   
-  
+  
   
   
 
@@ -582,7 +702,7 @@
 
 
 
-
+
 
   
   
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test1.ns.fasta
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test1.sqlite
Binary file test-data/test1.sqlite has changed
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test2.sqlite
Binary file test-data/test2.sqlite has changed
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test4.fasta
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test4.fasta	Wed Apr 25 11:00:33 2018 -0400
@@ -0,0 +1,1265 @@
+>ENST00000338702_homosapiens
+ATGGAGAATCAAGAGAAGGCGAGTATCGCGGGCCACATGTTCGACGTAGTCGTGATCGGA
+GGTGGCATTTCAGGACTATCTGCTGCCAAACTCTTGACTGAATATGGCGTTAGTGTTTTG
+GTTTTAGAAGCTCGGGACAGGGTTGGAGGAAGAACATATACTATAAGGAATGAGCATGTT
+GATTACGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAAAACAGAATCTTACGCTTG
+TCTAAGGAGCTGGGCATAGAGACTTACAAAGTGAATGTCAGTGAGCGTCTCGTTCAATAT
+GTCAAGGGGAAAACATATCCATTTCGGGGCGCCTTTCCACCAGTATGGAATCCCATTGCA
+TATTTGGATTACAATAATCTGTGGAGGACAATAGATAACATGGGGAAGGAGATTCCAACT
+GATGCACCCTGGGAGGCTCAACATGCTGACAAATGGGACAAAATGACCATGAAAGAGCTC
+ATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTTGCTTATCTTTTTGTGAATATC
+AATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGGTTCTTGTGGTATGTGAAGCAG
+TGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGTGGCCAGGAACGGAAGTTTGTA
+GGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTCCTCGGAGACCAAGTGAAGCTG
+AACCATCCTGTCACTCACGTTGACCAGTCAAGTGACAACATCATCATAGAGACGCTGAAC
+CATGAACATTATGAGTGCAAATACGTAATTAATGCGATCCCTCCGACCTTGACTGCCAAG
+ATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAGTTAATTCAGCGGCTTCCAATG
+GGAGCTGTCATTAAGTGCATGATGTATTACAAGGAGGCCTTCTGGAAGAAGAAGGATTAC
+TGTGGCTGCATGATCATTGAAGATGAAGATGCTCCAATTTCAATAACCTTGGATGACACC
+AAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATTCTTGCCCGGAAAGCTGATCGA
+CTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATCTGTGAGCTCTATGCCAAAGTG
+CTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCTGGGATCATGACTCAATATGGA
+AGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCGGGCACAGAGACTGCCACAAAG
+TGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAACGAGCAGCTAGGGAGGTCTTA
+AATGGTCTCGGGAAGGTGACCGAGAAAGATATCTGGGTACAAGAACCTGAATCAAAGGAC
+GTTCCAGCGGTAGAAATCACCCACACCTTCTGGGAAAGGAACCTGCCCTCTGTTTCTGGC
+CTGCTGAAGATCATTGGATTTTCCACATCAGTAACTGCCCTGGGGTTTGTGCTGTACAAA
+TACAAGCTCCTGCCACGGTCTTGA
+>ENST00000542639_homosapiens
+ATGGGGAAGGAGATTCCAACTGATGCACCCTGGGAGGCTCAACATGCTGACAAATGGGAC
+AAAATGACCATGAAAGAGCTCATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTT
+GCTTATCTTTTTGTGAATATCAATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGG
+TTCTTGTGGTATGTGAAGCAGTGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGT
+GGCCAGGAACGGAAGTTTGTAGGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTC
+CTCGGAGACCAAGTGAAGCTGAACCATCCTGTCACTCACGTTGACCAGTCAAGTGACAAC
+ATCATCATAGAGACGCTGAACCATGAACATTATGAGTGCAAATACGTAATTAATGCGATC
+CCTCCGACCTTGACTGCCAAGATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAG
+TTAATTCAGCGGCTTCCAATGGGAGCTGTCATTAAGTGCATGATGTATTACAAGGAGGCC
+TTCTGGAAGAAGAAGGATTACTGTGGCTGCATGATCATTGAAGATGAAGATGCTCCAATT
+TCAATAACCTTGGATGACACCAAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATT
+CTTGCCCGGAAAGCTGATCGACTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATC
+TGTGAGCTCTATGCCAAAGTGCTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAA
+GAGAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCT
+GGGATCATGACTCAATATGGAAGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCG
+GGCACAGAGACTGCCACAAAGTGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAA
+CGAGCAGCTAGGGAGGTCTTAAATGGTCTCGGGAAGGTGACCGAGAAAGATATCTGGGTA
+CAAGAACCTGAATCAAAGGACGTTCCAGCGGTAGAAATCACCCACACCTTCTGGGAAAGG
+AACCTGCCCTCTGTTTCTGGCCTGCTGAAGATCATTGGATTTTCCACATCAGTAACTGCC
+CTGGGGTTTGTGCTGTACAAATACAAGCTCCTGCCACGGTCTTGA
+>ENSPTRT00000040520_pantroglodytes
+ATGGAGAATCAAGAGAAGGCGAGTATCGCGGGCCACATGTTCGACGTAGTCGTGATCGGA
+GGTGGCATTTCAGGACTATCTGCTGCCAAACTCTTGACTGAATATGGCGTTAGTGTTTTA
+GTTTTAGAAGCTCGGGACAGGGTTGGAGGAAGAACATATACTATAAGGAATGAGCATGTT
+GATTACGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAAAACAGAATCTTACGCTTG
+TCTAAGGAGCTGGGCATAGAGACTTACAAAGTGAATGTCAGTGAGCGTCTCGTTCAATAT
+GTCAAGGGGAAAACATATCCATTTCGGGGCGCCTTTCCACCAGTATGGAATCCCATTGCA
+TATTTGGATTACAATAATCTGTGGCGGACAATAGATAACATGGGGAAGGAGATTCCAAAT
+GATGCACCCTGGGAGGCTCAACATGCTGACGAATGGGACAAAATGACCATGAAAGAGCTC
+ATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTTGCTTATCTTTTTGTGAATATC
+AATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGGTTCTTGTGGTATGTGAAGCAG
+TGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGCGGCCAGGAACGGAAGTTTGTA
+GGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTCCTTGGAGACCAAGTGAAGCTG
+AACCATCCTGTCACTCATGTTGACCAGTCAAGTGACAACATCATCATAGAGACACTGAAC
+CATGAACATTATGAGTGCAAATACGTAATTAATGCGATCCCTCCGACCTTGACTGCCAAG
+ATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAGTTAATTCAGCGTCTTCCAATG
+GGAGCTATCATTAAGTGCATGATGTATTACAAGGAGGCCTTCTGGAAGAAGAAGGATTAC
+TGTGGCTGCATGATCATTGAAGATGAAGATGCCCCAATTTCAATAACCTTGGATGACACC
+AAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATTCTTGCCCGGAAAGCTGATCGA
+CTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATCTGTGAGCTCTATGCCAAAGTG
+CTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCTGGGATCATGACTCAATATGGA
+AGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCGGGCACAGAGACTGCCACAAAG
+TGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAACGAGCAGCTAGGGAGGTCTTA
+AATGGTCTCGGGAAGGTGACCGAGAAAGACATCTGGGTACAAGAACCTGAATCAAAGGAC
+GTTCCAGCGGTAGAAATCACGCACACCTTCTGGGAAAGGAACCTGCCCTCTGTTTCTGGC
+CTGCTGAAGATCATTGGATTTTCCACATCAGTAACTACCCTGGGGTTTGTGCTGTACAAA
+TACAAGCTCCTGCCACGGTCTTGA
+>ENSSSCT00000013404_susscrofa
+ATGGAGCGTCAGGAGAAGGCGAACAACGCGGGCCACATGGTCGACGTAGTCGTGATAGGA
+GGCGGCATCTCAGGATTATCTGCTGCCAAACTCTTAAATGAATATGGAATTAATGTTTTG
+GTTTTAGAAGCCCGGGACAGAGTTGGAGGAAGAACATACACAGTGAGGAACGAAAATGTT
+GATTACGTGGACGTTGGTGGGGCTTATGTCGGACCGACCCAGAATAGGATCTTAAGGTTA
+TCTAAGGAACTGGGTTTAGAAACTTACAAAGTGAATGTAAATGAGTGTCTCGTTCAGTAT
+GTCAAGGGGAAATCTTATCCATTTCGGGGTGCCTTCCCTCCAGTCTGGAATCCCATTGCC
+TATCTGGATTACAACAACCTGTGGCGGACAATGGATGACATGGGAAAGAAGATTCCAGCT
+GATGCACCATGGGAGTCTCCGCATGCAGAGGAATGGGATAAGATGACCATGAAAGATCTC
+ATCGATAAAATCTGTTGGACAAAGACTGCTAAACGGTTTGCATCTCTCTTTGTAAATATC
+AATGTGACCTCCGAACCCCACGAAGTGTCTGCCCTGTGGTTTTTGTGGTATGTGAAGCAG
+TGTGGAGGCACCACCCGGATATTCTCTGTTACCAACGGGGGCCAGGAACGGAAGTTTGTA
+GGCGGATCTGGTCAAGTAAGCGAACGGATAATGCACCTCCTCGGGGACAGAGTGAAGCTG
+AGGTGTCCTGTCACCTATGTTGACCAGTCAGGTGACAACATCATCGTAGAGACATTGAAT
+CATGAACTTTATGAGTGCCAATACGTAATTAGTGCCATCCCTCCAACTCTGACTGCCAAG
+ATACACTTCAGACCGGAGCTTCCGTCAGAAAGAAACCAGTTAATTCAGCGTCTTCCGATG
+GGGGCTATCATTAAGTGCATGATGTATTACAAGGAGGCCTTTTGGAAGAAGAAGAATTAC
+TGTGGCTGTATGATCATCGAAGATGAGGAAGCTCCGATTTCAATAACTCTAGATGACACC
+AAGCCAGATGGATCGCTGCCCGCCATCATGGGCTTCATCCTTGCTCGAAAAGCTGACCGC
+CTTGCTAAGGTTCATAAAGAAATAAGAAAGCGGAAAATCTGTGAGCTCTACGCCAAAGTG
+CTAGGATCTCAAGAAGCTTTACATCCCGTGCACTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCGGGGGGCTGCTACACTGCCTACTTCCCCCCTGGGATCATGACTCAGTATGGA
+AGGGTGATCCGCCAGCCCGTAGGCAGGATATTCTTTGCTGGCACCGAGACTGCCACACAA
+TGGAGCGGTTACATGGAAGGAGCAGTAGAAGCCGGCGAACGGGCGGCTAGAGAGATCTTG
+AATGCTTTGGGGAAGGTGTCAAAGAAAGACATATGGCTTCGAGAACCTGAATCAGAGGAT
+GTTCCAGCTTTTGAGATCACCCGCACCTTCTGGGAGAGAAACCTGCCTTCCGTGACCGGG
+CTGCTTAAGATCATCGGATTTTCCACCTCGGTAACTGCCCTGTGGCTTGCCGTGTACAAA
+TTCAGGCTGCTGACCCGATCCTGA
+>ENSSSCT00000035258_susscrofa
+TCGCTGCCCGCCATCATGGGCTTCATCCTTGCTCGAAAAGCTGACCGCCTTGCTAAGGTT
+CATAAAGAAATAAGAAAGCGGAAAATCTGTGAGCTCTACGCCAAAGTGCTAGGATCTCAA
+GAAGCTTTACATCCCGTGCACTATGAAGAGAAGAACTGGTGTGAGGAGCAGTACTCGGGG
+GGCTGCTACACTGCCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTGATCCGC
+CAGCCCGTAGGCAGGATATTCTTTGCTGGCACCGAGACTGCCACACAATGGAGCGGTTAC
+ATGGAAGGAGCAGTAGAAGCCGGCGAACGGGCGGCTAGAGAGGATGTTCCAGCTTTTGAG
+ATCACCCGCACCTTCTGGGAGAGAAACCTGCCTTCCGTGACCGGGCTGCTTAAGATCATC
+GGATTTTCCA
+>ENSSSCT00000032764_susscrofa
+ATGGATGACATGGGAAAGAAGATTCCAGCTGATGCACCATGGGAGTCTCCGCATGCAGAG
+GAATGGGATAAGATGACCATGAAAGATCTCATCGATAAAATCTGTTGGACAAAGACTGCT
+AAACGGTTTGCATCTCTCTTTGTAAATATCAATGTGACCTCCGAACCCCACGAAGTGTCT
+GCCCTGTGGTTTTTGTGGTATGTGAAGCAGTGTGGAGGCACCACCCGGATATTCTCTGTT
+ACCAACGGGGGCCAGGAACGGAAGTTTGTAGGCGGATCTGGTCAAGTAAGCGAACGGATA
+ATGCACCTCCTCGGGGACAGAGTGAAGCTGAGGTGTCCTGTCACCTATGTTGACCAGTCA
+GGTGACAACATCATCGTAGAGACATTGAATCATGAACTTTATGAGTGCCAATACGTAATT
+AGTGCCATCCCTCCAACTCT
+>ENSCAFT00000022939_canisfamiliaris
+ATGGCGAGTAGAGAGAAGACGAGTATCGAGGGCCACATGTTTGACGTAGTCGTGATAGGA
+GGCGGCATCTCAGGATTGTCTGCTGCCAAACTCTTAGCCGAACATGAAGTTGATGTCTTA
+GTTTTAGAAGCACGAGATAGAGTTGGAGGAAGAACATACACCGTGAGGAATGAACATGTC
+GATTACGTAGATGTTGGTGGGGCTTATGTAGGACCAACTCAGAACAGAATCTTACGACTA
+TCTAAGGAGCTGGGTCTAGAGACTTACAAAGTGAACGTAAATGAGCGTCTTGTACAGTAT
+GTCAAGGGGAAAACTTACCCATTCCGAGGAGCCTTTCCTCCGGTATGGAATCCTATCGCA
+TATTTGGATTACAACAACCTGTGGCGGACAATGGATAACATGGGGAAGGAGATTCCAGCA
+GATGCACCATGGGAGGCCCCACATGCCGAGGAATGGGACAAGATGACTATGAAGGATCTT
+ATCGATAAAATCTGCTGGACAAAGACTGCTAGGAGGTTTGCATCCCTCTTTGTGAATATC
+AATGTGACCTCTGAGCCCCACGAGGTGTCTGCGCTCTGGTTCCTGTGGTATGTGAAGCAG
+TGCGGAGGTACCACTCGGATATTCTCGGTGACCAATGGAGGCCAGGAACGGAAGTTTGTG
+GGAGGATCCGGTCAAGTGAGTGAACGGATAATGGAGCGCCTTGGGGACAGAGTCAAGCTG
+AAGCGCCCTGTCACCTATGTTGACCAGTCAGATGACAACATCATCATAGAGACACTGAAT
+CATGAACTTTATGAGTGCAAATACGTGATTAGTGCCATCCCTCCAACTTTGACTGCCAAG
+ATCCACTTCAGACCAGAGCTTCCATCAGAGAGAAATCAGTTAATTCAGCGTCTTCCAATG
+GGAGCTATCATCAAGTGTATGATGTATTACAAGGAGGCCTTTTGGAAGAAGAAGGATTAC
+TGTGGCTGTATGATCATTGAAGACGAGGAAGCTCCAATTTCAATAACCCTGGATGACACC
+AAGCCAGATGGATCACTGCCCGCTATCATGGGCTTCATACTTGCCAGAAAAGCTGACCGA
+CTTGCCAAGCTCCATAAAGAAATAAGGAAGAGGAAAATCTGTGAGCTCTATGCCAAAGTG
+CTAGGATCCCAAGAAGCTTTACAACCCGTACACTATGAAGAGAAGAACTGGTGCGAGGAG
+CAGTACTCCGGGGGCTGCTATACCGCCTACTTCCCCCCTGGGATCATGACTCACTACGGA
+AGGGTGATCCGCCAGCCATTTGGCAGGATTTACTTTGCTGGCACTGAGACGGCAACACAC
+TGGAGCGGTTATATGGAAGGAGCTGTAGAGGCTGGGGAACGGACAGCTAGAGAGGTCTTA
+AATGCTCTCGGGAGGGTGGCAGAGAAAGACCTGAAGACCCAGGAACCTGAATCAAAGGAT
+GTTCCAGCTATGGAAATCACCCACACCTTCTGGGAGAGGAACCTGCCATCGGTGACAGGC
+CTGCTGAAGCTCATTGGATTTACCACATCAGTAACTGCCCTGTGGATTGTGGCGTACAAA
+TTCAGGCTGCTGAGACGATCCTGA
+>ENSMUST00000026013_musmusculus
+ATGACGGATCTGGAGAAGCCCAGTATCACAGGCCACATGTTCGACGTAGTCGTGATTGGA
+GGCGGCATCTCAGGATTGGCTGCTGCCAAACTATTGTCAGAATACAAAATTAATGTCTTG
+GTTCTGGAAGCCCGGGATAGAGTTGGAGGAAGAACATATACTGTGAGGAATGAGCATGTT
+AAATGGGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAGAACAGAATCTTACGCTTG
+TCTAAGGAGCTAGGCATAGAGACCTATAAAGTGAATGTCAATGAGCGTCTAGTTCAATAT
+GTCAAGGGGAAAACTTACCCATTCCGTGGTGCATTTCCACCTGTGTGGAACCCCTTGGCA
+TATTTGGATTACAACAACCTGTGGAGGACAATGGATGATATGGGAAAAGAGATCCCTGTT
+GATGCACCATGGCAAGCAAGACATGCTGAGGAATGGGACAAGATAACCATGAAAGATCTC
+ATTGATAAAATCTGTTGGACAAAAACTGCTCGAGAATTTGCTTATCTTTTTGTGAACATT
+AATGTGACTTCTGAGCCTCATGAGGTATCTGCCCTGTGGTTCTTGTGGTATGTGAGGCAG
+TGTGGAGGTACCTCTCGGATATTCTCAGTCACCAATGGCGGCCAGGAACGGAAATTTGTA
+GGTGGCTCTGGCCAAATAAGTGAACAGATAATGGTCCTCCTTGGGGATAAAGTGAAGCTG
+AGCTCTCCTGTTACTTATATTGACCAAACAGATGACAACATCATTATAGAAACACTGAAT
+CATGAGCACTATGAGTGCAAATATGTAATTAGTGCCATCCCACCGGTTTTGACTGCCAAG
+ATCCACTTTAAACCAGAGCTTCCACCTGAGAGAAACCAATTAATTCAGCGTCTTCCAATG
+GGGGCTGTCATCAAGTGCATGGTGTATTACAAGGAAGCCTTCTGGAAGAAAAAGGACTAT
+TGTGGCTGCATGATAATTGAAGATGAGGAGGCTCCAATTTCAATCACTCTGGATGACACT
+AAACCAGATGGGTCAATGCCTGCCATCATGGGCTTCATACTTGCCCGGAAAGCTGAACGA
+CTTGCTAAACTACATAAAGACATAAGGAAGAGGAAAATCTGTGAGCTGTATGCCAAAGTT
+CTGGGATCTCAAGAAGCTTTATCTCCCGTCCATTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCCGGGGGCTGCTACACAGCCTACTTCCCTCCTGGTATCATGACTCTGTATGGA
+AGGGTGATTCGGCAGCCAGTAGGCAGGATTTACTTTGCAGGCACAGAGACAGCAACACAG
+TGGAGTGGCTACATGGAAGGTGCAGTTGAAGCTGGAGAACGAGCAGCTAGAGAGGTCTTG
+AATGCTCTAGGAAAAGTTGCCAAGAAGGATATATGGGTTCAAGAGCCTGAGTCCAAGGAT
+GTTCCAGCTCTTGAAATTACCCACACCTTCTTAGAGAGGAACCTGCCTTCCGTGCCTGGT
+CTGCTCAAGATCACTGGTTTTTCCACTTCTGTGGCTCTTCTCTGCTTTGTATTGTACAAG
+TTTAAACAGCCCCAGTCCTGA
+>ENSRNOT00000066674_rattusnorvegicus
+ATGACGGATCTGGAGAAGCCCAATCTCGCAGGCCACATGTTCGACGTAGTCGTGATTGGA
+GGCGGCATCTCAGGATTGGCTGCTGCCAAACTGTTGTCTGAATACAAAATTAATGTCTTG
+GTTTTGGAAGCCCGGGATAGAGTTGGAGGAAGAACATATACTGTGAGGAATGAGCATGTC
+AAATGGGTAGATGTTGGTGGAGCCTATGTGGGACCAACCCAGAACAGAATCTTACGCTTG
+TCTAAGGAGCTAGGCATAGAGACCTATAAAGTGAATGTCAATGAGCGTCTAGTTCAATAT
+GTCAAGGGGAAAACTTACCCATTCCGTGGTGCATTCCCACCTGTGTGGAACCCCTTGGCA
+TATTTGGATTACAACAACCTATGGAGAACAATGGATGAAATGGGAAAAGAGATCCCCGTT
+GATGCACCGTGGCAAGCAAGACACGCTCAGGAATGGGACAAGATGACCATGAAAGATCTC
+ATTGATAAAATCTGTTGGACAAAAACTGCTCGGGAATTTGCGTATCTTTTTGTGAACATT
+AATGTGACTTCTGAGCCTCATGAGGTATCTGCCCTGTGGTTCCTGTGGTATGTGAGGCAG
+TGTGGGGGCACTGCTCGGATATTCTCAGTTACCAATGGCGGCCAGGAACGGAAATTTGTA
+GGTGGATCTGGCCAAGTAAGTGAACAGATAATGGGTCTCCTTGGAGATAAAGTGAAGCTG
+AGCTCTCCTGTTACTTATATTGACCAAACAGATGACAACATCATTGTAGAAACACTGAAT
+CATGAACACTATGAGTGCAAATACGTAATTAGTGCCATCCCACCGATTTTGACTGCCAAG
+ATCCACTTTAAACCAGAGCTTCCACCTGAGAGAAACCAATTAATTCAGCGTCTTCCAATG
+GGGGCTGTTATCAAGTGCATGGTGTATTACAAGGAAGCCTTCTGGAAGAAAAAGGACTAT
+TGTGGCTGCATGATCATTGAAGATGAGGAGGCTCCAATCGCCATCACTCTGGATGACACT
+AAACCAGATGGGTCACTGCCTGCCATCATGGGCTTCATACTTGCCCGGAAAGCTGATCGA
+CTTGCTAAACTACATAAAGACATAAGGAAGAGGAAAATCTGTGAGCTGTATGCCAAAGTT
+CTGGGATCTCAAGAAGCATTATATCCAGTCCATTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCCGGGGGCTGCTACACAGCCTACTTCCCTCCTGGTATCATGACCCAGTATGGA
+AGGGTGATTCGCCAGCCAGTAGGTAGGATTTACTTTGCAGGCACAGAGACAGCAACACAG
+TGGAGTGGCTACATGGAAGGAGCAGTTGAAGCTGGAGAACGAGCAGCTAGAGAGGTGTTG
+AATGCTCTAGGAAAAGTCGCGAAGAAGGATATATGGGTTGAAGAACCCGAGTCCAAGGAT
+GTTCCAGCCATTGAAATTACCCACACCTTCTTAGAGAGGAACCTGCCTTCCGTGCCTGGT
+CTGCTCAAGATCACTGGTGTTTCCACTTCTGTGGCTCTTCTCTGCTTTGTATTGTACAAG
+ATTAAGAAGCTCCCATGCTGA
+>ENSPTRT00000040521_pantroglodytes
+ATGAGCAACAAATGCGACGTGGTCGTGGTGGGGGGCGGCATCTCAGGTAAGGCAGCAGCC
+AAACTTCTGCATGACTCTGGACTGAATGTGGTTGTTCTGGAAGCCCGGGACCGTGTGGGA
+GGCAGGACTTACACTCTTAGGAACCAAAAGGTTAAATATGTGGACCTTGGAGGATCCTAT
+GTTGGACCAACCCAGAATCGTATCTTGAGATTAGCCAAGGAGCTAGGATTGGAGACCTAC
+AAAGTGAATGAGGTTGAGCGTCTGATCCACCATGTAAAGGGCAAATCATACCCCTTCAGG
+GGGCCGTTCCCACCTGTATGGAATCCAATTACCTACTTAGATCATAACAACTTTTGGAGG
+ACAATGGATGACATGGGGCGAGAGATTCCGAGTGATGCCCCATGGAAGGCTCCCCTTGCA
+GAAGAGTGGGACAACATGACAATGAAGGAGCTACTGGACAAGCTCTGCTGGACAGAATCT
+GCAAAGCAGCTTGCCACTCTCTTTGTGAACCTGTGTGTCACTGCAGAGACCCATGAGGTC
+TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACAACAAGAATCATCTCG
+ACAACGAATGGAGGACAGGAGAGGAAATTTGTGGGCGGATCTGGTCAAGTGAGCGAGCGG
+ATAATGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGATCTACATTGACCAG
+ACAAGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGATGTATGAGGCTAAATATGTG
+ATTAGTGCTATTCCTCCTACTCTGGGCATGAAGATTCACTTCAATCCCCCTCTGCCAATG
+ATGAGAAACCAGATGATCACTCGTGTGCCTTTGGGTTCAGTCATCAAGTGTATAGTTTAT
+TATAAAGAGCCTTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATTGATGGAGAG
+GAAGCTCCAGTTGCCTACACGTTAGATGATACCAAACCTGAAGGCAACTATGCTGCCATA
+ATGGGATTTATCCTGGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGAGGAAAGG
+TTGAAGAAACTTTGTGAACTCTATGCCAAGGTTCTGGGTTCCCCAGAAGCTCTGGAGCCA
+GTGCATTATGAAGAAAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACAACT
+TACTTCCCCCCTGGGATCCTGACTCAATATGGAAGGGTTCTACGCCAGCCAGTGGACAGG
+ATTTACTTTGCAGGCACCGAGACTGCCACACACTGGAGCGGCTACATGGAGGGGGCTGTA
+GAGGCCGGGGAGAGAGCAGCCCGAGAGATCCTGCATGCCATGGGGAAGATTCCAGAGGAT
+GAAATCTGGCAGTCAGAACCAGAGTCTGTGGATGTCCCTGCACAGCCCATCACCACGACC
+TTTTTGGAGAGACATTTGCCCTCCGTGCCAGGCCTGCTCAGGCTGATTGGATTGACCACC
+ATCTTTTCAGCAACGGCTCTTGGCTTCCTGGCCCACAAAAGGGGGCTACTTGTGCGAGTC
+TAA
+>ENST00000378069_homosapiens
+ATGAGCAACAAATGCGACGTGGTCGTGGTGGGGGGCGGCATCTCAGGTATGGCAGCAGCC
+AAACTTCTGCATGACTCTGGACTGAATGTGGTTGTTCTGGAAGCCCGGGACCGTGTGGGA
+GGCAGGACTTACACTCTTAGGAACCAAAAGGTTAAATATGTGGACCTTGGAGGATCCTAT
+GTTGGACCAACCCAGAATCGTATCTTGAGATTAGCCAAGGAGCTAGGATTGGAGACCTAC
+AAAGTGAATGAGGTTGAGCGTCTGATCCACCATGTAAAGGGCAAATCATACCCCTTCAGG
+GGGCCATTCCCACCTGTATGGAATCCAATTACCTACTTAGATCATAACAACTTTTGGAGG
+ACAATGGATGACATGGGGCGAGAGATTCCGAGTGATGCCCCATGGAAGGCTCCCCTTGCA
+GAAGAGTGGGACAACATGACAATGAAGGAGCTACTGGACAAGCTCTGCTGGACTGAATCT
+GCAAAGCAGCTTGCCACTCTCTTTGTGAACCTGTGTGTCACTGCAGAGACCCATGAGGTC
+TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACAACAAGAATCATCTCG
+ACAACAAATGGAGGACAGGAGAGGAAATTTGTGGGCGGATCTGGTCAAGTGAGTGAGCGG
+ATAATGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGATCTACATTGACCAG
+ACAAGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGATGTATGAGGCTAAATATGTG
+ATTAGTGCTATTCCTCCTACTCTGGGCATGAAGATTCACTTCAATCCCCCTCTGCCAATG
+ATGAGAAACCAGATGATCACTCGTGTGCCTTTGGGTTCAGTCATCAAGTGTATAGTTTAT
+TATAAAGAGCCTTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATTGATGGAGAA
+GAAGCTCCAGTTGCCTACACGTTGGATGATACCAAACCTGAAGGCAACTATGCTGCCATA
+ATGGGATTTATCCTGGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGAGGAAAGG
+TTGAAGAAACTTTGTGAACTCTATGCCAAGGTTCTGGGTTCCCTAGAAGCTCTGGAGCCA
+GTGCATTATGAAGAAAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACAACT
+TATTTCCCCCCTGGGATCCTGACTCAATATGGAAGGGTTCTACGCCAGCCAGTGGACAGG
+ATTTACTTTGCAGGCACCGAGACTGCCACACACTGGAGCGGCTACATGGAGGGGGCTGTA
+GAGGCCGGGGAGAGAGCAGCCCGAGAGATCCTGCATGCCATGGGGAAGATTCCAGAGGAT
+GAAATCTGGCAGTCAGAACCAGAGTCTGTGGATGTCCCTGCACAGCCCATCACCACCACC
+TTTTTGGAGAGACATTTGCCCTCCGTGCCAGGCCTGCTCAGGCTGATTGGATTGACCACC
+ATCTTTTCAGCAACGGCTCTTGGCTTCCTGGCCCACAAAAGGGGGCTACTTGTGAGAGTC
+TAA
+>ENSRNOT00000044009_rattusnorvegicus
+ATGAGCAACAAATGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCAGCAGCC
+AAACTTTTGCATGACTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGAGACCGTGTGGGA
+GGCAGGACTTACACAATTAGGAATAAAAATGTTAAATATGTGGACCTTGGAGGATCTTAT
+GTTGGGCCGACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
+AAAGTGAATGAAGTTGAGCGGCTGATCCACTTTGTAAAGGGAAAATCATATGCCTTCAGG
+GGCCCATTCCCACCAGTGTGGAATCCAATCACTTACCTAGATTATAACAACCTCTGGAGA
+ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAGGCACCCCTTGCT
+GAAGAGTGGGACTACATGACAATGAAAGAGTTGCTAGATAAGATCTGCTGGACCAACTCT
+ACAAAGCAGATTGCCACACTCTTTGTGAACCTATGTGTAACTGCGGAGACCCATGAGGTT
+TCTGCACTGTGGTTCCTGTGGTATGTGAAGCAGTGTGGGGGTACAACCAGAATCATATCA
+ACAACCAATGGAGGACAGGAGAGGAAATTTATTGGTGGATCTGGTCAAGTGAGTGAGCGG
+ATAAAGGATATCCTTGGGGACAGAGTGAAGCTGGAGAGGCCGGTGATCCACATTGACCAG
+ACAGGAGAAAATGTTGTTGTGAAAACCCTAAACCATGAAATATATGAGGCTAAATATGTG
+ATTAGTGCCATCCCACCTGTTTTGGGCATGAAGATTCACCATAGTCCTCCTCTGCCCATT
+CTAAGAAACCAGCTGATTACTCGTGTGCCTTTGGGTTCAGTTATTAAGTGCATGGTTTAT
+TATAAAGAACCCTTCTGGAGGAAAAAGGATTTCTGTGGAACCATGGTTATTGAAGGAGAG
+GAAGCTCCAATTGCGTACACATTGGATGATACCAAGCCAGATGGCAGCTGTGCTGCTATA
+ATGGGATTTATCCTTGCTCACAAAGCTAGAAAACTGGTACGCCTTACTAAAGAAGAAAGA
+CTGAGGAAGCTCTGTGAGCTATACGCGAAAGTTCTGAACTCTCAAGAAGCTCTGCAGCCA
+GTCCATTATGAAGAGAAGAACTGGTGTGAGGAGCAGTACTCCGGGGGCTGCTACACAGCC
+TACTTCCCTCCTGGCATCTTGACCCAGTATGGAAGGGTTCTACGCCAGCCAGTGGGCAAG
+ATTTTCTTTGCAGGCACCGAGACAGCTTCACATTGGAGTGGCTACATGGAGGGGGCTGTA
+GAGGCTGGAGAGAGAGCTGCCAGAGAGATTCTTCATGCCATTGGGAAGATTCCAGAGGAT
+GAAATTTGGCAGCCAGAACCAGAATCTGTGGATGTCCCAGCAAGACCCATTACCAACACC
+TTCCTGGAGAGACACTTGCCTTCTGTACCAGGTCTACTAAAGCTGCTTGGATTGACCACC
+ATCTTGTCAGCAACAGCTCTTGGTTTCCTGGCCCACAAAAAGGGTCTGTTTGTACGTTTC
+TAA
+>ENSMUST00000040820_musmusculus
+ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
+AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
+GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
+GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
+AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGGGAAAATCATATGCCTTCAGG
+GGCCCATTTCCACCAGTATGGAATCCTATCACCTACCTAGATAATAACAACCTCTGGAGG
+ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAAGCACCCCTTGCT
+GAAGAGTGGGACTACATGACAATGAAAGAATTGCTAGATAAGATCTGCTGGACCAAATCT
+ACAAAGCAGATTGCCACGCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGAGGTC
+TCTGCACTATGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGTACAACCAGAATCATCTCA
+ACAACCAATGGAGGACAGGAGAGGAAATTTATTGGTGGATCTGGTCAAGTGAGTGAACGG
+ATAAAGGATATACTTGGGGACCGAGTGAAGCTGGAGAGGCCTGTGATCCACATTGACCAG
+ACAGGGGAAAATGTTATTGTGAAAACCCTAAACCATGAAATATATGAGGCTAAATATGTG
+ATTAGTGCCATTCCACCTGCTTTGGGCATGAAGATTCACTATAGTCCTCCTCTGCCCATG
+CTAAGAAACCAGCTGATCTCTCGTGTGCCTTTGGGTTCAGTTATTAAATGCATGGTTTAT
+TACAAAGAGCCCTTCTGGAGGAAAAAGGATTTCTGTGGAACCATGGTTATCGAAGGAGAG
+GAAGCTCCAATTGCATACACATTGGATGATACCAAACCAGATGGCACCTATGCTGCTATA
+ATGGGATTTATCCTTGCTCACAAAGCTAGAAAACTGGTACGTCTCACCAAAGAAGAAAGA
+CTGAGGAAACTTTGTGAGCTATATGCAAAAGTGCTGAACTCCCAAGAAGCTCTGCAGCCC
+GTCCATTATGAAGAGAAGAACTGGTGTGAGGAACAGTATTCTGGGGGCTGCTACACAACC
+TACTTCCCTCCCGGCATCTTGACCCAGTATGGAAGGGTTCTACGTCAGCCAGTGGGCAAG
+ATTTTCTTTGCAGGCACTGAAACAGCCTCACACTGGAGCGGCTACATGGAGGGGGCTGTG
+GAGGCTGGGGAGAGAGCAGCCAGAGAGATTCTTCATGCCATTGGGAAGATTCCAGAAGAT
+GAAATTTGGCAGCCAGAACCAGAATCTTTGGATGTCCCTGCACGACCCATTACCAGTACC
+TTCCTGGAGAGACACCTGCCTTCTGTACCAGGCCTGCTAAAGCTGTTTGGATTGACCACC
+ATCTTGTCAGCAACAGCTCTTGGTTTCCTGGCCCACAAAAGGGGCCTGTTTGTACATTTT
+TAA
+>ENSMUST00000168613_musmusculus
+ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
+AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
+GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
+GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
+AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGGGAAAATCATATGCCTTCAGG
+GGCCCATTTCCACCAGTATGGAATCCTATCACCTACCTAGATAATAACAACCTCTGGAGG
+ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAAGCACCCCTTGCT
+GAAGAGTGGGACTACATGACAATGAAAGAATTGCTAGATAAGATCTGCTGGACCAAATCT
+ACAAAGCAGATTGCCACGCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGAGGTC
+TCTGCACTATGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGTACAACCAGAATCATCTCA
+ACAACCAATGGAGGACAGGGGAAAATGTTATTGTGA
+>ENSMUST00000163344_musmusculus
+ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
+AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
+GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
+GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
+AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGATCTACAAAGCAGATTGCCAC
+GCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGA
+>ENSMUST00000173143_musmusculus
+ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGAAAAACCTGCTAAT
+TCTAGTCAGTTTACAAGCTCATTGTGGAGGAGAATTGAAAAACTGTGA
+>ENSSSCT00000033745_susscrofa
+ATGGCAGCGGCCAAACTTCTGCATGACTCTGGCCTGAGTGTGATTGTTCTGGAAGCCCGG
+GACCGCGTGGGAGGCAGGACTTACACCGTCAGGAACCAACAAGTTAAATATGTGGACCTT
+GGAGGATCTTATGTTGGGCCAACTCAGAATCGCATCTTAAGATTGTCCAAGGAGCTAGGA
+TTGGAGACCTACAAAGTGAATGAAGTGGAGCGTCTGATTCACTATGTAAAGGGCAAATCC
+TACCCCTTCAGGGGCCCATTACCACCTGTGAGGAATCCGATTACCTTCCTAGATCTTAAC
+AACCTTTGGAGGACGGTGGATGACATGGGACGAGAGATTCCCAGTGATGCCCCATGGAAG
+GCGCCCCTTGCAGAACAGTGGGACCAGATGACAATGAAGGAGCTGTTGGACAAGCTCTGC
+TGGACTGAATCTTCGAAGCAGCTGGCCACCCTTTTTGTGAACCTGTGTGTCACCGCGGAG
+ACCCATGAGGTCTCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACCACC
+AGGATCATCTCAACAACTAACGGAGGGCAGGAGAGGAAATTTGTGGGCGGATCTGGTCAA
+GTGACCGAGCGGATAAAGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGGTC
+CACATTGACCAGACAGGAGAAAATGTCCTCGTGGAGACCCTAAACCACGAGGTGTACGAG
+GCTAAGTATGTGATTAGCGCCATTCCTCCTGTCCTGGGCATGAAGATTCATTTCAGTCCC
+CCTCTGCCAATGATGAGAAACCAGCTCATCACTCGTGTACCTCTGGGCTCTGTCATCAAG
+TGTATAGTTTATTACAAAGAGCCCTTCTGGAGGCATAAGGATTACTGTGGAAGCATGATT
+ATTGAAGGAGAGGAAGCTCCAATCGCCTACACGTTGGATGATTCCAAGCCTGATGGCAGC
+TGTGCCGCCATCATAGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCCCGTCTTACC
+AAAGAAGAAAGGCTGAAGAAACTTTGCGACCTCTATGCAAAAGTTCTGGGTTCAAAAGAA
+GCTTTGAACCCCGTGCACTATGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCGGCGGGC
+TGCTACACGACCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTTCTACGCCAG
+CCAGTCGGCAGGATTTATTTCGCCGGCACGGAGACTGCCACGCACTGGAGTGGCTACATG
+GAGGGGGCCGTGGAGGCCGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCTATGGGAAAG
+ATCCCAGAAGATGAAATCTGGCAGTCTGAACCAGAGTCCGTGGATGTGCCTGCGAAGCCC
+ATTACCACGACCTTCTTGGAGAGACACTTGCCCTCGGTGCCCGGCCTGCTGAGGCTGATT
+GGATTGACCGCCATCTTTTCAGCCACTGCTCTCGGCTACCTGGCCCACAAAAGGGGGCTA
+CTCGTGCGGGTCTGA
+>ENSSSCT00000023183_susscrofa
+ATGGCAGCGGCCAAACTTCTGCATGACTCTGGCCTGAGTGTGATTGTTCTGGAAGCCCGG
+GACCGCGTGGGAGGCAGGACTTACACCGTCAGGAACCAACAAGTTAAATATGTGGACCTT
+GGAGGATCTTATGTTGGGCCAACTCAGAATCGCATCTTAAGATTGTCCAAGGAGCTAGGA
+TTGGAGACCTACAAAGTGAATGAAGTGGAGCGTCTGATTCACTATATCAAAGGCAAATCC
+TACCCCTTCAGGGGCCCATTACCACCTGTGAGGAATCCGATTACCTTCCTAGATCTTAAC
+AACCTTTGGAGGACGGTGGATGACATGGGACGAGAGATTCCCAGTGATGCCCCATGGAAG
+GCGCCCCTTGCAGAACAGTGGGACCAGATGACAATGAAGGAGCTGTTGGACAAGCTCTGC
+TGGACTGAATCTTCGAAGCAGCTGGCCACCCTTTTTGTGAACCTGTGTGTCACCGCGGAG
+ACCCATGAGGTCTCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACCACC
+AGGATCATCTCAACAACTAACGGAGGGCAGGAGAGGAAATTTGTGGGCGGATCTGGTCAA
+GTGACCGAGCGGATAAAGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGGTC
+CACATTGACCAGACAGGAGAAAATGTCCTCGTGGAGACCCTAAACCACGAGGTGTACGAG
+GCTAAGTATGTGATTAGCGCCATTCCTCCTGTCCTGGGCATGAAGATTCATTTCAGTCCC
+CCTCTGCCAATGATGAGAAACCAGCTCATCACTCGTGTACCTCTGGGCTCTGTCATCAAG
+TGTATAGTTTATTACAAAGAGCCCTTCTGGAGGCATAAGGATTACTGTGGAAGCATGATT
+ATTGAAGGAGAGGAAGCTCCAATCGCCTACACGTTGGATGATTCCAAGCCTGATGGCAGC
+TGTGCCGCCATCATAGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCCCGTCTTACC
+AAAGAAGAAAGGCTGAAGAAACTTTGCGACCTCTATGCAAAAGTTCTGGGTTCAAAAGAA
+GCTTTGAACCCCGTGCACTATGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCGGCGGGC
+TGCTACACGACCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTTCTACGCCAG
+CCAGTCGGCAGGATTTATTTCGCCGGCACGGAGACTGCCACGCACTGGAGTGGCTACATG
+GAGGGGGCCGTGGAGGCCGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCTATGGGAAAG
+ATCCCAGAAGATGAAATCTGGCAGTCTGAACCAGAGTCCGTGGATGTGCCTGCGAAGCCC
+ATTACCACGACCTTCTTGGAGAGACACTTGCCCTCGGTGCCCGGCCTGCTGAGGCTGATT
+GGATTGACCGCCATCTTTTCAGCCACTGCTCTCGGCTACCTGGCCCACAAAAGGGGGCTA
+CTCGTGCGGGTCTGA
+>ENSCAFT00000022963_canisfamiliaris
+ATGAGCGGCAAGTGCGACGTGGTCATGGTGGGGGGCGGCATCTCAGGCATGGCAGCAGCC
+AAACTTCTGCATGATTTTGGCCTGAACGTGGTTGTTCTGGAGGCCCGGGACCGAGTGGGA
+GGCAGGACTTACACCATCAGGAACCAAAAGGTTAAATATTTGGACCTTGGAGGATCTTAT
+GTTGGGCCAACTCAGAATTGTATCTTAAGGTTAGCCAAGGAGCTAGGATTGGAGACCTAC
+AAAGTGAATGAAGTAGAGCGTCTCATCCATCATGTAAAGGGCAAATCGTACCCCTTCAGG
+GGCCCCTTCCCACCTGTATGGAACCCAATTGCATACCTAGATCATAACAACCTCTGGAGG
+ACGATGGACGACATGGGGCGAGAGATTCCCAGTGATGCCCCATGGAAGGCACCTCTTGCG
+GAGGAGTGGGACCACATGACAATGAAGGAGCTTCTGGACAAGATCTGCTGGACAGAATCT
+GCCAAGCAACTTGCTACTCTCTTTGTGAATCTGTGTGTCACTGCAGAGACCCATGAGGTC
+TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACGACCAGGATCATCTCA
+ACAACCAATGGAGGGCAGGAGAGAAAATTTGTGGGCGGATCTGGTCAAGTGAGTGAACGG
+ATAATGGACCTCCTTGGAGACCAAGTGAAGCTGGAGAGGCCTGTGACCCACATTGACCAG
+ACAGGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGGTGTATGAGGCTAAGTATGTG
+ATTAGTGCCATTCCTCCTACTCTGGGCATGAAGATTCATTTCAACCCCCCTCTGCCAATG
+ATGAGAAACCAGCTGATCACTCGTGTGCCTTTGGGCTCAGTCATCAAGTGCATAGTTTAT
+TATAAAGAGCCCTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATCGAAGGAGAG
+GAAGCTCCAATTGCTTACACGTTGGATGATACCAAACCTGATGGCAACTATGCCGCCATA
+ATGGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGATGAAAGG
+ATGAAGAAACTTTGTGAGCTCTATGCAAAAGTCCTGGGTTCCCAAGAAGCTTTGCAGCCC
+GTACACTACGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCCGGGGGCTGCTACACCACC
+TACTTTCCCCCTGGGATCATGACTCAATATGGAAGGGTTCTACGACAGCCTGTGGGCAGG
+ATTTATTTTGCAGGCACGGAGACTGCCACCCACTGGAGTGGCTACATGGAGGGCGCTGTG
+GAGGCTGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCCATGGGGAAGATCCCAGAGGAT
+GAAATCTGGCAGTCAGAACCAGAATCAGTGGATGTCCCTGCGCAGCCCATCACCACGACC
+TTCTTGGAGAGACATTTGCCCTCTGTGCCAGGCCTGCTGAGGCTGATCGGATTGACCGCC
+ATCTTTTCTGCAACTGCTCTTGGCGTCCTGGCACACAAAAGGGGTCTGCTTGTGCGGGTC
+TAA
+>ENSPTRT00000034846_pantroglodytes
+ATGGACCCGGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
+CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
+GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
+CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTCCGCCTGGCA
+GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGCAGGGGGAGTTACTACCA
+GGGCTCTTTGGGGAGGCAGGACCCCTCGGCCGAGCAGCCTGGGCCGTCCCCACCGTGCGC
+AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCACCCCAGCGCCCTGCGCTTCCTG
+GCCGACCACGGTGCGGTCGACACCATCTTCTCCCTTCAGGGAGACTCCAGCCTGTTTGTG
+GCCTCGGCGGCCAGTCAGCTCCTGGTACACGTCCTGGCTTTGTCCATGCAAGGTGGAGCC
+GAGGGACAGCCCTGCCTGCCGGGGGGTGACTGGCCCGCGTGTGCCCAGAGGATCATGGAT
+CACGTTGAAGAGTCCTTGTGCTCCGCGGCCACCCCCAAGGTCACTCAGGCCCTGAACGTC
+CTGACCACAACCTTCGGGCGCTGCCAGAGCCCCTGGACGGAAGCCCTGTGGGTGCGGCTG
+AGTCCCCGCGTGGCGTGTCTGCTGGAGAGAGACCCCATCCCCGCCGCACACTCGTTCGTG
+GACCTGCTTCTCTGTGTGGCTCGTTCTCCCGTGTTCAGTTCTTCCGACGGCAGCCTGTGG
+GAGACAGTGGCGCGGGCTCTGAGCTGCCTGGGTCCCACCCACATGGGACCCCTGGCTTTG
+GGGATCCTGAAGCTCGAGCACTGTCCACAGGCACTGAGGACCCAGGCCTTCCAGGTCCTT
+CTCCAGCCCCTGGCCTGTGTCCTGAAGGCCACGGTTCAGGCCCCCGGACCCCCAGGCTTG
+CTGGACGGGACGGCAGACGATGCCACGACGGTGGACACACTCCTGGCCTCCAAGTCGTCC
+TGCGCGGGCCTCCTGTGCCGCACCCTGGCTCACCTGGAGGAGCTGCAGCCGCTGCCCCAG
+CGCCCTTCACCGTGGCCCCAGGCGTCTCTACTGGGGGCTACAGTGACTGTCCTGCGGCTC
+TGTGACGGCTCAGCTGCCCCTGCCTCCAGTGTGGGGGGCCACCTCTGTGGGACCCTGGCG
+GGCTGCGTCCGGGTCCAGCGAGCAGCCCTCGACTTCCTGGGGACACTGTCACAGGGGACA
+GGCCCCCAGGAGCTGGTGACGCAGGCGCTTGCTGTCCTCCTGGAGTGCCTCGAGAGCCCC
+GGCTCCAGCCCCACGGTTCTGAAGAAGGCCTTCCAGGCCACGCTCAGGTGGCTCCTGAGC
+TCACCCAAGACCCCCGGCTGCTCTGATCTCGGCCCCCTCATCCCGCAGTTCCTCAGAGAG
+CTGTTCCCTGTGCTGCAGAAACGCCTGTGCCACCCCTGCTGGGAGGTGAGGGACTCCGCC
+CTCGAGTTCCTGACCCAGCTGAGCAGGCACTGGGGAGGACAGGCCGACTTCAGATGCGCA
+CTCTTGGCTTCAGAGGTGCCTGAGCTGGCCCTGCAGCTCCTCCAGGACCCTGAGAGTTAT
+GTCCGAGCGAGCGCGGTGACCGCCATGGGGCAGCTGTCCAGCCAGGGCCTGCACGCCCCC
+ACCAGCCCTGAGCATGCAGAGGCCCGGCAGAGCCTGTTCCCGGAGCTCCTGCACATCCTC
+TCCGTAGACTCGGAGGGCTTCCCACGGCGGGCGGTCATGCAAGTCTTCACTGAGTGGCTG
+CGGGACGGCCACGCCGACGCGGCCCGGGACACGGAGCAGTTCGTGGCCACTGTGCTGCAG
+GTGGCGAGCCGGGACCTGGACTGGGAGGTCCGCGCCCAGGGCCTGGAGCTGGCCCTCGTG
+TTCCTGGGCCAGACTTTGGGGCCGCCGCGTACCCACTGCCCCTATGCCGTGGCCCTACCC
+GAGGTGGCCCCAGCCCAGCCACTCACCGAGGCACTGAGGGCTCTCTGCCACGTGGGGCTC
+TTTGACTTCGCCTTTTGTGCCTTGTTTGACTGCGACCGCCCTGTGGCGCAGAAGTCTTGT
+GACCTCCTTCTCTTCCTGAGGGACAAGATTGCTTCCTACAGCAGCCTGCGGGAGGCCAGG
+GGCGGCCCCAACACTGCCTCCGCAGAGGCCACCCTGCCGAGGTGGCGGGCGGGTGAGCAG
+GCCCAGCCCCCAGGGGACCAGGAGCCTGAGGCTGTGCTGGCCATGCTCAGGTCCCTAGAC
+CTGGAGGGCCTGCGGAGCACACTGGCCGAGAGCAGCGACCACGTGGAGAAGAGTCCCCAG
+TCCCTCCTGCAGGACATGCTGGCCACGGGAGGCTTCCTGCAGGGGGATGAGGCCGACTGC
+TACTGA
+>ENST00000340611_homosapiens
+ATGGACCCAGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
+CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
+GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
+CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTGCGCCTGGCA
+GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGCAGGGGGAGTTACTACCA
+GGGCTCTTTGGGGAGCCAGGACCCCTCGGCCGAGCAACCTGGGCCGTCCCCACCGTGCGC
+AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCACCCCAGCGCCCTGCGCTTCCTG
+GCCGACCATGGTGCGGTCGACACCATCTTCTCCCTGCAGGGAGACTCCAGCCTGTTTGTG
+GCCTCGGCGGCCAGTCAGCTCCTGGTGCACGTCCTGGCTTTGTCCATGCGAGGTGGAGCC
+GAGGGGCAGCCCTGCCTGCCGGGGGGTGACTGGCCCGCGTGTGCCCAGAAGATCATGGAT
+CACGTTGAAGAGTCCTTGTGCTCCGCGGCCACCCCCAAGGTCACTCAGGCCCTGAACGTC
+CTGACCACGACCTTCGGGCGCTGCCAGAGCCCCTGGACGGAAGCCCTGTGGGTGCGGCTG
+AGTCCCCGCGTGGCCTGTCTGCTGGAGAGAGACCCCATCCCCGCCGCACACTCGTTCGTG
+GACCTGCTTCTCTGTGTGGCTCGTTCTCCCGTGTTCAGTTCTTCCGACGGCAGCCTGTGG
+GAGACAGTGGCGCGGGCTCTGAGCTGCCTGGGTCCCACCCACATGGGACCCCTGGCTTTG
+GGGATCCTGAAGCTCGAGCACTGTCCACAGGCACTGAGGACCCAGGCCTTCCAGGTCCTT
+CTCCAGCCCCTGGCCTGTGTCCTGAAGGCCACGGTTCAGGCCCCCGGACCCCCAGGCTTG
+CTGGACGGGACGGCAGACGATGCCACGACGGTGGACACACTCCTGGCCTCCAAGTCGTCC
+TGCGCCGGCCTCCTGTGCCGCACCCTGGCTCACCTGGAGGAGCTGCAGCCGCTGCCCCAG
+CGCCCTTCACCGTGGCCCCAGGCGTCTCTACTGGGGGCTACAGTGACTGTCCTGCGGCTC
+TGTGACGGCTCGGCTGCCCCTGCCTCCAGTGTGGGGGGCCACCTCTGTGGGACCCTGGCG
+GGCTGCGTCCGGGTCCAGCGAGCAGCCCTCGACTTCCTGGGGACGCTGTCACAGGGGACA
+GGCCCCCAGGAGCTGGTGACGCAGGCGCTTGCTGTCCTCCTGGAGTGCCTCGAGAGCCCC
+GGCTCCAGCCCCACGGTTCTGAAGAAGGCCTTCCAGGCCACGCTCAGGTGGCTCCTGAGC
+TCACCCAAGACCCCCGGCTGCTCTGATCTCGGCCCCCTCATCCCGCAGTTCCTCAGAGAG
+CTGTTCCCTGTGCTGCAGAAACGCCTGTGCCACCCCTGCTGGGAGGTGAGGGACTCCGCC
+CTCGAGTTCCTGACCCAGCTGAGCAGGCACTGGGGAGGACAGGCTGACTTCAGATGCGCA
+CTCTTGGCTTCAGAGGTGCCTCAGCTGGCCCTGCAGCTCCTCCAGGACCCTGAGAGTTAT
+GTCCGAGCGAGTGCAGTGACCGCCATGGGGCAGCTGTCCAGCCAGGGCCTGCACGCCCCC
+ACCAGCCCTGAGCATGCAGAGGCCCGGCAGAGCCTGTTCCTGGAGCTCCTGCACATCCTC
+TCCGTAGACTCGGAGGGCTTCCCACGGCGGGCGGTCATGCAAGTCTTCACTGAGTGGCTG
+CGGGACGGCCACGCCGACGCGGCCCAGGACACGGAGCAGTTCGTGGCCACTGTGCTGCAG
+GCGGCGAGCCGAGACCTGGACTGGGAGGTCCGCGCCCAGGGCCTGGAGCTGGCCCTCGTG
+TTCCTGGGCCAGACTTTGGGGCCGCCGCGTACCCACTGCCCCTATGCCGTGGCCCTACCC
+GAGGTGGCCCCAGCCCAGCCACTCACCGAGGCACTGAGGGCTCTCTGCCACGTGGGGCTC
+TTTGACTTCGCCTTTTGTGCCTTGTTTGACTGCGACCGCCCTGTGGCGCAGAAGTCTTGT
+GACCTCCTTCTCTTCCTGAGGGACAAGATTGCTTCCTACAGCAGCCTGCGGGAGGCCAGG
+GGCAGCCCCAACACTGCCTCCGCAGAGGCCACCCTGCCGAGGTGGCGGGCGGGTGAGCAG
+GCCCAGCCCCCAGGGGACCAGGAGCCTGAGGCTGTGCTGGCCATGCTCAGGTCCCTAGAC
+CTGGAGGGCCTGCGGAGCACGCTGGCCGAGAGCAGCGACCACGTGGAAAAGAGTCCCCAG
+TCCCTCCTGCAGGACATGCTGGCCACGGGAGGCTTCCTGCAGGGGGACGAGGCCGACTGC
+TACTGA
+>ENST00000421712_homosapiens
+ATGGACCCAGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
+CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
+GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
+CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTGCGCCTGGCA
+GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGGTGCGGTCGACACCATCT
+TCTCCCTGCAGGGAGACTCCAGCCTGTTTGTGGCCTCGGCGGCCAGTCAGCTCCTGGTGC
+ACGTCCTGGCTTTGTCCATGCGAGGTGGAGCCGAGGGGCAGCCCTGCCTGCCGGGGGGTG
+ACTGGCCCGCGTGTGCCCAGAAGATCATGGATCACGTTGAAGAGTCCTTGTGCTCCGCGG
+CCACCCCCAAGGTCACTCAGGCCCTGA
+>ENSRNOT00000064726_rattusnorvegicus
+ATGGACGCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCTAGA
+CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTACTGGACTGGTTTAAAACAGTGACA
+GAGGCAGAGCCCAGCCTCCAACTACTGCAGGACCACCCCTGCCTAATGGAGCTCCTGTCC
+CATGTGCTGAAGCCACAGGATGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTCGTT
+GGGGTCTTTGCGGCCCAGGAGGACTGTTTCCAGTACCTTCAGCAGGGGGAGTTGTTGCTG
+GGGCTCTTTGGGGAGACAGGTGCCCTTAGCTGGGCAGCCTGGAGCATCCCCAGTGTGCGC
+AGCGGCTGGATCCAGGGCCTGTGCTCCCTGGCACACCACCCCAGTGCCCTGCACTTCCTG
+GCTGACAGTGGTGCTGTGGACACGATCTTCTCCTTGCAAGGAGACCCCAGCCTGTTTGTA
+GCCTCAGCAGCCAGCCAGCTCCTAGTACACATCCTGGCTCTGTCAATGCAAGGCGGAGCT
+CCAGGGTCCCCCGTCCCTGAAGCCGTTGCCTGGCCTGTCTGTGCCCAGAAGATCATGAAC
+CATGTAGAAGAGTCCTTGCATTCCAAAGCCACCCCACAGGTCACACAGGCCTTGAATGTC
+CTGACGACGACCTTCGGGCGCTGCCACAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
+AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCTGCCACACACTCGCTCATG
+GACCTGCTTCTCAGTGTGGCCAGGTCTCCTGTGTTGAACTTTGCAGCCTGTGGCCTGTGG
+GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCACCCAAGCTGGGCCTCTAGCTCTG
+GGGACCCTGAAACTTCAGCATTGTCCCCAGGAACTGAGGACCCAGGCCTTTAGAGTCCTC
+CTTCAGCCACTGGCCTGCATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
+CTGGACGGGACTGCGGGTAGCTTGCTGACTGTGGATGCACTCTTATCTTCAAAGTCGGCC
+TGTGTGGGGCTCCTCTGCCAGACTCTGGCGCACCTGGAGGAGCTGCAGATGCTGCCCCAG
+TGCCCCTCACCGTGGCCACAGGTGCCTCTGCTGCAAGCTGCTGTGACGATATTGCGTCTC
+TCTGACGGCTCGGCGGACCCCAGTTCCAGTGCAGGAGGCCGTCTCTGTGGGGCGCTGGGT
+GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACGCTGTCTCTGGGGACA
+AGCCCCCTGGAATTGGTGCTGGAGGTATTTGCTGTCCTCCTGAAGACCCTGGAGAGCCCA
+GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAGC
+CCACACAAGACCCCCAGCGGCTCTGATCTCAGCCCCGATGCCTTGCTGTTCCTCGGAGAG
+CTATTCCCCATACTACAGAAGCGCCTGTGCAGCCCGTGTTGGGAGGTGAGGGACTCAGCC
+CTGGAGTTCCTGACGCATCTGATCCGGGACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
+CTGCATTCTTCAGAAGTACCCACACTTGCCCGCCAGCTCCTCCAAGACCCTGAGAGTTAT
+GTCCGAGCAAGTGCAGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGCCTTCAGGCCACT
+CCCGCCAACCAGCAGGGCCTACTCATGGACCTCATGCATATCCTGTCCACGGACTCAGAG
+GGCTTCCCTCGAAGAGCTGTGTTACGGGTCTTTACTGAATGGCTGAGGGATGGCCATGCT
+GATGTGGTTCGAGACACAGAGTGGTTCGTGGCCACTGTTCTCCAGGCAGTGAGCCGGGAT
+CTGGACTGGGAGGTCCGAGTGCAGGGCTTGGAGCTGGCACAGGTATTCCTCATCCAGGCA
+ATGGGGCAGCCTAGACTCCACTGTCCCTATACAGTAGGCCTGCCTGGGGCCACCTCTTCC
+CGCCCACACCTGGAATTCTTGCAGACTCTCTGCCGTCTGCCACTCTTTGAGTTTGCCTTT
+TGTGCCTTGCTTGACTGTGACCGCCCGGTGGCCCAAAAAGCCTGTGACCTGCTCCTCTTC
+TTGAGGGACAAGACAGTTTCCTGCAGTAACCCTCAGGAGGCCGGGGACAGCCCCAACTCA
+GCCTCAGTGGAGGCTGCCCTGCAGAGGTGGCGGGAAGGTGAGCAGGCTCAGCCCCTAGGG
+GACCTGGAGCCTGAAGCCATGCTGGCCATCCTCAGGTCCTTAGACCTGGAGGGCCTGCAG
+GGCAGGCTGGCCAAGAGCAGTGACCATGTGGAGAAGAGCCCACAGTCCCTGCTGCAGGAC
+ATGCTGGCCACGGTGGGCGTGTTGGAGGAGAATGAAGCTGACTGCTACTAA
+>ENSMUST00000041588_musmusculus
+ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
+CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
+GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
+CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
+GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
+GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
+AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
+GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
+GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
+CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
+CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
+CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
+AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
+GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
+GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
+GGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAGGCCTTTGGAGTCCTC
+CTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
+CTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTGGCTTCAAAGTCAGCC
+TGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTGCAGATGCTGCCCCAG
+TGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTGACTATATTGCATCTC
+TGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTCTGTGGGACTCTGGGT
+GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACCCTGTCTCAGGGGACA
+AGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAGACCCTGGAGAGCCCA
+GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAAC
+CCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTGCTGTTTCTCGGAGAG
+CTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAGGTGAGGGACTCTGCC
+CTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
+CTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAAGACCCAGAGAGTTAC
+GTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGTCTGCAGGCCGCT
+CCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGGCCTACTCATGGACCTTATGCATATC
+CTGTCCACTGACTCAGAGGGCTTCCCTCGAAGGGCTGTGTTACGGGTCTTCACGGACTGG
+CTGAGGGATGGCCATGCTGACGTGGTTCGAGACACGGAGTGGTTCGTGGCCACTGTTCTC
+CAGGCAGTGAGCCGGGATCTGGACTGGGAGGTCCGAGTGCAGGGTTTGGAGCTGGCACGG
+GTGTTCCTCACCCAGGCACTGGGCCAGCCCAGCCTCCACTGTCCCTATACAGTGGGCCTG
+CCCAGGGCCTCCTCTCCCCGCCCACACCCGGAATTCTTGCAGACTCTCTGCCGTCTGCCG
+CTCTTTGAGTTTGCCTTTTGTGCCTTGCTTGACTGTGACCGACCGGTGGCCCAAAAGGCC
+TGTGACCTGCTCCTCTTCTTGAGGGACAAGACAGTTCCCTGCAGTAGCCCTCGGGAGGCA
+GGGGACAGCCCCAACTCAGCCTCAGTGGAGGCTGCCCTGCAGAGGTGGCGGGAAGGAGAG
+CAGGCCCAGCCCCTAGGGGACCTGGATCCTGAGGCCATGCTAGCCATCCTCAGGGCCTTA
+GACCTGGAGGGCCTGCAGGGCAGGCTGGCCAAGAGCAGCGACCATGTGGAGAAGAGCCCA
+CAGTCCCTGCTGCAGGACATGCTGGCCACGGTGGGTGTGTTGGAGGAGAACGAAGCTGAC
+TGCTACTAA
+>ENSMUST00000153440_musmusculus
+ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
+CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
+GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
+CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
+GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
+GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
+AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
+GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
+GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
+CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
+CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
+CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
+AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
+GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
+GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
+GGGACCCTGAAACTTCAGCACTGGCTTGCTGGATGGGACTGTGGGTAG
+>ENSMUST00000110806_musmusculus
+ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
+CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
+GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
+CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
+GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
+GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
+AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
+GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
+GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
+CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
+CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
+CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
+AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
+GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
+GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
+GGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAGGCCTTTGGAGTCCTC
+CTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
+CTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTGGCTTCAAAGTCAGCC
+TGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTGCAGATGCTGCCCCAG
+TGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTGACTATATTGCATCTC
+TGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTCTGTGGGACTCTGGGT
+GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACCCTGTCTCAGGGGACA
+AGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAGACCCTGGAGAGCCCA
+GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAAC
+CCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTGCTGTTTCTCGGAGAG
+CTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAGGTGAGGGACTCTGCC
+CTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
+CTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAAGACCCAGAGAGTTAC
+GTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGTCTGCAGGCCGCT
+CCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGTAGACACAGGGAGTTGGTGA
+>ENSMUST00000100505_musmusculus
+ATGGTGCATTTTGCACTCTCGGGCCTAATTCCCGTAGCGGAGGGATGCGGGGGCGGGATT
+AGAACCCCTAGGCTAACTCGCAGTCGCCGAGAGCGCACCTCTTACCCGGATTTGGGAGGA
+ACTGCCTGCCTGATCATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTT
+TTGGCAGATCCCAGACAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGG
+TTTAAAACAGTGACAGAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTA
+ATGGAGCTCCTGTCCCATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTT
+GCTCTGCGCCTTGTTGGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAG
+GGAGAGTTGTTGCTGGGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGC
+ATCCCAAGTGTGCGCAGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGC
+GCCCTGCACTTCCTGGCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGAC
+CCCAGCCTGTTCGTCGCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCC
+ATGCAAGGTGGAGCCCCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCC
+CAGAAGATTGTGAACCATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACA
+CAGGCCTTGAATGTCCTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTC
+CTCTGGGAGCGGCTAAGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCC
+GTGCACGCGCTCATGGACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCA
+GCCTGTGGCCTGTGGGAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCT
+GGGCCTCTAGCCCTGGGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAG
+GCCTTTGGAGTCCTCCTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCT
+GGACCTCCAGGCTTGCTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTG
+GCTTCAAAGTCAGCCTGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTG
+CAGATGCTGCCCCAGTGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTG
+ACTATATTGCATCTCTGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTC
+TGTGGGACTCTGGGTGGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACC
+CTGTCTCAGGGGACAAGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAG
+ACCCTGGAGAGCCCAGAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTC
+AGATGGCTCCAGAACCCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTG
+CTGTTTCTCGGAGAGCTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAG
+GTGAGGGACTCTGCCCTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCT
+GACTTCAGAGAGGCACTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAA
+GACCCAGAGAGTTACGTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAG
+GGTCTGCAGGCCGCTCCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGGCCTACTCATG
+GACCTTATGCATATCCTGTCCACTGACTCAGAGGGCTTCCCTCGAAGGGCTGTGTTACGG
+GTCTTCACGGACTGGCTGAGGGATGGCCATGCTGACGTGGTTCGAGACACGGAGTGGTTC
+GTGGCCACTGTTCTCCAGGCAGTGAGCCGGGATCTGGACTGGGAGGTCCGAGTGCAGGGT
+TTGGAGCTGGCACGGGTGTTCCTCACCCAGGCACTGGGCCAGCCCAGCCTCCACTGTCCC
+TATACAGTGGGCCTGCCCAGGGCCTCCTCTCCCCGCCCACACCCGGAATTCTTGCAGACT
+CTCTGCCGTCTGCCGCTCTTTGAGTTTGCCTTTTGTGCCTTGCTTGACTGTGACCGACCG
+GTGGCCCAAAAGGCCTGTGACCTGCTCCTCTTCTTGAGGGACAAGACAGTTCCCTGCAGT
+AGCCCTCGGGAGGCAGGGGACAGCCCCAACTCAGCCTCAGTGGAGGCTGCCCTGCAGAGG
+TGGCGGGAAGGAGAGCAGGCCCAGCCCCTAGGGGACCTGGATCCTGAGGCCATGCTAGCC
+ATCCTCAGGGCCTTAGACCTGGAGGGCCTGCAGGGCAGGCTGGCCAAGAGCAGCGACCAT
+GTGGAGAAGAGCCCACAGTCCCTGCTGCAGGACATGCTGGCCACGGTGGGTGTGTTGGAG
+GAGAACGAAGCTGACTGCTACTAA
+>ENSCAFT00000025950_canisfamiliaris
+ATGGACCCAGAGTGCTCCCAGCTCCTCCCGGCCCTCTGTGCAGTTCTGGCAGACCCCAGG
+CAGCCCGTGGCAGATGACACCTGTTTGGAGAAGCTGCTGGATTGGTTTAAAACGATAACC
+AAAGCTGGGTCCAGTCTCCTGTTATTACAGGAGAACCCCTGTCTGGTGGAGCTGCTGTGT
+CACGTGCTGAAACCCCAGGACCTGAGTTCCAGAGTCCTCTCCTTCTCTCTCCGCCTCGCA
+GGGGTATTTGCAGCCCAGGAAGATTGCTTCCAGTATCTTCAGCAGGGGGAGTTGCTGCCC
+AGGCTCTTTGGGGAGCCAGGGCCCCTGGGAGGAGCTGCCTGGACTGCCCCCTCAGTGCGC
+AGTGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCATCCTAGTGCCCTGCATTTCCTG
+GCTGACTGTGGTGCCGTTGACACCATCTTCTCCCTGCAGGGAGATTCCAGCCTGTTTGTG
+GCCTCGGCAGCTGGGCAGCTCCTGGTGCACATCCTGGGCTTGTCCATGCAAGGCCTAGCC
+GAGGGACACCCCAGCCTGCAGGCTGGTGATTGGCCAGTGTGTGCCCAGAAGATCGTGGGT
+CACATAGAAGAGTCCCTGCACTCCACAGCCGTCCCGCAGATCACACAGGCTCTAAACGTC
+CTGACTACCACGTTCGGGCACTGCCATGACCCTTGGACACAAGTTCTGTGGGTACGGCTG
+AGTCCCCTAGTAGGCAGTCTACTTGAGAAAGACCCTGTCCCAGCTGCACACTCGCTCGTG
+GACCTCCTCCTCAGTGTGGCCCGTTCTCCTGGGCTGAGCTCTTCTAGCTGCGGCCTGTGG
+GAGACTCTGGCTCAGACTCTGAACCATCTGAGCCCTACCCAAGCAGGGCCGCTGGCGTTA
+GGGATCCTGAAACTGCAGGACTGTCCACAGGTGCTAAGGGCCCAGGCCTTTGTCATTCTT
+CTCCAGCCTCTGGCCTGCGTCCTTAAAGCCACGGGTCAGGACCCCGGACCCTCAGGTGTG
+CTGGACAGTGCCACAGGTGACTCTCTGACAGTGGACGTGCTCCTCTCCTCCAAGGCGGCC
+TGTGTGGGTCTCCTGTGCCGGACTCTGGCCCACCTGGAGCTGCTGCAGCCGCTACCCCAG
+CGCCCCTGCCCCTGGCCTCAGGAGCCCCTGCTTGGGGCCGCGGTGACCCTGCTGCAGTTA
+TGCAGGGGCTCAGCAAGCCCTGCCTCTGACGTGGGGCGCCACCTCTGCGCGCTCCTGCTG
+GGCTGCGTGCGGGTGCAGCGAGCGGCCCTGGATTTCCTGGGGACGCTGTCTCAGGGGACA
+GGCCCCCAAGAGCTGGTGACGGAGGTGTTTGCTGTCCTTCTGGAATATCTCAGGAGCCCA
+GACTCCAGCCCCACGGTTCTGAAGAAAGCCTTCCAGGCCACATTCAGGTGGCTCCTGAGC
+TCACCCAAGACCCCCGGCTGCTGTGATCTAGAACCCCATGCCCTGCTGGTCCTGAGAGAG
+CTGCTTCCTGTGCTGCAGAAGCGTCTGTGCAGCCCCTGCTGGGAGGTGAGGGACTCCGGC
+CTCGAGTTCCTGACTCAGATGACCAGACACTGGGGAGGGCAGGCTGGCTTCAGACATGCA
+CTCCTCGCTTCGGAGGTGCCCAAGCTTACCGAGCAGCTCCTACGAGACCCTGAGAGTTAC
+GTCCGTGCCAGTGCAGTGACCGTCATGGGGCAGCTCTCCAGCCAGGGGCTGCATGTCACC
+CCTGTGAGCCCTGAGCATCCAGGGGGCCAGCAGAAGAGTCTGCTCGTGGAGCTTCTGCAT
+ATCCTCTCCACAGATTCAGAGGGATTCCCGCGGAGAGCCGTCATGCAGGTCTTCACCCAG
+TGGCTGAGGGACCACCATGCCGACGTGGCGGGGGACACGGAACAGTTTATGGCCAGGGTG
+CTCCAGGTCGCCAGCCAGGATCTGGACTGGGAGGTCCGGGCCCAGGGCCTGGAGCTGGCG
+CTGGTATTCCTGGAGCAGACGCTGGGCCAGTTCCACTCCCACTGTCCCTATGCTGTGACC
+CCACCCGTGGCGGCCCCAGCTGGCTCGCTGGCCCAGGCCCTGCAGCCACTATGCCGAGTG
+CGGCTCTTTGAGTTTGCCTTCCGTGCCTTGTTTGACTGTGACCGACCTGTGGCTCAGAAG
+TCCTGTGATCTCCTCCTCTTCCTGAGGGCCAAGACTGCTTCTTCCTCTGGTAGCCTGGAG
+GAGTCCAGGAGCGGCCCAGATGTGGCCTCTGTGGAGGCTGCCTTGCAGAGGTGGCAGGCA
+GGTGATCAGGGCCAGCCCCTGGGGGACCTGGAGCCCGAGGTCGTGCTGGCTGTGCTGAGG
+TCTGTGGACCTGGAAGGCCTTCGGGGTGCATTAGCCGAGGGCAGTGACCACATGGAGAAG
+AGCCCTCAGTCACTCCTGCAGGACATGCTGGCCACGGTGGGCGTCCTGGGAGAGAACGAG
+GCCGACTGCTACTGA
+>ENSSSCT00000008295_susscrofa
+ATGGACCCGGAGTGCTCCCGGCTCCTCCCGGCTCTCTGTGCCGTCCTGGCAGACCCCCGG
+CAGCCTGTGGCAGATGATACTTGCTTGGAGAAGCTGCTGGACTGGTTTAAAACAATAACT
+GAAGCAGGGTCCAGTCTCCTGGTGCTACAGGAAAATCCCTGCCTGGTGGAGCTGCTGTTC
+GACGTGCTGAAACCCCAGGACCTGAGTCCCAGAGTCCTCTCCTTCTCACTCCGCCTCGCA
+GGCATGTTCGCAGCCCAGGAAGACTGCTTCCAGTACCTTCAGCAGGGGGAGTTGCTGCCC
+AGGCTGTTTGGGGAGGCGGGCCCCCTGGGAGGAGCGGCCTGGACGGCCCCGACCGTGCGC
+AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCGCAGCACCCTCGCGCCCTGCCCTTCCTT
+GCCGACTGTGGTGCCGTTGACACCATCTTCTCCCTGCAGGGAGATTCCAGCCTGTTTGTG
+GCCTCGGCAGCCGGGCAGCTCCTGGTGCACATCCTGGACTTGGCGATGCGAGCCCCGCCC
+CGGGGACACCCCGGCCCGCAGGCGTGTGACGGGCCAGCGTGCGCCCAGAAGATCGTGTGT
+CACCTCGAAGACTCCCTGCGCGCCGCAGCCGCCCCGCAGCTCACGCAGGCCCTGAATGTC
+CTGACCACCACGTTCGGGCACTGCCACGGCCTTTGGACGCCGGGCCTTTGGGGGCGGCTG
+AGCCCTCTTGTGGGGCACCTGCTCGAGAAAGACCCCGTCCCAGCCTCGCACGCGCTCGTG
+GACCTCCTCCTCAGCGTGGCCCGGTCCCCTGTGCTGAGTTCTGAGAGTGGCCCGTGGGAG
+ACTTTGGCGCTGACTCTGAGCCGCTTGAGCCCGATGCAAGCAGGGCCTCTGGCTTTGGGG
+ATCCTGAAGCTGCAGGACTGCCCACAGGCCTTGAGGACCCAGGCCTCTGGCGTCCTCCTC
+CAGCCCCTGGCCTGTGTCCTGAAAGCTGCTGTGCAGGGCCCCGGACGCCCAGGTAGGCTG
+CTGGGGAAGGGGGGCAGGTGCAGGATGGCAGGACCGTGGGGGCCTGAGCGCATCCTTGGG
+GCCGGCGCAGGCTGTCATCCCAGGTGTGACTGCTGCTCCTGTTGCCACCCTGGAANCAGT
+GCCCTTGGCCTGGCCCAAGAGGCCCGCCTGAGGCTGTGTGACAATGCTGCGATCCCCCGC
+TCTGACCTGGGGGGCCAATTCTGTGGCCACCTGGTGGCCTGTGTCCGAGTCCAGCGAGCG
+GCCCTGGATTTCCTGGGGACGCTGTCTCAGAGGGCGGGCCCCCAAGAGCTGGTGACGCAG
+GTTTCTGCTGTCCTCCTGGAGTACCTTTCAGGCCCTGACTCCAGCCCCACGGTTCTGAAG
+AAGGCCTTCCAGGCCTCACTCGGGTGGCTCCTGAGCTCACCCAAGACCCCCGGCTGCTGC
+GATCTGGACCCCCACGCCCAGCAGTTCCTCAGAGAGCTGCTCCCTGTGCTGCAGAAGCGC
+CTGTGCAGCCCCTGCTGGGAGGTGAGGGACTCAGGCCTTGAGTTCCTGACCCAGATGGCC
+AGACACTGGGGAGGGCAGGCCGCCTTCAGACAGGTGCTCCTTGCTTCCGAGGTGCCCAGG
+CTCACCAGGCAGCTCCTGCAAGACCCCGAGAGTTACGTCCGCGCAAGCGCAGTGACCGCC
+ACAGGGCAGCTGTCTAGCTGGGGGCTGCATGCTGCCCCCGCCGGCCCTGAGCACCCAGGG
+GTCCAGCAGAAGAGCCTCCTGTCGGAGCTCCTGCACGTCCTCGCCACAGACTCGGAGGGC
+TTCCCCCGGAGGGCCGTCATGCAGGTCTTCACCGAGTGGCTGAGGGGCGGCCATGCTGAC
+GTGGCCGAGGACCCAGAGCAGTTTGTGGCCGGAGTGCTCCAGGCCGCGAGCAGGGACCTG
+GACTGGGAGGTCCGGGCCCAGGGCCTCGAGCTGGCGCTGGTGTTCCTGGAGCAGCTGCTG
+GGCCCGCCCGGCGTGCGCTGTCCCTACGCCGTGGCCCTGCCCAAGGCAGCCCCGCCTGGC
+ACGCTGGCCCAGGCCTTGCAGGCACTGTGCCGAGTGCAGCTCTTCGAGTTCGCCTTCCGT
+GCCTTGTTCGACTGCGACCGACCTGTGGCGCAGAAGTCCTGTGACCTCCTCCTCTTCCTG
+AAGGCCAAGGCCACTTCCTGCGGCACCCCCCAGGAGGAACGGGACAGCCCCGACGTGTCC
+TCCGTGGAGGCCACACTGCAGAAGTGGCAGGCAGGGGAGCACGGACACCCCCTGGGGGAC
+CTGGAGCCCGCGGCTGTTGTGGCCGTGCTCAGGTCCATGGACTTGGAAGGCCTTCAGGAC
+ACACTGGCCGAGAGCAGTGACCACGTGGAGAGGAGCCCCCAGTCGCTCCTGCAGGACATG
+CTGGCCACCGTGGGCGTCCTCGGGGAGAATGAGGCCGACTGCTACTGA
+>ENSPTRT00000019089_pantroglodytes
+ATAGGCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
+CTTCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
+CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
+CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATAATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
+GACCTGTTCCCCAACCTCACGGTCATCCGGGGGTCACGACTGTTCTTTAACTACGCGCTG
+GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
+CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
+TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
+GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
+ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCACAGTCACTGCCAGAAAGTTTGCCCG
+ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
+GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
+GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
+GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
+TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
+ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
+CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
+ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
+CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
+TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
+GAAATCGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAT
+TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
+CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
+AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
+AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
+CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAA
+AATGTGACGGAGTTCGACGGGCAGGATGCATGTGGTTCCAACAGTTGGACGGTGGTAGAC
+ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
+CGGGGTCTGAAGCCCTGGACCCAGTATGCCATCTTCGTGAAGACCCTGGTCACCTTTTCG
+GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
+AACCCCTCCGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTTTG
+AAGTGGAAACCCCCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
+AGGCAGGCGGAAGACAGTGAGCTGTTCGAACTGGATTATTGCCTCAAATGGTGTGTGTGG
+TGTGTGTGTGTGGTTGTTTGTTTGTGGAGTGTGTGTGAGTATGAGGATTCGGCCGGCGAA
+TGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTGAAGGAGCTGGAGGAGTCCTCGTTT
+AGGAAGACGTTTGAGGATTACCTGCACAACGTGGTTTTCGTCCCCAGAAAAACCTCTTCA
+GGCACTGGTGCCGAGGACCCTAGGCCATCTCGGAAACGCAGGTCCCTTGGCGATGTTGGG
+AATGTGACGGTGGCCGTGCCCACGGTGGCAGCTTTCCCCAACACTTCCTCGACCAGCGTG
+CCCACGAGTCCGGAGGAGCACAGGCCTTTTGAGAAGGTGGTGAACAAGGAGTCGCTGGTC
+ATCTCCGGCTTGCGACACTTCACGGGCTATCGCATCGAGCTGCAGGCTTGCAACCAGGAC
+ACCCCTGAGGAACGGTGCAGTGTGGCAGCCTACGTCAGTGCCAGGACCATGCCTGAAGCC
+AAGGCTGATGACATTGTCGGCCCTGTGACGCATGAAATCTTTGAGAACAACGTTGTCCAC
+TTGATGTGGCAGGAGCCGAAGGAGCCCAATGGTCTGATCGTGCTGTATGAAGTGAGTTAT
+CGGCGATATGGTGATGAGGAGCTGCATCTCTGCGTCTCCCGCAAGCACTTCGCTCTGGAG
+CGGGGCTGCAGGCTGCGTGGGCTGTCACCGGGGAACTACAGCGTGCGAGTCCGGGCCACC
+TCCCTTGCGGGCAACGGCTCTTGGACGGAACCCACCTATTTCTACGTGACAGACTATTTA
+GATGTCCCGTCAAATATTGCAAAAATTATCATCGGCCCCCTCATCTTTGTCTTTCTCTTC
+AGTGTTGTGATTGGAAGTATTTATCTATTCCTGAGAAAGAGGCAGCCAGATGGGCCGCTG
+GGACCGCTTTACGCTTCTTCAAACCCTGAGTATCTCAGTGCCAGTGATGTGTTTCCATGC
+TCTGTGTACGTGCCGGACGAGTGGGAGGTGCCTCGAGAGAAGATCACCCTCCTTCGAGAG
+CTGGGGCAGGGCTCCTTCGGCATGGTGTATGAGGGCAATGCCAGGGACATCATCAAGGGT
+GAGGCAGAGACCCGCGTGGCGGTGAAGACGGTCAACGAGTCAGCCAGTCTCCGAGAGCGG
+ATTGAGTTCCTCAATGAGGCCTCGGTCATGAAGGGCTTCACCTGCCATCATGTGGTGCGC
+CTCCTGGGAGTGGTGTCCAAGGGCCAGCCCACACTGGTGGTGATGGAGCTGATGGCTCAC
+GGAGACCTGAAGAGCTACCTCCGTTCTCTGCGGCCAGAGGCTGAGAATAATCCCGGCCGC
+CCTCCCCCTACCCTTCAAGAGATGATTCAGATGGCGGCAGAGATTGCTGATGGGATGGCC
+TACCTGAACGCCAAGAAGTTTGTGCATCGGGACCTGGCAGCGAGAAACTGCATGGTCGCC
+CATGATTTTACTGTCAAAATTGGAGACTTTGGAATGACCAGAGACATCTATGAAACGGAT
+TACTACCGGAAAGGGGGCAAGGGTCTGCTCCCTGTACGGTGGATGGCGCCAGAGTCCCTG
+AAGGATGGGGTCTTCACCACTTCTTCTGACATGTGGTCCTTTGGCGTGGTCCTTTGGGAA
+ATCACCAGCTTGGCAGAACAGCCTTACCAAGGCCTGTCTAATGAACAGGTGTTGAAATTT
+GTCATGGATGGAGGGTATCTGGATCAACCCGACAACTGTCCAGAGAGAGTCACTGACCTC
+ATGCGCATGTGCTGGCAATTCAACCCCAAGATGAGGCCAACCTTCCTGGAGATTGTCAAC
+CTGCTCAAGGACGACCTGCACCCCAGCTTTCCGGAGGTGTCGTTCTTCCACAGCGAGGAG
+AACAAGGCTCCCGAGAGCGAGGAGCTGGAGATGGAGTTTGAGGACATGGAGAATGTGCCC
+CTGGACCGTTCCTCGCACTGTCAGAGGGAGGAGGCGGGGGGCCGGGATGGAGGGTCCTCA
+CTAGGTTTCAAGCGGAGCTACGAGGAACACATCCCTTACACACACATGAACGGAGGCAAG
+AAAAACGGGCGGATTCTGACCTTGCCTCGGTCCAATCCTTCCTAA
+>ENST00000341500_homosapiens
+ATGGCCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
+CTGCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
+CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
+CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
+GACCTGTTCCCCAACCTCACGGTCATCCGGGGATCACGACTGTTCTTTAACTACGCGCTG
+GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
+CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
+TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
+GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
+ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCATAGTCACTGCCAGAAAGTTTGCCCG
+ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
+GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
+GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
+GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
+TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
+ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
+CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
+ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
+CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
+TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
+GAAATTGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAC
+TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
+CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
+AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
+AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
+CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
+AATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCCAACAGTTGGACGGTGGTAGAC
+ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
+CGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTGAAGACCCTGGTCACCTTTTCG
+GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
+AACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTCTG
+AAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
+AGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTATTGCCTCAAAGGGCTGAAGCTG
+CCCTCGAGGACCTGGTCTCCACCATTCGAGTCTGAAGATTCTCAGAAGCACAACCAGAGT
+GAGTATGAGGATTCGGCCGGCGAATGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTG
+AAGGAGCTGGAGGAGTCCTCGTTTAGGAAGACGTTTGAGGATTACCTGCACAACGTGGTT
+TTCGTCCCCAGGCCATCTCGGAAACGCAGGTCCCTTGGCGATGTTGGGAATGTGACGGTG
+GCCGTGCCCACGGTGGCAGCTTTCCCCAACACTTCCTCGACCAGCGTGCCCACGAGTCCG
+GAGGAGCACAGGCCTTTTGAGAAGGTGGTGAACAAGGAGTCGCTGGTCATCTCCGGCTTG
+CGACACTTCACGGGCTATCGCATCGAGCTGCAGGCTTGCAACCAGGACACCCCTGAGGAA
+CGGTGCAGTGTGGCAGCCTACGTCAGTGCGAGGACCATGCCTGAAGCCAAGGCTGATGAC
+ATTGTTGGCCCTGTGACGCATGAAATCTTTGAGAACAACGTCGTCCACTTGATGTGGCAG
+GAGCCGAAGGAGCCCAATGGTCTGATCGTGCTGTATGAAGTGAGTTATCGGCGATATGGT
+GATGAGGAGCTGCATCTCTGCGTCTCCCGCAAGCACTTCGCTCTGGAACGGGGCTGCAGG
+CTGCGTGGGCTGTCACCGGGGAACTACAGCGTGCGAATCCGGGCCACCTCCCTTGCGGGC
+AACGGCTCTTGGACGGAACCCACCTATTTCTACGTGACAGACTATTTAGACGTCCCGTCA
+AATATTGCAAAAATTATCATCGGCCCCCTCATCTTTGTCTTTCTCTTCAGTGTTGTGATT
+GGAAGTATTTATCTATTCCTGAGAAAGAGGCAGCCAGATGGGCCGCTGGGACCGCTTTAC
+GCTTCTTCAAACCCTGAGTATCTCAGTGCCAGTGATGTGTTTCCATGCTCTGTGTACGTG
+CCGGACGAGTGGGAGGTGTCTCGAGAGAAGATCACCCTCCTTCGAGAGCTGGGGCAGGGC
+TCCTTCGGCATGGTGTATGAGGGCAATGCCAGGGACATCATCAAGGGTGAGGCAGAGACC
+CGCGTGGCGGTGAAGACGGTCAACGAGTCAGCCAGTCTCCGAGAGCGGATTGAGTTCCTC
+AATGAGGCCTCGGTCATGAAGGGCTTCACCTGCCATCACGTGGTGCGCCTCCTGGGAGTG
+GTGTCCAAGGGCCAGCCCACGCTGGTGGTGATGGAGCTGATGGCTCACGGAGACCTGAAG
+AGCTACCTCCGTTCTCTGCGGCCAGAGGCTGAGAATAATCCTGGCCGCCCTCCCCCTACC
+CTTCAAGAGATGATTCAGATGGCGGCAGAGATTGCTGACGGGATGGCCTACCTGAACGCC
+AAGAAGTTTGTGCATCGGGACCTGGCAGCGAGAAACTGCATGGTCGCCCATGATTTTACT
+GTCAAAATTGGAGACTTTGGAATGACCAGAGACATCTATGAAACGGATTACTACCGGAAA
+GGGGGCAAGGGTCTGCTCCCTGTACGGTGGATGGCACCGGAGTCCCTGAAGGATGGGGTC
+TTCACCACTTCTTCTGACATGTGGTCCTTTGGCGTGGTCCTTTGGGAAATCACCAGCTTG
+GCAGAACAGCCTTACCAAGGCCTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGA
+GGGTATCTGGATCAACCCGACAACTGTCCAGAGAGAGTCACTGACCTCATGCGCATGTGC
+TGGCAATTCAACCCCAAGATGAGGCCAACCTTCCTGGAGATTGTCAACCTGCTCAAGGAC
+GACCTGCACCCCAGCTTTCCAGAGGTGTCGTTCTTCCACAGCGAGGAGAACAAGGCTCCC
+GAGAGTGAGGAGCTGGAGATGGAGTTTGAGGACATGGAGAATGTGCCCCTGGACCGTTCC
+TCGCACTGTCAGAGGGAGGAGGCGGGGGGCCGGGATGGAGGGTCCTCGCTGGGTTTCAAG
+CGGAGCTACGAGGAACACATCCCTTACACACACATGAACGGAGGCAAGAAAAACGGGCGG
+ATTCTGACCTTGCCTCGGTCCAATCCTTCCTAA
+>ENST00000302850_homosapiens
+ATGGCCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
+CTGCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
+CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
+CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
+GACCTGTTCCCCAACCTCACGGTCATCCGGGGATCACGACTGTTCTTTAACTACGCGCTG
+GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
+CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
+TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
+GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
+ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCATAGTCACTGCCAGAAAGTTTGCCCG
+ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
+GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
+GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
+GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
+TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
+ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
+CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
+ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
+CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
+TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
+GAAATTGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAC
+TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
+CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
+AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
+AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
+CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
+AATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCCAACAGTTGGACGGTGGTAGAC
+ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
+CGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTGAAGACCCTGGTCACCTTTTCG
+GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
+AACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTCTG
+AAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
+AGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTATTGCCTCAAAGGGCTGAAGCTG
+CCCTCGAGGACCTGGTCTCCACCATTCGAGTCTGAAGATTCTCAGAAGCACAACCAGAGT
+GAGTATGAGGATTCGGCCGGCGAATGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTG
+AAGGAGCTGGAGGAGTCCTCGTTTAGGAAGACGTTTGAGGATTACCTGCACAACGTGGTT
+TTCGTCCCCAGAAAAACCTCTTCAGGCACTGGTGCCGAGGACCCTAGGCCATCTCGGAAA
+CGCAGGTCCCTTGGCGATGTTGGGAATGTGACGGTGGCCGTGCCCACGGTGGCAGCTTTC
+CCCAACACTTCCTCGACCAGCGTGCCCACGAGTCCGGAGGAGCACAGGCCTTTTGAGAAG
+GTGGTGAACAAGGAGTCGCTGGTCATCTCCGGCTTGCGACACTTCACGGGCTATCGCATC
+GAGCTGCAGGCTTGCAACCAGGACACCCCTGAGGAACGGTGCAGTGTGGCAGCCTACGTC
+AGTGCGAGGACCATGCCTGAAGCCAAGGCTGATGACATTGTTGGCCCTGTGACGCATGAA
+ATCTTTGAGAACAACGTCGTCCACTTGATGTGGCAGGAGCCGAAGGAGCCCAATGGTCTG
+ATCGTGCTGTATGAAGTGAGTTATCGGCGATATGGTGATGAGGAGCTGCATCTCTGCGTC
+TCCCGCAAGCACTTCGCTCTGGAACGGGGCTGCAGGCTGCGTGGGCTGTCACCGGGGAAC
+TACAGCGTGCGAATCCGGGCCACCTCCCTTGCGGGCAACGGCTCTTGGACGGAACCCACC
+TATTTCTACGTGACAGACTATTTAGACGTCCCGTCAAATATTGCAAAAATTATCATCGGC
+CCCCTCATCTTTGTCTTTCTCTTCAGTGTTGTGATTGGAAGTATTTATCTATTCCTGAGA
+AAGAGGCAGCCAGATGGGCCGCTGGGACCGCTTTACGCTTCTTCAAACCCTGAGTATCTC
+AGTGCCAGTGATGTGTTTCCATGCTCTGTGTACGTGCCGGACGAGTGGGAGGTGTCTCGA
+GAGAAGATCACCCTCCTTCGAGAGCTGGGGCAGGGCTCCTTCGGCATGGTGTATGAGGGC
+AATGCCAGGGACATCATCAAGGGTGAGGCAGAGACCCGCGTGGCGGTGAAGACGGTCAAC
+GAGTCAGCCAGTCTCCGAGAGCGGATTGAGTTCCTCAATGAGGCCTCGGTCATGAAGGGC
+TTCACCTGCCATCACGTGGTGCGCCTCCTGGGAGTGGTGTCCAAGGGCCAGCCCACGCTG
+GTGGTGATGGAGCTGATGGCTCACGGAGACCTGAAGAGCTACCTCCGTTCTCTGCGGCCA
+GAGGCTGAGAATAATCCTGGCCGCCCTCCCCCTACCCTTCAAGAGATGATTCAGATGGCG
+GCAGAGATTGCTGACGGGATGGCCTACCTGAACGCCAAGAAGTTTGTGCATCGGGACCTG
+GCAGCGAGAAACTGCATGGTCGCCCATGATTTTACTGTCAAAATTGGAGACTTTGGAATG
+ACCAGAGACATCTATGAAACGGATTACTACCGGAAAGGGGGCAAGGGTCTGCTCCCTGTA
+CGGTGGATGGCACCGGAGTCCCTGAAGGATGGGGTCTTCACCACTTCTTCTGACATGTGG
+TCCTTTGGCGTGGTCCTTTGGGAAATCACCAGCTTGGCAGAACAGCCTTACCAAGGCCTG
+TCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGGTATCTGGATCAACCCGACAAC
+TGTCCAGAGAGAGTCACTGACCTCATGCGCATGTGCTGGCAATTCAACCCCAAGATGAGG
+CCAACCTTCCTGGAGATTGTCAACCTGCTCAAGGACGACCTGCACCCCAGCTTTCCAGAG
+GTGTCGTTCTTCCACAGCGAGGAGAACAAGGCTCCCGAGAGTGAGGAGCTGGAGATGGAG
+TTTGAGGACATGGAGAATGTGCCCCTGGACCGTTCCTCGCACTGTCAGAGGGAGGAGGCG
+GGGGGCCGGGATGGAGGGTCCTCGCTGGGTTTCAAGCGGAGCTACGAGGAACACATCCCT
+TACACACACATGAACGGAGGCAAGAAAAACGGGCGGATTCTGACCTTGCCTCGGTCCAAT
+CCTTCCTAA
+>ENST00000600492_homosapiens
+TACAAAGAGGCCCCTTATCAGAATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCC
+AACAGTTGGACGGTGGTAGACATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAG
+AACCACCCAGGGTGGCTGATGCGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTG
+AAGACCCTGGTCACCTTTTCGGATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATT
+TATGTCCAGACAGATGCCACCAACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAAC
+TCATCATCCCAGATTATTCTGAAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACC
+CACTACCTGGTTTTCTGGGAGAGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTAT
+TGCCTCAAAGGGCGAGTCCAGTCATCAGCTCCGCTGTAA
+>ENSMUST00000208839_musmusculus
+NAGACAGATTACTATCGGAAAGGGGGCAAGGGACTGCTTCCTGTGAGGTGGATGTCACCT
+GAGTCCCTGAAGGATGGAGTCTTTACTGCTTCTTCTGATATGTGGTCCTTTGGGGTGGTC
+CTTTGGGAAATCACTAGCCTGGCTGAGCAACCTTATCAAGGCCTGTCTAATGAACAGGTG
+TTGAAGTTTGTCATGGATGGAGGCTATCTGGATCCCCCTGATAACTGTCCAGAGAGACTG
+AGATATGAGATAAAGACACACTGGCCACCCTGA
+>ENSMUST00000091291_musmusculus
+ATGGGCTTCGGGAGAGGATGTGAGACGACGGCTGTGCCATTGCTGGTGGCCGTGGCCGCG
+TTGCTGGTGGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCTGGTATGGACATC
+CGGAACAACCTGACCAGGCTACATGAGCTGGAGAACTGCTCAGTCATTGAGGGCCATCTG
+CAGATCCTCCTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATCATGATCACAGATTACCTGCTTCTCTTCCGTGTCTATGGTCTGGAAAGTCTGAAA
+GACCTCTTCCCAAATCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTG
+GTTATCTTCGAGATGGTCCACCTGAAGGAGCTGGGGCTTTATAACCTCATGAACATCACC
+CGGGGCTCTGTCCGCATCGAGAAGAATAATGAGCTCTGCTACCTGGCCACTATCGACTGG
+TCCCGTATCCTGGATTCTGTGGAGGACAACTACATTGTACTGAACAAAGATGACAACGAG
+GAATGTGGGGATGTCTGTCCAGGCACCGCCAAGGGCAAGACCAACTGTCCTGCCACTGTC
+ATCAATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCA
+ACCATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGCCACAAAGAGTGCCTG
+GGCAACTGTTCGGAACCTGATGACCCCACCAAGTGTGTGGCCTGTCGCAACTTCTATCTG
+GATGGTCAGTGTGTGGAGACCTGCCCGCCACCCTACTATCACTTCCAGGACTGGCGCTGT
+GTGAACTTCAGCTTCTGCCAAGACCTTCACTTCAAATGCAGGAACTCTCGGAAGCCTGGC
+TGCCACCAATACGTCATTCACAACAATAAGTGCATCCCCGAGTGCCCGTCTGGCTATACC
+ATGAATTCCAGCAACTTGATGTGCACCCCATGTCTGGGACCCTGCCCTAAGGTCTGCCAA
+ATCCTCGAAGGTGAGAAGACCATTGATTCTGTGACATCTGCCCAGGAGCTCCGAGGCTGC
+ACTGTGATCAACGGTAGCCTGATCATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAG
+CTGGAGGCTAACCTTGGCCTCATTGAAGAAATTTCGGGATTTCTAAAGATCCGCCGCTCC
+TATGCTCTGGTATCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTG
+GAAATTGGGAACTATTCTTTTTATGCCTTGGACAACCAGAACCTGAGGCAACTCTGGGAC
+TGGAGCAAACACAACCTCACCATCACTCAGGGCAAGCTCTTCTTCCATTACAACCCGAAA
+CTCTGCTTGTCTGAAATTCACAAGATGGAAGAAGTCTCCGGAACTAAGGGCCGTCAGGAG
+AGGAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCGTGTGAAAATGAATTGCTT
+AAATTTTCTTTCATTCGGACATCTTTTGACAAGATCCTGTTGAGGTGGGAACCCTACTGG
+CCCCCCGACTTCCGAGATCTCCTGGGATTCATGTTGTTCTACAAAGAGGCCCCTTATCAG
+AATGTGACAGAGTTTGATGGGCAGGATGCTTGTGGCTCCAACAGCTGGACTGTGGTGGAT
+ATTGACCCGCCCCAGAGGTCCAACGACCCCAAGTCTCAGACCCCAAGCCACCCTGGGTGG
+CTGATGCGGGGCCTCAAACCCTGGACCCAATACGCCATCTTTGTGAAGACCTTGGTTACC
+TTCTCTGATGAACGGCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGAT
+GCCACTAATCCTTCTGTCCCCCTGGATCCCATATCAGTTTCTAATTCCTCATCTCAGATT
+ATCTTAAAGTGGAAGCCCCCCTCTGACCCCAATGGCAACATCACACACTACCTGGTGTAC
+TGGGAGAGGCAAGCAGAGGACAGCGAGCTGTTTGAGCTGGATTATTGTCTCAAAGGGCTG
+AAGCTCCCTTCACGGACCTGGTCCCCACCCTTTGAGTCTGATGATTCTCAGAAGCACAAT
+CAGAGTGAGTATGACGACTCGGCCAGTGAGTGCTGCTCATGCCCTAAGACTGACTCTCAG
+ATCCTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAAC
+GTGGTTTTTGTCCCCAGGCCATCCCGAAAGCGAAGATCCCTTGAAGAGGTGGGGAATGTG
+ACAGCCACCACACTCACACTTCCAGATTTCCCCAACGTCTCCTCTACCATTGTGCCCACA
+AGTCAGGAGGAGCACAGGCCATTTGAGAAAGTGGTGAACAAGGAGTCACTTGTCATCTCT
+GGCCTGAGACACTTCACTGGGTACCGCATTGAGCTGCAGGCATGCAATCAAGATTCCCCA
+GATGAGAGGTGCAGTGTGGCTGCCTACGTCAGTGCCCGGACCATGCCTGAAGCTAAGGCA
+GATGACATCGTTGGCCCTGTGACTCATGAAATCTTTGAGAACAATGTTGTACACTTAATG
+TGGCAAGAGCCAAAGGAACCTAATGGTCTGATTGTGCTATATGAAGTGAGCTATCGCCGA
+TATGGTGATGAGGAGCTGCACCTCTGTGTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGC
+TGCAGGCTGCGAGGGCTCTCCCCAGGAAACTACAGTGTTCGAGTCCGGGCTACCTCTCTG
+GCAGGAAATGGCTCCTGGACAGAACCCACCTATTTTTATGTGACTGATTATTTAGATGTC
+CCATCAAATATTGCCAAAATTATCATTGGACCCCTCATCTTTGTCTTCCTCTTCAGTGTT
+GTGATTGGAAGTATTTATCTATTTCTGAGAAAGAGGCAGCCGGATGGGCCAATGGGACCA
+CTGTATGCATCTTCAAACCCTGAGTACCTCAGTGCCAGTGATGTGTTTCCATCTTCTGTG
+TACGTGCCGGACGAGTGGGAGGTGCCTCGAGAGAAGATCACCCTTCTTCGAGAGCTGGGG
+CAGGGATCCTTTGGTATGGTGTATGAAGGCAATGCCAAGGATATCATCAAGGGTGAGGCA
+GAGACCCGTGTTGCGGTTAAGACTGTCAATGAGTCAGCCAGTCTTCGAGAACGGATCGAG
+TTCCTCAATGAGGCATCAGTCATGAAGGGATTCACCTGCCATCATGTGGTCCGCCTTCTT
+GGGGTGGTATCCAAAGGACAGCCAACGCTGGTAGTGATGGAATTGATGGCTCATGGAGAC
+CTGAAAAGTCACCTCCGTTCTCTGAGGCCAGATGCTGAGAATAACCCAGGCCGCCCTCCC
+CCTACCTTGCAAGAAATGATTCAGATGACAGCAGAAATTGCTGATGGCATGGCATACTTG
+AACGCCAAGAAGTTTGTGCACCGGGACCTGGCAGCTCGAAACTGCATGGTTGCCCATGAT
+TTTACTGTCAAAATTGGAGACTTTGGAATGACAAGGGACATCTACGAGACAGATTACTAT
+CGGAAAGGGGGCAAGGGACTGCTTCCTGTGAGGTGGATGTCACCTGAGTCCCTGAAGGAT
+GGAGTCTTTACTGCTTCTTCTGATATGTGGTCCTTTGGGGTGGTCCTTTGGGAAATCACT
+AGCCTGGCTGAGCAACCTTATCAAGGCCTGTCTAATGAACAGGTGTTGAAGTTTGTCATG
+GATGGAGGCTATCTGGATCCCCCTGATAACTGTCCAGAGAGACTCACTGACCTGATGCGC
+ATGTGCTGGCAGTTCAACCCCAAGATGAGGCCAACCTTCCTGGAAATCGTCAACCTGCTC
+AAGGATGACCTCCACCCCAGCTTTCCAGAAGTTTCCTTCTTCTACAGCGAGGAGAACAAG
+GCTCCTGAGAGTGAGGAGCTGGAGATGGAGTTTGAAGACATGGAGAATGTCCCGTTGGAT
+CGTTCCTCTCACTGTCAGAGAGAAGAGGCTGGGGGCCGGGAGGGAGGGTCCTCACTGAGC
+ATCAAACGGACCTATGATGAACACATCCCCTATACCCACATGAATGGGGGCAAGAAGAAC
+GGACGTGTCCTTACCCTGCCAAGGTCAAACCCTTCCTAA
+>ENSMUST00000207100_musmusculus
+AGGTCCAACGACCCCAAGTCTCAGACCCCAAGCCACCCTGGGTGGCTGATGCGGGGCCTC
+AAACCCTGGACCCAATACGCCATCTTTGTGAAGACCTTGGTTACCTTCTCTGATGAACGG
+CGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGATGCCACTAATCCTTCT
+GTCCCCCTGGATCCCATATCAGTTTCTAATTCCTCATCTCAGATTATCTTAAAGTGGAAG
+CCCCCCTCTGACCCCAATGGCAACATCACACACTACCTGGTGTACTGGGAGAGGCAAGCA
+GAGGACAGCGAGCTGTTTGAGCTGGATTATTGTCTCAAAGGGCTGAAGCTCCCTTCACGG
+ACCTGGTCCCCACCCTTTGAGTCTGATGATTCTCAGAAGCACAATCAGAGTGAGTATGAC
+GACTCGGCCAGTGAGTGCTGCTCATGCCCTAAGACTGACTCTCAGATCCTGAAGGAGCTG
+GAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAACGTGGTTTTTGTCCCC
+AGAAAAACCTCTTCAGGCAATGGTGCCGAGGACAGTAGGCCATCCCGAAAGCGAAGATCC
+CTTGAAGAGGTGGGGAATGTGACAGCCACCACACTCACACTTCCAGATTTCCCCAACGTC
+TCCTCTACCATT
+>ENSRNOT00000041155_rattusnorvegicus
+ATGGGCTCCGGGAGAGGATGTGAGACGACGGCGGTGCCGTTGCTGATGGCCGTGGCCGCG
+TTGCTGGTGGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCGGGAATGGACATC
+CGGAACAACCTGACCAGGTTGCATGAGCTGGAGAACTGCTCGGTCATTGAGGGCCATCTG
+CAGATCCTCTTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATCATGATCACAGACTACCTGCTTCTTTTCCGTGTCTATGGCCTAGAAAGTCTAAAA
+GACCTCTTCCCAAACCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTG
+GTCATCTTCGAGATGGTCCACCTGAAGGAGCTGGGTCTTTACAACCTCATGAACATCACC
+CGGGGCTCTGTCCGCATCGAGAAGAATAATGAACTCTGCTACCTGGCCACTATCGACTGG
+TCCCGCATCCTGGATTCCGTGGAGGACAACTACATTGTACTGAACAAAGATGACAATGAG
+GAATGTGGGGACGTCTGTCCAGGCACAGCCAAGGGCAAGACCAACTGCCCTGCCACCGTC
+ATCAATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCA
+ACCATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGTCACAAGGAGTGCCTG
+GGCAACTGTTCAGAACCCGATGACCCTACCAAGTGTGTGGCCTGTCGAAACTTCTACCTG
+GATGGTCAGTGTGTGGAGACCTGCCCACCACCCTACTATCACTTCCAGGATTGGCGCTGT
+GTAAACTTCAGCTTCTGCCAAGACCTTCACTACAAATGCAGGAACTCTCGGAAGCCTGGC
+TGTCACCAATACGTCATTCACAACAACAAGTGCATCCCCGAGTGCCCGTCTGGCTATACC
+ATGAATTCCAGCAACTTGATGTGCACCCCGTGTCTGGGACCCTGTCCTAAGGTCTGCCAA
+ATCCTCGAAGGCGAGAAGACCATTGATTCCGTGACATCTGCCCAGGAGCTCCGAGGCTGC
+ACTGTGATCAATGGCAGCCTGATTATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAA
+CTAGAGGCTAACCTTGGCCTCATTGAAGAAATCTCAGGGTTCCTAAAGATCCGTCGCTCC
+TATGCTCTGGTGTCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTG
+GAAATTGGGAACTATTCTTTCTACGCCTTGGACAACCAGAACCTGAGGCAGCTGTGGGAC
+TGGAACAAGCACAACCTCACGATCACTCAGGGCAAGCTCTTCTTCCACTACAACCCCAAA
+CTCTGCCTGTCTGAGATCCACAAGATGGAGGAAGTGTCCGGAACCAAGGGCCGCCAGGAG
+AGGAACGACATTGCCCTGAAGACCAACGGGGACCAGGCATCCTGTGAAAATGAATTACTT
+AAATTCTCTTTCATCCGGACGTCTTTTGACAAGATCTTGCTGAGGTGGGAGCCCTACTGG
+CCCCCCGACTTCCGAGATCTCCTGGGATTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
+AACGTGACAGAGTTTGACGGGCAGGATGCGTGTGGCTCCAACAGCTGGACTGTGGTGGAT
+ATTGACCCGCCCCAGAGGTCCAACGACCCTAAGTCTCAGACCCCAAGCCACCCTGGGTGG
+CTGATGCGGGGCCTCAAACCCTGGACCCAGTATGCCATCTTTGTCAAGACCTTGGTTACC
+TTCTCTGATGAACGCCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGAT
+GCCACCAATCCTTCCGTTCCCCTGGATCCCATATCAGTTTCCAACTCCTCATCTCAGATT
+ATCTTAAAGTGGAAGCCCCCCTCGGACCCCAATGGCAACATCACACACTACCTGGTCTAC
+TGGGAGAGGCAGGCGGAGGACAGCGAGCTGTTCGAGTTGGATTATTGTCTCAAAGGGCTG
+AAGCTCCCCTCACGCACCTGGTCCCCACCTTTTGAGTCTGACGATTCTCAAAAGCACAAT
+CAGAGTGAGTATGACGACTCGGCCAGCGAGTGCTGCTCATGTCCTAAGACTGACTCTCAG
+ATCCTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAAC
+GTGGTTTTTGTTCCCAGAAAAACCTCTTCAGGCAATGGTGCTGAGGACACTAGGCCATCC
+CGAAAGCGAAGATCCCTTGAAGAGGTGGGCAATGTGACAGCCACTACACCCACACTTCCA
+GATTTTCCCAACATCTCCTCCACCATCGCGCCCACAAGCCACGAAGAGCACAGACCATTT
+GAGAAAGTAGTAAACAAGGAGTCACTTGTCATCTCTGGCCTGAGACACTTCACTGGGTAC
+CGCATTGAGCTGCAGGCATGCAATCAGGACTCCCCAGAAGAGAGGTGCAGCGTGGCTGCC
+TACGTCAGTGCCCGGACCATGCCTGAAGCTAAGGCAGATGACATCGTTGGCCCTGTGACC
+CATGAAATCTTTGAGAACAATGTTGTACACTTAATGTGGCAAGAGCCAAAGGAACCTAAT
+GGTCTGATTGTGCTATATGAAGTGAGCTATCGGCGATATGGTGATGAGGAGCTGCACCTC
+TGTGTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGCTGCAGGCTTCGAGGGCTCTCTCCA
+GGAAACTACAGTGTTCGAGTCCGGGCTACCTCTCTGGCAGGAAATGGCTCCTGGACAGAA
+CCCACCTATTTTTATGTGACTGATTATTTAGATGTCCCATCAAATATTGCCAAAATTATC
+ATCGGGCCCCTCATCTTCGTCTTCCTCTTCAGTGTCGTGATCGGAAGTATTTATCTATTC
+TTGAGGAAGAGGCAGCCAGATGGGCCAATGGGACCACTGTACGCTTCTTCAAACCCAGAG
+TACCTCAGTGCCAGTGATGTCTTTCCATCTTCCGTATACGTTCCGGATGAGTGGGAGGTA
+CCTCGAGAGAAGATCACCCTCCTCCGAGAGCTGGGGCAGGGATCCTTCGGTATGGTGTAC
+GAAGGCAATGCCAAGGATATCATCAAGGGTGAGGTAGAGACCCGTGTTGCGGTGAAGACG
+GTCAATGAGTCAGCCAGTCTTCGAGAACGGATCGAGTTCCTCAATGAGGCATCAGTCATG
+AAGGGCTTCACCTGTCATCACGTGGTCCGCCTTCTTGGGGTGGTGTCCAAAGGCCAGCCC
+ACATTGGTAGTGATGGAACTGATGGCTCATGGAGACCTGAAAAGTCACCTCCGTTCTCTG
+CGGCCCGATGCTGAGAACAACCCAGGCCGTCCTCCCCCTACCTTGCAAGAAATGATTCAG
+ATGACAGCAGAAATTGCCGATGGCATGGCATACTTGAACGCCAAGAAGTTTGTGCACCGG
+GACCTGGCAGCTCGGAACTGCATGGTTGCCCATGATTTTACTGTCAAAATCGGAGACTTT
+GGAATGACGAGAGACATCTACGAGACAGATTACTATCGGAAAGGGGGCAAGGGGTTGCTG
+CCCGTGAGGTGGATGTCACCCGAGTCCCTGAAGGACGGAGTCTTCACTGCTTCTTCCGAC
+ATGTGGTCCTTTGGGGTGGTCCTTTGGGAAATCACCAGCCTGGCTGAGCAACCTTACCAA
+GGCCTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGCTATCTGGATCCCCCT
+GATAACTGTCCAGAGAGACTCACTGACCTGATGCGCATGTGCTGGCAGTTCAACCCCAAG
+ATGAGGCCGACCTTCCTGGAAATCGTCAACCTGCTCAAGGACGACCTCCACCCCAGCTTT
+CCGGAAGTTTCCTTCTTCTACAGCGAGGAGAACAAGGCTCCCGAGAGTGAAGAGCTGGAG
+ATGGAGTTCGAGGACATGGAGAATGTCCCCTTGGATCGTTCCTCTCACTGTCAGAGAGAA
+GAGGCTGGATGCCGGGAGGGAGGGTCCTCTCTGAGCATCAAACGGACCTATGATGAACAC
+ATCCCCTACACCCACATGAACGGGGGCAAGAAGAATGGGCGGGTCCTCACCCTGCCGAGG
+TCGAACCCTTCCTAA
+>ENSRNOT00000067448_rattusnorvegicus
+ATGGGCTCCGGGAGAGGATGTGAGACGACGGCGGTGCCGTTGCTGATGGCCGTGGCCGTT
+GCTGGTGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCGGGAATGGACATCCGG
+AACAACCTGACCAGGTTGCATGAGCTGGAGAACTGCTCGGTCATTGAGGGCCATCTGCAG
+ATCCTCTTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAACTC
+ATCATGATCACAGACTACCTGCTTCTTTTCCGTGTCTATGGCCTAGAAAGTCTAAAAGAC
+CTCTTCCCAAACCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTGGTC
+ATCTTCGAGATGGTCCACCTGAAGGAGCTGGGTCTTTACAACCTCATGAACATCACCCGG
+GGCTCTGTCCGCATCGAGAAGAATAATGAACTCTGCTACCTGGCCACTATCGACTGGTCC
+CGCATCCTGGATTCCGTGGAGGACAACTACATTGTACTGAACAAAGATGACAATGAGGAA
+TGTGGGGACGTCTGTCCAGGCACAGCCAAGGGCAAGACCAACTGCCCTGCCACCGTCATC
+AATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCAACC
+ATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGTCACAAGGAGTGCCTGGGC
+AACTGTTCAGAACCCGATGACCCTACCAAGTGTGTGGCCTGTCGAAACTTCTACCTGGAT
+GGTCAGTGTGTGGAGACCTGCCCACCACCCTACTATCACTTCCAGGATTGGCGCTGTGTA
+AACTTCAGCTTCTGCCAAGACCTTCACTACAAATGCAGGAACTCTCGGAAGCCTGGCTGT
+CACCAATACGTCATTCACAACAACAAGTGCATCCCCGAGTGCCCGTCTGGCTATACCATG
+AATTCCAGCAACTTGATGTGCACCCCGTGTCTGGGACCCTGTCCTAAGGTCTGCCAAATC
+CTCGAAGGCGAGAAGACCATTGATTCCGTGACATCTGCCCAGGAGCTCCGAGGCTGCACT
+GTGATCAATGGCAGCCTGATTATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAACTA
+GAGGCTAACCTTGGCCTCATTGAAGAAATCTCAGGGTTCCTAAAGATCCGTCGCTCCTAT
+GCTCTGGTGTCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTGGAA
+ATTGGGAACTATTCTTTCTACGCCTTGGACAACCAGAACCTGAGGCAGCTGTGGGACTGG
+AACAAGCACAACCTCACGATCACTCAGGGCAAGCTCTTCTTCCACTACAACCCCAAACTC
+TGCCTGTCTGAGATCCACAAGATGGAGGAAGTGTCCGGAACCAAGGGCCGCCAGGAGAGG
+AACGACATTGCCCTGAAGACCAACGGGGACCAGGCATCCTGTGAAAATGAATTACTTAAA
+TTCTCTTTCATCCGGACGTCTTTTGACAAGATCTTGCTGAGGTGGGAGCCCTACTGGCCC
+CCCGACTTCCGAGATCTCCTGGGATTCATGCTGTTCTACAAAGAGGCCCCTTATCAGAAC
+GTGACAGAGTTTGACGGGCAGGATGCGTGTGGCTCCAACAGCTGGACTGTGGTGGATATT
+GACCCGCCCCAGAGGTCCAACGACCCTAAGTCTCAGACCCCAAGCCACCCTGGGTGGCTG
+ATGCGGGGCCTCAAACCCTGGACCCAGTATGCCATCTTTGTCAAGACCTTGGTTACCTTC
+TCTGATGAACGCCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGATGCC
+ACCAATCCTTCCGTTCCCCTGGATCCCATATCAGTTTCCAACTCCTCATCTCAGATTATC
+TTAAAGTGGAAGCCCCCCTCGGACCCCAATGGCAACATCACACACTACCTGGTCTACTGG
+GAGAGGCAGGCGGAGGACAGCGAGCTGTTCGAGTTGGATTATTGTCTCAAAGGGCTGAAG
+CTCCCCTCACGCACCTGGTCCCCACCTTTTGAGTCTGACGATTCTCAAAAGCACAATCAG
+AGTGAGTATGACGACTCGGCCAGCGAGTGCTGCTCATGTCCTAAGACTGACTCTCAGATC
+CTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAACGTG
+GTTTTTGTTCCCAGAAAAACCTCTTCAGGCAATGGTGCTGAGGACACTAGGCCATCCCGA
+AAGCGAAGATCCCTTGAAGAGGTGGGCAATGTGACAGCCACTACACCCACACTTCCAGAT
+TTTCCCAACATCTCCTCCACCATCGCGCCCACAAGCCACGAAGAGCACAGACCATTTGAG
+AAAGTAGTAAACAAGGAGTCACTTGTCATCTCTGGCCTGAGACACTTCACTGGGTACCGC
+ATTGAGCTGCAGGCATGCAATCAGGACTCCCCAGAAGAGAGGTGCAGCGTGGCTGCCTAC
+GTCAGTGCCCGGACCATGCCTGAAGCTAAGGCAGATGACATCGTTGGCCCTGTGACCCAT
+GAAATCTTTGAGAACAATGTTGTACACTTAATGTGGCAAGAGCCAAAGGAACCTAATGGT
+CTGATTGTGCTATATGAAGTGAGCTATCGGCGATATGGTGATGAGGAGCTGCACCTCTGT
+GTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGCTGCAGGCTTCGAGGGCTCTCTCCAGGA
+AACTACAGTGTTCGAGTCCGGGCTACCTCTCTGGCAGGAAATGGCTCCTGGACAGAACCC
+ACCTATTTTTATGTGACTGATTATTTAGATGTCCCATCAAATATTGCCAAAATTATCATC
+GGGCCCCTCATCTTCGTCTTCCTCTTCAGTGTCGTGATCGGAAGTATTTATCTATTCTTG
+AGGAAGAGGCAGCCAGATGGGCCAATGGGACCACTGTACGCTTCTTCAAACCCAGAGTAC
+CTCAGTGCCAGTGATGTCTTTCCATCTTCCGTATACGTTCCGGATGAGTGGGAGGTACCT
+CGAGAGAAGATCACCCTCCTCCGAGAGCTGGGGCAGGGATCCTTCGGTATGGTGTACGAA
+GGCAATGCCAAGGATATCATCAAGGGTGAGGTAGAGACCCGTGTTGCGGTGAAGACGGTC
+AATGAGTCAGCCAGTCTTCGAGAACGGATCGAGTTCCTCAATGAGGCATCAGTCATGAAG
+GGCTTCACCTGTCATCACGTGGTCCGCCTTCTTGGGGTGGTGTCCAAAGGCCAGCCCACA
+TTGGTAGTGATGGAACTGATGGCTCATGGAGACCTGAAAAGTCACCTCCGTTCTCTGCGG
+CCCGATGCTGAGAACAACCCAGGCCGTCCTCCCCCTACCTTGCAAGAAATGATTCAGATG
+ACAGCAGAAATTGCCGATGGCATGGCATACTTGAACGCCAAGAAGTTTGTGCACCGGGAC
+CTGGCAGCTCGGAACTGCATGGTTGCCCATGATTTTACTGTCAAAATCGGAGACTTTGGA
+ATGACGAGAGACATCTACGAGACAGATTACTATCGGAAAGGGGGCAAGGGGTTGCTGCCC
+GTGAGGTGGATGTCACCCGAGTCCCTGAAGGACGGAGTCTTCACTGCTTCTTCCGACATG
+TGGTCCTTTGGGGTGGTCCTTTGGGAAATCACCAGCCTGGCTGAGCAACCTTACCAAGGC
+CTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGCTATCTGGATCCCCCTGAT
+AACTGTCCAGAGAGACTCACTGACCTGATGCGCATGTGCTGGCAGTTCAACCCCAAGATG
+AGGCCGACCTTCCTGGAAATCGTCAACCTGCTCAAGGACGACCTCCACCCCAGCTTTCCG
+GAAGTTTCCTTCTTCTACAGCGAGGAGAACAAGGCTCCCGAGAGTGAAGAGCTGGAGATG
+GAGTTCGAGGACATGGAGAATGTCCCCTTGGATCGTTCCTCTCACTGTCAGAGAGAAGAG
+GCTGGATGCCGGGAGGGAGGGTCCTCTCTGAGCATCAAACGGACCTATGATGAACACATC
+CCCTACACCCACATGAACGGGGGCAAGAAGAATGGGCGGGTCCTCACCCTGCCGAGGTCG
+AACCCTTCCTAA
+>ENSSSCT00000014817_susscrofa
+GTGTGCCCAGGGATGGATATCCGGAATAACCTTACACGGCTGCACGAGTTGGCCAACTGC
+TCGGTCATCGAAGGACATTTGCAGATCCTGTTGATGTTCAAAACGCGGCCCGAGGATTTC
+CGAGACCTCAGTTTCCCCAAACTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTC
+TACGGGCTGGAGAGCCTGAAGGACCTGTTCCCCAACCTCACCGTCATCCGGGGCTCACGC
+CTCTTCTTTAACTATGCGCTGGTCATCTTTGAGATGGTTCACTTGAAGGAGCTTGGCCTC
+TACAATTTGATGAACATCACCAGGGGTGCTGTCCGCATCGAGAAGAACAATGAGCTCTGC
+TACCTGGCGACCATTGACTGGTCGCGCATCCTGGACTCTGTGGAGGATAATTACATTGTG
+CTGAACAAAGACGACAACGAGGAGTGTGGGGACATTTGCCCAGGCACTGCGAAGGGCAAG
+ACCAATTGCCCTGCCACCGTCATCAATGGGCAATTTGTCGAGCGGTGTTGGACGCACAGT
+CACTGCCAGAAAGTGTGCCCGACCATCTGTAAGTCGCACGGCTGCACTGCTGAGGGCCTC
+TGCTGTCACAGCGAGTGTTTGGGCAACTGCTCTGAGCCAGACGACCCCACCAAGTGCGTG
+GCCTGCCGCAACTTCTACCTGGACGGCAGATGCGTGGAGACCTGCCCGCCCCCCTACTAC
+CACTTCCAAGACTGGCGCTGCGTGAACTTCAGCTTCTGCCAGGACCTGCACAACAAATGC
+AAGAACTCAAGGAGGCAGGGCTGCCACCAGTACGTCATTCACAACAACAAGTGTATCCCT
+GAGTGCCCCTCAGGGTACACGATGAATTCCAGCAACTTGATGTGCACTCCGTGCCTAGGC
+CCCTGTCCCAAAGTGTGTCACCTCCTGGAAGGCGAGAAGACCATCGACTCAGTGACATCC
+GCCCAGGAGCTCCGAGGCTGCACCATTATCAACGGGAGCCTAATCATCAACATTCGAGGA
+GGCAACAACCTGGCAGCCGAACTAGAGGCCAACCTTGGACTCATTGAGGAGATTTCAGGG
+TACCTGAAAATCCGCCGATCCTATGCCCTCGTGTCACTTTCCTTCTTCCGGAAGTTGCGT
+CTGATCCGAGGGGAGACGTTGGAAATTGGGAACTATTCTTTCTATGCCTTGGACAACCAG
+AACCTAAGGCAACTGTGGGACTGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTC
+TTCTTCCATTATAATCCCAAACTCTGCTTGTCGGAAATTCACAAGATGGAGGAAGTTTCT
+GGAACCAAGGGGCGCCAGGAGAGAAATGATATTGCCCTGAAGACCAATGGGGACCAGGCG
+TCCTGTGAAAATGAGTTACTTAAATTTTCTTACATTCGGACATCTTATGACAAGATCTTG
+CTGAAGTGGGAGCCGTATTGGCCCCCCGACTTCCGAGACCTCCTGGGGTTCATGCTCTTC
+TACAAAGAGGCCCCTTATCAGAACGTGACGGAGTTTGACGGGCAGGATGCGTGTGGCTCC
+AACAGCTGGACGGTGGTGGACATTGACCCGCCTACGAGGTCCAATGACCCCAAGTCCCAG
+AACCATCCTGGGTGGCTGATGCGTGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTC
+AAGACTTTGGTCACCTTTTCTGATGAACGACGCACCTATGGAGCCAAGAGTGACATCATC
+TACGTCCAGACAGATGCCACAAGTAAGCATGTC
+
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test4.ns.fasta
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test4.sqlite
Binary file test-data/test4.sqlite has changed
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test5.ns.fasta
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test5.ns.fasta	Wed Apr 25 11:00:33 2018 -0400
@@ -0,0 +1,423 @@
+>ENST00000338702_homosapiens
+ATGGAGAATCAAGAGAAGGCGAGTATCGCGGGCCACATGTTCGACGTAGTCGTGATCGGA
+GGTGGCATTTCAGGACTATCTGCTGCCAAACTCTTGACTGAATATGGCGTTAGTGTTTTG
+GTTTTAGAAGCTCGGGACAGGGTTGGAGGAAGAACATATACTATAAGGAATGAGCATGTT
+GATTACGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAAAACAGAATCTTACGCTTG
+TCTAAGGAGCTGGGCATAGAGACTTACAAAGTGAATGTCAGTGAGCGTCTCGTTCAATAT
+GTCAAGGGGAAAACATATCCATTTCGGGGCGCCTTTCCACCAGTATGGAATCCCATTGCA
+TATTTGGATTACAATAATCTGTGGAGGACAATAGATAACATGGGGAAGGAGATTCCAACT
+GATGCACCCTGGGAGGCTCAACATGCTGACAAATGGGACAAAATGACCATGAAAGAGCTC
+ATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTTGCTTATCTTTTTGTGAATATC
+AATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGGTTCTTGTGGTATGTGAAGCAG
+TGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGTGGCCAGGAACGGAAGTTTGTA
+GGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTCCTCGGAGACCAAGTGAAGCTG
+AACCATCCTGTCACTCACGTTGACCAGTCAAGTGACAACATCATCATAGAGACGCTGAAC
+CATGAACATTATGAGTGCAAATACGTAATTAATGCGATCCCTCCGACCTTGACTGCCAAG
+ATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAGTTAATTCAGCGGCTTCCAATG
+GGAGCTGTCATTAAGTGCATGATGTATTACAAGGAGGCCTTCTGGAAGAAGAAGGATTAC
+TGTGGCTGCATGATCATTGAAGATGAAGATGCTCCAATTTCAATAACCTTGGATGACACC
+AAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATTCTTGCCCGGAAAGCTGATCGA
+CTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATCTGTGAGCTCTATGCCAAAGTG
+CTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCTGGGATCATGACTCAATATGGA
+AGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCGGGCACAGAGACTGCCACAAAG
+TGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAACGAGCAGCTAGGGAGGTCTTA
+AATGGTCTCGGGAAGGTGACCGAGAAAGATATCTGGGTACAAGAACCTGAATCAAAGGAC
+GTTCCAGCGGTAGAAATCACCCACACCTTCTGGGAAAGGAACCTGCCCTCTGTTTCTGGC
+CTGCTGAAGATCATTGGATTTTCCACATCAGTAACTGCCCTGGGGTTTGTGCTGTACAAA
+TACAAGCTCCTGCCACGGTCTTGA
+>ENST00000542639_homosapiens
+ATGGGGAAGGAGATTCCAACTGATGCACCCTGGGAGGCTCAACATGCTGACAAATGGGAC
+AAAATGACCATGAAAGAGCTCATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTT
+GCTTATCTTTTTGTGAATATCAATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGG
+TTCTTGTGGTATGTGAAGCAGTGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGT
+GGCCAGGAACGGAAGTTTGTAGGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTC
+CTCGGAGACCAAGTGAAGCTGAACCATCCTGTCACTCACGTTGACCAGTCAAGTGACAAC
+ATCATCATAGAGACGCTGAACCATGAACATTATGAGTGCAAATACGTAATTAATGCGATC
+CCTCCGACCTTGACTGCCAAGATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAG
+TTAATTCAGCGGCTTCCAATGGGAGCTGTCATTAAGTGCATGATGTATTACAAGGAGGCC
+TTCTGGAAGAAGAAGGATTACTGTGGCTGCATGATCATTGAAGATGAAGATGCTCCAATT
+TCAATAACCTTGGATGACACCAAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATT
+CTTGCCCGGAAAGCTGATCGACTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATC
+TGTGAGCTCTATGCCAAAGTGCTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAA
+GAGAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCT
+GGGATCATGACTCAATATGGAAGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCG
+GGCACAGAGACTGCCACAAAGTGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAA
+CGAGCAGCTAGGGAGGTCTTAAATGGTCTCGGGAAGGTGACCGAGAAAGATATCTGGGTA
+CAAGAACCTGAATCAAAGGACGTTCCAGCGGTAGAAATCACCCACACCTTCTGGGAAAGG
+AACCTGCCCTCTGTTTCTGGCCTGCTGAAGATCATTGGATTTTCCACATCAGTAACTGCC
+CTGGGGTTTGTGCTGTACAAATACAAGCTCCTGCCACGGTCTTGA
+>ENSPTRT00000040520_pantroglodytes
+ATGGAGAATCAAGAGAAGGCGAGTATCGCGGGCCACATGTTCGACGTAGTCGTGATCGGA
+GGTGGCATTTCAGGACTATCTGCTGCCAAACTCTTGACTGAATATGGCGTTAGTGTTTTA
+GTTTTAGAAGCTCGGGACAGGGTTGGAGGAAGAACATATACTATAAGGAATGAGCATGTT
+GATTACGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAAAACAGAATCTTACGCTTG
+TCTAAGGAGCTGGGCATAGAGACTTACAAAGTGAATGTCAGTGAGCGTCTCGTTCAATAT
+GTCAAGGGGAAAACATATCCATTTCGGGGCGCCTTTCCACCAGTATGGAATCCCATTGCA
+TATTTGGATTACAATAATCTGTGGCGGACAATAGATAACATGGGGAAGGAGATTCCAAAT
+GATGCACCCTGGGAGGCTCAACATGCTGACGAATGGGACAAAATGACCATGAAAGAGCTC
+ATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTTGCTTATCTTTTTGTGAATATC
+AATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGGTTCTTGTGGTATGTGAAGCAG
+TGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGCGGCCAGGAACGGAAGTTTGTA
+GGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTCCTTGGAGACCAAGTGAAGCTG
+AACCATCCTGTCACTCATGTTGACCAGTCAAGTGACAACATCATCATAGAGACACTGAAC
+CATGAACATTATGAGTGCAAATACGTAATTAATGCGATCCCTCCGACCTTGACTGCCAAG
+ATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAGTTAATTCAGCGTCTTCCAATG
+GGAGCTATCATTAAGTGCATGATGTATTACAAGGAGGCCTTCTGGAAGAAGAAGGATTAC
+TGTGGCTGCATGATCATTGAAGATGAAGATGCCCCAATTTCAATAACCTTGGATGACACC
+AAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATTCTTGCCCGGAAAGCTGATCGA
+CTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATCTGTGAGCTCTATGCCAAAGTG
+CTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCTGGGATCATGACTCAATATGGA
+AGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCGGGCACAGAGACTGCCACAAAG
+TGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAACGAGCAGCTAGGGAGGTCTTA
+AATGGTCTCGGGAAGGTGACCGAGAAAGACATCTGGGTACAAGAACCTGAATCAAAGGAC
+GTTCCAGCGGTAGAAATCACGCACACCTTCTGGGAAAGGAACCTGCCCTCTGTTTCTGGC
+CTGCTGAAGATCATTGGATTTTCCACATCAGTAACTACCCTGGGGTTTGTGCTGTACAAA
+TACAAGCTCCTGCCACGGTCTTGA
+>ENSSSCT00000013404_susscrofa
+ATGGAGCGTCAGGAGAAGGCGAACAACGCGGGCCACATGGTCGACGTAGTCGTGATAGGA
+GGCGGCATCTCAGGATTATCTGCTGCCAAACTCTTAAATGAATATGGAATTAATGTTTTG
+GTTTTAGAAGCCCGGGACAGAGTTGGAGGAAGAACATACACAGTGAGGAACGAAAATGTT
+GATTACGTGGACGTTGGTGGGGCTTATGTCGGACCGACCCAGAATAGGATCTTAAGGTTA
+TCTAAGGAACTGGGTTTAGAAACTTACAAAGTGAATGTAAATGAGTGTCTCGTTCAGTAT
+GTCAAGGGGAAATCTTATCCATTTCGGGGTGCCTTCCCTCCAGTCTGGAATCCCATTGCC
+TATCTGGATTACAACAACCTGTGGCGGACAATGGATGACATGGGAAAGAAGATTCCAGCT
+GATGCACCATGGGAGTCTCCGCATGCAGAGGAATGGGATAAGATGACCATGAAAGATCTC
+ATCGATAAAATCTGTTGGACAAAGACTGCTAAACGGTTTGCATCTCTCTTTGTAAATATC
+AATGTGACCTCCGAACCCCACGAAGTGTCTGCCCTGTGGTTTTTGTGGTATGTGAAGCAG
+TGTGGAGGCACCACCCGGATATTCTCTGTTACCAACGGGGGCCAGGAACGGAAGTTTGTA
+GGCGGATCTGGTCAAGTAAGCGAACGGATAATGCACCTCCTCGGGGACAGAGTGAAGCTG
+AGGTGTCCTGTCACCTATGTTGACCAGTCAGGTGACAACATCATCGTAGAGACATTGAAT
+CATGAACTTTATGAGTGCCAATACGTAATTAGTGCCATCCCTCCAACTCTGACTGCCAAG
+ATACACTTCAGACCGGAGCTTCCGTCAGAAAGAAACCAGTTAATTCAGCGTCTTCCGATG
+GGGGCTATCATTAAGTGCATGATGTATTACAAGGAGGCCTTTTGGAAGAAGAAGAATTAC
+TGTGGCTGTATGATCATCGAAGATGAGGAAGCTCCGATTTCAATAACTCTAGATGACACC
+AAGCCAGATGGATCGCTGCCCGCCATCATGGGCTTCATCCTTGCTCGAAAAGCTGACCGC
+CTTGCTAAGGTTCATAAAGAAATAAGAAAGCGGAAAATCTGTGAGCTCTACGCCAAAGTG
+CTAGGATCTCAAGAAGCTTTACATCCCGTGCACTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCGGGGGGCTGCTACACTGCCTACTTCCCCCCTGGGATCATGACTCAGTATGGA
+AGGGTGATCCGCCAGCCCGTAGGCAGGATATTCTTTGCTGGCACCGAGACTGCCACACAA
+TGGAGCGGTTACATGGAAGGAGCAGTAGAAGCCGGCGAACGGGCGGCTAGAGAGATCTTG
+AATGCTTTGGGGAAGGTGTCAAAGAAAGACATATGGCTTCGAGAACCTGAATCAGAGGAT
+GTTCCAGCTTTTGAGATCACCCGCACCTTCTGGGAGAGAAACCTGCCTTCCGTGACCGGG
+CTGCTTAAGATCATCGGATTTTCCACCTCGGTAACTGCCCTGTGGCTTGCCGTGTACAAA
+TTCAGGCTGCTGACCCGATCCTGA
+>ENSSSCT00000035258_susscrofa
+TCGCTGCCCGCCATCATGGGCTTCATCCTTGCTCGAAAAGCTGACCGCCTTGCTAAGGTT
+CATAAAGAAATAAGAAAGCGGAAAATCTGTGAGCTCTACGCCAAAGTGCTAGGATCTCAA
+GAAGCTTTACATCCCGTGCACTATGAAGAGAAGAACTGGTGTGAGGAGCAGTACTCGGGG
+GGCTGCTACACTGCCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTGATCCGC
+CAGCCCGTAGGCAGGATATTCTTTGCTGGCACCGAGACTGCCACACAATGGAGCGGTTAC
+ATGGAAGGAGCAGTAGAAGCCGGCGAACGGGCGGCTAGAGAGGATGTTCCAGCTTTTGAG
+ATCACCCGCACCTTCTGGGAGAGAAACCTGCCTTCCGTGACCGGGCTGCTTAAGATCATC
+GGATTTTCCA
+>ENSSSCT00000032764_susscrofa
+ATGGATGACATGGGAAAGAAGATTCCAGCTGATGCACCATGGGAGTCTCCGCATGCAGAG
+GAATGGGATAAGATGACCATGAAAGATCTCATCGATAAAATCTGTTGGACAAAGACTGCT
+AAACGGTTTGCATCTCTCTTTGTAAATATCAATGTGACCTCCGAACCCCACGAAGTGTCT
+GCCCTGTGGTTTTTGTGGTATGTGAAGCAGTGTGGAGGCACCACCCGGATATTCTCTGTT
+ACCAACGGGGGCCAGGAACGGAAGTTTGTAGGCGGATCTGGTCAAGTAAGCGAACGGATA
+ATGCACCTCCTCGGGGACAGAGTGAAGCTGAGGTGTCCTGTCACCTATGTTGACCAGTCA
+GGTGACAACATCATCGTAGAGACATTGAATCATGAACTTTATGAGTGCCAATACGTAATT
+AGTGCCATCCCTCCAACTCT
+>ENSCAFT00000022939_canisfamiliaris
+ATGGCGAGTAGAGAGAAGACGAGTATCGAGGGCCACATGTTTGACGTAGTCGTGATAGGA
+GGCGGCATCTCAGGATTGTCTGCTGCCAAACTCTTAGCCGAACATGAAGTTGATGTCTTA
+GTTTTAGAAGCACGAGATAGAGTTGGAGGAAGAACATACACCGTGAGGAATGAACATGTC
+GATTACGTAGATGTTGGTGGGGCTTATGTAGGACCAACTCAGAACAGAATCTTACGACTA
+TCTAAGGAGCTGGGTCTAGAGACTTACAAAGTGAACGTAAATGAGCGTCTTGTACAGTAT
+GTCAAGGGGAAAACTTACCCATTCCGAGGAGCCTTTCCTCCGGTATGGAATCCTATCGCA
+TATTTGGATTACAACAACCTGTGGCGGACAATGGATAACATGGGGAAGGAGATTCCAGCA
+GATGCACCATGGGAGGCCCCACATGCCGAGGAATGGGACAAGATGACTATGAAGGATCTT
+ATCGATAAAATCTGCTGGACAAAGACTGCTAGGAGGTTTGCATCCCTCTTTGTGAATATC
+AATGTGACCTCTGAGCCCCACGAGGTGTCTGCGCTCTGGTTCCTGTGGTATGTGAAGCAG
+TGCGGAGGTACCACTCGGATATTCTCGGTGACCAATGGAGGCCAGGAACGGAAGTTTGTG
+GGAGGATCCGGTCAAGTGAGTGAACGGATAATGGAGCGCCTTGGGGACAGAGTCAAGCTG
+AAGCGCCCTGTCACCTATGTTGACCAGTCAGATGACAACATCATCATAGAGACACTGAAT
+CATGAACTTTATGAGTGCAAATACGTGATTAGTGCCATCCCTCCAACTTTGACTGCCAAG
+ATCCACTTCAGACCAGAGCTTCCATCAGAGAGAAATCAGTTAATTCAGCGTCTTCCAATG
+GGAGCTATCATCAAGTGTATGATGTATTACAAGGAGGCCTTTTGGAAGAAGAAGGATTAC
+TGTGGCTGTATGATCATTGAAGACGAGGAAGCTCCAATTTCAATAACCCTGGATGACACC
+AAGCCAGATGGATCACTGCCCGCTATCATGGGCTTCATACTTGCCAGAAAAGCTGACCGA
+CTTGCCAAGCTCCATAAAGAAATAAGGAAGAGGAAAATCTGTGAGCTCTATGCCAAAGTG
+CTAGGATCCCAAGAAGCTTTACAACCCGTACACTATGAAGAGAAGAACTGGTGCGAGGAG
+CAGTACTCCGGGGGCTGCTATACCGCCTACTTCCCCCCTGGGATCATGACTCACTACGGA
+AGGGTGATCCGCCAGCCATTTGGCAGGATTTACTTTGCTGGCACTGAGACGGCAACACAC
+TGGAGCGGTTATATGGAAGGAGCTGTAGAGGCTGGGGAACGGACAGCTAGAGAGGTCTTA
+AATGCTCTCGGGAGGGTGGCAGAGAAAGACCTGAAGACCCAGGAACCTGAATCAAAGGAT
+GTTCCAGCTATGGAAATCACCCACACCTTCTGGGAGAGGAACCTGCCATCGGTGACAGGC
+CTGCTGAAGCTCATTGGATTTACCACATCAGTAACTGCCCTGTGGATTGTGGCGTACAAA
+TTCAGGCTGCTGAGACGATCCTGA
+>ENSMUST00000026013_musmusculus
+ATGACGGATCTGGAGAAGCCCAGTATCACAGGCCACATGTTCGACGTAGTCGTGATTGGA
+GGCGGCATCTCAGGATTGGCTGCTGCCAAACTATTGTCAGAATACAAAATTAATGTCTTG
+GTTCTGGAAGCCCGGGATAGAGTTGGAGGAAGAACATATACTGTGAGGAATGAGCATGTT
+AAATGGGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAGAACAGAATCTTACGCTTG
+TCTAAGGAGCTAGGCATAGAGACCTATAAAGTGAATGTCAATGAGCGTCTAGTTCAATAT
+GTCAAGGGGAAAACTTACCCATTCCGTGGTGCATTTCCACCTGTGTGGAACCCCTTGGCA
+TATTTGGATTACAACAACCTGTGGAGGACAATGGATGATATGGGAAAAGAGATCCCTGTT
+GATGCACCATGGCAAGCAAGACATGCTGAGGAATGGGACAAGATAACCATGAAAGATCTC
+ATTGATAAAATCTGTTGGACAAAAACTGCTCGAGAATTTGCTTATCTTTTTGTGAACATT
+AATGTGACTTCTGAGCCTCATGAGGTATCTGCCCTGTGGTTCTTGTGGTATGTGAGGCAG
+TGTGGAGGTACCTCTCGGATATTCTCAGTCACCAATGGCGGCCAGGAACGGAAATTTGTA
+GGTGGCTCTGGCCAAATAAGTGAACAGATAATGGTCCTCCTTGGGGATAAAGTGAAGCTG
+AGCTCTCCTGTTACTTATATTGACCAAACAGATGACAACATCATTATAGAAACACTGAAT
+CATGAGCACTATGAGTGCAAATATGTAATTAGTGCCATCCCACCGGTTTTGACTGCCAAG
+ATCCACTTTAAACCAGAGCTTCCACCTGAGAGAAACCAATTAATTCAGCGTCTTCCAATG
+GGGGCTGTCATCAAGTGCATGGTGTATTACAAGGAAGCCTTCTGGAAGAAAAAGGACTAT
+TGTGGCTGCATGATAATTGAAGATGAGGAGGCTCCAATTTCAATCACTCTGGATGACACT
+AAACCAGATGGGTCAATGCCTGCCATCATGGGCTTCATACTTGCCCGGAAAGCTGAACGA
+CTTGCTAAACTACATAAAGACATAAGGAAGAGGAAAATCTGTGAGCTGTATGCCAAAGTT
+CTGGGATCTCAAGAAGCTTTATCTCCCGTCCATTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCCGGGGGCTGCTACACAGCCTACTTCCCTCCTGGTATCATGACTCTGTATGGA
+AGGGTGATTCGGCAGCCAGTAGGCAGGATTTACTTTGCAGGCACAGAGACAGCAACACAG
+TGGAGTGGCTACATGGAAGGTGCAGTTGAAGCTGGAGAACGAGCAGCTAGAGAGGTCTTG
+AATGCTCTAGGAAAAGTTGCCAAGAAGGATATATGGGTTCAAGAGCCTGAGTCCAAGGAT
+GTTCCAGCTCTTGAAATTACCCACACCTTCTTAGAGAGGAACCTGCCTTCCGTGCCTGGT
+CTGCTCAAGATCACTGGTTTTTCCACTTCTGTGGCTCTTCTCTGCTTTGTATTGTACAAG
+TTTAAACAGCCCCAGTCCTGA
+>ENSRNOT00000066674_rattusnorvegicus
+ATGACGGATCTGGAGAAGCCCAATCTCGCAGGCCACATGTTCGACGTAGTCGTGATTGGA
+GGCGGCATCTCAGGATTGGCTGCTGCCAAACTGTTGTCTGAATACAAAATTAATGTCTTG
+GTTTTGGAAGCCCGGGATAGAGTTGGAGGAAGAACATATACTGTGAGGAATGAGCATGTC
+AAATGGGTAGATGTTGGTGGAGCCTATGTGGGACCAACCCAGAACAGAATCTTACGCTTG
+TCTAAGGAGCTAGGCATAGAGACCTATAAAGTGAATGTCAATGAGCGTCTAGTTCAATAT
+GTCAAGGGGAAAACTTACCCATTCCGTGGTGCATTCCCACCTGTGTGGAACCCCTTGGCA
+TATTTGGATTACAACAACCTATGGAGAACAATGGATGAAATGGGAAAAGAGATCCCCGTT
+GATGCACCGTGGCAAGCAAGACACGCTCAGGAATGGGACAAGATGACCATGAAAGATCTC
+ATTGATAAAATCTGTTGGACAAAAACTGCTCGGGAATTTGCGTATCTTTTTGTGAACATT
+AATGTGACTTCTGAGCCTCATGAGGTATCTGCCCTGTGGTTCCTGTGGTATGTGAGGCAG
+TGTGGGGGCACTGCTCGGATATTCTCAGTTACCAATGGCGGCCAGGAACGGAAATTTGTA
+GGTGGATCTGGCCAAGTAAGTGAACAGATAATGGGTCTCCTTGGAGATAAAGTGAAGCTG
+AGCTCTCCTGTTACTTATATTGACCAAACAGATGACAACATCATTGTAGAAACACTGAAT
+CATGAACACTATGAGTGCAAATACGTAATTAGTGCCATCCCACCGATTTTGACTGCCAAG
+ATCCACTTTAAACCAGAGCTTCCACCTGAGAGAAACCAATTAATTCAGCGTCTTCCAATG
+GGGGCTGTTATCAAGTGCATGGTGTATTACAAGGAAGCCTTCTGGAAGAAAAAGGACTAT
+TGTGGCTGCATGATCATTGAAGATGAGGAGGCTCCAATCGCCATCACTCTGGATGACACT
+AAACCAGATGGGTCACTGCCTGCCATCATGGGCTTCATACTTGCCCGGAAAGCTGATCGA
+CTTGCTAAACTACATAAAGACATAAGGAAGAGGAAAATCTGTGAGCTGTATGCCAAAGTT
+CTGGGATCTCAAGAAGCATTATATCCAGTCCATTATGAAGAGAAGAACTGGTGTGAGGAG
+CAGTACTCCGGGGGCTGCTACACAGCCTACTTCCCTCCTGGTATCATGACCCAGTATGGA
+AGGGTGATTCGCCAGCCAGTAGGTAGGATTTACTTTGCAGGCACAGAGACAGCAACACAG
+TGGAGTGGCTACATGGAAGGAGCAGTTGAAGCTGGAGAACGAGCAGCTAGAGAGGTGTTG
+AATGCTCTAGGAAAAGTCGCGAAGAAGGATATATGGGTTGAAGAACCCGAGTCCAAGGAT
+GTTCCAGCCATTGAAATTACCCACACCTTCTTAGAGAGGAACCTGCCTTCCGTGCCTGGT
+CTGCTCAAGATCACTGGTGTTTCCACTTCTGTGGCTCTTCTCTGCTTTGTATTGTACAAG
+ATTAAGAAGCTCCCATGCTGA
+>ENSPTRT00000040521_pantroglodytes
+ATGAGCAACAAATGCGACGTGGTCGTGGTGGGGGGCGGCATCTCAGGTAAGGCAGCAGCC
+AAACTTCTGCATGACTCTGGACTGAATGTGGTTGTTCTGGAAGCCCGGGACCGTGTGGGA
+GGCAGGACTTACACTCTTAGGAACCAAAAGGTTAAATATGTGGACCTTGGAGGATCCTAT
+GTTGGACCAACCCAGAATCGTATCTTGAGATTAGCCAAGGAGCTAGGATTGGAGACCTAC
+AAAGTGAATGAGGTTGAGCGTCTGATCCACCATGTAAAGGGCAAATCATACCCCTTCAGG
+GGGCCGTTCCCACCTGTATGGAATCCAATTACCTACTTAGATCATAACAACTTTTGGAGG
+ACAATGGATGACATGGGGCGAGAGATTCCGAGTGATGCCCCATGGAAGGCTCCCCTTGCA
+GAAGAGTGGGACAACATGACAATGAAGGAGCTACTGGACAAGCTCTGCTGGACAGAATCT
+GCAAAGCAGCTTGCCACTCTCTTTGTGAACCTGTGTGTCACTGCAGAGACCCATGAGGTC
+TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACAACAAGAATCATCTCG
+ACAACGAATGGAGGACAGGAGAGGAAATTTGTGGGCGGATCTGGTCAAGTGAGCGAGCGG
+ATAATGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGATCTACATTGACCAG
+ACAAGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGATGTATGAGGCTAAATATGTG
+ATTAGTGCTATTCCTCCTACTCTGGGCATGAAGATTCACTTCAATCCCCCTCTGCCAATG
+ATGAGAAACCAGATGATCACTCGTGTGCCTTTGGGTTCAGTCATCAAGTGTATAGTTTAT
+TATAAAGAGCCTTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATTGATGGAGAG
+GAAGCTCCAGTTGCCTACACGTTAGATGATACCAAACCTGAAGGCAACTATGCTGCCATA
+ATGGGATTTATCCTGGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGAGGAAAGG
+TTGAAGAAACTTTGTGAACTCTATGCCAAGGTTCTGGGTTCCCCAGAAGCTCTGGAGCCA
+GTGCATTATGAAGAAAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACAACT
+TACTTCCCCCCTGGGATCCTGACTCAATATGGAAGGGTTCTACGCCAGCCAGTGGACAGG
+ATTTACTTTGCAGGCACCGAGACTGCCACACACTGGAGCGGCTACATGGAGGGGGCTGTA
+GAGGCCGGGGAGAGAGCAGCCCGAGAGATCCTGCATGCCATGGGGAAGATTCCAGAGGAT
+GAAATCTGGCAGTCAGAACCAGAGTCTGTGGATGTCCCTGCACAGCCCATCACCACGACC
+TTTTTGGAGAGACATTTGCCCTCCGTGCCAGGCCTGCTCAGGCTGATTGGATTGACCACC
+ATCTTTTCAGCAACGGCTCTTGGCTTCCTGGCCCACAAAAGGGGGCTACTTGTGCGAGTC
+TAA
+>ENST00000378069_homosapiens
+ATGAGCAACAAATGCGACGTGGTCGTGGTGGGGGGCGGCATCTCAGGTATGGCAGCAGCC
+AAACTTCTGCATGACTCTGGACTGAATGTGGTTGTTCTGGAAGCCCGGGACCGTGTGGGA
+GGCAGGACTTACACTCTTAGGAACCAAAAGGTTAAATATGTGGACCTTGGAGGATCCTAT
+GTTGGACCAACCCAGAATCGTATCTTGAGATTAGCCAAGGAGCTAGGATTGGAGACCTAC
+AAAGTGAATGAGGTTGAGCGTCTGATCCACCATGTAAAGGGCAAATCATACCCCTTCAGG
+GGGCCATTCCCACCTGTATGGAATCCAATTACCTACTTAGATCATAACAACTTTTGGAGG
+ACAATGGATGACATGGGGCGAGAGATTCCGAGTGATGCCCCATGGAAGGCTCCCCTTGCA
+GAAGAGTGGGACAACATGACAATGAAGGAGCTACTGGACAAGCTCTGCTGGACTGAATCT
+GCAAAGCAGCTTGCCACTCTCTTTGTGAACCTGTGTGTCACTGCAGAGACCCATGAGGTC
+TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACAACAAGAATCATCTCG
+ACAACAAATGGAGGACAGGAGAGGAAATTTGTGGGCGGATCTGGTCAAGTGAGTGAGCGG
+ATAATGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGATCTACATTGACCAG
+ACAAGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGATGTATGAGGCTAAATATGTG
+ATTAGTGCTATTCCTCCTACTCTGGGCATGAAGATTCACTTCAATCCCCCTCTGCCAATG
+ATGAGAAACCAGATGATCACTCGTGTGCCTTTGGGTTCAGTCATCAAGTGTATAGTTTAT
+TATAAAGAGCCTTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATTGATGGAGAA
+GAAGCTCCAGTTGCCTACACGTTGGATGATACCAAACCTGAAGGCAACTATGCTGCCATA
+ATGGGATTTATCCTGGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGAGGAAAGG
+TTGAAGAAACTTTGTGAACTCTATGCCAAGGTTCTGGGTTCCCTAGAAGCTCTGGAGCCA
+GTGCATTATGAAGAAAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACAACT
+TATTTCCCCCCTGGGATCCTGACTCAATATGGAAGGGTTCTACGCCAGCCAGTGGACAGG
+ATTTACTTTGCAGGCACCGAGACTGCCACACACTGGAGCGGCTACATGGAGGGGGCTGTA
+GAGGCCGGGGAGAGAGCAGCCCGAGAGATCCTGCATGCCATGGGGAAGATTCCAGAGGAT
+GAAATCTGGCAGTCAGAACCAGAGTCTGTGGATGTCCCTGCACAGCCCATCACCACCACC
+TTTTTGGAGAGACATTTGCCCTCCGTGCCAGGCCTGCTCAGGCTGATTGGATTGACCACC
+ATCTTTTCAGCAACGGCTCTTGGCTTCCTGGCCCACAAAAGGGGGCTACTTGTGAGAGTC
+TAA
+>ENSRNOT00000044009_rattusnorvegicus
+ATGAGCAACAAATGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCAGCAGCC
+AAACTTTTGCATGACTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGAGACCGTGTGGGA
+GGCAGGACTTACACAATTAGGAATAAAAATGTTAAATATGTGGACCTTGGAGGATCTTAT
+GTTGGGCCGACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
+AAAGTGAATGAAGTTGAGCGGCTGATCCACTTTGTAAAGGGAAAATCATATGCCTTCAGG
+GGCCCATTCCCACCAGTGTGGAATCCAATCACTTACCTAGATTATAACAACCTCTGGAGA
+ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAGGCACCCCTTGCT
+GAAGAGTGGGACTACATGACAATGAAAGAGTTGCTAGATAAGATCTGCTGGACCAACTCT
+ACAAAGCAGATTGCCACACTCTTTGTGAACCTATGTGTAACTGCGGAGACCCATGAGGTT
+TCTGCACTGTGGTTCCTGTGGTATGTGAAGCAGTGTGGGGGTACAACCAGAATCATATCA
+ACAACCAATGGAGGACAGGAGAGGAAATTTATTGGTGGATCTGGTCAAGTGAGTGAGCGG
+ATAAAGGATATCCTTGGGGACAGAGTGAAGCTGGAGAGGCCGGTGATCCACATTGACCAG
+ACAGGAGAAAATGTTGTTGTGAAAACCCTAAACCATGAAATATATGAGGCTAAATATGTG
+ATTAGTGCCATCCCACCTGTTTTGGGCATGAAGATTCACCATAGTCCTCCTCTGCCCATT
+CTAAGAAACCAGCTGATTACTCGTGTGCCTTTGGGTTCAGTTATTAAGTGCATGGTTTAT
+TATAAAGAACCCTTCTGGAGGAAAAAGGATTTCTGTGGAACCATGGTTATTGAAGGAGAG
+GAAGCTCCAATTGCGTACACATTGGATGATACCAAGCCAGATGGCAGCTGTGCTGCTATA
+ATGGGATTTATCCTTGCTCACAAAGCTAGAAAACTGGTACGCCTTACTAAAGAAGAAAGA
+CTGAGGAAGCTCTGTGAGCTATACGCGAAAGTTCTGAACTCTCAAGAAGCTCTGCAGCCA
+GTCCATTATGAAGAGAAGAACTGGTGTGAGGAGCAGTACTCCGGGGGCTGCTACACAGCC
+TACTTCCCTCCTGGCATCTTGACCCAGTATGGAAGGGTTCTACGCCAGCCAGTGGGCAAG
+ATTTTCTTTGCAGGCACCGAGACAGCTTCACATTGGAGTGGCTACATGGAGGGGGCTGTA
+GAGGCTGGAGAGAGAGCTGCCAGAGAGATTCTTCATGCCATTGGGAAGATTCCAGAGGAT
+GAAATTTGGCAGCCAGAACCAGAATCTGTGGATGTCCCAGCAAGACCCATTACCAACACC
+TTCCTGGAGAGACACTTGCCTTCTGTACCAGGTCTACTAAAGCTGCTTGGATTGACCACC
+ATCTTGTCAGCAACAGCTCTTGGTTTCCTGGCCCACAAAAAGGGTCTGTTTGTACGTTTC
+TAA
+>ENSMUST00000040820_musmusculus
+ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
+AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
+GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
+GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
+AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGGGAAAATCATATGCCTTCAGG
+GGCCCATTTCCACCAGTATGGAATCCTATCACCTACCTAGATAATAACAACCTCTGGAGG
+ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAAGCACCCCTTGCT
+GAAGAGTGGGACTACATGACAATGAAAGAATTGCTAGATAAGATCTGCTGGACCAAATCT
+ACAAAGCAGATTGCCACGCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGAGGTC
+TCTGCACTATGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGTACAACCAGAATCATCTCA
+ACAACCAATGGAGGACAGGAGAGGAAATTTATTGGTGGATCTGGTCAAGTGAGTGAACGG
+ATAAAGGATATACTTGGGGACCGAGTGAAGCTGGAGAGGCCTGTGATCCACATTGACCAG
+ACAGGGGAAAATGTTATTGTGAAAACCCTAAACCATGAAATATATGAGGCTAAATATGTG
+ATTAGTGCCATTCCACCTGCTTTGGGCATGAAGATTCACTATAGTCCTCCTCTGCCCATG
+CTAAGAAACCAGCTGATCTCTCGTGTGCCTTTGGGTTCAGTTATTAAATGCATGGTTTAT
+TACAAAGAGCCCTTCTGGAGGAAAAAGGATTTCTGTGGAACCATGGTTATCGAAGGAGAG
+GAAGCTCCAATTGCATACACATTGGATGATACCAAACCAGATGGCACCTATGCTGCTATA
+ATGGGATTTATCCTTGCTCACAAAGCTAGAAAACTGGTACGTCTCACCAAAGAAGAAAGA
+CTGAGGAAACTTTGTGAGCTATATGCAAAAGTGCTGAACTCCCAAGAAGCTCTGCAGCCC
+GTCCATTATGAAGAGAAGAACTGGTGTGAGGAACAGTATTCTGGGGGCTGCTACACAACC
+TACTTCCCTCCCGGCATCTTGACCCAGTATGGAAGGGTTCTACGTCAGCCAGTGGGCAAG
+ATTTTCTTTGCAGGCACTGAAACAGCCTCACACTGGAGCGGCTACATGGAGGGGGCTGTG
+GAGGCTGGGGAGAGAGCAGCCAGAGAGATTCTTCATGCCATTGGGAAGATTCCAGAAGAT
+GAAATTTGGCAGCCAGAACCAGAATCTTTGGATGTCCCTGCACGACCCATTACCAGTACC
+TTCCTGGAGAGACACCTGCCTTCTGTACCAGGCCTGCTAAAGCTGTTTGGATTGACCACC
+ATCTTGTCAGCAACAGCTCTTGGTTTCCTGGCCCACAAAAGGGGCCTGTTTGTACATTTT
+TAA
+>ENSMUST00000168613_musmusculus
+ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
+AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
+GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
+GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
+AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGGGAAAATCATATGCCTTCAGG
+GGCCCATTTCCACCAGTATGGAATCCTATCACCTACCTAGATAATAACAACCTCTGGAGG
+ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAAGCACCCCTTGCT
+GAAGAGTGGGACTACATGACAATGAAAGAATTGCTAGATAAGATCTGCTGGACCAAATCT
+ACAAAGCAGATTGCCACGCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGAGGTC
+TCTGCACTATGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGTACAACCAGAATCATCTCA
+ACAACCAATGGAGGACAGGGGAAAATGTTATTGTGA
+>ENSMUST00000163344_musmusculus
+ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
+AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
+GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
+GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
+AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGATCTACAAAGCAGATTGCCAC
+GCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGA
+>ENSMUST00000173143_musmusculus
+ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGAAAAACCTGCTAAT
+TCTAGTCAGTTTACAAGCTCATTGTGGAGGAGAATTGAAAAACTGTGA
+>ENSSSCT00000033745_susscrofa
+ATGGCAGCGGCCAAACTTCTGCATGACTCTGGCCTGAGTGTGATTGTTCTGGAAGCCCGG
+GACCGCGTGGGAGGCAGGACTTACACCGTCAGGAACCAACAAGTTAAATATGTGGACCTT
+GGAGGATCTTATGTTGGGCCAACTCAGAATCGCATCTTAAGATTGTCCAAGGAGCTAGGA
+TTGGAGACCTACAAAGTGAATGAAGTGGAGCGTCTGATTCACTATGTAAAGGGCAAATCC
+TACCCCTTCAGGGGCCCATTACCACCTGTGAGGAATCCGATTACCTTCCTAGATCTTAAC
+AACCTTTGGAGGACGGTGGATGACATGGGACGAGAGATTCCCAGTGATGCCCCATGGAAG
+GCGCCCCTTGCAGAACAGTGGGACCAGATGACAATGAAGGAGCTGTTGGACAAGCTCTGC
+TGGACTGAATCTTCGAAGCAGCTGGCCACCCTTTTTGTGAACCTGTGTGTCACCGCGGAG
+ACCCATGAGGTCTCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACCACC
+AGGATCATCTCAACAACTAACGGAGGGCAGGAGAGGAAATTTGTGGGCGGATCTGGTCAA
+GTGACCGAGCGGATAAAGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGGTC
+CACATTGACCAGACAGGAGAAAATGTCCTCGTGGAGACCCTAAACCACGAGGTGTACGAG
+GCTAAGTATGTGATTAGCGCCATTCCTCCTGTCCTGGGCATGAAGATTCATTTCAGTCCC
+CCTCTGCCAATGATGAGAAACCAGCTCATCACTCGTGTACCTCTGGGCTCTGTCATCAAG
+TGTATAGTTTATTACAAAGAGCCCTTCTGGAGGCATAAGGATTACTGTGGAAGCATGATT
+ATTGAAGGAGAGGAAGCTCCAATCGCCTACACGTTGGATGATTCCAAGCCTGATGGCAGC
+TGTGCCGCCATCATAGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCCCGTCTTACC
+AAAGAAGAAAGGCTGAAGAAACTTTGCGACCTCTATGCAAAAGTTCTGGGTTCAAAAGAA
+GCTTTGAACCCCGTGCACTATGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCGGCGGGC
+TGCTACACGACCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTTCTACGCCAG
+CCAGTCGGCAGGATTTATTTCGCCGGCACGGAGACTGCCACGCACTGGAGTGGCTACATG
+GAGGGGGCCGTGGAGGCCGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCTATGGGAAAG
+ATCCCAGAAGATGAAATCTGGCAGTCTGAACCAGAGTCCGTGGATGTGCCTGCGAAGCCC
+ATTACCACGACCTTCTTGGAGAGACACTTGCCCTCGGTGCCCGGCCTGCTGAGGCTGATT
+GGATTGACCGCCATCTTTTCAGCCACTGCTCTCGGCTACCTGGCCCACAAAAGGGGGCTA
+CTCGTGCGGGTCTGA
+>ENSSSCT00000023183_susscrofa
+ATGGCAGCGGCCAAACTTCTGCATGACTCTGGCCTGAGTGTGATTGTTCTGGAAGCCCGG
+GACCGCGTGGGAGGCAGGACTTACACCGTCAGGAACCAACAAGTTAAATATGTGGACCTT
+GGAGGATCTTATGTTGGGCCAACTCAGAATCGCATCTTAAGATTGTCCAAGGAGCTAGGA
+TTGGAGACCTACAAAGTGAATGAAGTGGAGCGTCTGATTCACTATATCAAAGGCAAATCC
+TACCCCTTCAGGGGCCCATTACCACCTGTGAGGAATCCGATTACCTTCCTAGATCTTAAC
+AACCTTTGGAGGACGGTGGATGACATGGGACGAGAGATTCCCAGTGATGCCCCATGGAAG
+GCGCCCCTTGCAGAACAGTGGGACCAGATGACAATGAAGGAGCTGTTGGACAAGCTCTGC
+TGGACTGAATCTTCGAAGCAGCTGGCCACCCTTTTTGTGAACCTGTGTGTCACCGCGGAG
+ACCCATGAGGTCTCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACCACC
+AGGATCATCTCAACAACTAACGGAGGGCAGGAGAGGAAATTTGTGGGCGGATCTGGTCAA
+GTGACCGAGCGGATAAAGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGGTC
+CACATTGACCAGACAGGAGAAAATGTCCTCGTGGAGACCCTAAACCACGAGGTGTACGAG
+GCTAAGTATGTGATTAGCGCCATTCCTCCTGTCCTGGGCATGAAGATTCATTTCAGTCCC
+CCTCTGCCAATGATGAGAAACCAGCTCATCACTCGTGTACCTCTGGGCTCTGTCATCAAG
+TGTATAGTTTATTACAAAGAGCCCTTCTGGAGGCATAAGGATTACTGTGGAAGCATGATT
+ATTGAAGGAGAGGAAGCTCCAATCGCCTACACGTTGGATGATTCCAAGCCTGATGGCAGC
+TGTGCCGCCATCATAGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCCCGTCTTACC
+AAAGAAGAAAGGCTGAAGAAACTTTGCGACCTCTATGCAAAAGTTCTGGGTTCAAAAGAA
+GCTTTGAACCCCGTGCACTATGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCGGCGGGC
+TGCTACACGACCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTTCTACGCCAG
+CCAGTCGGCAGGATTTATTTCGCCGGCACGGAGACTGCCACGCACTGGAGTGGCTACATG
+GAGGGGGCCGTGGAGGCCGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCTATGGGAAAG
+ATCCCAGAAGATGAAATCTGGCAGTCTGAACCAGAGTCCGTGGATGTGCCTGCGAAGCCC
+ATTACCACGACCTTCTTGGAGAGACACTTGCCCTCGGTGCCCGGCCTGCTGAGGCTGATT
+GGATTGACCGCCATCTTTTCAGCCACTGCTCTCGGCTACCTGGCCCACAAAAGGGGGCTA
+CTCGTGCGGGTCTGA
+>ENSCAFT00000022963_canisfamiliaris
+ATGAGCGGCAAGTGCGACGTGGTCATGGTGGGGGGCGGCATCTCAGGCATGGCAGCAGCC
+AAACTTCTGCATGATTTTGGCCTGAACGTGGTTGTTCTGGAGGCCCGGGACCGAGTGGGA
+GGCAGGACTTACACCATCAGGAACCAAAAGGTTAAATATTTGGACCTTGGAGGATCTTAT
+GTTGGGCCAACTCAGAATTGTATCTTAAGGTTAGCCAAGGAGCTAGGATTGGAGACCTAC
+AAAGTGAATGAAGTAGAGCGTCTCATCCATCATGTAAAGGGCAAATCGTACCCCTTCAGG
+GGCCCCTTCCCACCTGTATGGAACCCAATTGCATACCTAGATCATAACAACCTCTGGAGG
+ACGATGGACGACATGGGGCGAGAGATTCCCAGTGATGCCCCATGGAAGGCACCTCTTGCG
+GAGGAGTGGGACCACATGACAATGAAGGAGCTTCTGGACAAGATCTGCTGGACAGAATCT
+GCCAAGCAACTTGCTACTCTCTTTGTGAATCTGTGTGTCACTGCAGAGACCCATGAGGTC
+TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACGACCAGGATCATCTCA
+ACAACCAATGGAGGGCAGGAGAGAAAATTTGTGGGCGGATCTGGTCAAGTGAGTGAACGG
+ATAATGGACCTCCTTGGAGACCAAGTGAAGCTGGAGAGGCCTGTGACCCACATTGACCAG
+ACAGGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGGTGTATGAGGCTAAGTATGTG
+ATTAGTGCCATTCCTCCTACTCTGGGCATGAAGATTCATTTCAACCCCCCTCTGCCAATG
+ATGAGAAACCAGCTGATCACTCGTGTGCCTTTGGGCTCAGTCATCAAGTGCATAGTTTAT
+TATAAAGAGCCCTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATCGAAGGAGAG
+GAAGCTCCAATTGCTTACACGTTGGATGATACCAAACCTGATGGCAACTATGCCGCCATA
+ATGGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGATGAAAGG
+ATGAAGAAACTTTGTGAGCTCTATGCAAAAGTCCTGGGTTCCCAAGAAGCTTTGCAGCCC
+GTACACTACGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCCGGGGGCTGCTACACCACC
+TACTTTCCCCCTGGGATCATGACTCAATATGGAAGGGTTCTACGACAGCCTGTGGGCAGG
+ATTTATTTTGCAGGCACGGAGACTGCCACCCACTGGAGTGGCTACATGGAGGGCGCTGTG
+GAGGCTGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCCATGGGGAAGATCCCAGAGGAT
+GAAATCTGGCAGTCAGAACCAGAATCAGTGGATGTCCCTGCGCAGCCCATCACCACGACC
+TTCTTGGAGAGACATTTGCCCTCTGTGCCAGGCCTGCTGAGGCTGATCGGATTGACCGCC
+ATCTTTTCTGCAACTGCTCTTGGCGTCCTGGCACACAAAAGGGGTCTGCTTGTGCGGGTC
+TAA
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test5.sqlite
Binary file test-data/test5.sqlite has changed
diff -r b3ba0c84667c -r 56bbdbfe3eaa test-data/test5_filtered.fasta
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test5_filtered.fasta	Wed Apr 25 11:00:33 2018 -0400
@@ -0,0 +1,842 @@
+>ENSPTRT00000034846_pantroglodytes
+ATGGACCCGGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
+CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
+GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
+CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTCCGCCTGGCA
+GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGCAGGGGGAGTTACTACCA
+GGGCTCTTTGGGGAGGCAGGACCCCTCGGCCGAGCAGCCTGGGCCGTCCCCACCGTGCGC
+AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCACCCCAGCGCCCTGCGCTTCCTG
+GCCGACCACGGTGCGGTCGACACCATCTTCTCCCTTCAGGGAGACTCCAGCCTGTTTGTG
+GCCTCGGCGGCCAGTCAGCTCCTGGTACACGTCCTGGCTTTGTCCATGCAAGGTGGAGCC
+GAGGGACAGCCCTGCCTGCCGGGGGGTGACTGGCCCGCGTGTGCCCAGAGGATCATGGAT
+CACGTTGAAGAGTCCTTGTGCTCCGCGGCCACCCCCAAGGTCACTCAGGCCCTGAACGTC
+CTGACCACAACCTTCGGGCGCTGCCAGAGCCCCTGGACGGAAGCCCTGTGGGTGCGGCTG
+AGTCCCCGCGTGGCGTGTCTGCTGGAGAGAGACCCCATCCCCGCCGCACACTCGTTCGTG
+GACCTGCTTCTCTGTGTGGCTCGTTCTCCCGTGTTCAGTTCTTCCGACGGCAGCCTGTGG
+GAGACAGTGGCGCGGGCTCTGAGCTGCCTGGGTCCCACCCACATGGGACCCCTGGCTTTG
+GGGATCCTGAAGCTCGAGCACTGTCCACAGGCACTGAGGACCCAGGCCTTCCAGGTCCTT
+CTCCAGCCCCTGGCCTGTGTCCTGAAGGCCACGGTTCAGGCCCCCGGACCCCCAGGCTTG
+CTGGACGGGACGGCAGACGATGCCACGACGGTGGACACACTCCTGGCCTCCAAGTCGTCC
+TGCGCGGGCCTCCTGTGCCGCACCCTGGCTCACCTGGAGGAGCTGCAGCCGCTGCCCCAG
+CGCCCTTCACCGTGGCCCCAGGCGTCTCTACTGGGGGCTACAGTGACTGTCCTGCGGCTC
+TGTGACGGCTCAGCTGCCCCTGCCTCCAGTGTGGGGGGCCACCTCTGTGGGACCCTGGCG
+GGCTGCGTCCGGGTCCAGCGAGCAGCCCTCGACTTCCTGGGGACACTGTCACAGGGGACA
+GGCCCCCAGGAGCTGGTGACGCAGGCGCTTGCTGTCCTCCTGGAGTGCCTCGAGAGCCCC
+GGCTCCAGCCCCACGGTTCTGAAGAAGGCCTTCCAGGCCACGCTCAGGTGGCTCCTGAGC
+TCACCCAAGACCCCCGGCTGCTCTGATCTCGGCCCCCTCATCCCGCAGTTCCTCAGAGAG
+CTGTTCCCTGTGCTGCAGAAACGCCTGTGCCACCCCTGCTGGGAGGTGAGGGACTCCGCC
+CTCGAGTTCCTGACCCAGCTGAGCAGGCACTGGGGAGGACAGGCCGACTTCAGATGCGCA
+CTCTTGGCTTCAGAGGTGCCTGAGCTGGCCCTGCAGCTCCTCCAGGACCCTGAGAGTTAT
+GTCCGAGCGAGCGCGGTGACCGCCATGGGGCAGCTGTCCAGCCAGGGCCTGCACGCCCCC
+ACCAGCCCTGAGCATGCAGAGGCCCGGCAGAGCCTGTTCCCGGAGCTCCTGCACATCCTC
+TCCGTAGACTCGGAGGGCTTCCCACGGCGGGCGGTCATGCAAGTCTTCACTGAGTGGCTG
+CGGGACGGCCACGCCGACGCGGCCCGGGACACGGAGCAGTTCGTGGCCACTGTGCTGCAG
+GTGGCGAGCCGGGACCTGGACTGGGAGGTCCGCGCCCAGGGCCTGGAGCTGGCCCTCGTG
+TTCCTGGGCCAGACTTTGGGGCCGCCGCGTACCCACTGCCCCTATGCCGTGGCCCTACCC
+GAGGTGGCCCCAGCCCAGCCACTCACCGAGGCACTGAGGGCTCTCTGCCACGTGGGGCTC
+TTTGACTTCGCCTTTTGTGCCTTGTTTGACTGCGACCGCCCTGTGGCGCAGAAGTCTTGT
+GACCTCCTTCTCTTCCTGAGGGACAAGATTGCTTCCTACAGCAGCCTGCGGGAGGCCAGG
+GGCGGCCCCAACACTGCCTCCGCAGAGGCCACCCTGCCGAGGTGGCGGGCGGGTGAGCAG
+GCCCAGCCCCCAGGGGACCAGGAGCCTGAGGCTGTGCTGGCCATGCTCAGGTCCCTAGAC
+CTGGAGGGCCTGCGGAGCACACTGGCCGAGAGCAGCGACCACGTGGAGAAGAGTCCCCAG
+TCCCTCCTGCAGGACATGCTGGCCACGGGAGGCTTCCTGCAGGGGGATGAGGCCGACTGC
+TACTGA
+>ENST00000340611_homosapiens
+ATGGACCCAGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
+CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
+GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
+CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTGCGCCTGGCA
+GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGCAGGGGGAGTTACTACCA
+GGGCTCTTTGGGGAGCCAGGACCCCTCGGCCGAGCAACCTGGGCCGTCCCCACCGTGCGC
+AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCACCCCAGCGCCCTGCGCTTCCTG
+GCCGACCATGGTGCGGTCGACACCATCTTCTCCCTGCAGGGAGACTCCAGCCTGTTTGTG
+GCCTCGGCGGCCAGTCAGCTCCTGGTGCACGTCCTGGCTTTGTCCATGCGAGGTGGAGCC
+GAGGGGCAGCCCTGCCTGCCGGGGGGTGACTGGCCCGCGTGTGCCCAGAAGATCATGGAT
+CACGTTGAAGAGTCCTTGTGCTCCGCGGCCACCCCCAAGGTCACTCAGGCCCTGAACGTC
+CTGACCACGACCTTCGGGCGCTGCCAGAGCCCCTGGACGGAAGCCCTGTGGGTGCGGCTG
+AGTCCCCGCGTGGCCTGTCTGCTGGAGAGAGACCCCATCCCCGCCGCACACTCGTTCGTG
+GACCTGCTTCTCTGTGTGGCTCGTTCTCCCGTGTTCAGTTCTTCCGACGGCAGCCTGTGG
+GAGACAGTGGCGCGGGCTCTGAGCTGCCTGGGTCCCACCCACATGGGACCCCTGGCTTTG
+GGGATCCTGAAGCTCGAGCACTGTCCACAGGCACTGAGGACCCAGGCCTTCCAGGTCCTT
+CTCCAGCCCCTGGCCTGTGTCCTGAAGGCCACGGTTCAGGCCCCCGGACCCCCAGGCTTG
+CTGGACGGGACGGCAGACGATGCCACGACGGTGGACACACTCCTGGCCTCCAAGTCGTCC
+TGCGCCGGCCTCCTGTGCCGCACCCTGGCTCACCTGGAGGAGCTGCAGCCGCTGCCCCAG
+CGCCCTTCACCGTGGCCCCAGGCGTCTCTACTGGGGGCTACAGTGACTGTCCTGCGGCTC
+TGTGACGGCTCGGCTGCCCCTGCCTCCAGTGTGGGGGGCCACCTCTGTGGGACCCTGGCG
+GGCTGCGTCCGGGTCCAGCGAGCAGCCCTCGACTTCCTGGGGACGCTGTCACAGGGGACA
+GGCCCCCAGGAGCTGGTGACGCAGGCGCTTGCTGTCCTCCTGGAGTGCCTCGAGAGCCCC
+GGCTCCAGCCCCACGGTTCTGAAGAAGGCCTTCCAGGCCACGCTCAGGTGGCTCCTGAGC
+TCACCCAAGACCCCCGGCTGCTCTGATCTCGGCCCCCTCATCCCGCAGTTCCTCAGAGAG
+CTGTTCCCTGTGCTGCAGAAACGCCTGTGCCACCCCTGCTGGGAGGTGAGGGACTCCGCC
+CTCGAGTTCCTGACCCAGCTGAGCAGGCACTGGGGAGGACAGGCTGACTTCAGATGCGCA
+CTCTTGGCTTCAGAGGTGCCTCAGCTGGCCCTGCAGCTCCTCCAGGACCCTGAGAGTTAT
+GTCCGAGCGAGTGCAGTGACCGCCATGGGGCAGCTGTCCAGCCAGGGCCTGCACGCCCCC
+ACCAGCCCTGAGCATGCAGAGGCCCGGCAGAGCCTGTTCCTGGAGCTCCTGCACATCCTC
+TCCGTAGACTCGGAGGGCTTCCCACGGCGGGCGGTCATGCAAGTCTTCACTGAGTGGCTG
+CGGGACGGCCACGCCGACGCGGCCCAGGACACGGAGCAGTTCGTGGCCACTGTGCTGCAG
+GCGGCGAGCCGAGACCTGGACTGGGAGGTCCGCGCCCAGGGCCTGGAGCTGGCCCTCGTG
+TTCCTGGGCCAGACTTTGGGGCCGCCGCGTACCCACTGCCCCTATGCCGTGGCCCTACCC
+GAGGTGGCCCCAGCCCAGCCACTCACCGAGGCACTGAGGGCTCTCTGCCACGTGGGGCTC
+TTTGACTTCGCCTTTTGTGCCTTGTTTGACTGCGACCGCCCTGTGGCGCAGAAGTCTTGT
+GACCTCCTTCTCTTCCTGAGGGACAAGATTGCTTCCTACAGCAGCCTGCGGGAGGCCAGG
+GGCAGCCCCAACACTGCCTCCGCAGAGGCCACCCTGCCGAGGTGGCGGGCGGGTGAGCAG
+GCCCAGCCCCCAGGGGACCAGGAGCCTGAGGCTGTGCTGGCCATGCTCAGGTCCCTAGAC
+CTGGAGGGCCTGCGGAGCACGCTGGCCGAGAGCAGCGACCACGTGGAAAAGAGTCCCCAG
+TCCCTCCTGCAGGACATGCTGGCCACGGGAGGCTTCCTGCAGGGGGACGAGGCCGACTGC
+TACTGA
+>ENST00000421712_homosapiens
+ATGGACCCAGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
+CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
+GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
+CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTGCGCCTGGCA
+GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGGTGCGGTCGACACCATCT
+TCTCCCTGCAGGGAGACTCCAGCCTGTTTGTGGCCTCGGCGGCCAGTCAGCTCCTGGTGC
+ACGTCCTGGCTTTGTCCATGCGAGGTGGAGCCGAGGGGCAGCCCTGCCTGCCGGGGGGTG
+ACTGGCCCGCGTGTGCCCAGAAGATCATGGATCACGTTGAAGAGTCCTTGTGCTCCGCGG
+CCACCCCCAAGGTCACTCAGGCCCTGA
+>ENSRNOT00000064726_rattusnorvegicus
+ATGGACGCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCTAGA
+CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTACTGGACTGGTTTAAAACAGTGACA
+GAGGCAGAGCCCAGCCTCCAACTACTGCAGGACCACCCCTGCCTAATGGAGCTCCTGTCC
+CATGTGCTGAAGCCACAGGATGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTCGTT
+GGGGTCTTTGCGGCCCAGGAGGACTGTTTCCAGTACCTTCAGCAGGGGGAGTTGTTGCTG
+GGGCTCTTTGGGGAGACAGGTGCCCTTAGCTGGGCAGCCTGGAGCATCCCCAGTGTGCGC
+AGCGGCTGGATCCAGGGCCTGTGCTCCCTGGCACACCACCCCAGTGCCCTGCACTTCCTG
+GCTGACAGTGGTGCTGTGGACACGATCTTCTCCTTGCAAGGAGACCCCAGCCTGTTTGTA
+GCCTCAGCAGCCAGCCAGCTCCTAGTACACATCCTGGCTCTGTCAATGCAAGGCGGAGCT
+CCAGGGTCCCCCGTCCCTGAAGCCGTTGCCTGGCCTGTCTGTGCCCAGAAGATCATGAAC
+CATGTAGAAGAGTCCTTGCATTCCAAAGCCACCCCACAGGTCACACAGGCCTTGAATGTC
+CTGACGACGACCTTCGGGCGCTGCCACAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
+AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCTGCCACACACTCGCTCATG
+GACCTGCTTCTCAGTGTGGCCAGGTCTCCTGTGTTGAACTTTGCAGCCTGTGGCCTGTGG
+GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCACCCAAGCTGGGCCTCTAGCTCTG
+GGGACCCTGAAACTTCAGCATTGTCCCCAGGAACTGAGGACCCAGGCCTTTAGAGTCCTC
+CTTCAGCCACTGGCCTGCATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
+CTGGACGGGACTGCGGGTAGCTTGCTGACTGTGGATGCACTCTTATCTTCAAAGTCGGCC
+TGTGTGGGGCTCCTCTGCCAGACTCTGGCGCACCTGGAGGAGCTGCAGATGCTGCCCCAG
+TGCCCCTCACCGTGGCCACAGGTGCCTCTGCTGCAAGCTGCTGTGACGATATTGCGTCTC
+TCTGACGGCTCGGCGGACCCCAGTTCCAGTGCAGGAGGCCGTCTCTGTGGGGCGCTGGGT
+GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACGCTGTCTCTGGGGACA
+AGCCCCCTGGAATTGGTGCTGGAGGTATTTGCTGTCCTCCTGAAGACCCTGGAGAGCCCA
+GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAGC
+CCACACAAGACCCCCAGCGGCTCTGATCTCAGCCCCGATGCCTTGCTGTTCCTCGGAGAG
+CTATTCCCCATACTACAGAAGCGCCTGTGCAGCCCGTGTTGGGAGGTGAGGGACTCAGCC
+CTGGAGTTCCTGACGCATCTGATCCGGGACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
+CTGCATTCTTCAGAAGTACCCACACTTGCCCGCCAGCTCCTCCAAGACCCTGAGAGTTAT
+GTCCGAGCAAGTGCAGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGCCTTCAGGCCACT
+CCCGCCAACCAGCAGGGCCTACTCATGGACCTCATGCATATCCTGTCCACGGACTCAGAG
+GGCTTCCCTCGAAGAGCTGTGTTACGGGTCTTTACTGAATGGCTGAGGGATGGCCATGCT
+GATGTGGTTCGAGACACAGAGTGGTTCGTGGCCACTGTTCTCCAGGCAGTGAGCCGGGAT
+CTGGACTGGGAGGTCCGAGTGCAGGGCTTGGAGCTGGCACAGGTATTCCTCATCCAGGCA
+ATGGGGCAGCCTAGACTCCACTGTCCCTATACAGTAGGCCTGCCTGGGGCCACCTCTTCC
+CGCCCACACCTGGAATTCTTGCAGACTCTCTGCCGTCTGCCACTCTTTGAGTTTGCCTTT
+TGTGCCTTGCTTGACTGTGACCGCCCGGTGGCCCAAAAAGCCTGTGACCTGCTCCTCTTC
+TTGAGGGACAAGACAGTTTCCTGCAGTAACCCTCAGGAGGCCGGGGACAGCCCCAACTCA
+GCCTCAGTGGAGGCTGCCCTGCAGAGGTGGCGGGAAGGTGAGCAGGCTCAGCCCCTAGGG
+GACCTGGAGCCTGAAGCCATGCTGGCCATCCTCAGGTCCTTAGACCTGGAGGGCCTGCAG
+GGCAGGCTGGCCAAGAGCAGTGACCATGTGGAGAAGAGCCCACAGTCCCTGCTGCAGGAC
+ATGCTGGCCACGGTGGGCGTGTTGGAGGAGAATGAAGCTGACTGCTACTAA
+>ENSMUST00000041588_musmusculus
+ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
+CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
+GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
+CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
+GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
+GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
+AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
+GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
+GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
+CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
+CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
+CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
+AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
+GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
+GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
+GGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAGGCCTTTGGAGTCCTC
+CTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
+CTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTGGCTTCAAAGTCAGCC
+TGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTGCAGATGCTGCCCCAG
+TGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTGACTATATTGCATCTC
+TGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTCTGTGGGACTCTGGGT
+GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACCCTGTCTCAGGGGACA
+AGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAGACCCTGGAGAGCCCA
+GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAAC
+CCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTGCTGTTTCTCGGAGAG
+CTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAGGTGAGGGACTCTGCC
+CTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
+CTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAAGACCCAGAGAGTTAC
+GTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGTCTGCAGGCCGCT
+CCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGGCCTACTCATGGACCTTATGCATATC
+CTGTCCACTGACTCAGAGGGCTTCCCTCGAAGGGCTGTGTTACGGGTCTTCACGGACTGG
+CTGAGGGATGGCCATGCTGACGTGGTTCGAGACACGGAGTGGTTCGTGGCCACTGTTCTC
+CAGGCAGTGAGCCGGGATCTGGACTGGGAGGTCCGAGTGCAGGGTTTGGAGCTGGCACGG
+GTGTTCCTCACCCAGGCACTGGGCCAGCCCAGCCTCCACTGTCCCTATACAGTGGGCCTG
+CCCAGGGCCTCCTCTCCCCGCCCACACCCGGAATTCTTGCAGACTCTCTGCCGTCTGCCG
+CTCTTTGAGTTTGCCTTTTGTGCCTTGCTTGACTGTGACCGACCGGTGGCCCAAAAGGCC
+TGTGACCTGCTCCTCTTCTTGAGGGACAAGACAGTTCCCTGCAGTAGCCCTCGGGAGGCA
+GGGGACAGCCCCAACTCAGCCTCAGTGGAGGCTGCCCTGCAGAGGTGGCGGGAAGGAGAG
+CAGGCCCAGCCCCTAGGGGACCTGGATCCTGAGGCCATGCTAGCCATCCTCAGGGCCTTA
+GACCTGGAGGGCCTGCAGGGCAGGCTGGCCAAGAGCAGCGACCATGTGGAGAAGAGCCCA
+CAGTCCCTGCTGCAGGACATGCTGGCCACGGTGGGTGTGTTGGAGGAGAACGAAGCTGAC
+TGCTACTAA
+>ENSMUST00000153440_musmusculus
+ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
+CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
+GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
+CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
+GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
+GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
+AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
+GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
+GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
+CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
+CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
+CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
+AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
+GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
+GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
+GGGACCCTGAAACTTCAGCACTGGCTTGCTGGATGGGACTGTGGGTAG
+>ENSMUST00000110806_musmusculus
+ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
+CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
+GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
+CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
+GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
+GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
+AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
+GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
+GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
+CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
+CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
+CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
+AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
+GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
+GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
+GGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAGGCCTTTGGAGTCCTC
+CTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
+CTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTGGCTTCAAAGTCAGCC
+TGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTGCAGATGCTGCCCCAG
+TGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTGACTATATTGCATCTC
+TGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTCTGTGGGACTCTGGGT
+GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACCCTGTCTCAGGGGACA
+AGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAGACCCTGGAGAGCCCA
+GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAAC
+CCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTGCTGTTTCTCGGAGAG
+CTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAGGTGAGGGACTCTGCC
+CTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
+CTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAAGACCCAGAGAGTTAC
+GTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGTCTGCAGGCCGCT
+CCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGTAGACACAGGGAGTTGGTGA
+>ENSMUST00000100505_musmusculus
+ATGGTGCATTTTGCACTCTCGGGCCTAATTCCCGTAGCGGAGGGATGCGGGGGCGGGATT
+AGAACCCCTAGGCTAACTCGCAGTCGCCGAGAGCGCACCTCTTACCCGGATTTGGGAGGA
+ACTGCCTGCCTGATCATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTT
+TTGGCAGATCCCAGACAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGG
+TTTAAAACAGTGACAGAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTA
+ATGGAGCTCCTGTCCCATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTT
+GCTCTGCGCCTTGTTGGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAG
+GGAGAGTTGTTGCTGGGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGC
+ATCCCAAGTGTGCGCAGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGC
+GCCCTGCACTTCCTGGCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGAC
+CCCAGCCTGTTCGTCGCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCC
+ATGCAAGGTGGAGCCCCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCC
+CAGAAGATTGTGAACCATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACA
+CAGGCCTTGAATGTCCTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTC
+CTCTGGGAGCGGCTAAGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCC
+GTGCACGCGCTCATGGACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCA
+GCCTGTGGCCTGTGGGAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCT
+GGGCCTCTAGCCCTGGGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAG
+GCCTTTGGAGTCCTCCTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCT
+GGACCTCCAGGCTTGCTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTG
+GCTTCAAAGTCAGCCTGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTG
+CAGATGCTGCCCCAGTGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTG
+ACTATATTGCATCTCTGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTC
+TGTGGGACTCTGGGTGGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACC
+CTGTCTCAGGGGACAAGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAG
+ACCCTGGAGAGCCCAGAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTC
+AGATGGCTCCAGAACCCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTG
+CTGTTTCTCGGAGAGCTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAG
+GTGAGGGACTCTGCCCTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCT
+GACTTCAGAGAGGCACTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAA
+GACCCAGAGAGTTACGTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAG
+GGTCTGCAGGCCGCTCCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGGCCTACTCATG
+GACCTTATGCATATCCTGTCCACTGACTCAGAGGGCTTCCCTCGAAGGGCTGTGTTACGG
+GTCTTCACGGACTGGCTGAGGGATGGCCATGCTGACGTGGTTCGAGACACGGAGTGGTTC
+GTGGCCACTGTTCTCCAGGCAGTGAGCCGGGATCTGGACTGGGAGGTCCGAGTGCAGGGT
+TTGGAGCTGGCACGGGTGTTCCTCACCCAGGCACTGGGCCAGCCCAGCCTCCACTGTCCC
+TATACAGTGGGCCTGCCCAGGGCCTCCTCTCCCCGCCCACACCCGGAATTCTTGCAGACT
+CTCTGCCGTCTGCCGCTCTTTGAGTTTGCCTTTTGTGCCTTGCTTGACTGTGACCGACCG
+GTGGCCCAAAAGGCCTGTGACCTGCTCCTCTTCTTGAGGGACAAGACAGTTCCCTGCAGT
+AGCCCTCGGGAGGCAGGGGACAGCCCCAACTCAGCCTCAGTGGAGGCTGCCCTGCAGAGG
+TGGCGGGAAGGAGAGCAGGCCCAGCCCCTAGGGGACCTGGATCCTGAGGCCATGCTAGCC
+ATCCTCAGGGCCTTAGACCTGGAGGGCCTGCAGGGCAGGCTGGCCAAGAGCAGCGACCAT
+GTGGAGAAGAGCCCACAGTCCCTGCTGCAGGACATGCTGGCCACGGTGGGTGTGTTGGAG
+GAGAACGAAGCTGACTGCTACTAA
+>ENSCAFT00000025950_canisfamiliaris
+ATGGACCCAGAGTGCTCCCAGCTCCTCCCGGCCCTCTGTGCAGTTCTGGCAGACCCCAGG
+CAGCCCGTGGCAGATGACACCTGTTTGGAGAAGCTGCTGGATTGGTTTAAAACGATAACC
+AAAGCTGGGTCCAGTCTCCTGTTATTACAGGAGAACCCCTGTCTGGTGGAGCTGCTGTGT
+CACGTGCTGAAACCCCAGGACCTGAGTTCCAGAGTCCTCTCCTTCTCTCTCCGCCTCGCA
+GGGGTATTTGCAGCCCAGGAAGATTGCTTCCAGTATCTTCAGCAGGGGGAGTTGCTGCCC
+AGGCTCTTTGGGGAGCCAGGGCCCCTGGGAGGAGCTGCCTGGACTGCCCCCTCAGTGCGC
+AGTGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCATCCTAGTGCCCTGCATTTCCTG
+GCTGACTGTGGTGCCGTTGACACCATCTTCTCCCTGCAGGGAGATTCCAGCCTGTTTGTG
+GCCTCGGCAGCTGGGCAGCTCCTGGTGCACATCCTGGGCTTGTCCATGCAAGGCCTAGCC
+GAGGGACACCCCAGCCTGCAGGCTGGTGATTGGCCAGTGTGTGCCCAGAAGATCGTGGGT
+CACATAGAAGAGTCCCTGCACTCCACAGCCGTCCCGCAGATCACACAGGCTCTAAACGTC
+CTGACTACCACGTTCGGGCACTGCCATGACCCTTGGACACAAGTTCTGTGGGTACGGCTG
+AGTCCCCTAGTAGGCAGTCTACTTGAGAAAGACCCTGTCCCAGCTGCACACTCGCTCGTG
+GACCTCCTCCTCAGTGTGGCCCGTTCTCCTGGGCTGAGCTCTTCTAGCTGCGGCCTGTGG
+GAGACTCTGGCTCAGACTCTGAACCATCTGAGCCCTACCCAAGCAGGGCCGCTGGCGTTA
+GGGATCCTGAAACTGCAGGACTGTCCACAGGTGCTAAGGGCCCAGGCCTTTGTCATTCTT
+CTCCAGCCTCTGGCCTGCGTCCTTAAAGCCACGGGTCAGGACCCCGGACCCTCAGGTGTG
+CTGGACAGTGCCACAGGTGACTCTCTGACAGTGGACGTGCTCCTCTCCTCCAAGGCGGCC
+TGTGTGGGTCTCCTGTGCCGGACTCTGGCCCACCTGGAGCTGCTGCAGCCGCTACCCCAG
+CGCCCCTGCCCCTGGCCTCAGGAGCCCCTGCTTGGGGCCGCGGTGACCCTGCTGCAGTTA
+TGCAGGGGCTCAGCAAGCCCTGCCTCTGACGTGGGGCGCCACCTCTGCGCGCTCCTGCTG
+GGCTGCGTGCGGGTGCAGCGAGCGGCCCTGGATTTCCTGGGGACGCTGTCTCAGGGGACA
+GGCCCCCAAGAGCTGGTGACGGAGGTGTTTGCTGTCCTTCTGGAATATCTCAGGAGCCCA
+GACTCCAGCCCCACGGTTCTGAAGAAAGCCTTCCAGGCCACATTCAGGTGGCTCCTGAGC
+TCACCCAAGACCCCCGGCTGCTGTGATCTAGAACCCCATGCCCTGCTGGTCCTGAGAGAG
+CTGCTTCCTGTGCTGCAGAAGCGTCTGTGCAGCCCCTGCTGGGAGGTGAGGGACTCCGGC
+CTCGAGTTCCTGACTCAGATGACCAGACACTGGGGAGGGCAGGCTGGCTTCAGACATGCA
+CTCCTCGCTTCGGAGGTGCCCAAGCTTACCGAGCAGCTCCTACGAGACCCTGAGAGTTAC
+GTCCGTGCCAGTGCAGTGACCGTCATGGGGCAGCTCTCCAGCCAGGGGCTGCATGTCACC
+CCTGTGAGCCCTGAGCATCCAGGGGGCCAGCAGAAGAGTCTGCTCGTGGAGCTTCTGCAT
+ATCCTCTCCACAGATTCAGAGGGATTCCCGCGGAGAGCCGTCATGCAGGTCTTCACCCAG
+TGGCTGAGGGACCACCATGCCGACGTGGCGGGGGACACGGAACAGTTTATGGCCAGGGTG
+CTCCAGGTCGCCAGCCAGGATCTGGACTGGGAGGTCCGGGCCCAGGGCCTGGAGCTGGCG
+CTGGTATTCCTGGAGCAGACGCTGGGCCAGTTCCACTCCCACTGTCCCTATGCTGTGACC
+CCACCCGTGGCGGCCCCAGCTGGCTCGCTGGCCCAGGCCCTGCAGCCACTATGCCGAGTG
+CGGCTCTTTGAGTTTGCCTTCCGTGCCTTGTTTGACTGTGACCGACCTGTGGCTCAGAAG
+TCCTGTGATCTCCTCCTCTTCCTGAGGGCCAAGACTGCTTCTTCCTCTGGTAGCCTGGAG
+GAGTCCAGGAGCGGCCCAGATGTGGCCTCTGTGGAGGCTGCCTTGCAGAGGTGGCAGGCA
+GGTGATCAGGGCCAGCCCCTGGGGGACCTGGAGCCCGAGGTCGTGCTGGCTGTGCTGAGG
+TCTGTGGACCTGGAAGGCCTTCGGGGTGCATTAGCCGAGGGCAGTGACCACATGGAGAAG
+AGCCCTCAGTCACTCCTGCAGGACATGCTGGCCACGGTGGGCGTCCTGGGAGAGAACGAG
+GCCGACTGCTACTGA
+>ENSSSCT00000008295_susscrofa
+ATGGACCCGGAGTGCTCCCGGCTCCTCCCGGCTCTCTGTGCCGTCCTGGCAGACCCCCGG
+CAGCCTGTGGCAGATGATACTTGCTTGGAGAAGCTGCTGGACTGGTTTAAAACAATAACT
+GAAGCAGGGTCCAGTCTCCTGGTGCTACAGGAAAATCCCTGCCTGGTGGAGCTGCTGTTC
+GACGTGCTGAAACCCCAGGACCTGAGTCCCAGAGTCCTCTCCTTCTCACTCCGCCTCGCA
+GGCATGTTCGCAGCCCAGGAAGACTGCTTCCAGTACCTTCAGCAGGGGGAGTTGCTGCCC
+AGGCTGTTTGGGGAGGCGGGCCCCCTGGGAGGAGCGGCCTGGACGGCCCCGACCGTGCGC
+AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCGCAGCACCCTCGCGCCCTGCCCTTCCTT
+GCCGACTGTGGTGCCGTTGACACCATCTTCTCCCTGCAGGGAGATTCCAGCCTGTTTGTG
+GCCTCGGCAGCCGGGCAGCTCCTGGTGCACATCCTGGACTTGGCGATGCGAGCCCCGCCC
+CGGGGACACCCCGGCCCGCAGGCGTGTGACGGGCCAGCGTGCGCCCAGAAGATCGTGTGT
+CACCTCGAAGACTCCCTGCGCGCCGCAGCCGCCCCGCAGCTCACGCAGGCCCTGAATGTC
+CTGACCACCACGTTCGGGCACTGCCACGGCCTTTGGACGCCGGGCCTTTGGGGGCGGCTG
+AGCCCTCTTGTGGGGCACCTGCTCGAGAAAGACCCCGTCCCAGCCTCGCACGCGCTCGTG
+GACCTCCTCCTCAGCGTGGCCCGGTCCCCTGTGCTGAGTTCTGAGAGTGGCCCGTGGGAG
+ACTTTGGCGCTGACTCTGAGCCGCTTGAGCCCGATGCAAGCAGGGCCTCTGGCTTTGGGG
+ATCCTGAAGCTGCAGGACTGCCCACAGGCCTTGAGGACCCAGGCCTCTGGCGTCCTCCTC
+CAGCCCCTGGCCTGTGTCCTGAAAGCTGCTGTGCAGGGCCCCGGACGCCCAGGTAGGCTG
+CTGGGGAAGGGGGGCAGGTGCAGGATGGCAGGACCGTGGGGGCCTGAGCGCATCCTTGGG
+GCCGGCGCAGGCTGTCATCCCAGGTGTGACTGCTGCTCCTGTTGCCACCCTGGAANCAGT
+GCCCTTGGCCTGGCCCAAGAGGCCCGCCTGAGGCTGTGTGACAATGCTGCGATCCCCCGC
+TCTGACCTGGGGGGCCAATTCTGTGGCCACCTGGTGGCCTGTGTCCGAGTCCAGCGAGCG
+GCCCTGGATTTCCTGGGGACGCTGTCTCAGAGGGCGGGCCCCCAAGAGCTGGTGACGCAG
+GTTTCTGCTGTCCTCCTGGAGTACCTTTCAGGCCCTGACTCCAGCCCCACGGTTCTGAAG
+AAGGCCTTCCAGGCCTCACTCGGGTGGCTCCTGAGCTCACCCAAGACCCCCGGCTGCTGC
+GATCTGGACCCCCACGCCCAGCAGTTCCTCAGAGAGCTGCTCCCTGTGCTGCAGAAGCGC
+CTGTGCAGCCCCTGCTGGGAGGTGAGGGACTCAGGCCTTGAGTTCCTGACCCAGATGGCC
+AGACACTGGGGAGGGCAGGCCGCCTTCAGACAGGTGCTCCTTGCTTCCGAGGTGCCCAGG
+CTCACCAGGCAGCTCCTGCAAGACCCCGAGAGTTACGTCCGCGCAAGCGCAGTGACCGCC
+ACAGGGCAGCTGTCTAGCTGGGGGCTGCATGCTGCCCCCGCCGGCCCTGAGCACCCAGGG
+GTCCAGCAGAAGAGCCTCCTGTCGGAGCTCCTGCACGTCCTCGCCACAGACTCGGAGGGC
+TTCCCCCGGAGGGCCGTCATGCAGGTCTTCACCGAGTGGCTGAGGGGCGGCCATGCTGAC
+GTGGCCGAGGACCCAGAGCAGTTTGTGGCCGGAGTGCTCCAGGCCGCGAGCAGGGACCTG
+GACTGGGAGGTCCGGGCCCAGGGCCTCGAGCTGGCGCTGGTGTTCCTGGAGCAGCTGCTG
+GGCCCGCCCGGCGTGCGCTGTCCCTACGCCGTGGCCCTGCCCAAGGCAGCCCCGCCTGGC
+ACGCTGGCCCAGGCCTTGCAGGCACTGTGCCGAGTGCAGCTCTTCGAGTTCGCCTTCCGT
+GCCTTGTTCGACTGCGACCGACCTGTGGCGCAGAAGTCCTGTGACCTCCTCCTCTTCCTG
+AAGGCCAAGGCCACTTCCTGCGGCACCCCCCAGGAGGAACGGGACAGCCCCGACGTGTCC
+TCCGTGGAGGCCACACTGCAGAAGTGGCAGGCAGGGGAGCACGGACACCCCCTGGGGGAC
+CTGGAGCCCGCGGCTGTTGTGGCCGTGCTCAGGTCCATGGACTTGGAAGGCCTTCAGGAC
+ACACTGGCCGAGAGCAGTGACCACGTGGAGAGGAGCCCCCAGTCGCTCCTGCAGGACATG
+CTGGCCACCGTGGGCGTCCTCGGGGAGAATGAGGCCGACTGCTACTGA
+>ENSPTRT00000019089_pantroglodytes
+ATAGGCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
+CTTCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
+CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
+CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATAATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
+GACCTGTTCCCCAACCTCACGGTCATCCGGGGGTCACGACTGTTCTTTAACTACGCGCTG
+GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
+CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
+TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
+GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
+ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCACAGTCACTGCCAGAAAGTTTGCCCG
+ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
+GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
+GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
+GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
+TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
+ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
+CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
+ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
+CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
+TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
+GAAATCGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAT
+TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
+CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
+AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
+AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
+CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAA
+AATGTGACGGAGTTCGACGGGCAGGATGCATGTGGTTCCAACAGTTGGACGGTGGTAGAC
+ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
+CGGGGTCTGAAGCCCTGGACCCAGTATGCCATCTTCGTGAAGACCCTGGTCACCTTTTCG
+GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
+AACCCCTCCGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTTTG
+AAGTGGAAACCCCCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
+AGGCAGGCGGAAGACAGTGAGCTGTTCGAACTGGATTATTGCCTCAAATGGTGTGTGTGG
+TGTGTGTGTGTGGTTGTTTGTTTGTGGAGTGTGTGTGAGTATGAGGATTCGGCCGGCGAA
+TGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTGAAGGAGCTGGAGGAGTCCTCGTTT
+AGGAAGACGTTTGAGGATTACCTGCACAACGTGGTTTTCGTCCCCAGAAAAACCTCTTCA
+GGCACTGGTGCCGAGGACCCTAGGCCATCTCGGAAACGCAGGTCCCTTGGCGATGTTGGG
+AATGTGACGGTGGCCGTGCCCACGGTGGCAGCTTTCCCCAACACTTCCTCGACCAGCGTG
+CCCACGAGTCCGGAGGAGCACAGGCCTTTTGAGAAGGTGGTGAACAAGGAGTCGCTGGTC
+ATCTCCGGCTTGCGACACTTCACGGGCTATCGCATCGAGCTGCAGGCTTGCAACCAGGAC
+ACCCCTGAGGAACGGTGCAGTGTGGCAGCCTACGTCAGTGCCAGGACCATGCCTGAAGCC
+AAGGCTGATGACATTGTCGGCCCTGTGACGCATGAAATCTTTGAGAACAACGTTGTCCAC
+TTGATGTGGCAGGAGCCGAAGGAGCCCAATGGTCTGATCGTGCTGTATGAAGTGAGTTAT
+CGGCGATATGGTGATGAGGAGCTGCATCTCTGCGTCTCCCGCAAGCACTTCGCTCTGGAG
+CGGGGCTGCAGGCTGCGTGGGCTGTCACCGGGGAACTACAGCGTGCGAGTCCGGGCCACC
+TCCCTTGCGGGCAACGGCTCTTGGACGGAACCCACCTATTTCTACGTGACAGACTATTTA
+GATGTCCCGTCAAATATTGCAAAAATTATCATCGGCCCCCTCATCTTTGTCTTTCTCTTC
+AGTGTTGTGATTGGAAGTATTTATCTATTCCTGAGAAAGAGGCAGCCAGATGGGCCGCTG
+GGACCGCTTTACGCTTCTTCAAACCCTGAGTATCTCAGTGCCAGTGATGTGTTTCCATGC
+TCTGTGTACGTGCCGGACGAGTGGGAGGTGCCTCGAGAGAAGATCACCCTCCTTCGAGAG
+CTGGGGCAGGGCTCCTTCGGCATGGTGTATGAGGGCAATGCCAGGGACATCATCAAGGGT
+GAGGCAGAGACCCGCGTGGCGGTGAAGACGGTCAACGAGTCAGCCAGTCTCCGAGAGCGG
+ATTGAGTTCCTCAATGAGGCCTCGGTCATGAAGGGCTTCACCTGCCATCATGTGGTGCGC
+CTCCTGGGAGTGGTGTCCAAGGGCCAGCCCACACTGGTGGTGATGGAGCTGATGGCTCAC
+GGAGACCTGAAGAGCTACCTCCGTTCTCTGCGGCCAGAGGCTGAGAATAATCCCGGCCGC
+CCTCCCCCTACCCTTCAAGAGATGATTCAGATGGCGGCAGAGATTGCTGATGGGATGGCC
+TACCTGAACGCCAAGAAGTTTGTGCATCGGGACCTGGCAGCGAGAAACTGCATGGTCGCC
+CATGATTTTACTGTCAAAATTGGAGACTTTGGAATGACCAGAGACATCTATGAAACGGAT
+TACTACCGGAAAGGGGGCAAGGGTCTGCTCCCTGTACGGTGGATGGCGCCAGAGTCCCTG
+AAGGATGGGGTCTTCACCACTTCTTCTGACATGTGGTCCTTTGGCGTGGTCCTTTGGGAA
+ATCACCAGCTTGGCAGAACAGCCTTACCAAGGCCTGTCTAATGAACAGGTGTTGAAATTT
+GTCATGGATGGAGGGTATCTGGATCAACCCGACAACTGTCCAGAGAGAGTCACTGACCTC
+ATGCGCATGTGCTGGCAATTCAACCCCAAGATGAGGCCAACCTTCCTGGAGATTGTCAAC
+CTGCTCAAGGACGACCTGCACCCCAGCTTTCCGGAGGTGTCGTTCTTCCACAGCGAGGAG
+AACAAGGCTCCCGAGAGCGAGGAGCTGGAGATGGAGTTTGAGGACATGGAGAATGTGCCC
+CTGGACCGTTCCTCGCACTGTCAGAGGGAGGAGGCGGGGGGCCGGGATGGAGGGTCCTCA
+CTAGGTTTCAAGCGGAGCTACGAGGAACACATCCCTTACACACACATGAACGGAGGCAAG
+AAAAACGGGCGGATTCTGACCTTGCCTCGGTCCAATCCTTCCTAA
+>ENST00000341500_homosapiens
+ATGGCCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
+CTGCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
+CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
+CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
+GACCTGTTCCCCAACCTCACGGTCATCCGGGGATCACGACTGTTCTTTAACTACGCGCTG
+GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
+CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
+TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
+GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
+ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCATAGTCACTGCCAGAAAGTTTGCCCG
+ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
+GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
+GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
+GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
+TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
+ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
+CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
+ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
+CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
+TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
+GAAATTGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAC
+TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
+CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
+AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
+AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
+CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
+AATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCCAACAGTTGGACGGTGGTAGAC
+ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
+CGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTGAAGACCCTGGTCACCTTTTCG
+GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
+AACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTCTG
+AAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
+AGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTATTGCCTCAAAGGGCTGAAGCTG
+CCCTCGAGGACCTGGTCTCCACCATTCGAGTCTGAAGATTCTCAGAAGCACAACCAGAGT
+GAGTATGAGGATTCGGCCGGCGAATGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTG
+AAGGAGCTGGAGGAGTCCTCGTTTAGGAAGACGTTTGAGGATTACCTGCACAACGTGGTT
+TTCGTCCCCAGGCCATCTCGGAAACGCAGGTCCCTTGGCGATGTTGGGAATGTGACGGTG
+GCCGTGCCCACGGTGGCAGCTTTCCCCAACACTTCCTCGACCAGCGTGCCCACGAGTCCG
+GAGGAGCACAGGCCTTTTGAGAAGGTGGTGAACAAGGAGTCGCTGGTCATCTCCGGCTTG
+CGACACTTCACGGGCTATCGCATCGAGCTGCAGGCTTGCAACCAGGACACCCCTGAGGAA
+CGGTGCAGTGTGGCAGCCTACGTCAGTGCGAGGACCATGCCTGAAGCCAAGGCTGATGAC
+ATTGTTGGCCCTGTGACGCATGAAATCTTTGAGAACAACGTCGTCCACTTGATGTGGCAG
+GAGCCGAAGGAGCCCAATGGTCTGATCGTGCTGTATGAAGTGAGTTATCGGCGATATGGT
+GATGAGGAGCTGCATCTCTGCGTCTCCCGCAAGCACTTCGCTCTGGAACGGGGCTGCAGG
+CTGCGTGGGCTGTCACCGGGGAACTACAGCGTGCGAATCCGGGCCACCTCCCTTGCGGGC
+AACGGCTCTTGGACGGAACCCACCTATTTCTACGTGACAGACTATTTAGACGTCCCGTCA
+AATATTGCAAAAATTATCATCGGCCCCCTCATCTTTGTCTTTCTCTTCAGTGTTGTGATT
+GGAAGTATTTATCTATTCCTGAGAAAGAGGCAGCCAGATGGGCCGCTGGGACCGCTTTAC
+GCTTCTTCAAACCCTGAGTATCTCAGTGCCAGTGATGTGTTTCCATGCTCTGTGTACGTG
+CCGGACGAGTGGGAGGTGTCTCGAGAGAAGATCACCCTCCTTCGAGAGCTGGGGCAGGGC
+TCCTTCGGCATGGTGTATGAGGGCAATGCCAGGGACATCATCAAGGGTGAGGCAGAGACC
+CGCGTGGCGGTGAAGACGGTCAACGAGTCAGCCAGTCTCCGAGAGCGGATTGAGTTCCTC
+AATGAGGCCTCGGTCATGAAGGGCTTCACCTGCCATCACGTGGTGCGCCTCCTGGGAGTG
+GTGTCCAAGGGCCAGCCCACGCTGGTGGTGATGGAGCTGATGGCTCACGGAGACCTGAAG
+AGCTACCTCCGTTCTCTGCGGCCAGAGGCTGAGAATAATCCTGGCCGCCCTCCCCCTACC
+CTTCAAGAGATGATTCAGATGGCGGCAGAGATTGCTGACGGGATGGCCTACCTGAACGCC
+AAGAAGTTTGTGCATCGGGACCTGGCAGCGAGAAACTGCATGGTCGCCCATGATTTTACT
+GTCAAAATTGGAGACTTTGGAATGACCAGAGACATCTATGAAACGGATTACTACCGGAAA
+GGGGGCAAGGGTCTGCTCCCTGTACGGTGGATGGCACCGGAGTCCCTGAAGGATGGGGTC
+TTCACCACTTCTTCTGACATGTGGTCCTTTGGCGTGGTCCTTTGGGAAATCACCAGCTTG
+GCAGAACAGCCTTACCAAGGCCTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGA
+GGGTATCTGGATCAACCCGACAACTGTCCAGAGAGAGTCACTGACCTCATGCGCATGTGC
+TGGCAATTCAACCCCAAGATGAGGCCAACCTTCCTGGAGATTGTCAACCTGCTCAAGGAC
+GACCTGCACCCCAGCTTTCCAGAGGTGTCGTTCTTCCACAGCGAGGAGAACAAGGCTCCC
+GAGAGTGAGGAGCTGGAGATGGAGTTTGAGGACATGGAGAATGTGCCCCTGGACCGTTCC
+TCGCACTGTCAGAGGGAGGAGGCGGGGGGCCGGGATGGAGGGTCCTCGCTGGGTTTCAAG
+CGGAGCTACGAGGAACACATCCCTTACACACACATGAACGGAGGCAAGAAAAACGGGCGG
+ATTCTGACCTTGCCTCGGTCCAATCCTTCCTAA
+>ENST00000302850_homosapiens
+ATGGCCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
+CTGCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
+CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
+CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
+GACCTGTTCCCCAACCTCACGGTCATCCGGGGATCACGACTGTTCTTTAACTACGCGCTG
+GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
+CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
+TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
+GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
+ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCATAGTCACTGCCAGAAAGTTTGCCCG
+ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
+GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
+GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
+GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
+TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
+ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
+CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
+ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
+CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
+TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
+GAAATTGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAC
+TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
+CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
+AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
+AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
+CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
+AATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCCAACAGTTGGACGGTGGTAGAC
+ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
+CGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTGAAGACCCTGGTCACCTTTTCG
+GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
+AACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTCTG
+AAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
+AGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTATTGCCTCAAAGGGCTGAAGCTG
+CCCTCGAGGACCTGGTCTCCACCATTCGAGTCTGAAGATTCTCAGAAGCACAACCAGAGT
+GAGTATGAGGATTCGGCCGGCGAATGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTG
+AAGGAGCTGGAGGAGTCCTCGTTTAGGAAGACGTTTGAGGATTACCTGCACAACGTGGTT
+TTCGTCCCCAGAAAAACCTCTTCAGGCACTGGTGCCGAGGACCCTAGGCCATCTCGGAAA
+CGCAGGTCCCTTGGCGATGTTGGGAATGTGACGGTGGCCGTGCCCACGGTGGCAGCTTTC
+CCCAACACTTCCTCGACCAGCGTGCCCACGAGTCCGGAGGAGCACAGGCCTTTTGAGAAG
+GTGGTGAACAAGGAGTCGCTGGTCATCTCCGGCTTGCGACACTTCACGGGCTATCGCATC
+GAGCTGCAGGCTTGCAACCAGGACACCCCTGAGGAACGGTGCAGTGTGGCAGCCTACGTC
+AGTGCGAGGACCATGCCTGAAGCCAAGGCTGATGACATTGTTGGCCCTGTGACGCATGAA
+ATCTTTGAGAACAACGTCGTCCACTTGATGTGGCAGGAGCCGAAGGAGCCCAATGGTCTG
+ATCGTGCTGTATGAAGTGAGTTATCGGCGATATGGTGATGAGGAGCTGCATCTCTGCGTC
+TCCCGCAAGCACTTCGCTCTGGAACGGGGCTGCAGGCTGCGTGGGCTGTCACCGGGGAAC
+TACAGCGTGCGAATCCGGGCCACCTCCCTTGCGGGCAACGGCTCTTGGACGGAACCCACC
+TATTTCTACGTGACAGACTATTTAGACGTCCCGTCAAATATTGCAAAAATTATCATCGGC
+CCCCTCATCTTTGTCTTTCTCTTCAGTGTTGTGATTGGAAGTATTTATCTATTCCTGAGA
+AAGAGGCAGCCAGATGGGCCGCTGGGACCGCTTTACGCTTCTTCAAACCCTGAGTATCTC
+AGTGCCAGTGATGTGTTTCCATGCTCTGTGTACGTGCCGGACGAGTGGGAGGTGTCTCGA
+GAGAAGATCACCCTCCTTCGAGAGCTGGGGCAGGGCTCCTTCGGCATGGTGTATGAGGGC
+AATGCCAGGGACATCATCAAGGGTGAGGCAGAGACCCGCGTGGCGGTGAAGACGGTCAAC
+GAGTCAGCCAGTCTCCGAGAGCGGATTGAGTTCCTCAATGAGGCCTCGGTCATGAAGGGC
+TTCACCTGCCATCACGTGGTGCGCCTCCTGGGAGTGGTGTCCAAGGGCCAGCCCACGCTG
+GTGGTGATGGAGCTGATGGCTCACGGAGACCTGAAGAGCTACCTCCGTTCTCTGCGGCCA
+GAGGCTGAGAATAATCCTGGCCGCCCTCCCCCTACCCTTCAAGAGATGATTCAGATGGCG
+GCAGAGATTGCTGACGGGATGGCCTACCTGAACGCCAAGAAGTTTGTGCATCGGGACCTG
+GCAGCGAGAAACTGCATGGTCGCCCATGATTTTACTGTCAAAATTGGAGACTTTGGAATG
+ACCAGAGACATCTATGAAACGGATTACTACCGGAAAGGGGGCAAGGGTCTGCTCCCTGTA
+CGGTGGATGGCACCGGAGTCCCTGAAGGATGGGGTCTTCACCACTTCTTCTGACATGTGG
+TCCTTTGGCGTGGTCCTTTGGGAAATCACCAGCTTGGCAGAACAGCCTTACCAAGGCCTG
+TCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGGTATCTGGATCAACCCGACAAC
+TGTCCAGAGAGAGTCACTGACCTCATGCGCATGTGCTGGCAATTCAACCCCAAGATGAGG
+CCAACCTTCCTGGAGATTGTCAACCTGCTCAAGGACGACCTGCACCCCAGCTTTCCAGAG
+GTGTCGTTCTTCCACAGCGAGGAGAACAAGGCTCCCGAGAGTGAGGAGCTGGAGATGGAG
+TTTGAGGACATGGAGAATGTGCCCCTGGACCGTTCCTCGCACTGTCAGAGGGAGGAGGCG
+GGGGGCCGGGATGGAGGGTCCTCGCTGGGTTTCAAGCGGAGCTACGAGGAACACATCCCT
+TACACACACATGAACGGAGGCAAGAAAAACGGGCGGATTCTGACCTTGCCTCGGTCCAAT
+CCTTCCTAA
+>ENST00000600492_homosapiens
+TACAAAGAGGCCCCTTATCAGAATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCC
+AACAGTTGGACGGTGGTAGACATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAG
+AACCACCCAGGGTGGCTGATGCGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTG
+AAGACCCTGGTCACCTTTTCGGATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATT
+TATGTCCAGACAGATGCCACCAACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAAC
+TCATCATCCCAGATTATTCTGAAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACC
+CACTACCTGGTTTTCTGGGAGAGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTAT
+TGCCTCAAAGGGCGAGTCCAGTCATCAGCTCCGCTGTAA
+>ENSMUST00000208839_musmusculus
+NAGACAGATTACTATCGGAAAGGGGGCAAGGGACTGCTTCCTGTGAGGTGGATGTCACCT
+GAGTCCCTGAAGGATGGAGTCTTTACTGCTTCTTCTGATATGTGGTCCTTTGGGGTGGTC
+CTTTGGGAAATCACTAGCCTGGCTGAGCAACCTTATCAAGGCCTGTCTAATGAACAGGTG
+TTGAAGTTTGTCATGGATGGAGGCTATCTGGATCCCCCTGATAACTGTCCAGAGAGACTG
+AGATATGAGATAAAGACACACTGGCCACCCTGA
+>ENSMUST00000091291_musmusculus
+ATGGGCTTCGGGAGAGGATGTGAGACGACGGCTGTGCCATTGCTGGTGGCCGTGGCCGCG
+TTGCTGGTGGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCTGGTATGGACATC
+CGGAACAACCTGACCAGGCTACATGAGCTGGAGAACTGCTCAGTCATTGAGGGCCATCTG
+CAGATCCTCCTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATCATGATCACAGATTACCTGCTTCTCTTCCGTGTCTATGGTCTGGAAAGTCTGAAA
+GACCTCTTCCCAAATCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTG
+GTTATCTTCGAGATGGTCCACCTGAAGGAGCTGGGGCTTTATAACCTCATGAACATCACC
+CGGGGCTCTGTCCGCATCGAGAAGAATAATGAGCTCTGCTACCTGGCCACTATCGACTGG
+TCCCGTATCCTGGATTCTGTGGAGGACAACTACATTGTACTGAACAAAGATGACAACGAG
+GAATGTGGGGATGTCTGTCCAGGCACCGCCAAGGGCAAGACCAACTGTCCTGCCACTGTC
+ATCAATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCA
+ACCATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGCCACAAAGAGTGCCTG
+GGCAACTGTTCGGAACCTGATGACCCCACCAAGTGTGTGGCCTGTCGCAACTTCTATCTG
+GATGGTCAGTGTGTGGAGACCTGCCCGCCACCCTACTATCACTTCCAGGACTGGCGCTGT
+GTGAACTTCAGCTTCTGCCAAGACCTTCACTTCAAATGCAGGAACTCTCGGAAGCCTGGC
+TGCCACCAATACGTCATTCACAACAATAAGTGCATCCCCGAGTGCCCGTCTGGCTATACC
+ATGAATTCCAGCAACTTGATGTGCACCCCATGTCTGGGACCCTGCCCTAAGGTCTGCCAA
+ATCCTCGAAGGTGAGAAGACCATTGATTCTGTGACATCTGCCCAGGAGCTCCGAGGCTGC
+ACTGTGATCAACGGTAGCCTGATCATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAG
+CTGGAGGCTAACCTTGGCCTCATTGAAGAAATTTCGGGATTTCTAAAGATCCGCCGCTCC
+TATGCTCTGGTATCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTG
+GAAATTGGGAACTATTCTTTTTATGCCTTGGACAACCAGAACCTGAGGCAACTCTGGGAC
+TGGAGCAAACACAACCTCACCATCACTCAGGGCAAGCTCTTCTTCCATTACAACCCGAAA
+CTCTGCTTGTCTGAAATTCACAAGATGGAAGAAGTCTCCGGAACTAAGGGCCGTCAGGAG
+AGGAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCGTGTGAAAATGAATTGCTT
+AAATTTTCTTTCATTCGGACATCTTTTGACAAGATCCTGTTGAGGTGGGAACCCTACTGG
+CCCCCCGACTTCCGAGATCTCCTGGGATTCATGTTGTTCTACAAAGAGGCCCCTTATCAG
+AATGTGACAGAGTTTGATGGGCAGGATGCTTGTGGCTCCAACAGCTGGACTGTGGTGGAT
+ATTGACCCGCCCCAGAGGTCCAACGACCCCAAGTCTCAGACCCCAAGCCACCCTGGGTGG
+CTGATGCGGGGCCTCAAACCCTGGACCCAATACGCCATCTTTGTGAAGACCTTGGTTACC
+TTCTCTGATGAACGGCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGAT
+GCCACTAATCCTTCTGTCCCCCTGGATCCCATATCAGTTTCTAATTCCTCATCTCAGATT
+ATCTTAAAGTGGAAGCCCCCCTCTGACCCCAATGGCAACATCACACACTACCTGGTGTAC
+TGGGAGAGGCAAGCAGAGGACAGCGAGCTGTTTGAGCTGGATTATTGTCTCAAAGGGCTG
+AAGCTCCCTTCACGGACCTGGTCCCCACCCTTTGAGTCTGATGATTCTCAGAAGCACAAT
+CAGAGTGAGTATGACGACTCGGCCAGTGAGTGCTGCTCATGCCCTAAGACTGACTCTCAG
+ATCCTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAAC
+GTGGTTTTTGTCCCCAGGCCATCCCGAAAGCGAAGATCCCTTGAAGAGGTGGGGAATGTG
+ACAGCCACCACACTCACACTTCCAGATTTCCCCAACGTCTCCTCTACCATTGTGCCCACA
+AGTCAGGAGGAGCACAGGCCATTTGAGAAAGTGGTGAACAAGGAGTCACTTGTCATCTCT
+GGCCTGAGACACTTCACTGGGTACCGCATTGAGCTGCAGGCATGCAATCAAGATTCCCCA
+GATGAGAGGTGCAGTGTGGCTGCCTACGTCAGTGCCCGGACCATGCCTGAAGCTAAGGCA
+GATGACATCGTTGGCCCTGTGACTCATGAAATCTTTGAGAACAATGTTGTACACTTAATG
+TGGCAAGAGCCAAAGGAACCTAATGGTCTGATTGTGCTATATGAAGTGAGCTATCGCCGA
+TATGGTGATGAGGAGCTGCACCTCTGTGTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGC
+TGCAGGCTGCGAGGGCTCTCCCCAGGAAACTACAGTGTTCGAGTCCGGGCTACCTCTCTG
+GCAGGAAATGGCTCCTGGACAGAACCCACCTATTTTTATGTGACTGATTATTTAGATGTC
+CCATCAAATATTGCCAAAATTATCATTGGACCCCTCATCTTTGTCTTCCTCTTCAGTGTT
+GTGATTGGAAGTATTTATCTATTTCTGAGAAAGAGGCAGCCGGATGGGCCAATGGGACCA
+CTGTATGCATCTTCAAACCCTGAGTACCTCAGTGCCAGTGATGTGTTTCCATCTTCTGTG
+TACGTGCCGGACGAGTGGGAGGTGCCTCGAGAGAAGATCACCCTTCTTCGAGAGCTGGGG
+CAGGGATCCTTTGGTATGGTGTATGAAGGCAATGCCAAGGATATCATCAAGGGTGAGGCA
+GAGACCCGTGTTGCGGTTAAGACTGTCAATGAGTCAGCCAGTCTTCGAGAACGGATCGAG
+TTCCTCAATGAGGCATCAGTCATGAAGGGATTCACCTGCCATCATGTGGTCCGCCTTCTT
+GGGGTGGTATCCAAAGGACAGCCAACGCTGGTAGTGATGGAATTGATGGCTCATGGAGAC
+CTGAAAAGTCACCTCCGTTCTCTGAGGCCAGATGCTGAGAATAACCCAGGCCGCCCTCCC
+CCTACCTTGCAAGAAATGATTCAGATGACAGCAGAAATTGCTGATGGCATGGCATACTTG
+AACGCCAAGAAGTTTGTGCACCGGGACCTGGCAGCTCGAAACTGCATGGTTGCCCATGAT
+TTTACTGTCAAAATTGGAGACTTTGGAATGACAAGGGACATCTACGAGACAGATTACTAT
+CGGAAAGGGGGCAAGGGACTGCTTCCTGTGAGGTGGATGTCACCTGAGTCCCTGAAGGAT
+GGAGTCTTTACTGCTTCTTCTGATATGTGGTCCTTTGGGGTGGTCCTTTGGGAAATCACT
+AGCCTGGCTGAGCAACCTTATCAAGGCCTGTCTAATGAACAGGTGTTGAAGTTTGTCATG
+GATGGAGGCTATCTGGATCCCCCTGATAACTGTCCAGAGAGACTCACTGACCTGATGCGC
+ATGTGCTGGCAGTTCAACCCCAAGATGAGGCCAACCTTCCTGGAAATCGTCAACCTGCTC
+AAGGATGACCTCCACCCCAGCTTTCCAGAAGTTTCCTTCTTCTACAGCGAGGAGAACAAG
+GCTCCTGAGAGTGAGGAGCTGGAGATGGAGTTTGAAGACATGGAGAATGTCCCGTTGGAT
+CGTTCCTCTCACTGTCAGAGAGAAGAGGCTGGGGGCCGGGAGGGAGGGTCCTCACTGAGC
+ATCAAACGGACCTATGATGAACACATCCCCTATACCCACATGAATGGGGGCAAGAAGAAC
+GGACGTGTCCTTACCCTGCCAAGGTCAAACCCTTCCTAA
+>ENSMUST00000207100_musmusculus
+AGGTCCAACGACCCCAAGTCTCAGACCCCAAGCCACCCTGGGTGGCTGATGCGGGGCCTC
+AAACCCTGGACCCAATACGCCATCTTTGTGAAGACCTTGGTTACCTTCTCTGATGAACGG
+CGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGATGCCACTAATCCTTCT
+GTCCCCCTGGATCCCATATCAGTTTCTAATTCCTCATCTCAGATTATCTTAAAGTGGAAG
+CCCCCCTCTGACCCCAATGGCAACATCACACACTACCTGGTGTACTGGGAGAGGCAAGCA
+GAGGACAGCGAGCTGTTTGAGCTGGATTATTGTCTCAAAGGGCTGAAGCTCCCTTCACGG
+ACCTGGTCCCCACCCTTTGAGTCTGATGATTCTCAGAAGCACAATCAGAGTGAGTATGAC
+GACTCGGCCAGTGAGTGCTGCTCATGCCCTAAGACTGACTCTCAGATCCTGAAGGAGCTG
+GAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAACGTGGTTTTTGTCCCC
+AGAAAAACCTCTTCAGGCAATGGTGCCGAGGACAGTAGGCCATCCCGAAAGCGAAGATCC
+CTTGAAGAGGTGGGGAATGTGACAGCCACCACACTCACACTTCCAGATTTCCCCAACGTC
+TCCTCTACCATT
+>ENSRNOT00000041155_rattusnorvegicus
+ATGGGCTCCGGGAGAGGATGTGAGACGACGGCGGTGCCGTTGCTGATGGCCGTGGCCGCG
+TTGCTGGTGGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCGGGAATGGACATC
+CGGAACAACCTGACCAGGTTGCATGAGCTGGAGAACTGCTCGGTCATTGAGGGCCATCTG
+CAGATCCTCTTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
+CTCATCATGATCACAGACTACCTGCTTCTTTTCCGTGTCTATGGCCTAGAAAGTCTAAAA
+GACCTCTTCCCAAACCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTG
+GTCATCTTCGAGATGGTCCACCTGAAGGAGCTGGGTCTTTACAACCTCATGAACATCACC
+CGGGGCTCTGTCCGCATCGAGAAGAATAATGAACTCTGCTACCTGGCCACTATCGACTGG
+TCCCGCATCCTGGATTCCGTGGAGGACAACTACATTGTACTGAACAAAGATGACAATGAG
+GAATGTGGGGACGTCTGTCCAGGCACAGCCAAGGGCAAGACCAACTGCCCTGCCACCGTC
+ATCAATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCA
+ACCATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGTCACAAGGAGTGCCTG
+GGCAACTGTTCAGAACCCGATGACCCTACCAAGTGTGTGGCCTGTCGAAACTTCTACCTG
+GATGGTCAGTGTGTGGAGACCTGCCCACCACCCTACTATCACTTCCAGGATTGGCGCTGT
+GTAAACTTCAGCTTCTGCCAAGACCTTCACTACAAATGCAGGAACTCTCGGAAGCCTGGC
+TGTCACCAATACGTCATTCACAACAACAAGTGCATCCCCGAGTGCCCGTCTGGCTATACC
+ATGAATTCCAGCAACTTGATGTGCACCCCGTGTCTGGGACCCTGTCCTAAGGTCTGCCAA
+ATCCTCGAAGGCGAGAAGACCATTGATTCCGTGACATCTGCCCAGGAGCTCCGAGGCTGC
+ACTGTGATCAATGGCAGCCTGATTATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAA
+CTAGAGGCTAACCTTGGCCTCATTGAAGAAATCTCAGGGTTCCTAAAGATCCGTCGCTCC
+TATGCTCTGGTGTCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTG
+GAAATTGGGAACTATTCTTTCTACGCCTTGGACAACCAGAACCTGAGGCAGCTGTGGGAC
+TGGAACAAGCACAACCTCACGATCACTCAGGGCAAGCTCTTCTTCCACTACAACCCCAAA
+CTCTGCCTGTCTGAGATCCACAAGATGGAGGAAGTGTCCGGAACCAAGGGCCGCCAGGAG
+AGGAACGACATTGCCCTGAAGACCAACGGGGACCAGGCATCCTGTGAAAATGAATTACTT
+AAATTCTCTTTCATCCGGACGTCTTTTGACAAGATCTTGCTGAGGTGGGAGCCCTACTGG
+CCCCCCGACTTCCGAGATCTCCTGGGATTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
+AACGTGACAGAGTTTGACGGGCAGGATGCGTGTGGCTCCAACAGCTGGACTGTGGTGGAT
+ATTGACCCGCCCCAGAGGTCCAACGACCCTAAGTCTCAGACCCCAAGCCACCCTGGGTGG
+CTGATGCGGGGCCTCAAACCCTGGACCCAGTATGCCATCTTTGTCAAGACCTTGGTTACC
+TTCTCTGATGAACGCCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGAT
+GCCACCAATCCTTCCGTTCCCCTGGATCCCATATCAGTTTCCAACTCCTCATCTCAGATT
+ATCTTAAAGTGGAAGCCCCCCTCGGACCCCAATGGCAACATCACACACTACCTGGTCTAC
+TGGGAGAGGCAGGCGGAGGACAGCGAGCTGTTCGAGTTGGATTATTGTCTCAAAGGGCTG
+AAGCTCCCCTCACGCACCTGGTCCCCACCTTTTGAGTCTGACGATTCTCAAAAGCACAAT
+CAGAGTGAGTATGACGACTCGGCCAGCGAGTGCTGCTCATGTCCTAAGACTGACTCTCAG
+ATCCTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAAC
+GTGGTTTTTGTTCCCAGAAAAACCTCTTCAGGCAATGGTGCTGAGGACACTAGGCCATCC
+CGAAAGCGAAGATCCCTTGAAGAGGTGGGCAATGTGACAGCCACTACACCCACACTTCCA
+GATTTTCCCAACATCTCCTCCACCATCGCGCCCACAAGCCACGAAGAGCACAGACCATTT
+GAGAAAGTAGTAAACAAGGAGTCACTTGTCATCTCTGGCCTGAGACACTTCACTGGGTAC
+CGCATTGAGCTGCAGGCATGCAATCAGGACTCCCCAGAAGAGAGGTGCAGCGTGGCTGCC
+TACGTCAGTGCCCGGACCATGCCTGAAGCTAAGGCAGATGACATCGTTGGCCCTGTGACC
+CATGAAATCTTTGAGAACAATGTTGTACACTTAATGTGGCAAGAGCCAAAGGAACCTAAT
+GGTCTGATTGTGCTATATGAAGTGAGCTATCGGCGATATGGTGATGAGGAGCTGCACCTC
+TGTGTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGCTGCAGGCTTCGAGGGCTCTCTCCA
+GGAAACTACAGTGTTCGAGTCCGGGCTACCTCTCTGGCAGGAAATGGCTCCTGGACAGAA
+CCCACCTATTTTTATGTGACTGATTATTTAGATGTCCCATCAAATATTGCCAAAATTATC
+ATCGGGCCCCTCATCTTCGTCTTCCTCTTCAGTGTCGTGATCGGAAGTATTTATCTATTC
+TTGAGGAAGAGGCAGCCAGATGGGCCAATGGGACCACTGTACGCTTCTTCAAACCCAGAG
+TACCTCAGTGCCAGTGATGTCTTTCCATCTTCCGTATACGTTCCGGATGAGTGGGAGGTA
+CCTCGAGAGAAGATCACCCTCCTCCGAGAGCTGGGGCAGGGATCCTTCGGTATGGTGTAC
+GAAGGCAATGCCAAGGATATCATCAAGGGTGAGGTAGAGACCCGTGTTGCGGTGAAGACG
+GTCAATGAGTCAGCCAGTCTTCGAGAACGGATCGAGTTCCTCAATGAGGCATCAGTCATG
+AAGGGCTTCACCTGTCATCACGTGGTCCGCCTTCTTGGGGTGGTGTCCAAAGGCCAGCCC
+ACATTGGTAGTGATGGAACTGATGGCTCATGGAGACCTGAAAAGTCACCTCCGTTCTCTG
+CGGCCCGATGCTGAGAACAACCCAGGCCGTCCTCCCCCTACCTTGCAAGAAATGATTCAG
+ATGACAGCAGAAATTGCCGATGGCATGGCATACTTGAACGCCAAGAAGTTTGTGCACCGG
+GACCTGGCAGCTCGGAACTGCATGGTTGCCCATGATTTTACTGTCAAAATCGGAGACTTT
+GGAATGACGAGAGACATCTACGAGACAGATTACTATCGGAAAGGGGGCAAGGGGTTGCTG
+CCCGTGAGGTGGATGTCACCCGAGTCCCTGAAGGACGGAGTCTTCACTGCTTCTTCCGAC
+ATGTGGTCCTTTGGGGTGGTCCTTTGGGAAATCACCAGCCTGGCTGAGCAACCTTACCAA
+GGCCTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGCTATCTGGATCCCCCT
+GATAACTGTCCAGAGAGACTCACTGACCTGATGCGCATGTGCTGGCAGTTCAACCCCAAG
+ATGAGGCCGACCTTCCTGGAAATCGTCAACCTGCTCAAGGACGACCTCCACCCCAGCTTT
+CCGGAAGTTTCCTTCTTCTACAGCGAGGAGAACAAGGCTCCCGAGAGTGAAGAGCTGGAG
+ATGGAGTTCGAGGACATGGAGAATGTCCCCTTGGATCGTTCCTCTCACTGTCAGAGAGAA
+GAGGCTGGATGCCGGGAGGGAGGGTCCTCTCTGAGCATCAAACGGACCTATGATGAACAC
+ATCCCCTACACCCACATGAACGGGGGCAAGAAGAATGGGCGGGTCCTCACCCTGCCGAGG
+TCGAACCCTTCCTAA
+>ENSRNOT00000067448_rattusnorvegicus
+ATGGGCTCCGGGAGAGGATGTGAGACGACGGCGGTGCCGTTGCTGATGGCCGTGGCCGTT
+GCTGGTGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCGGGAATGGACATCCGG
+AACAACCTGACCAGGTTGCATGAGCTGGAGAACTGCTCGGTCATTGAGGGCCATCTGCAG
+ATCCTCTTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAACTC
+ATCATGATCACAGACTACCTGCTTCTTTTCCGTGTCTATGGCCTAGAAAGTCTAAAAGAC
+CTCTTCCCAAACCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTGGTC
+ATCTTCGAGATGGTCCACCTGAAGGAGCTGGGTCTTTACAACCTCATGAACATCACCCGG
+GGCTCTGTCCGCATCGAGAAGAATAATGAACTCTGCTACCTGGCCACTATCGACTGGTCC
+CGCATCCTGGATTCCGTGGAGGACAACTACATTGTACTGAACAAAGATGACAATGAGGAA
+TGTGGGGACGTCTGTCCAGGCACAGCCAAGGGCAAGACCAACTGCCCTGCCACCGTCATC
+AATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCAACC
+ATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGTCACAAGGAGTGCCTGGGC
+AACTGTTCAGAACCCGATGACCCTACCAAGTGTGTGGCCTGTCGAAACTTCTACCTGGAT
+GGTCAGTGTGTGGAGACCTGCCCACCACCCTACTATCACTTCCAGGATTGGCGCTGTGTA
+AACTTCAGCTTCTGCCAAGACCTTCACTACAAATGCAGGAACTCTCGGAAGCCTGGCTGT
+CACCAATACGTCATTCACAACAACAAGTGCATCCCCGAGTGCCCGTCTGGCTATACCATG
+AATTCCAGCAACTTGATGTGCACCCCGTGTCTGGGACCCTGTCCTAAGGTCTGCCAAATC
+CTCGAAGGCGAGAAGACCATTGATTCCGTGACATCTGCCCAGGAGCTCCGAGGCTGCACT
+GTGATCAATGGCAGCCTGATTATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAACTA
+GAGGCTAACCTTGGCCTCATTGAAGAAATCTCAGGGTTCCTAAAGATCCGTCGCTCCTAT
+GCTCTGGTGTCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTGGAA
+ATTGGGAACTATTCTTTCTACGCCTTGGACAACCAGAACCTGAGGCAGCTGTGGGACTGG
+AACAAGCACAACCTCACGATCACTCAGGGCAAGCTCTTCTTCCACTACAACCCCAAACTC
+TGCCTGTCTGAGATCCACAAGATGGAGGAAGTGTCCGGAACCAAGGGCCGCCAGGAGAGG
+AACGACATTGCCCTGAAGACCAACGGGGACCAGGCATCCTGTGAAAATGAATTACTTAAA
+TTCTCTTTCATCCGGACGTCTTTTGACAAGATCTTGCTGAGGTGGGAGCCCTACTGGCCC
+CCCGACTTCCGAGATCTCCTGGGATTCATGCTGTTCTACAAAGAGGCCCCTTATCAGAAC
+GTGACAGAGTTTGACGGGCAGGATGCGTGTGGCTCCAACAGCTGGACTGTGGTGGATATT
+GACCCGCCCCAGAGGTCCAACGACCCTAAGTCTCAGACCCCAAGCCACCCTGGGTGGCTG
+ATGCGGGGCCTCAAACCCTGGACCCAGTATGCCATCTTTGTCAAGACCTTGGTTACCTTC
+TCTGATGAACGCCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGATGCC
+ACCAATCCTTCCGTTCCCCTGGATCCCATATCAGTTTCCAACTCCTCATCTCAGATTATC
+TTAAAGTGGAAGCCCCCCTCGGACCCCAATGGCAACATCACACACTACCTGGTCTACTGG
+GAGAGGCAGGCGGAGGACAGCGAGCTGTTCGAGTTGGATTATTGTCTCAAAGGGCTGAAG
+CTCCCCTCACGCACCTGGTCCCCACCTTTTGAGTCTGACGATTCTCAAAAGCACAATCAG
+AGTGAGTATGACGACTCGGCCAGCGAGTGCTGCTCATGTCCTAAGACTGACTCTCAGATC
+CTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAACGTG
+GTTTTTGTTCCCAGAAAAACCTCTTCAGGCAATGGTGCTGAGGACACTAGGCCATCCCGA
+AAGCGAAGATCCCTTGAAGAGGTGGGCAATGTGACAGCCACTACACCCACACTTCCAGAT
+TTTCCCAACATCTCCTCCACCATCGCGCCCACAAGCCACGAAGAGCACAGACCATTTGAG
+AAAGTAGTAAACAAGGAGTCACTTGTCATCTCTGGCCTGAGACACTTCACTGGGTACCGC
+ATTGAGCTGCAGGCATGCAATCAGGACTCCCCAGAAGAGAGGTGCAGCGTGGCTGCCTAC
+GTCAGTGCCCGGACCATGCCTGAAGCTAAGGCAGATGACATCGTTGGCCCTGTGACCCAT
+GAAATCTTTGAGAACAATGTTGTACACTTAATGTGGCAAGAGCCAAAGGAACCTAATGGT
+CTGATTGTGCTATATGAAGTGAGCTATCGGCGATATGGTGATGAGGAGCTGCACCTCTGT
+GTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGCTGCAGGCTTCGAGGGCTCTCTCCAGGA
+AACTACAGTGTTCGAGTCCGGGCTACCTCTCTGGCAGGAAATGGCTCCTGGACAGAACCC
+ACCTATTTTTATGTGACTGATTATTTAGATGTCCCATCAAATATTGCCAAAATTATCATC
+GGGCCCCTCATCTTCGTCTTCCTCTTCAGTGTCGTGATCGGAAGTATTTATCTATTCTTG
+AGGAAGAGGCAGCCAGATGGGCCAATGGGACCACTGTACGCTTCTTCAAACCCAGAGTAC
+CTCAGTGCCAGTGATGTCTTTCCATCTTCCGTATACGTTCCGGATGAGTGGGAGGTACCT
+CGAGAGAAGATCACCCTCCTCCGAGAGCTGGGGCAGGGATCCTTCGGTATGGTGTACGAA
+GGCAATGCCAAGGATATCATCAAGGGTGAGGTAGAGACCCGTGTTGCGGTGAAGACGGTC
+AATGAGTCAGCCAGTCTTCGAGAACGGATCGAGTTCCTCAATGAGGCATCAGTCATGAAG
+GGCTTCACCTGTCATCACGTGGTCCGCCTTCTTGGGGTGGTGTCCAAAGGCCAGCCCACA
+TTGGTAGTGATGGAACTGATGGCTCATGGAGACCTGAAAAGTCACCTCCGTTCTCTGCGG
+CCCGATGCTGAGAACAACCCAGGCCGTCCTCCCCCTACCTTGCAAGAAATGATTCAGATG
+ACAGCAGAAATTGCCGATGGCATGGCATACTTGAACGCCAAGAAGTTTGTGCACCGGGAC
+CTGGCAGCTCGGAACTGCATGGTTGCCCATGATTTTACTGTCAAAATCGGAGACTTTGGA
+ATGACGAGAGACATCTACGAGACAGATTACTATCGGAAAGGGGGCAAGGGGTTGCTGCCC
+GTGAGGTGGATGTCACCCGAGTCCCTGAAGGACGGAGTCTTCACTGCTTCTTCCGACATG
+TGGTCCTTTGGGGTGGTCCTTTGGGAAATCACCAGCCTGGCTGAGCAACCTTACCAAGGC
+CTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGCTATCTGGATCCCCCTGAT
+AACTGTCCAGAGAGACTCACTGACCTGATGCGCATGTGCTGGCAGTTCAACCCCAAGATG
+AGGCCGACCTTCCTGGAAATCGTCAACCTGCTCAAGGACGACCTCCACCCCAGCTTTCCG
+GAAGTTTCCTTCTTCTACAGCGAGGAGAACAAGGCTCCCGAGAGTGAAGAGCTGGAGATG
+GAGTTCGAGGACATGGAGAATGTCCCCTTGGATCGTTCCTCTCACTGTCAGAGAGAAGAG
+GCTGGATGCCGGGAGGGAGGGTCCTCTCTGAGCATCAAACGGACCTATGATGAACACATC
+CCCTACACCCACATGAACGGGGGCAAGAAGAATGGGCGGGTCCTCACCCTGCCGAGGTCG
+AACCCTTCCTAA
+>ENSSSCT00000014817_susscrofa
+GTGTGCCCAGGGATGGATATCCGGAATAACCTTACACGGCTGCACGAGTTGGCCAACTGC
+TCGGTCATCGAAGGACATTTGCAGATCCTGTTGATGTTCAAAACGCGGCCCGAGGATTTC
+CGAGACCTCAGTTTCCCCAAACTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTC
+TACGGGCTGGAGAGCCTGAAGGACCTGTTCCCCAACCTCACCGTCATCCGGGGCTCACGC
+CTCTTCTTTAACTATGCGCTGGTCATCTTTGAGATGGTTCACTTGAAGGAGCTTGGCCTC
+TACAATTTGATGAACATCACCAGGGGTGCTGTCCGCATCGAGAAGAACAATGAGCTCTGC
+TACCTGGCGACCATTGACTGGTCGCGCATCCTGGACTCTGTGGAGGATAATTACATTGTG
+CTGAACAAAGACGACAACGAGGAGTGTGGGGACATTTGCCCAGGCACTGCGAAGGGCAAG
+ACCAATTGCCCTGCCACCGTCATCAATGGGCAATTTGTCGAGCGGTGTTGGACGCACAGT
+CACTGCCAGAAAGTGTGCCCGACCATCTGTAAGTCGCACGGCTGCACTGCTGAGGGCCTC
+TGCTGTCACAGCGAGTGTTTGGGCAACTGCTCTGAGCCAGACGACCCCACCAAGTGCGTG
+GCCTGCCGCAACTTCTACCTGGACGGCAGATGCGTGGAGACCTGCCCGCCCCCCTACTAC
+CACTTCCAAGACTGGCGCTGCGTGAACTTCAGCTTCTGCCAGGACCTGCACAACAAATGC
+AAGAACTCAAGGAGGCAGGGCTGCCACCAGTACGTCATTCACAACAACAAGTGTATCCCT
+GAGTGCCCCTCAGGGTACACGATGAATTCCAGCAACTTGATGTGCACTCCGTGCCTAGGC
+CCCTGTCCCAAAGTGTGTCACCTCCTGGAAGGCGAGAAGACCATCGACTCAGTGACATCC
+GCCCAGGAGCTCCGAGGCTGCACCATTATCAACGGGAGCCTAATCATCAACATTCGAGGA
+GGCAACAACCTGGCAGCCGAACTAGAGGCCAACCTTGGACTCATTGAGGAGATTTCAGGG
+TACCTGAAAATCCGCCGATCCTATGCCCTCGTGTCACTTTCCTTCTTCCGGAAGTTGCGT
+CTGATCCGAGGGGAGACGTTGGAAATTGGGAACTATTCTTTCTATGCCTTGGACAACCAG
+AACCTAAGGCAACTGTGGGACTGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTC
+TTCTTCCATTATAATCCCAAACTCTGCTTGTCGGAAATTCACAAGATGGAGGAAGTTTCT
+GGAACCAAGGGGCGCCAGGAGAGAAATGATATTGCCCTGAAGACCAATGGGGACCAGGCG
+TCCTGTGAAAATGAGTTACTTAAATTTTCTTACATTCGGACATCTTATGACAAGATCTTG
+CTGAAGTGGGAGCCGTATTGGCCCCCCGACTTCCGAGACCTCCTGGGGTTCATGCTCTTC
+TACAAAGAGGCCCCTTATCAGAACGTGACGGAGTTTGACGGGCAGGATGCGTGTGGCTCC
+AACAGCTGGACGGTGGTGGACATTGACCCGCCTACGAGGTCCAATGACCCCAAGTCCCAG
+AACCATCCTGGGTGGCTGATGCGTGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTC
+AAGACTTTGGTCACCTTTTCTGATGAACGACGCACCTATGGAGCCAAGAGTGACATCATC
+TACGTCCAGACAGATGCCACAAGTAAGCATGTC
+