changeset 9:f4acbfe8d6fe draft

planemo upload for repository https://github.com/TGAC/earlham-galaxytools/tree/master/tools/gstf_preparation commit 2f56285b1ef694d732c8b2637e3e924f8a626e55
author earlhaminst
date Wed, 17 Oct 2018 07:31:29 -0400
parents 92f3966d5bc3
children e8e75a79de59
files gstf_preparation.py test-data/test2.fasta
diffstat 2 files changed, 55 insertions(+), 1298 deletions(-) [+]
line wrap: on
line diff
--- a/gstf_preparation.py	Wed May 16 20:03:57 2018 -0400
+++ b/gstf_preparation.py	Wed Oct 17 07:31:29 2018 -0400
@@ -264,10 +264,10 @@
 
     cur.execute('SELECT species, seq_region_name FROM transcript_species WHERE transcript_id=?',
                 (transcript_id, ))
-    results = cur.fetchone()
-    if not results:
-        return None
-    return results
+    row = cur.fetchone()
+    if not row:
+        return (None, None)
+    return row
 
 
 def fetch_gene_id_for_transcript(conn, transcript_id):
@@ -275,17 +275,18 @@
 
     cur.execute('SELECT gene_id FROM transcript WHERE transcript_id=?',
                 (transcript_id, ))
-    results = cur.fetchone()
-    if not results:
+    row = cur.fetchone()
+    if not row:
         return None
-    return results[0]
+    return row[0]
 
 
-def remove_id_version(s):
+def remove_id_version(s, force=False):
     """
-    Remove the optional '.VERSION' from an Ensembl id.
+    Remove the optional '.VERSION' from an id if it's an Ensembl id or if
+    `force` is True.
     """
-    if s.startswith('ENS'):
+    if force or s.startswith('ENS'):
         return s.split('.')[0]
     else:
         return s
@@ -358,7 +359,7 @@
                     print("Line %i in file '%s': %s" % (i, filename, e), file=sys.stderr)
 
         for unimplemented_feature, nlines in unimplemented_feature_nlines_dict.items():
-            print("Skipped %d lines in file '%s': '%s' is not an implemented feature type" % (nlines, filename, unimplemented_feature), file=sys.stderr)
+            print("Skipped %d lines in GFF3 file '%s': '%s' is not an implemented feature type" % (nlines, filename, unimplemented_feature), file=sys.stderr)
 
         join_dicts(gene_dict, transcript_dict, exon_parent_dict, cds_parent_dict, five_prime_utr_parent_dict, three_prime_utr_parent_dict)
         write_gene_dict_to_db(conn, gene_dict)
@@ -367,47 +368,68 @@
         with open(json_arg) as f:
             write_gene_dict_to_db(conn, json.load(f))
 
-    if options.longestCDS:
-        gene_transcripts_dict = dict()
-        for fasta_arg in options.fasta:
-            for entry in FASTAReader_gen(fasta_arg):
-                # Extract the transcript id by removing everything after the first space and then removing the version if it is an Ensembl id
-                transcript_id = remove_id_version(entry.header[1:].lstrip().split(' ')[0])
+    # Read the FASTA files a first time to:
+    # - determine for each file if we need to force the removal of the version
+    #   from the transcript id
+    # - fill gene_transcripts_dict when keeping only the longest CDS per gene
+    force_remove_id_version_file_list = []
+    gene_transcripts_dict = dict()
+    for fasta_arg in options.fasta:
+        force_remove_id_version = False
+        found_gene_transcript = False
+        for entry in FASTAReader_gen(fasta_arg):
+            # Extract the transcript id by removing everything after the first space and then removing the version if needed
+            transcript_id = remove_id_version(entry.header[1:].lstrip().split(' ')[0], force_remove_id_version)
 
-                if len(entry.sequence) % 3 != 0:
-                    print("Transcript '%s' in file '%s' has a coding sequence length which is not multiple of 3" % (transcript_id, fasta_arg), file=sys.stderr)
-                    continue
+            if len(entry.sequence) % 3 != 0:
+                continue
 
+            gene_id = fetch_gene_id_for_transcript(conn, transcript_id)
+            if not gene_id and not found_gene_transcript:
+                # We have not found a proper gene transcript in this file yet,
+                # try to force the removal of the version from the transcript id
+                transcript_id = remove_id_version(entry.header[1:].lstrip().split(' ')[0], True)
                 gene_id = fetch_gene_id_for_transcript(conn, transcript_id)
-                if not gene_id:
-                    print("Transcript '%s' in file '%s' not found in the gene feature information" % (transcript_id, fasta_arg), file=sys.stderr)
-                    continue
+                # Remember that we need to force the removal for this file
+                if gene_id:
+                    force_remove_id_version = True
+                    force_remove_id_version_file_list.append(fasta_arg)
+                    print("Forcing removal of id version in FASTA file '%s'" % fasta_arg, file=sys.stderr)
+            if not gene_id:
+                print("Transcript '%s' in FASTA file '%s' not found in the gene feature information" % (transcript_id, fasta_arg), file=sys.stderr)
+                continue
+            if options.longestCDS:
+                found_gene_transcript = True
+            else:
+                break
 
-                if gene_id in gene_transcripts_dict:
-                    gene_transcripts_dict[gene_id].append((transcript_id, len(entry.sequence)))
-                else:
-                    gene_transcripts_dict[gene_id] = [(transcript_id, len(entry.sequence))]
+            if gene_id in gene_transcripts_dict:
+                gene_transcripts_dict[gene_id].append((transcript_id, len(entry.sequence)))
+            else:
+                gene_transcripts_dict[gene_id] = [(transcript_id, len(entry.sequence))]
 
-        # For each gene, select the transcript with the longest sequence
-        # If more than one transcripts have the same longest sequence for a gene, the
-        # first one to appear in the FASTA file is selected
+    if options.longestCDS:
+        # For each gene, select the transcript with the longest sequence.
+        # If more than one transcripts have the same longest sequence for a
+        # gene, the first one to appear in the FASTA file is selected
         selected_transcript_ids = [max(transcript_id_lengths, key=lambda _: _[1])[0] for transcript_id_lengths in gene_transcripts_dict.values()]
 
     regions = [_.strip().lower() for _ in options.regions.split(",")]
     with open(options.of, 'w') as output_fasta_file, open(options.ff, 'w') as filtered_fasta_file:
         for fasta_arg in options.fasta:
+            force_remove_id_version = fasta_arg in force_remove_id_version_file_list
             for entry in FASTAReader_gen(fasta_arg):
-                transcript_id = remove_id_version(entry.header[1:].lstrip().split(' ')[0])
+                transcript_id = remove_id_version(entry.header[1:].lstrip().split(' ')[0], force_remove_id_version)
                 if options.longestCDS and transcript_id not in selected_transcript_ids:
                     continue
 
                 if len(entry.sequence) % 3 != 0:
-                    print("Transcript '%s' in file '%s' has a coding sequence length which is not multiple of 3" % (transcript_id, fasta_arg), file=sys.stderr)
+                    print("Transcript '%s' in FASTA file '%s' has a coding sequence length which is not multiple of 3" % (transcript_id, fasta_arg), file=sys.stderr)
                     continue
 
                 species_for_transcript, seq_region_for_transcript = fetch_species_and_seq_region_for_transcript(conn, transcript_id)
                 if not species_for_transcript:
-                    print("Transcript '%s' in file '%s' not found in the gene feature information" % (transcript_id, fasta_arg), file=sys.stderr)
+                    print("Transcript '%s' in FASTA file '%s' not found in the gene feature information" % (transcript_id, fasta_arg), file=sys.stderr)
                     continue
 
                 if options.headers:
--- a/test-data/test2.fasta	Wed May 16 20:03:57 2018 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,1265 +0,0 @@
->ENST00000338702_homosapiens
-ATGGAGAATCAAGAGAAGGCGAGTATCGCGGGCCACATGTTCGACGTAGTCGTGATCGGA
-GGTGGCATTTCAGGACTATCTGCTGCCAAACTCTTGACTGAATATGGCGTTAGTGTTTTG
-GTTTTAGAAGCTCGGGACAGGGTTGGAGGAAGAACATATACTATAAGGAATGAGCATGTT
-GATTACGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAAAACAGAATCTTACGCTTG
-TCTAAGGAGCTGGGCATAGAGACTTACAAAGTGAATGTCAGTGAGCGTCTCGTTCAATAT
-GTCAAGGGGAAAACATATCCATTTCGGGGCGCCTTTCCACCAGTATGGAATCCCATTGCA
-TATTTGGATTACAATAATCTGTGGAGGACAATAGATAACATGGGGAAGGAGATTCCAACT
-GATGCACCCTGGGAGGCTCAACATGCTGACAAATGGGACAAAATGACCATGAAAGAGCTC
-ATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTTGCTTATCTTTTTGTGAATATC
-AATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGGTTCTTGTGGTATGTGAAGCAG
-TGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGTGGCCAGGAACGGAAGTTTGTA
-GGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTCCTCGGAGACCAAGTGAAGCTG
-AACCATCCTGTCACTCACGTTGACCAGTCAAGTGACAACATCATCATAGAGACGCTGAAC
-CATGAACATTATGAGTGCAAATACGTAATTAATGCGATCCCTCCGACCTTGACTGCCAAG
-ATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAGTTAATTCAGCGGCTTCCAATG
-GGAGCTGTCATTAAGTGCATGATGTATTACAAGGAGGCCTTCTGGAAGAAGAAGGATTAC
-TGTGGCTGCATGATCATTGAAGATGAAGATGCTCCAATTTCAATAACCTTGGATGACACC
-AAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATTCTTGCCCGGAAAGCTGATCGA
-CTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATCTGTGAGCTCTATGCCAAAGTG
-CTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAAGAGAAGAACTGGTGTGAGGAG
-CAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCTGGGATCATGACTCAATATGGA
-AGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCGGGCACAGAGACTGCCACAAAG
-TGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAACGAGCAGCTAGGGAGGTCTTA
-AATGGTCTCGGGAAGGTGACCGAGAAAGATATCTGGGTACAAGAACCTGAATCAAAGGAC
-GTTCCAGCGGTAGAAATCACCCACACCTTCTGGGAAAGGAACCTGCCCTCTGTTTCTGGC
-CTGCTGAAGATCATTGGATTTTCCACATCAGTAACTGCCCTGGGGTTTGTGCTGTACAAA
-TACAAGCTCCTGCCACGGTCTTGA
->ENST00000542639_homosapiens
-ATGGGGAAGGAGATTCCAACTGATGCACCCTGGGAGGCTCAACATGCTGACAAATGGGAC
-AAAATGACCATGAAAGAGCTCATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTT
-GCTTATCTTTTTGTGAATATCAATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGG
-TTCTTGTGGTATGTGAAGCAGTGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGT
-GGCCAGGAACGGAAGTTTGTAGGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTC
-CTCGGAGACCAAGTGAAGCTGAACCATCCTGTCACTCACGTTGACCAGTCAAGTGACAAC
-ATCATCATAGAGACGCTGAACCATGAACATTATGAGTGCAAATACGTAATTAATGCGATC
-CCTCCGACCTTGACTGCCAAGATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAG
-TTAATTCAGCGGCTTCCAATGGGAGCTGTCATTAAGTGCATGATGTATTACAAGGAGGCC
-TTCTGGAAGAAGAAGGATTACTGTGGCTGCATGATCATTGAAGATGAAGATGCTCCAATT
-TCAATAACCTTGGATGACACCAAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATT
-CTTGCCCGGAAAGCTGATCGACTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATC
-TGTGAGCTCTATGCCAAAGTGCTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAA
-GAGAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCT
-GGGATCATGACTCAATATGGAAGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCG
-GGCACAGAGACTGCCACAAAGTGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAA
-CGAGCAGCTAGGGAGGTCTTAAATGGTCTCGGGAAGGTGACCGAGAAAGATATCTGGGTA
-CAAGAACCTGAATCAAAGGACGTTCCAGCGGTAGAAATCACCCACACCTTCTGGGAAAGG
-AACCTGCCCTCTGTTTCTGGCCTGCTGAAGATCATTGGATTTTCCACATCAGTAACTGCC
-CTGGGGTTTGTGCTGTACAAATACAAGCTCCTGCCACGGTCTTGA
->ENSPTRT00000040520_pantroglodytes
-ATGGAGAATCAAGAGAAGGCGAGTATCGCGGGCCACATGTTCGACGTAGTCGTGATCGGA
-GGTGGCATTTCAGGACTATCTGCTGCCAAACTCTTGACTGAATATGGCGTTAGTGTTTTA
-GTTTTAGAAGCTCGGGACAGGGTTGGAGGAAGAACATATACTATAAGGAATGAGCATGTT
-GATTACGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAAAACAGAATCTTACGCTTG
-TCTAAGGAGCTGGGCATAGAGACTTACAAAGTGAATGTCAGTGAGCGTCTCGTTCAATAT
-GTCAAGGGGAAAACATATCCATTTCGGGGCGCCTTTCCACCAGTATGGAATCCCATTGCA
-TATTTGGATTACAATAATCTGTGGCGGACAATAGATAACATGGGGAAGGAGATTCCAAAT
-GATGCACCCTGGGAGGCTCAACATGCTGACGAATGGGACAAAATGACCATGAAAGAGCTC
-ATTGACAAAATCTGCTGGACAAAGACTGCTAGGCGGTTTGCTTATCTTTTTGTGAATATC
-AATGTGACCTCTGAGCCTCACGAAGTGTCTGCCCTGTGGTTCTTGTGGTATGTGAAGCAG
-TGCGGGGGCACCACTCGGATATTCTCTGTCACCAATGGCGGCCAGGAACGGAAGTTTGTA
-GGTGGATCTGGTCAAGTGAGCGAACGGATAATGGACCTCCTTGGAGACCAAGTGAAGCTG
-AACCATCCTGTCACTCATGTTGACCAGTCAAGTGACAACATCATCATAGAGACACTGAAC
-CATGAACATTATGAGTGCAAATACGTAATTAATGCGATCCCTCCGACCTTGACTGCCAAG
-ATTCACTTCAGACCAGAGCTTCCAGCAGAGAGAAACCAGTTAATTCAGCGTCTTCCAATG
-GGAGCTATCATTAAGTGCATGATGTATTACAAGGAGGCCTTCTGGAAGAAGAAGGATTAC
-TGTGGCTGCATGATCATTGAAGATGAAGATGCCCCAATTTCAATAACCTTGGATGACACC
-AAGCCAGATGGGTCACTGCCTGCCATCATGGGCTTCATTCTTGCCCGGAAAGCTGATCGA
-CTTGCTAAGCTACATAAGGAAATAAGGAAGAAGAAAATCTGTGAGCTCTATGCCAAAGTG
-CTGGGATCCCAAGAAGCTTTACATCCAGTGCATTATGAAGAGAAGAACTGGTGTGAGGAG
-CAGTACTCTGGGGGCTGCTACACGGCCTACTTCCCTCCTGGGATCATGACTCAATATGGA
-AGGGTGATTCGTCAACCCGTGGGCAGGATTTTCTTTGCGGGCACAGAGACTGCCACAAAG
-TGGAGCGGCTACATGGAAGGGGCAGTTGAGGCTGGAGAACGAGCAGCTAGGGAGGTCTTA
-AATGGTCTCGGGAAGGTGACCGAGAAAGACATCTGGGTACAAGAACCTGAATCAAAGGAC
-GTTCCAGCGGTAGAAATCACGCACACCTTCTGGGAAAGGAACCTGCCCTCTGTTTCTGGC
-CTGCTGAAGATCATTGGATTTTCCACATCAGTAACTACCCTGGGGTTTGTGCTGTACAAA
-TACAAGCTCCTGCCACGGTCTTGA
->ENSSSCT00000013404_susscrofa
-ATGGAGCGTCAGGAGAAGGCGAACAACGCGGGCCACATGGTCGACGTAGTCGTGATAGGA
-GGCGGCATCTCAGGATTATCTGCTGCCAAACTCTTAAATGAATATGGAATTAATGTTTTG
-GTTTTAGAAGCCCGGGACAGAGTTGGAGGAAGAACATACACAGTGAGGAACGAAAATGTT
-GATTACGTGGACGTTGGTGGGGCTTATGTCGGACCGACCCAGAATAGGATCTTAAGGTTA
-TCTAAGGAACTGGGTTTAGAAACTTACAAAGTGAATGTAAATGAGTGTCTCGTTCAGTAT
-GTCAAGGGGAAATCTTATCCATTTCGGGGTGCCTTCCCTCCAGTCTGGAATCCCATTGCC
-TATCTGGATTACAACAACCTGTGGCGGACAATGGATGACATGGGAAAGAAGATTCCAGCT
-GATGCACCATGGGAGTCTCCGCATGCAGAGGAATGGGATAAGATGACCATGAAAGATCTC
-ATCGATAAAATCTGTTGGACAAAGACTGCTAAACGGTTTGCATCTCTCTTTGTAAATATC
-AATGTGACCTCCGAACCCCACGAAGTGTCTGCCCTGTGGTTTTTGTGGTATGTGAAGCAG
-TGTGGAGGCACCACCCGGATATTCTCTGTTACCAACGGGGGCCAGGAACGGAAGTTTGTA
-GGCGGATCTGGTCAAGTAAGCGAACGGATAATGCACCTCCTCGGGGACAGAGTGAAGCTG
-AGGTGTCCTGTCACCTATGTTGACCAGTCAGGTGACAACATCATCGTAGAGACATTGAAT
-CATGAACTTTATGAGTGCCAATACGTAATTAGTGCCATCCCTCCAACTCTGACTGCCAAG
-ATACACTTCAGACCGGAGCTTCCGTCAGAAAGAAACCAGTTAATTCAGCGTCTTCCGATG
-GGGGCTATCATTAAGTGCATGATGTATTACAAGGAGGCCTTTTGGAAGAAGAAGAATTAC
-TGTGGCTGTATGATCATCGAAGATGAGGAAGCTCCGATTTCAATAACTCTAGATGACACC
-AAGCCAGATGGATCGCTGCCCGCCATCATGGGCTTCATCCTTGCTCGAAAAGCTGACCGC
-CTTGCTAAGGTTCATAAAGAAATAAGAAAGCGGAAAATCTGTGAGCTCTACGCCAAAGTG
-CTAGGATCTCAAGAAGCTTTACATCCCGTGCACTATGAAGAGAAGAACTGGTGTGAGGAG
-CAGTACTCGGGGGGCTGCTACACTGCCTACTTCCCCCCTGGGATCATGACTCAGTATGGA
-AGGGTGATCCGCCAGCCCGTAGGCAGGATATTCTTTGCTGGCACCGAGACTGCCACACAA
-TGGAGCGGTTACATGGAAGGAGCAGTAGAAGCCGGCGAACGGGCGGCTAGAGAGATCTTG
-AATGCTTTGGGGAAGGTGTCAAAGAAAGACATATGGCTTCGAGAACCTGAATCAGAGGAT
-GTTCCAGCTTTTGAGATCACCCGCACCTTCTGGGAGAGAAACCTGCCTTCCGTGACCGGG
-CTGCTTAAGATCATCGGATTTTCCACCTCGGTAACTGCCCTGTGGCTTGCCGTGTACAAA
-TTCAGGCTGCTGACCCGATCCTGA
->ENSSSCT00000035258_susscrofa
-TCGCTGCCCGCCATCATGGGCTTCATCCTTGCTCGAAAAGCTGACCGCCTTGCTAAGGTT
-CATAAAGAAATAAGAAAGCGGAAAATCTGTGAGCTCTACGCCAAAGTGCTAGGATCTCAA
-GAAGCTTTACATCCCGTGCACTATGAAGAGAAGAACTGGTGTGAGGAGCAGTACTCGGGG
-GGCTGCTACACTGCCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTGATCCGC
-CAGCCCGTAGGCAGGATATTCTTTGCTGGCACCGAGACTGCCACACAATGGAGCGGTTAC
-ATGGAAGGAGCAGTAGAAGCCGGCGAACGGGCGGCTAGAGAGGATGTTCCAGCTTTTGAG
-ATCACCCGCACCTTCTGGGAGAGAAACCTGCCTTCCGTGACCGGGCTGCTTAAGATCATC
-GGATTTTCCA
->ENSSSCT00000032764_susscrofa
-ATGGATGACATGGGAAAGAAGATTCCAGCTGATGCACCATGGGAGTCTCCGCATGCAGAG
-GAATGGGATAAGATGACCATGAAAGATCTCATCGATAAAATCTGTTGGACAAAGACTGCT
-AAACGGTTTGCATCTCTCTTTGTAAATATCAATGTGACCTCCGAACCCCACGAAGTGTCT
-GCCCTGTGGTTTTTGTGGTATGTGAAGCAGTGTGGAGGCACCACCCGGATATTCTCTGTT
-ACCAACGGGGGCCAGGAACGGAAGTTTGTAGGCGGATCTGGTCAAGTAAGCGAACGGATA
-ATGCACCTCCTCGGGGACAGAGTGAAGCTGAGGTGTCCTGTCACCTATGTTGACCAGTCA
-GGTGACAACATCATCGTAGAGACATTGAATCATGAACTTTATGAGTGCCAATACGTAATT
-AGTGCCATCCCTCCAACTCT
->ENSCAFT00000022939_canisfamiliaris
-ATGGCGAGTAGAGAGAAGACGAGTATCGAGGGCCACATGTTTGACGTAGTCGTGATAGGA
-GGCGGCATCTCAGGATTGTCTGCTGCCAAACTCTTAGCCGAACATGAAGTTGATGTCTTA
-GTTTTAGAAGCACGAGATAGAGTTGGAGGAAGAACATACACCGTGAGGAATGAACATGTC
-GATTACGTAGATGTTGGTGGGGCTTATGTAGGACCAACTCAGAACAGAATCTTACGACTA
-TCTAAGGAGCTGGGTCTAGAGACTTACAAAGTGAACGTAAATGAGCGTCTTGTACAGTAT
-GTCAAGGGGAAAACTTACCCATTCCGAGGAGCCTTTCCTCCGGTATGGAATCCTATCGCA
-TATTTGGATTACAACAACCTGTGGCGGACAATGGATAACATGGGGAAGGAGATTCCAGCA
-GATGCACCATGGGAGGCCCCACATGCCGAGGAATGGGACAAGATGACTATGAAGGATCTT
-ATCGATAAAATCTGCTGGACAAAGACTGCTAGGAGGTTTGCATCCCTCTTTGTGAATATC
-AATGTGACCTCTGAGCCCCACGAGGTGTCTGCGCTCTGGTTCCTGTGGTATGTGAAGCAG
-TGCGGAGGTACCACTCGGATATTCTCGGTGACCAATGGAGGCCAGGAACGGAAGTTTGTG
-GGAGGATCCGGTCAAGTGAGTGAACGGATAATGGAGCGCCTTGGGGACAGAGTCAAGCTG
-AAGCGCCCTGTCACCTATGTTGACCAGTCAGATGACAACATCATCATAGAGACACTGAAT
-CATGAACTTTATGAGTGCAAATACGTGATTAGTGCCATCCCTCCAACTTTGACTGCCAAG
-ATCCACTTCAGACCAGAGCTTCCATCAGAGAGAAATCAGTTAATTCAGCGTCTTCCAATG
-GGAGCTATCATCAAGTGTATGATGTATTACAAGGAGGCCTTTTGGAAGAAGAAGGATTAC
-TGTGGCTGTATGATCATTGAAGACGAGGAAGCTCCAATTTCAATAACCCTGGATGACACC
-AAGCCAGATGGATCACTGCCCGCTATCATGGGCTTCATACTTGCCAGAAAAGCTGACCGA
-CTTGCCAAGCTCCATAAAGAAATAAGGAAGAGGAAAATCTGTGAGCTCTATGCCAAAGTG
-CTAGGATCCCAAGAAGCTTTACAACCCGTACACTATGAAGAGAAGAACTGGTGCGAGGAG
-CAGTACTCCGGGGGCTGCTATACCGCCTACTTCCCCCCTGGGATCATGACTCACTACGGA
-AGGGTGATCCGCCAGCCATTTGGCAGGATTTACTTTGCTGGCACTGAGACGGCAACACAC
-TGGAGCGGTTATATGGAAGGAGCTGTAGAGGCTGGGGAACGGACAGCTAGAGAGGTCTTA
-AATGCTCTCGGGAGGGTGGCAGAGAAAGACCTGAAGACCCAGGAACCTGAATCAAAGGAT
-GTTCCAGCTATGGAAATCACCCACACCTTCTGGGAGAGGAACCTGCCATCGGTGACAGGC
-CTGCTGAAGCTCATTGGATTTACCACATCAGTAACTGCCCTGTGGATTGTGGCGTACAAA
-TTCAGGCTGCTGAGACGATCCTGA
->ENSMUST00000026013_musmusculus
-ATGACGGATCTGGAGAAGCCCAGTATCACAGGCCACATGTTCGACGTAGTCGTGATTGGA
-GGCGGCATCTCAGGATTGGCTGCTGCCAAACTATTGTCAGAATACAAAATTAATGTCTTG
-GTTCTGGAAGCCCGGGATAGAGTTGGAGGAAGAACATATACTGTGAGGAATGAGCATGTT
-AAATGGGTAGATGTTGGTGGAGCTTATGTGGGACCAACCCAGAACAGAATCTTACGCTTG
-TCTAAGGAGCTAGGCATAGAGACCTATAAAGTGAATGTCAATGAGCGTCTAGTTCAATAT
-GTCAAGGGGAAAACTTACCCATTCCGTGGTGCATTTCCACCTGTGTGGAACCCCTTGGCA
-TATTTGGATTACAACAACCTGTGGAGGACAATGGATGATATGGGAAAAGAGATCCCTGTT
-GATGCACCATGGCAAGCAAGACATGCTGAGGAATGGGACAAGATAACCATGAAAGATCTC
-ATTGATAAAATCTGTTGGACAAAAACTGCTCGAGAATTTGCTTATCTTTTTGTGAACATT
-AATGTGACTTCTGAGCCTCATGAGGTATCTGCCCTGTGGTTCTTGTGGTATGTGAGGCAG
-TGTGGAGGTACCTCTCGGATATTCTCAGTCACCAATGGCGGCCAGGAACGGAAATTTGTA
-GGTGGCTCTGGCCAAATAAGTGAACAGATAATGGTCCTCCTTGGGGATAAAGTGAAGCTG
-AGCTCTCCTGTTACTTATATTGACCAAACAGATGACAACATCATTATAGAAACACTGAAT
-CATGAGCACTATGAGTGCAAATATGTAATTAGTGCCATCCCACCGGTTTTGACTGCCAAG
-ATCCACTTTAAACCAGAGCTTCCACCTGAGAGAAACCAATTAATTCAGCGTCTTCCAATG
-GGGGCTGTCATCAAGTGCATGGTGTATTACAAGGAAGCCTTCTGGAAGAAAAAGGACTAT
-TGTGGCTGCATGATAATTGAAGATGAGGAGGCTCCAATTTCAATCACTCTGGATGACACT
-AAACCAGATGGGTCAATGCCTGCCATCATGGGCTTCATACTTGCCCGGAAAGCTGAACGA
-CTTGCTAAACTACATAAAGACATAAGGAAGAGGAAAATCTGTGAGCTGTATGCCAAAGTT
-CTGGGATCTCAAGAAGCTTTATCTCCCGTCCATTATGAAGAGAAGAACTGGTGTGAGGAG
-CAGTACTCCGGGGGCTGCTACACAGCCTACTTCCCTCCTGGTATCATGACTCTGTATGGA
-AGGGTGATTCGGCAGCCAGTAGGCAGGATTTACTTTGCAGGCACAGAGACAGCAACACAG
-TGGAGTGGCTACATGGAAGGTGCAGTTGAAGCTGGAGAACGAGCAGCTAGAGAGGTCTTG
-AATGCTCTAGGAAAAGTTGCCAAGAAGGATATATGGGTTCAAGAGCCTGAGTCCAAGGAT
-GTTCCAGCTCTTGAAATTACCCACACCTTCTTAGAGAGGAACCTGCCTTCCGTGCCTGGT
-CTGCTCAAGATCACTGGTTTTTCCACTTCTGTGGCTCTTCTCTGCTTTGTATTGTACAAG
-TTTAAACAGCCCCAGTCCTGA
->ENSRNOT00000066674_rattusnorvegicus
-ATGACGGATCTGGAGAAGCCCAATCTCGCAGGCCACATGTTCGACGTAGTCGTGATTGGA
-GGCGGCATCTCAGGATTGGCTGCTGCCAAACTGTTGTCTGAATACAAAATTAATGTCTTG
-GTTTTGGAAGCCCGGGATAGAGTTGGAGGAAGAACATATACTGTGAGGAATGAGCATGTC
-AAATGGGTAGATGTTGGTGGAGCCTATGTGGGACCAACCCAGAACAGAATCTTACGCTTG
-TCTAAGGAGCTAGGCATAGAGACCTATAAAGTGAATGTCAATGAGCGTCTAGTTCAATAT
-GTCAAGGGGAAAACTTACCCATTCCGTGGTGCATTCCCACCTGTGTGGAACCCCTTGGCA
-TATTTGGATTACAACAACCTATGGAGAACAATGGATGAAATGGGAAAAGAGATCCCCGTT
-GATGCACCGTGGCAAGCAAGACACGCTCAGGAATGGGACAAGATGACCATGAAAGATCTC
-ATTGATAAAATCTGTTGGACAAAAACTGCTCGGGAATTTGCGTATCTTTTTGTGAACATT
-AATGTGACTTCTGAGCCTCATGAGGTATCTGCCCTGTGGTTCCTGTGGTATGTGAGGCAG
-TGTGGGGGCACTGCTCGGATATTCTCAGTTACCAATGGCGGCCAGGAACGGAAATTTGTA
-GGTGGATCTGGCCAAGTAAGTGAACAGATAATGGGTCTCCTTGGAGATAAAGTGAAGCTG
-AGCTCTCCTGTTACTTATATTGACCAAACAGATGACAACATCATTGTAGAAACACTGAAT
-CATGAACACTATGAGTGCAAATACGTAATTAGTGCCATCCCACCGATTTTGACTGCCAAG
-ATCCACTTTAAACCAGAGCTTCCACCTGAGAGAAACCAATTAATTCAGCGTCTTCCAATG
-GGGGCTGTTATCAAGTGCATGGTGTATTACAAGGAAGCCTTCTGGAAGAAAAAGGACTAT
-TGTGGCTGCATGATCATTGAAGATGAGGAGGCTCCAATCGCCATCACTCTGGATGACACT
-AAACCAGATGGGTCACTGCCTGCCATCATGGGCTTCATACTTGCCCGGAAAGCTGATCGA
-CTTGCTAAACTACATAAAGACATAAGGAAGAGGAAAATCTGTGAGCTGTATGCCAAAGTT
-CTGGGATCTCAAGAAGCATTATATCCAGTCCATTATGAAGAGAAGAACTGGTGTGAGGAG
-CAGTACTCCGGGGGCTGCTACACAGCCTACTTCCCTCCTGGTATCATGACCCAGTATGGA
-AGGGTGATTCGCCAGCCAGTAGGTAGGATTTACTTTGCAGGCACAGAGACAGCAACACAG
-TGGAGTGGCTACATGGAAGGAGCAGTTGAAGCTGGAGAACGAGCAGCTAGAGAGGTGTTG
-AATGCTCTAGGAAAAGTCGCGAAGAAGGATATATGGGTTGAAGAACCCGAGTCCAAGGAT
-GTTCCAGCCATTGAAATTACCCACACCTTCTTAGAGAGGAACCTGCCTTCCGTGCCTGGT
-CTGCTCAAGATCACTGGTGTTTCCACTTCTGTGGCTCTTCTCTGCTTTGTATTGTACAAG
-ATTAAGAAGCTCCCATGCTGA
->ENSPTRT00000040521_pantroglodytes
-ATGAGCAACAAATGCGACGTGGTCGTGGTGGGGGGCGGCATCTCAGGTAAGGCAGCAGCC
-AAACTTCTGCATGACTCTGGACTGAATGTGGTTGTTCTGGAAGCCCGGGACCGTGTGGGA
-GGCAGGACTTACACTCTTAGGAACCAAAAGGTTAAATATGTGGACCTTGGAGGATCCTAT
-GTTGGACCAACCCAGAATCGTATCTTGAGATTAGCCAAGGAGCTAGGATTGGAGACCTAC
-AAAGTGAATGAGGTTGAGCGTCTGATCCACCATGTAAAGGGCAAATCATACCCCTTCAGG
-GGGCCGTTCCCACCTGTATGGAATCCAATTACCTACTTAGATCATAACAACTTTTGGAGG
-ACAATGGATGACATGGGGCGAGAGATTCCGAGTGATGCCCCATGGAAGGCTCCCCTTGCA
-GAAGAGTGGGACAACATGACAATGAAGGAGCTACTGGACAAGCTCTGCTGGACAGAATCT
-GCAAAGCAGCTTGCCACTCTCTTTGTGAACCTGTGTGTCACTGCAGAGACCCATGAGGTC
-TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACAACAAGAATCATCTCG
-ACAACGAATGGAGGACAGGAGAGGAAATTTGTGGGCGGATCTGGTCAAGTGAGCGAGCGG
-ATAATGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGATCTACATTGACCAG
-ACAAGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGATGTATGAGGCTAAATATGTG
-ATTAGTGCTATTCCTCCTACTCTGGGCATGAAGATTCACTTCAATCCCCCTCTGCCAATG
-ATGAGAAACCAGATGATCACTCGTGTGCCTTTGGGTTCAGTCATCAAGTGTATAGTTTAT
-TATAAAGAGCCTTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATTGATGGAGAG
-GAAGCTCCAGTTGCCTACACGTTAGATGATACCAAACCTGAAGGCAACTATGCTGCCATA
-ATGGGATTTATCCTGGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGAGGAAAGG
-TTGAAGAAACTTTGTGAACTCTATGCCAAGGTTCTGGGTTCCCCAGAAGCTCTGGAGCCA
-GTGCATTATGAAGAAAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACAACT
-TACTTCCCCCCTGGGATCCTGACTCAATATGGAAGGGTTCTACGCCAGCCAGTGGACAGG
-ATTTACTTTGCAGGCACCGAGACTGCCACACACTGGAGCGGCTACATGGAGGGGGCTGTA
-GAGGCCGGGGAGAGAGCAGCCCGAGAGATCCTGCATGCCATGGGGAAGATTCCAGAGGAT
-GAAATCTGGCAGTCAGAACCAGAGTCTGTGGATGTCCCTGCACAGCCCATCACCACGACC
-TTTTTGGAGAGACATTTGCCCTCCGTGCCAGGCCTGCTCAGGCTGATTGGATTGACCACC
-ATCTTTTCAGCAACGGCTCTTGGCTTCCTGGCCCACAAAAGGGGGCTACTTGTGCGAGTC
-TAA
->ENST00000378069_homosapiens
-ATGAGCAACAAATGCGACGTGGTCGTGGTGGGGGGCGGCATCTCAGGTATGGCAGCAGCC
-AAACTTCTGCATGACTCTGGACTGAATGTGGTTGTTCTGGAAGCCCGGGACCGTGTGGGA
-GGCAGGACTTACACTCTTAGGAACCAAAAGGTTAAATATGTGGACCTTGGAGGATCCTAT
-GTTGGACCAACCCAGAATCGTATCTTGAGATTAGCCAAGGAGCTAGGATTGGAGACCTAC
-AAAGTGAATGAGGTTGAGCGTCTGATCCACCATGTAAAGGGCAAATCATACCCCTTCAGG
-GGGCCATTCCCACCTGTATGGAATCCAATTACCTACTTAGATCATAACAACTTTTGGAGG
-ACAATGGATGACATGGGGCGAGAGATTCCGAGTGATGCCCCATGGAAGGCTCCCCTTGCA
-GAAGAGTGGGACAACATGACAATGAAGGAGCTACTGGACAAGCTCTGCTGGACTGAATCT
-GCAAAGCAGCTTGCCACTCTCTTTGTGAACCTGTGTGTCACTGCAGAGACCCATGAGGTC
-TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACAACAAGAATCATCTCG
-ACAACAAATGGAGGACAGGAGAGGAAATTTGTGGGCGGATCTGGTCAAGTGAGTGAGCGG
-ATAATGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGATCTACATTGACCAG
-ACAAGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGATGTATGAGGCTAAATATGTG
-ATTAGTGCTATTCCTCCTACTCTGGGCATGAAGATTCACTTCAATCCCCCTCTGCCAATG
-ATGAGAAACCAGATGATCACTCGTGTGCCTTTGGGTTCAGTCATCAAGTGTATAGTTTAT
-TATAAAGAGCCTTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATTGATGGAGAA
-GAAGCTCCAGTTGCCTACACGTTGGATGATACCAAACCTGAAGGCAACTATGCTGCCATA
-ATGGGATTTATCCTGGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGAGGAAAGG
-TTGAAGAAACTTTGTGAACTCTATGCCAAGGTTCTGGGTTCCCTAGAAGCTCTGGAGCCA
-GTGCATTATGAAGAAAAGAACTGGTGTGAGGAGCAGTACTCTGGGGGCTGCTACACAACT
-TATTTCCCCCCTGGGATCCTGACTCAATATGGAAGGGTTCTACGCCAGCCAGTGGACAGG
-ATTTACTTTGCAGGCACCGAGACTGCCACACACTGGAGCGGCTACATGGAGGGGGCTGTA
-GAGGCCGGGGAGAGAGCAGCCCGAGAGATCCTGCATGCCATGGGGAAGATTCCAGAGGAT
-GAAATCTGGCAGTCAGAACCAGAGTCTGTGGATGTCCCTGCACAGCCCATCACCACCACC
-TTTTTGGAGAGACATTTGCCCTCCGTGCCAGGCCTGCTCAGGCTGATTGGATTGACCACC
-ATCTTTTCAGCAACGGCTCTTGGCTTCCTGGCCCACAAAAGGGGGCTACTTGTGAGAGTC
-TAA
->ENSRNOT00000044009_rattusnorvegicus
-ATGAGCAACAAATGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCAGCAGCC
-AAACTTTTGCATGACTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGAGACCGTGTGGGA
-GGCAGGACTTACACAATTAGGAATAAAAATGTTAAATATGTGGACCTTGGAGGATCTTAT
-GTTGGGCCGACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
-AAAGTGAATGAAGTTGAGCGGCTGATCCACTTTGTAAAGGGAAAATCATATGCCTTCAGG
-GGCCCATTCCCACCAGTGTGGAATCCAATCACTTACCTAGATTATAACAACCTCTGGAGA
-ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAGGCACCCCTTGCT
-GAAGAGTGGGACTACATGACAATGAAAGAGTTGCTAGATAAGATCTGCTGGACCAACTCT
-ACAAAGCAGATTGCCACACTCTTTGTGAACCTATGTGTAACTGCGGAGACCCATGAGGTT
-TCTGCACTGTGGTTCCTGTGGTATGTGAAGCAGTGTGGGGGTACAACCAGAATCATATCA
-ACAACCAATGGAGGACAGGAGAGGAAATTTATTGGTGGATCTGGTCAAGTGAGTGAGCGG
-ATAAAGGATATCCTTGGGGACAGAGTGAAGCTGGAGAGGCCGGTGATCCACATTGACCAG
-ACAGGAGAAAATGTTGTTGTGAAAACCCTAAACCATGAAATATATGAGGCTAAATATGTG
-ATTAGTGCCATCCCACCTGTTTTGGGCATGAAGATTCACCATAGTCCTCCTCTGCCCATT
-CTAAGAAACCAGCTGATTACTCGTGTGCCTTTGGGTTCAGTTATTAAGTGCATGGTTTAT
-TATAAAGAACCCTTCTGGAGGAAAAAGGATTTCTGTGGAACCATGGTTATTGAAGGAGAG
-GAAGCTCCAATTGCGTACACATTGGATGATACCAAGCCAGATGGCAGCTGTGCTGCTATA
-ATGGGATTTATCCTTGCTCACAAAGCTAGAAAACTGGTACGCCTTACTAAAGAAGAAAGA
-CTGAGGAAGCTCTGTGAGCTATACGCGAAAGTTCTGAACTCTCAAGAAGCTCTGCAGCCA
-GTCCATTATGAAGAGAAGAACTGGTGTGAGGAGCAGTACTCCGGGGGCTGCTACACAGCC
-TACTTCCCTCCTGGCATCTTGACCCAGTATGGAAGGGTTCTACGCCAGCCAGTGGGCAAG
-ATTTTCTTTGCAGGCACCGAGACAGCTTCACATTGGAGTGGCTACATGGAGGGGGCTGTA
-GAGGCTGGAGAGAGAGCTGCCAGAGAGATTCTTCATGCCATTGGGAAGATTCCAGAGGAT
-GAAATTTGGCAGCCAGAACCAGAATCTGTGGATGTCCCAGCAAGACCCATTACCAACACC
-TTCCTGGAGAGACACTTGCCTTCTGTACCAGGTCTACTAAAGCTGCTTGGATTGACCACC
-ATCTTGTCAGCAACAGCTCTTGGTTTCCTGGCCCACAAAAAGGGTCTGTTTGTACGTTTC
-TAA
->ENSMUST00000040820_musmusculus
-ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
-AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
-GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
-GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
-AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGGGAAAATCATATGCCTTCAGG
-GGCCCATTTCCACCAGTATGGAATCCTATCACCTACCTAGATAATAACAACCTCTGGAGG
-ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAAGCACCCCTTGCT
-GAAGAGTGGGACTACATGACAATGAAAGAATTGCTAGATAAGATCTGCTGGACCAAATCT
-ACAAAGCAGATTGCCACGCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGAGGTC
-TCTGCACTATGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGTACAACCAGAATCATCTCA
-ACAACCAATGGAGGACAGGAGAGGAAATTTATTGGTGGATCTGGTCAAGTGAGTGAACGG
-ATAAAGGATATACTTGGGGACCGAGTGAAGCTGGAGAGGCCTGTGATCCACATTGACCAG
-ACAGGGGAAAATGTTATTGTGAAAACCCTAAACCATGAAATATATGAGGCTAAATATGTG
-ATTAGTGCCATTCCACCTGCTTTGGGCATGAAGATTCACTATAGTCCTCCTCTGCCCATG
-CTAAGAAACCAGCTGATCTCTCGTGTGCCTTTGGGTTCAGTTATTAAATGCATGGTTTAT
-TACAAAGAGCCCTTCTGGAGGAAAAAGGATTTCTGTGGAACCATGGTTATCGAAGGAGAG
-GAAGCTCCAATTGCATACACATTGGATGATACCAAACCAGATGGCACCTATGCTGCTATA
-ATGGGATTTATCCTTGCTCACAAAGCTAGAAAACTGGTACGTCTCACCAAAGAAGAAAGA
-CTGAGGAAACTTTGTGAGCTATATGCAAAAGTGCTGAACTCCCAAGAAGCTCTGCAGCCC
-GTCCATTATGAAGAGAAGAACTGGTGTGAGGAACAGTATTCTGGGGGCTGCTACACAACC
-TACTTCCCTCCCGGCATCTTGACCCAGTATGGAAGGGTTCTACGTCAGCCAGTGGGCAAG
-ATTTTCTTTGCAGGCACTGAAACAGCCTCACACTGGAGCGGCTACATGGAGGGGGCTGTG
-GAGGCTGGGGAGAGAGCAGCCAGAGAGATTCTTCATGCCATTGGGAAGATTCCAGAAGAT
-GAAATTTGGCAGCCAGAACCAGAATCTTTGGATGTCCCTGCACGACCCATTACCAGTACC
-TTCCTGGAGAGACACCTGCCTTCTGTACCAGGCCTGCTAAAGCTGTTTGGATTGACCACC
-ATCTTGTCAGCAACAGCTCTTGGTTTCCTGGCCCACAAAAGGGGCCTGTTTGTACATTTT
-TAA
->ENSMUST00000168613_musmusculus
-ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
-AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
-GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
-GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
-AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGGGAAAATCATATGCCTTCAGG
-GGCCCATTTCCACCAGTATGGAATCCTATCACCTACCTAGATAATAACAACCTCTGGAGG
-ACAATGGATGAGATGGGCCAAGAGATTCCCAGTGATGCTCCATGGAAAGCACCCCTTGCT
-GAAGAGTGGGACTACATGACAATGAAAGAATTGCTAGATAAGATCTGCTGGACCAAATCT
-ACAAAGCAGATTGCCACGCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGAGGTC
-TCTGCACTATGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGTACAACCAGAATCATCTCA
-ACAACCAATGGAGGACAGGGGAAAATGTTATTGTGA
->ENSMUST00000163344_musmusculus
-ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGGTATGGCGGCAGCC
-AAACTTCTGCATGATTGTGGCCTCAGTGTGGTGGTTCTGGAAGCACGGGACCGTGTAGGA
-GGCAGGACTTACACAATTAGGAATAAAAACGTTAAATATGTGGACCTTGGAGGATCTTAT
-GTTGGGCCAACCCAGAATCGTATCTTACGATTGGCCAAAGAGCTAGGATTGGAGACCTAT
-AAAGTTAATGAAGTTGAGCGGCTGATACACTTTGTAAAGATCTACAAAGCAGATTGCCAC
-GCTCTTTGTGAACCTGTGTGTAACTGCAGAGACCCATGA
->ENSMUST00000173143_musmusculus
-ATGAGCAACAAAAGCGATGTGATCGTGGTGGGGGGCGGCATCTCAGAAAAACCTGCTAAT
-TCTAGTCAGTTTACAAGCTCATTGTGGAGGAGAATTGAAAAACTGTGA
->ENSSSCT00000033745_susscrofa
-ATGGCAGCGGCCAAACTTCTGCATGACTCTGGCCTGAGTGTGATTGTTCTGGAAGCCCGG
-GACCGCGTGGGAGGCAGGACTTACACCGTCAGGAACCAACAAGTTAAATATGTGGACCTT
-GGAGGATCTTATGTTGGGCCAACTCAGAATCGCATCTTAAGATTGTCCAAGGAGCTAGGA
-TTGGAGACCTACAAAGTGAATGAAGTGGAGCGTCTGATTCACTATGTAAAGGGCAAATCC
-TACCCCTTCAGGGGCCCATTACCACCTGTGAGGAATCCGATTACCTTCCTAGATCTTAAC
-AACCTTTGGAGGACGGTGGATGACATGGGACGAGAGATTCCCAGTGATGCCCCATGGAAG
-GCGCCCCTTGCAGAACAGTGGGACCAGATGACAATGAAGGAGCTGTTGGACAAGCTCTGC
-TGGACTGAATCTTCGAAGCAGCTGGCCACCCTTTTTGTGAACCTGTGTGTCACCGCGGAG
-ACCCATGAGGTCTCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACCACC
-AGGATCATCTCAACAACTAACGGAGGGCAGGAGAGGAAATTTGTGGGCGGATCTGGTCAA
-GTGACCGAGCGGATAAAGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGGTC
-CACATTGACCAGACAGGAGAAAATGTCCTCGTGGAGACCCTAAACCACGAGGTGTACGAG
-GCTAAGTATGTGATTAGCGCCATTCCTCCTGTCCTGGGCATGAAGATTCATTTCAGTCCC
-CCTCTGCCAATGATGAGAAACCAGCTCATCACTCGTGTACCTCTGGGCTCTGTCATCAAG
-TGTATAGTTTATTACAAAGAGCCCTTCTGGAGGCATAAGGATTACTGTGGAAGCATGATT
-ATTGAAGGAGAGGAAGCTCCAATCGCCTACACGTTGGATGATTCCAAGCCTGATGGCAGC
-TGTGCCGCCATCATAGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCCCGTCTTACC
-AAAGAAGAAAGGCTGAAGAAACTTTGCGACCTCTATGCAAAAGTTCTGGGTTCAAAAGAA
-GCTTTGAACCCCGTGCACTATGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCGGCGGGC
-TGCTACACGACCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTTCTACGCCAG
-CCAGTCGGCAGGATTTATTTCGCCGGCACGGAGACTGCCACGCACTGGAGTGGCTACATG
-GAGGGGGCCGTGGAGGCCGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCTATGGGAAAG
-ATCCCAGAAGATGAAATCTGGCAGTCTGAACCAGAGTCCGTGGATGTGCCTGCGAAGCCC
-ATTACCACGACCTTCTTGGAGAGACACTTGCCCTCGGTGCCCGGCCTGCTGAGGCTGATT
-GGATTGACCGCCATCTTTTCAGCCACTGCTCTCGGCTACCTGGCCCACAAAAGGGGGCTA
-CTCGTGCGGGTCTGA
->ENSSSCT00000023183_susscrofa
-ATGGCAGCGGCCAAACTTCTGCATGACTCTGGCCTGAGTGTGATTGTTCTGGAAGCCCGG
-GACCGCGTGGGAGGCAGGACTTACACCGTCAGGAACCAACAAGTTAAATATGTGGACCTT
-GGAGGATCTTATGTTGGGCCAACTCAGAATCGCATCTTAAGATTGTCCAAGGAGCTAGGA
-TTGGAGACCTACAAAGTGAATGAAGTGGAGCGTCTGATTCACTATATCAAAGGCAAATCC
-TACCCCTTCAGGGGCCCATTACCACCTGTGAGGAATCCGATTACCTTCCTAGATCTTAAC
-AACCTTTGGAGGACGGTGGATGACATGGGACGAGAGATTCCCAGTGATGCCCCATGGAAG
-GCGCCCCTTGCAGAACAGTGGGACCAGATGACAATGAAGGAGCTGTTGGACAAGCTCTGC
-TGGACTGAATCTTCGAAGCAGCTGGCCACCCTTTTTGTGAACCTGTGTGTCACCGCGGAG
-ACCCATGAGGTCTCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACCACC
-AGGATCATCTCAACAACTAACGGAGGGCAGGAGAGGAAATTTGTGGGCGGATCTGGTCAA
-GTGACCGAGCGGATAAAGGACCTCCTTGGAGACCGAGTGAAGCTGGAGAGGCCTGTGGTC
-CACATTGACCAGACAGGAGAAAATGTCCTCGTGGAGACCCTAAACCACGAGGTGTACGAG
-GCTAAGTATGTGATTAGCGCCATTCCTCCTGTCCTGGGCATGAAGATTCATTTCAGTCCC
-CCTCTGCCAATGATGAGAAACCAGCTCATCACTCGTGTACCTCTGGGCTCTGTCATCAAG
-TGTATAGTTTATTACAAAGAGCCCTTCTGGAGGCATAAGGATTACTGTGGAAGCATGATT
-ATTGAAGGAGAGGAAGCTCCAATCGCCTACACGTTGGATGATTCCAAGCCTGATGGCAGC
-TGTGCCGCCATCATAGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCCCGTCTTACC
-AAAGAAGAAAGGCTGAAGAAACTTTGCGACCTCTATGCAAAAGTTCTGGGTTCAAAAGAA
-GCTTTGAACCCCGTGCACTATGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCGGCGGGC
-TGCTACACGACCTACTTCCCCCCTGGGATCATGACTCAGTATGGAAGGGTTCTACGCCAG
-CCAGTCGGCAGGATTTATTTCGCCGGCACGGAGACTGCCACGCACTGGAGTGGCTACATG
-GAGGGGGCCGTGGAGGCCGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCTATGGGAAAG
-ATCCCAGAAGATGAAATCTGGCAGTCTGAACCAGAGTCCGTGGATGTGCCTGCGAAGCCC
-ATTACCACGACCTTCTTGGAGAGACACTTGCCCTCGGTGCCCGGCCTGCTGAGGCTGATT
-GGATTGACCGCCATCTTTTCAGCCACTGCTCTCGGCTACCTGGCCCACAAAAGGGGGCTA
-CTCGTGCGGGTCTGA
->ENSCAFT00000022963_canisfamiliaris
-ATGAGCGGCAAGTGCGACGTGGTCATGGTGGGGGGCGGCATCTCAGGCATGGCAGCAGCC
-AAACTTCTGCATGATTTTGGCCTGAACGTGGTTGTTCTGGAGGCCCGGGACCGAGTGGGA
-GGCAGGACTTACACCATCAGGAACCAAAAGGTTAAATATTTGGACCTTGGAGGATCTTAT
-GTTGGGCCAACTCAGAATTGTATCTTAAGGTTAGCCAAGGAGCTAGGATTGGAGACCTAC
-AAAGTGAATGAAGTAGAGCGTCTCATCCATCATGTAAAGGGCAAATCGTACCCCTTCAGG
-GGCCCCTTCCCACCTGTATGGAACCCAATTGCATACCTAGATCATAACAACCTCTGGAGG
-ACGATGGACGACATGGGGCGAGAGATTCCCAGTGATGCCCCATGGAAGGCACCTCTTGCG
-GAGGAGTGGGACCACATGACAATGAAGGAGCTTCTGGACAAGATCTGCTGGACAGAATCT
-GCCAAGCAACTTGCTACTCTCTTTGTGAATCTGTGTGTCACTGCAGAGACCCATGAGGTC
-TCTGCTCTCTGGTTCCTGTGGTATGTGAAGCAGTGTGGAGGCACGACCAGGATCATCTCA
-ACAACCAATGGAGGGCAGGAGAGAAAATTTGTGGGCGGATCTGGTCAAGTGAGTGAACGG
-ATAATGGACCTCCTTGGAGACCAAGTGAAGCTGGAGAGGCCTGTGACCCACATTGACCAG
-ACAGGAGAAAATGTCCTTGTGGAGACCCTAAACCATGAGGTGTATGAGGCTAAGTATGTG
-ATTAGTGCCATTCCTCCTACTCTGGGCATGAAGATTCATTTCAACCCCCCTCTGCCAATG
-ATGAGAAACCAGCTGATCACTCGTGTGCCTTTGGGCTCAGTCATCAAGTGCATAGTTTAT
-TATAAAGAGCCCTTCTGGAGGAAAAAGGATTACTGTGGAACCATGATTATCGAAGGAGAG
-GAAGCTCCAATTGCTTACACGTTGGATGATACCAAACCTGATGGCAACTATGCCGCCATA
-ATGGGATTTATCCTTGCCCACAAAGCCAGAAAACTGGCACGTCTTACCAAAGATGAAAGG
-ATGAAGAAACTTTGTGAGCTCTATGCAAAAGTCCTGGGTTCCCAAGAAGCTTTGCAGCCC
-GTACACTACGAAGAGAAGAACTGGTGCGAGGAGCAGTACTCCGGGGGCTGCTACACCACC
-TACTTTCCCCCTGGGATCATGACTCAATATGGAAGGGTTCTACGACAGCCTGTGGGCAGG
-ATTTATTTTGCAGGCACGGAGACTGCCACCCACTGGAGTGGCTACATGGAGGGCGCTGTG
-GAGGCTGGAGAGAGAGCGGCCCGAGAGATCCTGCATGCCATGGGGAAGATCCCAGAGGAT
-GAAATCTGGCAGTCAGAACCAGAATCAGTGGATGTCCCTGCGCAGCCCATCACCACGACC
-TTCTTGGAGAGACATTTGCCCTCTGTGCCAGGCCTGCTGAGGCTGATCGGATTGACCGCC
-ATCTTTTCTGCAACTGCTCTTGGCGTCCTGGCACACAAAAGGGGTCTGCTTGTGCGGGTC
-TAA
->ENSPTRT00000034846_pantroglodytes
-ATGGACCCGGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
-CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
-GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
-CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTCCGCCTGGCA
-GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGCAGGGGGAGTTACTACCA
-GGGCTCTTTGGGGAGGCAGGACCCCTCGGCCGAGCAGCCTGGGCCGTCCCCACCGTGCGC
-AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCACCCCAGCGCCCTGCGCTTCCTG
-GCCGACCACGGTGCGGTCGACACCATCTTCTCCCTTCAGGGAGACTCCAGCCTGTTTGTG
-GCCTCGGCGGCCAGTCAGCTCCTGGTACACGTCCTGGCTTTGTCCATGCAAGGTGGAGCC
-GAGGGACAGCCCTGCCTGCCGGGGGGTGACTGGCCCGCGTGTGCCCAGAGGATCATGGAT
-CACGTTGAAGAGTCCTTGTGCTCCGCGGCCACCCCCAAGGTCACTCAGGCCCTGAACGTC
-CTGACCACAACCTTCGGGCGCTGCCAGAGCCCCTGGACGGAAGCCCTGTGGGTGCGGCTG
-AGTCCCCGCGTGGCGTGTCTGCTGGAGAGAGACCCCATCCCCGCCGCACACTCGTTCGTG
-GACCTGCTTCTCTGTGTGGCTCGTTCTCCCGTGTTCAGTTCTTCCGACGGCAGCCTGTGG
-GAGACAGTGGCGCGGGCTCTGAGCTGCCTGGGTCCCACCCACATGGGACCCCTGGCTTTG
-GGGATCCTGAAGCTCGAGCACTGTCCACAGGCACTGAGGACCCAGGCCTTCCAGGTCCTT
-CTCCAGCCCCTGGCCTGTGTCCTGAAGGCCACGGTTCAGGCCCCCGGACCCCCAGGCTTG
-CTGGACGGGACGGCAGACGATGCCACGACGGTGGACACACTCCTGGCCTCCAAGTCGTCC
-TGCGCGGGCCTCCTGTGCCGCACCCTGGCTCACCTGGAGGAGCTGCAGCCGCTGCCCCAG
-CGCCCTTCACCGTGGCCCCAGGCGTCTCTACTGGGGGCTACAGTGACTGTCCTGCGGCTC
-TGTGACGGCTCAGCTGCCCCTGCCTCCAGTGTGGGGGGCCACCTCTGTGGGACCCTGGCG
-GGCTGCGTCCGGGTCCAGCGAGCAGCCCTCGACTTCCTGGGGACACTGTCACAGGGGACA
-GGCCCCCAGGAGCTGGTGACGCAGGCGCTTGCTGTCCTCCTGGAGTGCCTCGAGAGCCCC
-GGCTCCAGCCCCACGGTTCTGAAGAAGGCCTTCCAGGCCACGCTCAGGTGGCTCCTGAGC
-TCACCCAAGACCCCCGGCTGCTCTGATCTCGGCCCCCTCATCCCGCAGTTCCTCAGAGAG
-CTGTTCCCTGTGCTGCAGAAACGCCTGTGCCACCCCTGCTGGGAGGTGAGGGACTCCGCC
-CTCGAGTTCCTGACCCAGCTGAGCAGGCACTGGGGAGGACAGGCCGACTTCAGATGCGCA
-CTCTTGGCTTCAGAGGTGCCTGAGCTGGCCCTGCAGCTCCTCCAGGACCCTGAGAGTTAT
-GTCCGAGCGAGCGCGGTGACCGCCATGGGGCAGCTGTCCAGCCAGGGCCTGCACGCCCCC
-ACCAGCCCTGAGCATGCAGAGGCCCGGCAGAGCCTGTTCCCGGAGCTCCTGCACATCCTC
-TCCGTAGACTCGGAGGGCTTCCCACGGCGGGCGGTCATGCAAGTCTTCACTGAGTGGCTG
-CGGGACGGCCACGCCGACGCGGCCCGGGACACGGAGCAGTTCGTGGCCACTGTGCTGCAG
-GTGGCGAGCCGGGACCTGGACTGGGAGGTCCGCGCCCAGGGCCTGGAGCTGGCCCTCGTG
-TTCCTGGGCCAGACTTTGGGGCCGCCGCGTACCCACTGCCCCTATGCCGTGGCCCTACCC
-GAGGTGGCCCCAGCCCAGCCACTCACCGAGGCACTGAGGGCTCTCTGCCACGTGGGGCTC
-TTTGACTTCGCCTTTTGTGCCTTGTTTGACTGCGACCGCCCTGTGGCGCAGAAGTCTTGT
-GACCTCCTTCTCTTCCTGAGGGACAAGATTGCTTCCTACAGCAGCCTGCGGGAGGCCAGG
-GGCGGCCCCAACACTGCCTCCGCAGAGGCCACCCTGCCGAGGTGGCGGGCGGGTGAGCAG
-GCCCAGCCCCCAGGGGACCAGGAGCCTGAGGCTGTGCTGGCCATGCTCAGGTCCCTAGAC
-CTGGAGGGCCTGCGGAGCACACTGGCCGAGAGCAGCGACCACGTGGAGAAGAGTCCCCAG
-TCCCTCCTGCAGGACATGCTGGCCACGGGAGGCTTCCTGCAGGGGGATGAGGCCGACTGC
-TACTGA
->ENST00000340611_homosapiens
-ATGGACCCAGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
-CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
-GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
-CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTGCGCCTGGCA
-GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGCAGGGGGAGTTACTACCA
-GGGCTCTTTGGGGAGCCAGGACCCCTCGGCCGAGCAACCTGGGCCGTCCCCACCGTGCGC
-AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCACCCCAGCGCCCTGCGCTTCCTG
-GCCGACCATGGTGCGGTCGACACCATCTTCTCCCTGCAGGGAGACTCCAGCCTGTTTGTG
-GCCTCGGCGGCCAGTCAGCTCCTGGTGCACGTCCTGGCTTTGTCCATGCGAGGTGGAGCC
-GAGGGGCAGCCCTGCCTGCCGGGGGGTGACTGGCCCGCGTGTGCCCAGAAGATCATGGAT
-CACGTTGAAGAGTCCTTGTGCTCCGCGGCCACCCCCAAGGTCACTCAGGCCCTGAACGTC
-CTGACCACGACCTTCGGGCGCTGCCAGAGCCCCTGGACGGAAGCCCTGTGGGTGCGGCTG
-AGTCCCCGCGTGGCCTGTCTGCTGGAGAGAGACCCCATCCCCGCCGCACACTCGTTCGTG
-GACCTGCTTCTCTGTGTGGCTCGTTCTCCCGTGTTCAGTTCTTCCGACGGCAGCCTGTGG
-GAGACAGTGGCGCGGGCTCTGAGCTGCCTGGGTCCCACCCACATGGGACCCCTGGCTTTG
-GGGATCCTGAAGCTCGAGCACTGTCCACAGGCACTGAGGACCCAGGCCTTCCAGGTCCTT
-CTCCAGCCCCTGGCCTGTGTCCTGAAGGCCACGGTTCAGGCCCCCGGACCCCCAGGCTTG
-CTGGACGGGACGGCAGACGATGCCACGACGGTGGACACACTCCTGGCCTCCAAGTCGTCC
-TGCGCCGGCCTCCTGTGCCGCACCCTGGCTCACCTGGAGGAGCTGCAGCCGCTGCCCCAG
-CGCCCTTCACCGTGGCCCCAGGCGTCTCTACTGGGGGCTACAGTGACTGTCCTGCGGCTC
-TGTGACGGCTCGGCTGCCCCTGCCTCCAGTGTGGGGGGCCACCTCTGTGGGACCCTGGCG
-GGCTGCGTCCGGGTCCAGCGAGCAGCCCTCGACTTCCTGGGGACGCTGTCACAGGGGACA
-GGCCCCCAGGAGCTGGTGACGCAGGCGCTTGCTGTCCTCCTGGAGTGCCTCGAGAGCCCC
-GGCTCCAGCCCCACGGTTCTGAAGAAGGCCTTCCAGGCCACGCTCAGGTGGCTCCTGAGC
-TCACCCAAGACCCCCGGCTGCTCTGATCTCGGCCCCCTCATCCCGCAGTTCCTCAGAGAG
-CTGTTCCCTGTGCTGCAGAAACGCCTGTGCCACCCCTGCTGGGAGGTGAGGGACTCCGCC
-CTCGAGTTCCTGACCCAGCTGAGCAGGCACTGGGGAGGACAGGCTGACTTCAGATGCGCA
-CTCTTGGCTTCAGAGGTGCCTCAGCTGGCCCTGCAGCTCCTCCAGGACCCTGAGAGTTAT
-GTCCGAGCGAGTGCAGTGACCGCCATGGGGCAGCTGTCCAGCCAGGGCCTGCACGCCCCC
-ACCAGCCCTGAGCATGCAGAGGCCCGGCAGAGCCTGTTCCTGGAGCTCCTGCACATCCTC
-TCCGTAGACTCGGAGGGCTTCCCACGGCGGGCGGTCATGCAAGTCTTCACTGAGTGGCTG
-CGGGACGGCCACGCCGACGCGGCCCAGGACACGGAGCAGTTCGTGGCCACTGTGCTGCAG
-GCGGCGAGCCGAGACCTGGACTGGGAGGTCCGCGCCCAGGGCCTGGAGCTGGCCCTCGTG
-TTCCTGGGCCAGACTTTGGGGCCGCCGCGTACCCACTGCCCCTATGCCGTGGCCCTACCC
-GAGGTGGCCCCAGCCCAGCCACTCACCGAGGCACTGAGGGCTCTCTGCCACGTGGGGCTC
-TTTGACTTCGCCTTTTGTGCCTTGTTTGACTGCGACCGCCCTGTGGCGCAGAAGTCTTGT
-GACCTCCTTCTCTTCCTGAGGGACAAGATTGCTTCCTACAGCAGCCTGCGGGAGGCCAGG
-GGCAGCCCCAACACTGCCTCCGCAGAGGCCACCCTGCCGAGGTGGCGGGCGGGTGAGCAG
-GCCCAGCCCCCAGGGGACCAGGAGCCTGAGGCTGTGCTGGCCATGCTCAGGTCCCTAGAC
-CTGGAGGGCCTGCGGAGCACGCTGGCCGAGAGCAGCGACCACGTGGAAAAGAGTCCCCAG
-TCCCTCCTGCAGGACATGCTGGCCACGGGAGGCTTCCTGCAGGGGGACGAGGCCGACTGC
-TACTGA
->ENST00000421712_homosapiens
-ATGGACCCAGAATGCGCCCAGCTGCTCCCGGCTCTCTGTGCTGTTCTGGTAGATCCCAGG
-CAGCCGGTGGCAGATGACACCTGTTTGGAGAAGCTCCTGGACTGGTTTAAAACGGTCACT
-GAAGGAGAGTCCAGTGTCGTGCTGCTGCAGGAGCACCCCTGCCTGGTGGAGCTGCTGTCC
-CATGTGCTGAAAGTCCAGGACCTGAGTTCTGGGGTCCTCTCCTTCTCACTGCGCCTGGCA
-GGAACCTTCGCAGCCCAGGAAAACTGCTTCCAGTATCTTCAGGTGCGGTCGACACCATCT
-TCTCCCTGCAGGGAGACTCCAGCCTGTTTGTGGCCTCGGCGGCCAGTCAGCTCCTGGTGC
-ACGTCCTGGCTTTGTCCATGCGAGGTGGAGCCGAGGGGCAGCCCTGCCTGCCGGGGGGTG
-ACTGGCCCGCGTGTGCCCAGAAGATCATGGATCACGTTGAAGAGTCCTTGTGCTCCGCGG
-CCACCCCCAAGGTCACTCAGGCCCTGA
->ENSRNOT00000064726_rattusnorvegicus
-ATGGACGCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCTAGA
-CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTACTGGACTGGTTTAAAACAGTGACA
-GAGGCAGAGCCCAGCCTCCAACTACTGCAGGACCACCCCTGCCTAATGGAGCTCCTGTCC
-CATGTGCTGAAGCCACAGGATGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTCGTT
-GGGGTCTTTGCGGCCCAGGAGGACTGTTTCCAGTACCTTCAGCAGGGGGAGTTGTTGCTG
-GGGCTCTTTGGGGAGACAGGTGCCCTTAGCTGGGCAGCCTGGAGCATCCCCAGTGTGCGC
-AGCGGCTGGATCCAGGGCCTGTGCTCCCTGGCACACCACCCCAGTGCCCTGCACTTCCTG
-GCTGACAGTGGTGCTGTGGACACGATCTTCTCCTTGCAAGGAGACCCCAGCCTGTTTGTA
-GCCTCAGCAGCCAGCCAGCTCCTAGTACACATCCTGGCTCTGTCAATGCAAGGCGGAGCT
-CCAGGGTCCCCCGTCCCTGAAGCCGTTGCCTGGCCTGTCTGTGCCCAGAAGATCATGAAC
-CATGTAGAAGAGTCCTTGCATTCCAAAGCCACCCCACAGGTCACACAGGCCTTGAATGTC
-CTGACGACGACCTTCGGGCGCTGCCACAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
-AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCTGCCACACACTCGCTCATG
-GACCTGCTTCTCAGTGTGGCCAGGTCTCCTGTGTTGAACTTTGCAGCCTGTGGCCTGTGG
-GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCACCCAAGCTGGGCCTCTAGCTCTG
-GGGACCCTGAAACTTCAGCATTGTCCCCAGGAACTGAGGACCCAGGCCTTTAGAGTCCTC
-CTTCAGCCACTGGCCTGCATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
-CTGGACGGGACTGCGGGTAGCTTGCTGACTGTGGATGCACTCTTATCTTCAAAGTCGGCC
-TGTGTGGGGCTCCTCTGCCAGACTCTGGCGCACCTGGAGGAGCTGCAGATGCTGCCCCAG
-TGCCCCTCACCGTGGCCACAGGTGCCTCTGCTGCAAGCTGCTGTGACGATATTGCGTCTC
-TCTGACGGCTCGGCGGACCCCAGTTCCAGTGCAGGAGGCCGTCTCTGTGGGGCGCTGGGT
-GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACGCTGTCTCTGGGGACA
-AGCCCCCTGGAATTGGTGCTGGAGGTATTTGCTGTCCTCCTGAAGACCCTGGAGAGCCCA
-GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAGC
-CCACACAAGACCCCCAGCGGCTCTGATCTCAGCCCCGATGCCTTGCTGTTCCTCGGAGAG
-CTATTCCCCATACTACAGAAGCGCCTGTGCAGCCCGTGTTGGGAGGTGAGGGACTCAGCC
-CTGGAGTTCCTGACGCATCTGATCCGGGACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
-CTGCATTCTTCAGAAGTACCCACACTTGCCCGCCAGCTCCTCCAAGACCCTGAGAGTTAT
-GTCCGAGCAAGTGCAGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGCCTTCAGGCCACT
-CCCGCCAACCAGCAGGGCCTACTCATGGACCTCATGCATATCCTGTCCACGGACTCAGAG
-GGCTTCCCTCGAAGAGCTGTGTTACGGGTCTTTACTGAATGGCTGAGGGATGGCCATGCT
-GATGTGGTTCGAGACACAGAGTGGTTCGTGGCCACTGTTCTCCAGGCAGTGAGCCGGGAT
-CTGGACTGGGAGGTCCGAGTGCAGGGCTTGGAGCTGGCACAGGTATTCCTCATCCAGGCA
-ATGGGGCAGCCTAGACTCCACTGTCCCTATACAGTAGGCCTGCCTGGGGCCACCTCTTCC
-CGCCCACACCTGGAATTCTTGCAGACTCTCTGCCGTCTGCCACTCTTTGAGTTTGCCTTT
-TGTGCCTTGCTTGACTGTGACCGCCCGGTGGCCCAAAAAGCCTGTGACCTGCTCCTCTTC
-TTGAGGGACAAGACAGTTTCCTGCAGTAACCCTCAGGAGGCCGGGGACAGCCCCAACTCA
-GCCTCAGTGGAGGCTGCCCTGCAGAGGTGGCGGGAAGGTGAGCAGGCTCAGCCCCTAGGG
-GACCTGGAGCCTGAAGCCATGCTGGCCATCCTCAGGTCCTTAGACCTGGAGGGCCTGCAG
-GGCAGGCTGGCCAAGAGCAGTGACCATGTGGAGAAGAGCCCACAGTCCCTGCTGCAGGAC
-ATGCTGGCCACGGTGGGCGTGTTGGAGGAGAATGAAGCTGACTGCTACTAA
->ENSMUST00000041588_musmusculus
-ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
-CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
-GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
-CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
-GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
-GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
-AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
-GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
-GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
-CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
-CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
-CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
-AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
-GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
-GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
-GGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAGGCCTTTGGAGTCCTC
-CTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
-CTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTGGCTTCAAAGTCAGCC
-TGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTGCAGATGCTGCCCCAG
-TGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTGACTATATTGCATCTC
-TGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTCTGTGGGACTCTGGGT
-GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACCCTGTCTCAGGGGACA
-AGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAGACCCTGGAGAGCCCA
-GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAAC
-CCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTGCTGTTTCTCGGAGAG
-CTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAGGTGAGGGACTCTGCC
-CTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
-CTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAAGACCCAGAGAGTTAC
-GTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGTCTGCAGGCCGCT
-CCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGGCCTACTCATGGACCTTATGCATATC
-CTGTCCACTGACTCAGAGGGCTTCCCTCGAAGGGCTGTGTTACGGGTCTTCACGGACTGG
-CTGAGGGATGGCCATGCTGACGTGGTTCGAGACACGGAGTGGTTCGTGGCCACTGTTCTC
-CAGGCAGTGAGCCGGGATCTGGACTGGGAGGTCCGAGTGCAGGGTTTGGAGCTGGCACGG
-GTGTTCCTCACCCAGGCACTGGGCCAGCCCAGCCTCCACTGTCCCTATACAGTGGGCCTG
-CCCAGGGCCTCCTCTCCCCGCCCACACCCGGAATTCTTGCAGACTCTCTGCCGTCTGCCG
-CTCTTTGAGTTTGCCTTTTGTGCCTTGCTTGACTGTGACCGACCGGTGGCCCAAAAGGCC
-TGTGACCTGCTCCTCTTCTTGAGGGACAAGACAGTTCCCTGCAGTAGCCCTCGGGAGGCA
-GGGGACAGCCCCAACTCAGCCTCAGTGGAGGCTGCCCTGCAGAGGTGGCGGGAAGGAGAG
-CAGGCCCAGCCCCTAGGGGACCTGGATCCTGAGGCCATGCTAGCCATCCTCAGGGCCTTA
-GACCTGGAGGGCCTGCAGGGCAGGCTGGCCAAGAGCAGCGACCATGTGGAGAAGAGCCCA
-CAGTCCCTGCTGCAGGACATGCTGGCCACGGTGGGTGTGTTGGAGGAGAACGAAGCTGAC
-TGCTACTAA
->ENSMUST00000153440_musmusculus
-ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
-CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
-GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
-CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
-GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
-GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
-AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
-GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
-GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
-CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
-CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
-CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
-AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
-GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
-GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
-GGGACCCTGAAACTTCAGCACTGGCTTGCTGGATGGGACTGTGGGTAG
->ENSMUST00000110806_musmusculus
-ATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTTTTGGCAGATCCCAGA
-CAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGGTTTAAAACAGTGACA
-GAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTAATGGAGCTCCTGTCC
-CATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTTGCTCTGCGCCTTGTT
-GGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAGGGAGAGTTGTTGCTG
-GGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGCATCCCAAGTGTGCGC
-AGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGCGCCCTGCACTTCCTG
-GCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGACCCCAGCCTGTTCGTC
-GCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCCATGCAAGGTGGAGCC
-CCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCCCAGAAGATTGTGAAC
-CATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACACAGGCCTTGAATGTC
-CTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTCCTCTGGGAGCGGCTA
-AGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCCGTGCACGCGCTCATG
-GACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCAGCCTGTGGCCTGTGG
-GAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCTGGGCCTCTAGCCCTG
-GGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAGGCCTTTGGAGTCCTC
-CTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCTGGACCTCCAGGCTTG
-CTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTGGCTTCAAAGTCAGCC
-TGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTGCAGATGCTGCCCCAG
-TGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTGACTATATTGCATCTC
-TGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTCTGTGGGACTCTGGGT
-GGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACCCTGTCTCAGGGGACA
-AGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAGACCCTGGAGAGCCCA
-GAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTCAGATGGCTCCAGAAC
-CCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTGCTGTTTCTCGGAGAG
-CTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAGGTGAGGGACTCTGCC
-CTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCTGACTTCAGAGAGGCA
-CTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAAGACCCAGAGAGTTAC
-GTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAGGGTCTGCAGGCCGCT
-CCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGTAGACACAGGGAGTTGGTGA
->ENSMUST00000100505_musmusculus
-ATGGTGCATTTTGCACTCTCGGGCCTAATTCCCGTAGCGGAGGGATGCGGGGGCGGGATT
-AGAACCCCTAGGCTAACTCGCAGTCGCCGAGAGCGCACCTCTTACCCGGATTTGGGAGGA
-ACTGCCTGCCTGATCATGGACCCAGAATGCTCCAGGCTCCTCCCGGCTCTCTGTGCTGTT
-TTGGCAGATCCCAGACAGCTGGTGGCAGATGACACCTGCTTGGAGAAACTGCTGGACTGG
-TTTAAAACAGTGACAGAGGCAGAGTCTAGCCTCCAACTACTACAGGACCATCCCTGCTTA
-ATGGAGCTCCTGTCCCATGTGCTGAAGCCACAGGACGTGAGCCCTAGGGTCCTCTCCTTT
-GCTCTGCGCCTTGTTGGGGTCTTCGCAGCCCAGGAAGACTGTTTTGAGTACCTTCAGCAG
-GGAGAGTTGTTGCTGGGGCTCTTTGGGGAGTCAGGTGCCCCCGGCTGGGCAGCCTGGAGC
-ATCCCAAGTGTGCGCAGCGGCTGGATCCAGGGTCTGTGCTACCTGGCACACCACCCTAGC
-GCCCTGCACTTCCTGGCTGACAGTGGTGCTGTGGACACGCTCTTCTCCTTGCAGGGAGAC
-CCCAGCCTGTTCGTCGCCTCAGCAGCCAGCCAGCTCCTAGTACATATCCTGGCTCTGTCC
-ATGCAAGGTGGAGCCCCAGGGTCCCCCGTCCCTGAAGCTGCTGCTTGGCCTATGTGTGCC
-CAGAAGATTGTGAACCATGTGGATGAGTCCCTGCATGCCAAAGCCACCCCCCAGGTCACA
-CAGGCCTTGAATGTCCTGACTACGACCTTCGGGCGCTGCCATAACCCCTGGACAGGGGTC
-CTCTGGGAGCGGCTAAGTCCCCCTGTTGCCCGCCTGTTTGAGAGAGACCCCATTCCAGCC
-GTGCACGCGCTCATGGACCTTCTTCTTAGTGTGGCCAGGTCGCCTGTGTTGAATTTTGCA
-GCCTGTGGCCTGTGGGAGATGCTGGCCCAGACTCTGAGCCGCCTGAGCCCCATACAAGCT
-GGGCCTCTAGCCCTGGGGACCCTGAAACTTCAGCACTGTCCCCAGGAATTGAGGACCCAG
-GCCTTTGGAGTCCTCCTACAGCCACTGGCCTGTATCCTGAAAGCTACCACTCAGGCCCCT
-GGACCTCCAGGCTTGCTGGATGGGACTGTGGGTAGCTTGCTGACTGTGGATATACTCTTG
-GCTTCAAAGTCAGCCTGTGTGGGACTCCTTTGCCAGACTCTGGCTCACCTGGAGGAGCTG
-CAGATGCTGCCCCAGTGCCCCTCACCCTGGCCACAGGTGCATCTGCTGCAAGCTGCTTTG
-ACTATATTGCATCTCTGTGATGGCTCAGCGGACCCCAGCTCCAGTGCAGGAGGCCGTCTC
-TGTGGGACTCTGGGTGGCTGTGTTCGTGTCCAGCGAGCAGCCCTTGACTTCTTGGGGACC
-CTGTCTCAGGGGACAAGCCCCCTGGAGTTGGTTCTGGAGGTATTTGCTGTTCTCCTGAAG
-ACCCTGGAGAGCCCAGAGTCCAGCCCCATGGTCCTAAAGAAGGCCTTCCAGGCCACACTC
-AGATGGCTCCAGAACCCACACAAGACCCCCAGCAGCTCTGATCTCAGCTCCGACGCCCTG
-CTGTTTCTCGGAGAGCTGTTCCCCATACTACAGAAGCGCCTATGCAGCCCATGTTGGGAG
-GTGAGGGACTCTGCCCTGGAGTTCCTGACGCATCTGATCCGACACTGGGGAGGGCAGGCT
-GACTTCAGAGAGGCACTGCGTTCCTCAGAAGTACCCACACTTGCCCTCCAGCTTCTCCAA
-GACCCAGAGAGTTACGTCCGAGCAAGTGCCGTGGGTGCCGCTGGGCAGCTCTCCAGCCAG
-GGTCTGCAGGCCGCTCCCGCTAGCCCCGAGAACTCGCAGGCCCAACAGGGCCTACTCATG
-GACCTTATGCATATCCTGTCCACTGACTCAGAGGGCTTCCCTCGAAGGGCTGTGTTACGG
-GTCTTCACGGACTGGCTGAGGGATGGCCATGCTGACGTGGTTCGAGACACGGAGTGGTTC
-GTGGCCACTGTTCTCCAGGCAGTGAGCCGGGATCTGGACTGGGAGGTCCGAGTGCAGGGT
-TTGGAGCTGGCACGGGTGTTCCTCACCCAGGCACTGGGCCAGCCCAGCCTCCACTGTCCC
-TATACAGTGGGCCTGCCCAGGGCCTCCTCTCCCCGCCCACACCCGGAATTCTTGCAGACT
-CTCTGCCGTCTGCCGCTCTTTGAGTTTGCCTTTTGTGCCTTGCTTGACTGTGACCGACCG
-GTGGCCCAAAAGGCCTGTGACCTGCTCCTCTTCTTGAGGGACAAGACAGTTCCCTGCAGT
-AGCCCTCGGGAGGCAGGGGACAGCCCCAACTCAGCCTCAGTGGAGGCTGCCCTGCAGAGG
-TGGCGGGAAGGAGAGCAGGCCCAGCCCCTAGGGGACCTGGATCCTGAGGCCATGCTAGCC
-ATCCTCAGGGCCTTAGACCTGGAGGGCCTGCAGGGCAGGCTGGCCAAGAGCAGCGACCAT
-GTGGAGAAGAGCCCACAGTCCCTGCTGCAGGACATGCTGGCCACGGTGGGTGTGTTGGAG
-GAGAACGAAGCTGACTGCTACTAA
->ENSCAFT00000025950_canisfamiliaris
-ATGGACCCAGAGTGCTCCCAGCTCCTCCCGGCCCTCTGTGCAGTTCTGGCAGACCCCAGG
-CAGCCCGTGGCAGATGACACCTGTTTGGAGAAGCTGCTGGATTGGTTTAAAACGATAACC
-AAAGCTGGGTCCAGTCTCCTGTTATTACAGGAGAACCCCTGTCTGGTGGAGCTGCTGTGT
-CACGTGCTGAAACCCCAGGACCTGAGTTCCAGAGTCCTCTCCTTCTCTCTCCGCCTCGCA
-GGGGTATTTGCAGCCCAGGAAGATTGCTTCCAGTATCTTCAGCAGGGGGAGTTGCTGCCC
-AGGCTCTTTGGGGAGCCAGGGCCCCTGGGAGGAGCTGCCTGGACTGCCCCCTCAGTGCGC
-AGTGGCTGGATCCAGGGCCTGCGCTCCCTGGCACAGCATCCTAGTGCCCTGCATTTCCTG
-GCTGACTGTGGTGCCGTTGACACCATCTTCTCCCTGCAGGGAGATTCCAGCCTGTTTGTG
-GCCTCGGCAGCTGGGCAGCTCCTGGTGCACATCCTGGGCTTGTCCATGCAAGGCCTAGCC
-GAGGGACACCCCAGCCTGCAGGCTGGTGATTGGCCAGTGTGTGCCCAGAAGATCGTGGGT
-CACATAGAAGAGTCCCTGCACTCCACAGCCGTCCCGCAGATCACACAGGCTCTAAACGTC
-CTGACTACCACGTTCGGGCACTGCCATGACCCTTGGACACAAGTTCTGTGGGTACGGCTG
-AGTCCCCTAGTAGGCAGTCTACTTGAGAAAGACCCTGTCCCAGCTGCACACTCGCTCGTG
-GACCTCCTCCTCAGTGTGGCCCGTTCTCCTGGGCTGAGCTCTTCTAGCTGCGGCCTGTGG
-GAGACTCTGGCTCAGACTCTGAACCATCTGAGCCCTACCCAAGCAGGGCCGCTGGCGTTA
-GGGATCCTGAAACTGCAGGACTGTCCACAGGTGCTAAGGGCCCAGGCCTTTGTCATTCTT
-CTCCAGCCTCTGGCCTGCGTCCTTAAAGCCACGGGTCAGGACCCCGGACCCTCAGGTGTG
-CTGGACAGTGCCACAGGTGACTCTCTGACAGTGGACGTGCTCCTCTCCTCCAAGGCGGCC
-TGTGTGGGTCTCCTGTGCCGGACTCTGGCCCACCTGGAGCTGCTGCAGCCGCTACCCCAG
-CGCCCCTGCCCCTGGCCTCAGGAGCCCCTGCTTGGGGCCGCGGTGACCCTGCTGCAGTTA
-TGCAGGGGCTCAGCAAGCCCTGCCTCTGACGTGGGGCGCCACCTCTGCGCGCTCCTGCTG
-GGCTGCGTGCGGGTGCAGCGAGCGGCCCTGGATTTCCTGGGGACGCTGTCTCAGGGGACA
-GGCCCCCAAGAGCTGGTGACGGAGGTGTTTGCTGTCCTTCTGGAATATCTCAGGAGCCCA
-GACTCCAGCCCCACGGTTCTGAAGAAAGCCTTCCAGGCCACATTCAGGTGGCTCCTGAGC
-TCACCCAAGACCCCCGGCTGCTGTGATCTAGAACCCCATGCCCTGCTGGTCCTGAGAGAG
-CTGCTTCCTGTGCTGCAGAAGCGTCTGTGCAGCCCCTGCTGGGAGGTGAGGGACTCCGGC
-CTCGAGTTCCTGACTCAGATGACCAGACACTGGGGAGGGCAGGCTGGCTTCAGACATGCA
-CTCCTCGCTTCGGAGGTGCCCAAGCTTACCGAGCAGCTCCTACGAGACCCTGAGAGTTAC
-GTCCGTGCCAGTGCAGTGACCGTCATGGGGCAGCTCTCCAGCCAGGGGCTGCATGTCACC
-CCTGTGAGCCCTGAGCATCCAGGGGGCCAGCAGAAGAGTCTGCTCGTGGAGCTTCTGCAT
-ATCCTCTCCACAGATTCAGAGGGATTCCCGCGGAGAGCCGTCATGCAGGTCTTCACCCAG
-TGGCTGAGGGACCACCATGCCGACGTGGCGGGGGACACGGAACAGTTTATGGCCAGGGTG
-CTCCAGGTCGCCAGCCAGGATCTGGACTGGGAGGTCCGGGCCCAGGGCCTGGAGCTGGCG
-CTGGTATTCCTGGAGCAGACGCTGGGCCAGTTCCACTCCCACTGTCCCTATGCTGTGACC
-CCACCCGTGGCGGCCCCAGCTGGCTCGCTGGCCCAGGCCCTGCAGCCACTATGCCGAGTG
-CGGCTCTTTGAGTTTGCCTTCCGTGCCTTGTTTGACTGTGACCGACCTGTGGCTCAGAAG
-TCCTGTGATCTCCTCCTCTTCCTGAGGGCCAAGACTGCTTCTTCCTCTGGTAGCCTGGAG
-GAGTCCAGGAGCGGCCCAGATGTGGCCTCTGTGGAGGCTGCCTTGCAGAGGTGGCAGGCA
-GGTGATCAGGGCCAGCCCCTGGGGGACCTGGAGCCCGAGGTCGTGCTGGCTGTGCTGAGG
-TCTGTGGACCTGGAAGGCCTTCGGGGTGCATTAGCCGAGGGCAGTGACCACATGGAGAAG
-AGCCCTCAGTCACTCCTGCAGGACATGCTGGCCACGGTGGGCGTCCTGGGAGAGAACGAG
-GCCGACTGCTACTGA
->ENSSSCT00000008295_susscrofa
-ATGGACCCGGAGTGCTCCCGGCTCCTCCCGGCTCTCTGTGCCGTCCTGGCAGACCCCCGG
-CAGCCTGTGGCAGATGATACTTGCTTGGAGAAGCTGCTGGACTGGTTTAAAACAATAACT
-GAAGCAGGGTCCAGTCTCCTGGTGCTACAGGAAAATCCCTGCCTGGTGGAGCTGCTGTTC
-GACGTGCTGAAACCCCAGGACCTGAGTCCCAGAGTCCTCTCCTTCTCACTCCGCCTCGCA
-GGCATGTTCGCAGCCCAGGAAGACTGCTTCCAGTACCTTCAGCAGGGGGAGTTGCTGCCC
-AGGCTGTTTGGGGAGGCGGGCCCCCTGGGAGGAGCGGCCTGGACGGCCCCGACCGTGCGC
-AGCGGCTGGATCCAGGGCCTGCGCTCCCTGGCGCAGCACCCTCGCGCCCTGCCCTTCCTT
-GCCGACTGTGGTGCCGTTGACACCATCTTCTCCCTGCAGGGAGATTCCAGCCTGTTTGTG
-GCCTCGGCAGCCGGGCAGCTCCTGGTGCACATCCTGGACTTGGCGATGCGAGCCCCGCCC
-CGGGGACACCCCGGCCCGCAGGCGTGTGACGGGCCAGCGTGCGCCCAGAAGATCGTGTGT
-CACCTCGAAGACTCCCTGCGCGCCGCAGCCGCCCCGCAGCTCACGCAGGCCCTGAATGTC
-CTGACCACCACGTTCGGGCACTGCCACGGCCTTTGGACGCCGGGCCTTTGGGGGCGGCTG
-AGCCCTCTTGTGGGGCACCTGCTCGAGAAAGACCCCGTCCCAGCCTCGCACGCGCTCGTG
-GACCTCCTCCTCAGCGTGGCCCGGTCCCCTGTGCTGAGTTCTGAGAGTGGCCCGTGGGAG
-ACTTTGGCGCTGACTCTGAGCCGCTTGAGCCCGATGCAAGCAGGGCCTCTGGCTTTGGGG
-ATCCTGAAGCTGCAGGACTGCCCACAGGCCTTGAGGACCCAGGCCTCTGGCGTCCTCCTC
-CAGCCCCTGGCCTGTGTCCTGAAAGCTGCTGTGCAGGGCCCCGGACGCCCAGGTAGGCTG
-CTGGGGAAGGGGGGCAGGTGCAGGATGGCAGGACCGTGGGGGCCTGAGCGCATCCTTGGG
-GCCGGCGCAGGCTGTCATCCCAGGTGTGACTGCTGCTCCTGTTGCCACCCTGGAANCAGT
-GCCCTTGGCCTGGCCCAAGAGGCCCGCCTGAGGCTGTGTGACAATGCTGCGATCCCCCGC
-TCTGACCTGGGGGGCCAATTCTGTGGCCACCTGGTGGCCTGTGTCCGAGTCCAGCGAGCG
-GCCCTGGATTTCCTGGGGACGCTGTCTCAGAGGGCGGGCCCCCAAGAGCTGGTGACGCAG
-GTTTCTGCTGTCCTCCTGGAGTACCTTTCAGGCCCTGACTCCAGCCCCACGGTTCTGAAG
-AAGGCCTTCCAGGCCTCACTCGGGTGGCTCCTGAGCTCACCCAAGACCCCCGGCTGCTGC
-GATCTGGACCCCCACGCCCAGCAGTTCCTCAGAGAGCTGCTCCCTGTGCTGCAGAAGCGC
-CTGTGCAGCCCCTGCTGGGAGGTGAGGGACTCAGGCCTTGAGTTCCTGACCCAGATGGCC
-AGACACTGGGGAGGGCAGGCCGCCTTCAGACAGGTGCTCCTTGCTTCCGAGGTGCCCAGG
-CTCACCAGGCAGCTCCTGCAAGACCCCGAGAGTTACGTCCGCGCAAGCGCAGTGACCGCC
-ACAGGGCAGCTGTCTAGCTGGGGGCTGCATGCTGCCCCCGCCGGCCCTGAGCACCCAGGG
-GTCCAGCAGAAGAGCCTCCTGTCGGAGCTCCTGCACGTCCTCGCCACAGACTCGGAGGGC
-TTCCCCCGGAGGGCCGTCATGCAGGTCTTCACCGAGTGGCTGAGGGGCGGCCATGCTGAC
-GTGGCCGAGGACCCAGAGCAGTTTGTGGCCGGAGTGCTCCAGGCCGCGAGCAGGGACCTG
-GACTGGGAGGTCCGGGCCCAGGGCCTCGAGCTGGCGCTGGTGTTCCTGGAGCAGCTGCTG
-GGCCCGCCCGGCGTGCGCTGTCCCTACGCCGTGGCCCTGCCCAAGGCAGCCCCGCCTGGC
-ACGCTGGCCCAGGCCTTGCAGGCACTGTGCCGAGTGCAGCTCTTCGAGTTCGCCTTCCGT
-GCCTTGTTCGACTGCGACCGACCTGTGGCGCAGAAGTCCTGTGACCTCCTCCTCTTCCTG
-AAGGCCAAGGCCACTTCCTGCGGCACCCCCCAGGAGGAACGGGACAGCCCCGACGTGTCC
-TCCGTGGAGGCCACACTGCAGAAGTGGCAGGCAGGGGAGCACGGACACCCCCTGGGGGAC
-CTGGAGCCCGCGGCTGTTGTGGCCGTGCTCAGGTCCATGGACTTGGAAGGCCTTCAGGAC
-ACACTGGCCGAGAGCAGTGACCACGTGGAGAGGAGCCCCCAGTCGCTCCTGCAGGACATG
-CTGGCCACCGTGGGCGTCCTCGGGGAGAATGAGGCCGACTGCTACTGA
->ENSPTRT00000019089_pantroglodytes
-ATAGGCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
-CTTCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
-CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
-CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
-CTCATAATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
-GACCTGTTCCCCAACCTCACGGTCATCCGGGGGTCACGACTGTTCTTTAACTACGCGCTG
-GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
-CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
-TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
-GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
-ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCACAGTCACTGCCAGAAAGTTTGCCCG
-ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
-GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
-GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
-GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
-TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
-ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
-CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
-ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
-CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
-TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
-GAAATCGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAT
-TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
-CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
-AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
-AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
-CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAA
-AATGTGACGGAGTTCGACGGGCAGGATGCATGTGGTTCCAACAGTTGGACGGTGGTAGAC
-ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
-CGGGGTCTGAAGCCCTGGACCCAGTATGCCATCTTCGTGAAGACCCTGGTCACCTTTTCG
-GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
-AACCCCTCCGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTTTG
-AAGTGGAAACCCCCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
-AGGCAGGCGGAAGACAGTGAGCTGTTCGAACTGGATTATTGCCTCAAATGGTGTGTGTGG
-TGTGTGTGTGTGGTTGTTTGTTTGTGGAGTGTGTGTGAGTATGAGGATTCGGCCGGCGAA
-TGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTGAAGGAGCTGGAGGAGTCCTCGTTT
-AGGAAGACGTTTGAGGATTACCTGCACAACGTGGTTTTCGTCCCCAGAAAAACCTCTTCA
-GGCACTGGTGCCGAGGACCCTAGGCCATCTCGGAAACGCAGGTCCCTTGGCGATGTTGGG
-AATGTGACGGTGGCCGTGCCCACGGTGGCAGCTTTCCCCAACACTTCCTCGACCAGCGTG
-CCCACGAGTCCGGAGGAGCACAGGCCTTTTGAGAAGGTGGTGAACAAGGAGTCGCTGGTC
-ATCTCCGGCTTGCGACACTTCACGGGCTATCGCATCGAGCTGCAGGCTTGCAACCAGGAC
-ACCCCTGAGGAACGGTGCAGTGTGGCAGCCTACGTCAGTGCCAGGACCATGCCTGAAGCC
-AAGGCTGATGACATTGTCGGCCCTGTGACGCATGAAATCTTTGAGAACAACGTTGTCCAC
-TTGATGTGGCAGGAGCCGAAGGAGCCCAATGGTCTGATCGTGCTGTATGAAGTGAGTTAT
-CGGCGATATGGTGATGAGGAGCTGCATCTCTGCGTCTCCCGCAAGCACTTCGCTCTGGAG
-CGGGGCTGCAGGCTGCGTGGGCTGTCACCGGGGAACTACAGCGTGCGAGTCCGGGCCACC
-TCCCTTGCGGGCAACGGCTCTTGGACGGAACCCACCTATTTCTACGTGACAGACTATTTA
-GATGTCCCGTCAAATATTGCAAAAATTATCATCGGCCCCCTCATCTTTGTCTTTCTCTTC
-AGTGTTGTGATTGGAAGTATTTATCTATTCCTGAGAAAGAGGCAGCCAGATGGGCCGCTG
-GGACCGCTTTACGCTTCTTCAAACCCTGAGTATCTCAGTGCCAGTGATGTGTTTCCATGC
-TCTGTGTACGTGCCGGACGAGTGGGAGGTGCCTCGAGAGAAGATCACCCTCCTTCGAGAG
-CTGGGGCAGGGCTCCTTCGGCATGGTGTATGAGGGCAATGCCAGGGACATCATCAAGGGT
-GAGGCAGAGACCCGCGTGGCGGTGAAGACGGTCAACGAGTCAGCCAGTCTCCGAGAGCGG
-ATTGAGTTCCTCAATGAGGCCTCGGTCATGAAGGGCTTCACCTGCCATCATGTGGTGCGC
-CTCCTGGGAGTGGTGTCCAAGGGCCAGCCCACACTGGTGGTGATGGAGCTGATGGCTCAC
-GGAGACCTGAAGAGCTACCTCCGTTCTCTGCGGCCAGAGGCTGAGAATAATCCCGGCCGC
-CCTCCCCCTACCCTTCAAGAGATGATTCAGATGGCGGCAGAGATTGCTGATGGGATGGCC
-TACCTGAACGCCAAGAAGTTTGTGCATCGGGACCTGGCAGCGAGAAACTGCATGGTCGCC
-CATGATTTTACTGTCAAAATTGGAGACTTTGGAATGACCAGAGACATCTATGAAACGGAT
-TACTACCGGAAAGGGGGCAAGGGTCTGCTCCCTGTACGGTGGATGGCGCCAGAGTCCCTG
-AAGGATGGGGTCTTCACCACTTCTTCTGACATGTGGTCCTTTGGCGTGGTCCTTTGGGAA
-ATCACCAGCTTGGCAGAACAGCCTTACCAAGGCCTGTCTAATGAACAGGTGTTGAAATTT
-GTCATGGATGGAGGGTATCTGGATCAACCCGACAACTGTCCAGAGAGAGTCACTGACCTC
-ATGCGCATGTGCTGGCAATTCAACCCCAAGATGAGGCCAACCTTCCTGGAGATTGTCAAC
-CTGCTCAAGGACGACCTGCACCCCAGCTTTCCGGAGGTGTCGTTCTTCCACAGCGAGGAG
-AACAAGGCTCCCGAGAGCGAGGAGCTGGAGATGGAGTTTGAGGACATGGAGAATGTGCCC
-CTGGACCGTTCCTCGCACTGTCAGAGGGAGGAGGCGGGGGGCCGGGATGGAGGGTCCTCA
-CTAGGTTTCAAGCGGAGCTACGAGGAACACATCCCTTACACACACATGAACGGAGGCAAG
-AAAAACGGGCGGATTCTGACCTTGCCTCGGTCCAATCCTTCCTAA
->ENST00000341500_homosapiens
-ATGGCCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
-CTGCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
-CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
-CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
-CTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
-GACCTGTTCCCCAACCTCACGGTCATCCGGGGATCACGACTGTTCTTTAACTACGCGCTG
-GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
-CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
-TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
-GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
-ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCATAGTCACTGCCAGAAAGTTTGCCCG
-ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
-GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
-GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
-GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
-TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
-ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
-CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
-ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
-CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
-TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
-GAAATTGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAC
-TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
-CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
-AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
-AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
-CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
-AATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCCAACAGTTGGACGGTGGTAGAC
-ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
-CGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTGAAGACCCTGGTCACCTTTTCG
-GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
-AACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTCTG
-AAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
-AGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTATTGCCTCAAAGGGCTGAAGCTG
-CCCTCGAGGACCTGGTCTCCACCATTCGAGTCTGAAGATTCTCAGAAGCACAACCAGAGT
-GAGTATGAGGATTCGGCCGGCGAATGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTG
-AAGGAGCTGGAGGAGTCCTCGTTTAGGAAGACGTTTGAGGATTACCTGCACAACGTGGTT
-TTCGTCCCCAGGCCATCTCGGAAACGCAGGTCCCTTGGCGATGTTGGGAATGTGACGGTG
-GCCGTGCCCACGGTGGCAGCTTTCCCCAACACTTCCTCGACCAGCGTGCCCACGAGTCCG
-GAGGAGCACAGGCCTTTTGAGAAGGTGGTGAACAAGGAGTCGCTGGTCATCTCCGGCTTG
-CGACACTTCACGGGCTATCGCATCGAGCTGCAGGCTTGCAACCAGGACACCCCTGAGGAA
-CGGTGCAGTGTGGCAGCCTACGTCAGTGCGAGGACCATGCCTGAAGCCAAGGCTGATGAC
-ATTGTTGGCCCTGTGACGCATGAAATCTTTGAGAACAACGTCGTCCACTTGATGTGGCAG
-GAGCCGAAGGAGCCCAATGGTCTGATCGTGCTGTATGAAGTGAGTTATCGGCGATATGGT
-GATGAGGAGCTGCATCTCTGCGTCTCCCGCAAGCACTTCGCTCTGGAACGGGGCTGCAGG
-CTGCGTGGGCTGTCACCGGGGAACTACAGCGTGCGAATCCGGGCCACCTCCCTTGCGGGC
-AACGGCTCTTGGACGGAACCCACCTATTTCTACGTGACAGACTATTTAGACGTCCCGTCA
-AATATTGCAAAAATTATCATCGGCCCCCTCATCTTTGTCTTTCTCTTCAGTGTTGTGATT
-GGAAGTATTTATCTATTCCTGAGAAAGAGGCAGCCAGATGGGCCGCTGGGACCGCTTTAC
-GCTTCTTCAAACCCTGAGTATCTCAGTGCCAGTGATGTGTTTCCATGCTCTGTGTACGTG
-CCGGACGAGTGGGAGGTGTCTCGAGAGAAGATCACCCTCCTTCGAGAGCTGGGGCAGGGC
-TCCTTCGGCATGGTGTATGAGGGCAATGCCAGGGACATCATCAAGGGTGAGGCAGAGACC
-CGCGTGGCGGTGAAGACGGTCAACGAGTCAGCCAGTCTCCGAGAGCGGATTGAGTTCCTC
-AATGAGGCCTCGGTCATGAAGGGCTTCACCTGCCATCACGTGGTGCGCCTCCTGGGAGTG
-GTGTCCAAGGGCCAGCCCACGCTGGTGGTGATGGAGCTGATGGCTCACGGAGACCTGAAG
-AGCTACCTCCGTTCTCTGCGGCCAGAGGCTGAGAATAATCCTGGCCGCCCTCCCCCTACC
-CTTCAAGAGATGATTCAGATGGCGGCAGAGATTGCTGACGGGATGGCCTACCTGAACGCC
-AAGAAGTTTGTGCATCGGGACCTGGCAGCGAGAAACTGCATGGTCGCCCATGATTTTACT
-GTCAAAATTGGAGACTTTGGAATGACCAGAGACATCTATGAAACGGATTACTACCGGAAA
-GGGGGCAAGGGTCTGCTCCCTGTACGGTGGATGGCACCGGAGTCCCTGAAGGATGGGGTC
-TTCACCACTTCTTCTGACATGTGGTCCTTTGGCGTGGTCCTTTGGGAAATCACCAGCTTG
-GCAGAACAGCCTTACCAAGGCCTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGA
-GGGTATCTGGATCAACCCGACAACTGTCCAGAGAGAGTCACTGACCTCATGCGCATGTGC
-TGGCAATTCAACCCCAAGATGAGGCCAACCTTCCTGGAGATTGTCAACCTGCTCAAGGAC
-GACCTGCACCCCAGCTTTCCAGAGGTGTCGTTCTTCCACAGCGAGGAGAACAAGGCTCCC
-GAGAGTGAGGAGCTGGAGATGGAGTTTGAGGACATGGAGAATGTGCCCCTGGACCGTTCC
-TCGCACTGTCAGAGGGAGGAGGCGGGGGGCCGGGATGGAGGGTCCTCGCTGGGTTTCAAG
-CGGAGCTACGAGGAACACATCCCTTACACACACATGAACGGAGGCAAGAAAAACGGGCGG
-ATTCTGACCTTGCCTCGGTCCAATCCTTCCTAA
->ENST00000302850_homosapiens
-ATGGCCACCGGGGGCCGGCGGGGGGCGGCGGCCGCGCCGCTGCTGGTGGCGGTGGCCGCG
-CTGCTACTGGGCGCCGCGGGCCACCTGTACCCCGGAGAGGTGTGTCCCGGCATGGATATC
-CGGAACAACCTCACTAGGTTGCATGAGCTGGAGAATTGCTCTGTCATCGAAGGACACTTG
-CAGATACTCTTGATGTTCAAAACGAGGCCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
-CTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTCTATGGGCTCGAGAGCCTGAAG
-GACCTGTTCCCCAACCTCACGGTCATCCGGGGATCACGACTGTTCTTTAACTACGCGCTG
-GTCATCTTCGAGATGGTTCACCTCAAGGAACTCGGCCTCTACAACCTGATGAACATCACC
-CGGGGTTCTGTCCGCATCGAGAAGAACAATGAGCTCTGTTACTTGGCCACTATCGACTGG
-TCCCGTATCCTGGATTCCGTGGAGGATAATTACATCGTGTTGAACAAAGATGACAACGAG
-GAGTGTGGAGACATCTGTCCGGGTACCGCGAAGGGCAAGACCAACTGCCCCGCCACCGTC
-ATCAACGGGCAGTTTGTCGAACGATGTTGGACTCATAGTCACTGCCAGAAAGTTTGCCCG
-ACCATCTGTAAGTCACACGGCTGCACCGCCGAAGGCCTCTGTTGCCACAGCGAGTGCCTG
-GGCAACTGTTCTCAGCCCGACGACCCCACCAAGTGCGTGGCCTGCCGCAACTTCTACCTG
-GACGGCAGGTGTGTGGAGACCTGCCCGCCCCCGTACTACCACTTCCAGGACTGGCGCTGT
-GTGAACTTCAGCTTCTGCCAGGACCTGCACCACAAATGCAAGAACTCGCGGAGGCAGGGC
-TGCCACCAGTACGTCATTCACAACAACAAGTGCATCCCTGAGTGTCCCTCCGGGTACACG
-ATGAATTCCAGCAACTTGCTGTGCACCCCATGCCTGGGTCCCTGTCCCAAGGTGTGCCAC
-CTCCTAGAAGGCGAGAAGACCATCGACTCGGTGACGTCTGCCCAGGAGCTCCGAGGATGC
-ACCGTCATCAACGGGAGTCTGATCATCAACATTCGAGGAGGCAACAATCTGGCAGCTGAG
-CTAGAAGCCAACCTCGGCCTCATTGAAGAAATTTCAGGGTATCTAAAAATCCGCCGATCC
-TACGCTCTGGTGTCACTTTCCTTCTTCCGGAAGTTACGTCTGATTCGAGGAGAGACCTTG
-GAAATTGGGAACTACTCCTTCTATGCCTTGGACAACCAGAACCTAAGGCAGCTCTGGGAC
-TGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTCTTCTTCCACTATAACCCCAAA
-CTCTGCTTGTCAGAAATCCACAAGATGGAAGAAGTTTCAGGAACCAAGGGGCGCCAGGAG
-AGAAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCCTGTGAAAATGAGTTACTT
-AAATTTTCTTACATTCGGACATCTTTTGACAAGATCTTGCTGAGATGGGAGCCGTACTGG
-CCCCCCGACTTCCGAGACCTCTTGGGGTTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
-AATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCCAACAGTTGGACGGTGGTAGAC
-ATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAGAACCACCCAGGGTGGCTGATG
-CGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTGAAGACCCTGGTCACCTTTTCG
-GATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATTTATGTCCAGACAGATGCCACC
-AACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAACTCATCATCCCAGATTATTCTG
-AAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACCCACTACCTGGTTTTCTGGGAG
-AGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTATTGCCTCAAAGGGCTGAAGCTG
-CCCTCGAGGACCTGGTCTCCACCATTCGAGTCTGAAGATTCTCAGAAGCACAACCAGAGT
-GAGTATGAGGATTCGGCCGGCGAATGCTGCTCCTGTCCAAAGACAGACTCTCAGATCCTG
-AAGGAGCTGGAGGAGTCCTCGTTTAGGAAGACGTTTGAGGATTACCTGCACAACGTGGTT
-TTCGTCCCCAGAAAAACCTCTTCAGGCACTGGTGCCGAGGACCCTAGGCCATCTCGGAAA
-CGCAGGTCCCTTGGCGATGTTGGGAATGTGACGGTGGCCGTGCCCACGGTGGCAGCTTTC
-CCCAACACTTCCTCGACCAGCGTGCCCACGAGTCCGGAGGAGCACAGGCCTTTTGAGAAG
-GTGGTGAACAAGGAGTCGCTGGTCATCTCCGGCTTGCGACACTTCACGGGCTATCGCATC
-GAGCTGCAGGCTTGCAACCAGGACACCCCTGAGGAACGGTGCAGTGTGGCAGCCTACGTC
-AGTGCGAGGACCATGCCTGAAGCCAAGGCTGATGACATTGTTGGCCCTGTGACGCATGAA
-ATCTTTGAGAACAACGTCGTCCACTTGATGTGGCAGGAGCCGAAGGAGCCCAATGGTCTG
-ATCGTGCTGTATGAAGTGAGTTATCGGCGATATGGTGATGAGGAGCTGCATCTCTGCGTC
-TCCCGCAAGCACTTCGCTCTGGAACGGGGCTGCAGGCTGCGTGGGCTGTCACCGGGGAAC
-TACAGCGTGCGAATCCGGGCCACCTCCCTTGCGGGCAACGGCTCTTGGACGGAACCCACC
-TATTTCTACGTGACAGACTATTTAGACGTCCCGTCAAATATTGCAAAAATTATCATCGGC
-CCCCTCATCTTTGTCTTTCTCTTCAGTGTTGTGATTGGAAGTATTTATCTATTCCTGAGA
-AAGAGGCAGCCAGATGGGCCGCTGGGACCGCTTTACGCTTCTTCAAACCCTGAGTATCTC
-AGTGCCAGTGATGTGTTTCCATGCTCTGTGTACGTGCCGGACGAGTGGGAGGTGTCTCGA
-GAGAAGATCACCCTCCTTCGAGAGCTGGGGCAGGGCTCCTTCGGCATGGTGTATGAGGGC
-AATGCCAGGGACATCATCAAGGGTGAGGCAGAGACCCGCGTGGCGGTGAAGACGGTCAAC
-GAGTCAGCCAGTCTCCGAGAGCGGATTGAGTTCCTCAATGAGGCCTCGGTCATGAAGGGC
-TTCACCTGCCATCACGTGGTGCGCCTCCTGGGAGTGGTGTCCAAGGGCCAGCCCACGCTG
-GTGGTGATGGAGCTGATGGCTCACGGAGACCTGAAGAGCTACCTCCGTTCTCTGCGGCCA
-GAGGCTGAGAATAATCCTGGCCGCCCTCCCCCTACCCTTCAAGAGATGATTCAGATGGCG
-GCAGAGATTGCTGACGGGATGGCCTACCTGAACGCCAAGAAGTTTGTGCATCGGGACCTG
-GCAGCGAGAAACTGCATGGTCGCCCATGATTTTACTGTCAAAATTGGAGACTTTGGAATG
-ACCAGAGACATCTATGAAACGGATTACTACCGGAAAGGGGGCAAGGGTCTGCTCCCTGTA
-CGGTGGATGGCACCGGAGTCCCTGAAGGATGGGGTCTTCACCACTTCTTCTGACATGTGG
-TCCTTTGGCGTGGTCCTTTGGGAAATCACCAGCTTGGCAGAACAGCCTTACCAAGGCCTG
-TCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGGTATCTGGATCAACCCGACAAC
-TGTCCAGAGAGAGTCACTGACCTCATGCGCATGTGCTGGCAATTCAACCCCAAGATGAGG
-CCAACCTTCCTGGAGATTGTCAACCTGCTCAAGGACGACCTGCACCCCAGCTTTCCAGAG
-GTGTCGTTCTTCCACAGCGAGGAGAACAAGGCTCCCGAGAGTGAGGAGCTGGAGATGGAG
-TTTGAGGACATGGAGAATGTGCCCCTGGACCGTTCCTCGCACTGTCAGAGGGAGGAGGCG
-GGGGGCCGGGATGGAGGGTCCTCGCTGGGTTTCAAGCGGAGCTACGAGGAACACATCCCT
-TACACACACATGAACGGAGGCAAGAAAAACGGGCGGATTCTGACCTTGCCTCGGTCCAAT
-CCTTCCTAA
->ENST00000600492_homosapiens
-TACAAAGAGGCCCCTTATCAGAATGTGACGGAGTTCGACGGGCAGGATGCGTGTGGTTCC
-AACAGTTGGACGGTGGTAGACATTGACCCACCCCTGAGGTCCAACGACCCCAAATCACAG
-AACCACCCAGGGTGGCTGATGCGGGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTG
-AAGACCCTGGTCACCTTTTCGGATGAACGCCGGACCTATGGGGCCAAGAGTGACATCATT
-TATGTCCAGACAGATGCCACCAACCCCTCTGTGCCCCTGGATCCAATCTCAGTGTCTAAC
-TCATCATCCCAGATTATTCTGAAGTGGAAACCACCCTCCGACCCCAATGGCAACATCACC
-CACTACCTGGTTTTCTGGGAGAGGCAGGCGGAAGACAGTGAGCTGTTCGAGCTGGATTAT
-TGCCTCAAAGGGCGAGTCCAGTCATCAGCTCCGCTGTAA
->ENSMUST00000208839_musmusculus
-NAGACAGATTACTATCGGAAAGGGGGCAAGGGACTGCTTCCTGTGAGGTGGATGTCACCT
-GAGTCCCTGAAGGATGGAGTCTTTACTGCTTCTTCTGATATGTGGTCCTTTGGGGTGGTC
-CTTTGGGAAATCACTAGCCTGGCTGAGCAACCTTATCAAGGCCTGTCTAATGAACAGGTG
-TTGAAGTTTGTCATGGATGGAGGCTATCTGGATCCCCCTGATAACTGTCCAGAGAGACTG
-AGATATGAGATAAAGACACACTGGCCACCCTGA
->ENSMUST00000091291_musmusculus
-ATGGGCTTCGGGAGAGGATGTGAGACGACGGCTGTGCCATTGCTGGTGGCCGTGGCCGCG
-TTGCTGGTGGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCTGGTATGGACATC
-CGGAACAACCTGACCAGGCTACATGAGCTGGAGAACTGCTCAGTCATTGAGGGCCATCTG
-CAGATCCTCCTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
-CTCATCATGATCACAGATTACCTGCTTCTCTTCCGTGTCTATGGTCTGGAAAGTCTGAAA
-GACCTCTTCCCAAATCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTG
-GTTATCTTCGAGATGGTCCACCTGAAGGAGCTGGGGCTTTATAACCTCATGAACATCACC
-CGGGGCTCTGTCCGCATCGAGAAGAATAATGAGCTCTGCTACCTGGCCACTATCGACTGG
-TCCCGTATCCTGGATTCTGTGGAGGACAACTACATTGTACTGAACAAAGATGACAACGAG
-GAATGTGGGGATGTCTGTCCAGGCACCGCCAAGGGCAAGACCAACTGTCCTGCCACTGTC
-ATCAATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCA
-ACCATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGCCACAAAGAGTGCCTG
-GGCAACTGTTCGGAACCTGATGACCCCACCAAGTGTGTGGCCTGTCGCAACTTCTATCTG
-GATGGTCAGTGTGTGGAGACCTGCCCGCCACCCTACTATCACTTCCAGGACTGGCGCTGT
-GTGAACTTCAGCTTCTGCCAAGACCTTCACTTCAAATGCAGGAACTCTCGGAAGCCTGGC
-TGCCACCAATACGTCATTCACAACAATAAGTGCATCCCCGAGTGCCCGTCTGGCTATACC
-ATGAATTCCAGCAACTTGATGTGCACCCCATGTCTGGGACCCTGCCCTAAGGTCTGCCAA
-ATCCTCGAAGGTGAGAAGACCATTGATTCTGTGACATCTGCCCAGGAGCTCCGAGGCTGC
-ACTGTGATCAACGGTAGCCTGATCATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAG
-CTGGAGGCTAACCTTGGCCTCATTGAAGAAATTTCGGGATTTCTAAAGATCCGCCGCTCC
-TATGCTCTGGTATCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTG
-GAAATTGGGAACTATTCTTTTTATGCCTTGGACAACCAGAACCTGAGGCAACTCTGGGAC
-TGGAGCAAACACAACCTCACCATCACTCAGGGCAAGCTCTTCTTCCATTACAACCCGAAA
-CTCTGCTTGTCTGAAATTCACAAGATGGAAGAAGTCTCCGGAACTAAGGGCCGTCAGGAG
-AGGAACGACATTGCCCTGAAGACCAATGGGGACCAGGCATCGTGTGAAAATGAATTGCTT
-AAATTTTCTTTCATTCGGACATCTTTTGACAAGATCCTGTTGAGGTGGGAACCCTACTGG
-CCCCCCGACTTCCGAGATCTCCTGGGATTCATGTTGTTCTACAAAGAGGCCCCTTATCAG
-AATGTGACAGAGTTTGATGGGCAGGATGCTTGTGGCTCCAACAGCTGGACTGTGGTGGAT
-ATTGACCCGCCCCAGAGGTCCAACGACCCCAAGTCTCAGACCCCAAGCCACCCTGGGTGG
-CTGATGCGGGGCCTCAAACCCTGGACCCAATACGCCATCTTTGTGAAGACCTTGGTTACC
-TTCTCTGATGAACGGCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGAT
-GCCACTAATCCTTCTGTCCCCCTGGATCCCATATCAGTTTCTAATTCCTCATCTCAGATT
-ATCTTAAAGTGGAAGCCCCCCTCTGACCCCAATGGCAACATCACACACTACCTGGTGTAC
-TGGGAGAGGCAAGCAGAGGACAGCGAGCTGTTTGAGCTGGATTATTGTCTCAAAGGGCTG
-AAGCTCCCTTCACGGACCTGGTCCCCACCCTTTGAGTCTGATGATTCTCAGAAGCACAAT
-CAGAGTGAGTATGACGACTCGGCCAGTGAGTGCTGCTCATGCCCTAAGACTGACTCTCAG
-ATCCTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAAC
-GTGGTTTTTGTCCCCAGGCCATCCCGAAAGCGAAGATCCCTTGAAGAGGTGGGGAATGTG
-ACAGCCACCACACTCACACTTCCAGATTTCCCCAACGTCTCCTCTACCATTGTGCCCACA
-AGTCAGGAGGAGCACAGGCCATTTGAGAAAGTGGTGAACAAGGAGTCACTTGTCATCTCT
-GGCCTGAGACACTTCACTGGGTACCGCATTGAGCTGCAGGCATGCAATCAAGATTCCCCA
-GATGAGAGGTGCAGTGTGGCTGCCTACGTCAGTGCCCGGACCATGCCTGAAGCTAAGGCA
-GATGACATCGTTGGCCCTGTGACTCATGAAATCTTTGAGAACAATGTTGTACACTTAATG
-TGGCAAGAGCCAAAGGAACCTAATGGTCTGATTGTGCTATATGAAGTGAGCTATCGCCGA
-TATGGTGATGAGGAGCTGCACCTCTGTGTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGC
-TGCAGGCTGCGAGGGCTCTCCCCAGGAAACTACAGTGTTCGAGTCCGGGCTACCTCTCTG
-GCAGGAAATGGCTCCTGGACAGAACCCACCTATTTTTATGTGACTGATTATTTAGATGTC
-CCATCAAATATTGCCAAAATTATCATTGGACCCCTCATCTTTGTCTTCCTCTTCAGTGTT
-GTGATTGGAAGTATTTATCTATTTCTGAGAAAGAGGCAGCCGGATGGGCCAATGGGACCA
-CTGTATGCATCTTCAAACCCTGAGTACCTCAGTGCCAGTGATGTGTTTCCATCTTCTGTG
-TACGTGCCGGACGAGTGGGAGGTGCCTCGAGAGAAGATCACCCTTCTTCGAGAGCTGGGG
-CAGGGATCCTTTGGTATGGTGTATGAAGGCAATGCCAAGGATATCATCAAGGGTGAGGCA
-GAGACCCGTGTTGCGGTTAAGACTGTCAATGAGTCAGCCAGTCTTCGAGAACGGATCGAG
-TTCCTCAATGAGGCATCAGTCATGAAGGGATTCACCTGCCATCATGTGGTCCGCCTTCTT
-GGGGTGGTATCCAAAGGACAGCCAACGCTGGTAGTGATGGAATTGATGGCTCATGGAGAC
-CTGAAAAGTCACCTCCGTTCTCTGAGGCCAGATGCTGAGAATAACCCAGGCCGCCCTCCC
-CCTACCTTGCAAGAAATGATTCAGATGACAGCAGAAATTGCTGATGGCATGGCATACTTG
-AACGCCAAGAAGTTTGTGCACCGGGACCTGGCAGCTCGAAACTGCATGGTTGCCCATGAT
-TTTACTGTCAAAATTGGAGACTTTGGAATGACAAGGGACATCTACGAGACAGATTACTAT
-CGGAAAGGGGGCAAGGGACTGCTTCCTGTGAGGTGGATGTCACCTGAGTCCCTGAAGGAT
-GGAGTCTTTACTGCTTCTTCTGATATGTGGTCCTTTGGGGTGGTCCTTTGGGAAATCACT
-AGCCTGGCTGAGCAACCTTATCAAGGCCTGTCTAATGAACAGGTGTTGAAGTTTGTCATG
-GATGGAGGCTATCTGGATCCCCCTGATAACTGTCCAGAGAGACTCACTGACCTGATGCGC
-ATGTGCTGGCAGTTCAACCCCAAGATGAGGCCAACCTTCCTGGAAATCGTCAACCTGCTC
-AAGGATGACCTCCACCCCAGCTTTCCAGAAGTTTCCTTCTTCTACAGCGAGGAGAACAAG
-GCTCCTGAGAGTGAGGAGCTGGAGATGGAGTTTGAAGACATGGAGAATGTCCCGTTGGAT
-CGTTCCTCTCACTGTCAGAGAGAAGAGGCTGGGGGCCGGGAGGGAGGGTCCTCACTGAGC
-ATCAAACGGACCTATGATGAACACATCCCCTATACCCACATGAATGGGGGCAAGAAGAAC
-GGACGTGTCCTTACCCTGCCAAGGTCAAACCCTTCCTAA
->ENSMUST00000207100_musmusculus
-AGGTCCAACGACCCCAAGTCTCAGACCCCAAGCCACCCTGGGTGGCTGATGCGGGGCCTC
-AAACCCTGGACCCAATACGCCATCTTTGTGAAGACCTTGGTTACCTTCTCTGATGAACGG
-CGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGATGCCACTAATCCTTCT
-GTCCCCCTGGATCCCATATCAGTTTCTAATTCCTCATCTCAGATTATCTTAAAGTGGAAG
-CCCCCCTCTGACCCCAATGGCAACATCACACACTACCTGGTGTACTGGGAGAGGCAAGCA
-GAGGACAGCGAGCTGTTTGAGCTGGATTATTGTCTCAAAGGGCTGAAGCTCCCTTCACGG
-ACCTGGTCCCCACCCTTTGAGTCTGATGATTCTCAGAAGCACAATCAGAGTGAGTATGAC
-GACTCGGCCAGTGAGTGCTGCTCATGCCCTAAGACTGACTCTCAGATCCTGAAGGAGCTG
-GAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAACGTGGTTTTTGTCCCC
-AGAAAAACCTCTTCAGGCAATGGTGCCGAGGACAGTAGGCCATCCCGAAAGCGAAGATCC
-CTTGAAGAGGTGGGGAATGTGACAGCCACCACACTCACACTTCCAGATTTCCCCAACGTC
-TCCTCTACCATT
->ENSRNOT00000041155_rattusnorvegicus
-ATGGGCTCCGGGAGAGGATGTGAGACGACGGCGGTGCCGTTGCTGATGGCCGTGGCCGCG
-TTGCTGGTGGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCGGGAATGGACATC
-CGGAACAACCTGACCAGGTTGCATGAGCTGGAGAACTGCTCGGTCATTGAGGGCCATCTG
-CAGATCCTCTTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAA
-CTCATCATGATCACAGACTACCTGCTTCTTTTCCGTGTCTATGGCCTAGAAAGTCTAAAA
-GACCTCTTCCCAAACCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTG
-GTCATCTTCGAGATGGTCCACCTGAAGGAGCTGGGTCTTTACAACCTCATGAACATCACC
-CGGGGCTCTGTCCGCATCGAGAAGAATAATGAACTCTGCTACCTGGCCACTATCGACTGG
-TCCCGCATCCTGGATTCCGTGGAGGACAACTACATTGTACTGAACAAAGATGACAATGAG
-GAATGTGGGGACGTCTGTCCAGGCACAGCCAAGGGCAAGACCAACTGCCCTGCCACCGTC
-ATCAATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCA
-ACCATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGTCACAAGGAGTGCCTG
-GGCAACTGTTCAGAACCCGATGACCCTACCAAGTGTGTGGCCTGTCGAAACTTCTACCTG
-GATGGTCAGTGTGTGGAGACCTGCCCACCACCCTACTATCACTTCCAGGATTGGCGCTGT
-GTAAACTTCAGCTTCTGCCAAGACCTTCACTACAAATGCAGGAACTCTCGGAAGCCTGGC
-TGTCACCAATACGTCATTCACAACAACAAGTGCATCCCCGAGTGCCCGTCTGGCTATACC
-ATGAATTCCAGCAACTTGATGTGCACCCCGTGTCTGGGACCCTGTCCTAAGGTCTGCCAA
-ATCCTCGAAGGCGAGAAGACCATTGATTCCGTGACATCTGCCCAGGAGCTCCGAGGCTGC
-ACTGTGATCAATGGCAGCCTGATTATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAA
-CTAGAGGCTAACCTTGGCCTCATTGAAGAAATCTCAGGGTTCCTAAAGATCCGTCGCTCC
-TATGCTCTGGTGTCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTG
-GAAATTGGGAACTATTCTTTCTACGCCTTGGACAACCAGAACCTGAGGCAGCTGTGGGAC
-TGGAACAAGCACAACCTCACGATCACTCAGGGCAAGCTCTTCTTCCACTACAACCCCAAA
-CTCTGCCTGTCTGAGATCCACAAGATGGAGGAAGTGTCCGGAACCAAGGGCCGCCAGGAG
-AGGAACGACATTGCCCTGAAGACCAACGGGGACCAGGCATCCTGTGAAAATGAATTACTT
-AAATTCTCTTTCATCCGGACGTCTTTTGACAAGATCTTGCTGAGGTGGGAGCCCTACTGG
-CCCCCCGACTTCCGAGATCTCCTGGGATTCATGCTGTTCTACAAAGAGGCCCCTTATCAG
-AACGTGACAGAGTTTGACGGGCAGGATGCGTGTGGCTCCAACAGCTGGACTGTGGTGGAT
-ATTGACCCGCCCCAGAGGTCCAACGACCCTAAGTCTCAGACCCCAAGCCACCCTGGGTGG
-CTGATGCGGGGCCTCAAACCCTGGACCCAGTATGCCATCTTTGTCAAGACCTTGGTTACC
-TTCTCTGATGAACGCCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGAT
-GCCACCAATCCTTCCGTTCCCCTGGATCCCATATCAGTTTCCAACTCCTCATCTCAGATT
-ATCTTAAAGTGGAAGCCCCCCTCGGACCCCAATGGCAACATCACACACTACCTGGTCTAC
-TGGGAGAGGCAGGCGGAGGACAGCGAGCTGTTCGAGTTGGATTATTGTCTCAAAGGGCTG
-AAGCTCCCCTCACGCACCTGGTCCCCACCTTTTGAGTCTGACGATTCTCAAAAGCACAAT
-CAGAGTGAGTATGACGACTCGGCCAGCGAGTGCTGCTCATGTCCTAAGACTGACTCTCAG
-ATCCTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAAC
-GTGGTTTTTGTTCCCAGAAAAACCTCTTCAGGCAATGGTGCTGAGGACACTAGGCCATCC
-CGAAAGCGAAGATCCCTTGAAGAGGTGGGCAATGTGACAGCCACTACACCCACACTTCCA
-GATTTTCCCAACATCTCCTCCACCATCGCGCCCACAAGCCACGAAGAGCACAGACCATTT
-GAGAAAGTAGTAAACAAGGAGTCACTTGTCATCTCTGGCCTGAGACACTTCACTGGGTAC
-CGCATTGAGCTGCAGGCATGCAATCAGGACTCCCCAGAAGAGAGGTGCAGCGTGGCTGCC
-TACGTCAGTGCCCGGACCATGCCTGAAGCTAAGGCAGATGACATCGTTGGCCCTGTGACC
-CATGAAATCTTTGAGAACAATGTTGTACACTTAATGTGGCAAGAGCCAAAGGAACCTAAT
-GGTCTGATTGTGCTATATGAAGTGAGCTATCGGCGATATGGTGATGAGGAGCTGCACCTC
-TGTGTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGCTGCAGGCTTCGAGGGCTCTCTCCA
-GGAAACTACAGTGTTCGAGTCCGGGCTACCTCTCTGGCAGGAAATGGCTCCTGGACAGAA
-CCCACCTATTTTTATGTGACTGATTATTTAGATGTCCCATCAAATATTGCCAAAATTATC
-ATCGGGCCCCTCATCTTCGTCTTCCTCTTCAGTGTCGTGATCGGAAGTATTTATCTATTC
-TTGAGGAAGAGGCAGCCAGATGGGCCAATGGGACCACTGTACGCTTCTTCAAACCCAGAG
-TACCTCAGTGCCAGTGATGTCTTTCCATCTTCCGTATACGTTCCGGATGAGTGGGAGGTA
-CCTCGAGAGAAGATCACCCTCCTCCGAGAGCTGGGGCAGGGATCCTTCGGTATGGTGTAC
-GAAGGCAATGCCAAGGATATCATCAAGGGTGAGGTAGAGACCCGTGTTGCGGTGAAGACG
-GTCAATGAGTCAGCCAGTCTTCGAGAACGGATCGAGTTCCTCAATGAGGCATCAGTCATG
-AAGGGCTTCACCTGTCATCACGTGGTCCGCCTTCTTGGGGTGGTGTCCAAAGGCCAGCCC
-ACATTGGTAGTGATGGAACTGATGGCTCATGGAGACCTGAAAAGTCACCTCCGTTCTCTG
-CGGCCCGATGCTGAGAACAACCCAGGCCGTCCTCCCCCTACCTTGCAAGAAATGATTCAG
-ATGACAGCAGAAATTGCCGATGGCATGGCATACTTGAACGCCAAGAAGTTTGTGCACCGG
-GACCTGGCAGCTCGGAACTGCATGGTTGCCCATGATTTTACTGTCAAAATCGGAGACTTT
-GGAATGACGAGAGACATCTACGAGACAGATTACTATCGGAAAGGGGGCAAGGGGTTGCTG
-CCCGTGAGGTGGATGTCACCCGAGTCCCTGAAGGACGGAGTCTTCACTGCTTCTTCCGAC
-ATGTGGTCCTTTGGGGTGGTCCTTTGGGAAATCACCAGCCTGGCTGAGCAACCTTACCAA
-GGCCTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGCTATCTGGATCCCCCT
-GATAACTGTCCAGAGAGACTCACTGACCTGATGCGCATGTGCTGGCAGTTCAACCCCAAG
-ATGAGGCCGACCTTCCTGGAAATCGTCAACCTGCTCAAGGACGACCTCCACCCCAGCTTT
-CCGGAAGTTTCCTTCTTCTACAGCGAGGAGAACAAGGCTCCCGAGAGTGAAGAGCTGGAG
-ATGGAGTTCGAGGACATGGAGAATGTCCCCTTGGATCGTTCCTCTCACTGTCAGAGAGAA
-GAGGCTGGATGCCGGGAGGGAGGGTCCTCTCTGAGCATCAAACGGACCTATGATGAACAC
-ATCCCCTACACCCACATGAACGGGGGCAAGAAGAATGGGCGGGTCCTCACCCTGCCGAGG
-TCGAACCCTTCCTAA
->ENSRNOT00000067448_rattusnorvegicus
-ATGGGCTCCGGGAGAGGATGTGAGACGACGGCGGTGCCGTTGCTGATGGCCGTGGCCGTT
-GCTGGTGGCACAGCCGGCCACCTGTACCCTGGAGAGGTGTGCCCGGGAATGGACATCCGG
-AACAACCTGACCAGGTTGCATGAGCTGGAGAACTGCTCGGTCATTGAGGGCCATCTGCAG
-ATCCTCTTGATGTTCAAGACCAGACCCGAAGATTTCCGAGACCTCAGTTTCCCCAAACTC
-ATCATGATCACAGACTACCTGCTTCTTTTCCGTGTCTATGGCCTAGAAAGTCTAAAAGAC
-CTCTTCCCAAACCTCACAGTCATCCGAGGCTCCCGTCTCTTCTTCAACTATGCCCTGGTC
-ATCTTCGAGATGGTCCACCTGAAGGAGCTGGGTCTTTACAACCTCATGAACATCACCCGG
-GGCTCTGTCCGCATCGAGAAGAATAATGAACTCTGCTACCTGGCCACTATCGACTGGTCC
-CGCATCCTGGATTCCGTGGAGGACAACTACATTGTACTGAACAAAGATGACAATGAGGAA
-TGTGGGGACGTCTGTCCAGGCACAGCCAAGGGCAAGACCAACTGCCCTGCCACCGTCATC
-AATGGGCAGTTTGTGGAACGGTGCTGGACACACAGTCATTGTCAGAAAGTTTGCCCAACC
-ATCTGTAAGTCACATGGCTGCACAGCTGAAGGCCTGTGCTGTCACAAGGAGTGCCTGGGC
-AACTGTTCAGAACCCGATGACCCTACCAAGTGTGTGGCCTGTCGAAACTTCTACCTGGAT
-GGTCAGTGTGTGGAGACCTGCCCACCACCCTACTATCACTTCCAGGATTGGCGCTGTGTA
-AACTTCAGCTTCTGCCAAGACCTTCACTACAAATGCAGGAACTCTCGGAAGCCTGGCTGT
-CACCAATACGTCATTCACAACAACAAGTGCATCCCCGAGTGCCCGTCTGGCTATACCATG
-AATTCCAGCAACTTGATGTGCACCCCGTGTCTGGGACCCTGTCCTAAGGTCTGCCAAATC
-CTCGAAGGCGAGAAGACCATTGATTCCGTGACATCTGCCCAGGAGCTCCGAGGCTGCACT
-GTGATCAATGGCAGCCTGATTATCAACATCCGAGGGGGCAACAACCTGGCAGCTGAACTA
-GAGGCTAACCTTGGCCTCATTGAAGAAATCTCAGGGTTCCTAAAGATCCGTCGCTCCTAT
-GCTCTGGTGTCACTTTCTTTCTTCAGGAAGCTACATCTGATTCGAGGAGAGACCTTGGAA
-ATTGGGAACTATTCTTTCTACGCCTTGGACAACCAGAACCTGAGGCAGCTGTGGGACTGG
-AACAAGCACAACCTCACGATCACTCAGGGCAAGCTCTTCTTCCACTACAACCCCAAACTC
-TGCCTGTCTGAGATCCACAAGATGGAGGAAGTGTCCGGAACCAAGGGCCGCCAGGAGAGG
-AACGACATTGCCCTGAAGACCAACGGGGACCAGGCATCCTGTGAAAATGAATTACTTAAA
-TTCTCTTTCATCCGGACGTCTTTTGACAAGATCTTGCTGAGGTGGGAGCCCTACTGGCCC
-CCCGACTTCCGAGATCTCCTGGGATTCATGCTGTTCTACAAAGAGGCCCCTTATCAGAAC
-GTGACAGAGTTTGACGGGCAGGATGCGTGTGGCTCCAACAGCTGGACTGTGGTGGATATT
-GACCCGCCCCAGAGGTCCAACGACCCTAAGTCTCAGACCCCAAGCCACCCTGGGTGGCTG
-ATGCGGGGCCTCAAACCCTGGACCCAGTATGCCATCTTTGTCAAGACCTTGGTTACCTTC
-TCTGATGAACGCCGGACCTATGGAGCCAAAAGTGATATCATCTATGTGCAAACAGATGCC
-ACCAATCCTTCCGTTCCCCTGGATCCCATATCAGTTTCCAACTCCTCATCTCAGATTATC
-TTAAAGTGGAAGCCCCCCTCGGACCCCAATGGCAACATCACACACTACCTGGTCTACTGG
-GAGAGGCAGGCGGAGGACAGCGAGCTGTTCGAGTTGGATTATTGTCTCAAAGGGCTGAAG
-CTCCCCTCACGCACCTGGTCCCCACCTTTTGAGTCTGACGATTCTCAAAAGCACAATCAG
-AGTGAGTATGACGACTCGGCCAGCGAGTGCTGCTCATGTCCTAAGACTGACTCTCAGATC
-CTGAAGGAGCTGGAGGAGTCTTCATTCAGGAAGACCTTCGAGGATTACCTGCACAACGTG
-GTTTTTGTTCCCAGAAAAACCTCTTCAGGCAATGGTGCTGAGGACACTAGGCCATCCCGA
-AAGCGAAGATCCCTTGAAGAGGTGGGCAATGTGACAGCCACTACACCCACACTTCCAGAT
-TTTCCCAACATCTCCTCCACCATCGCGCCCACAAGCCACGAAGAGCACAGACCATTTGAG
-AAAGTAGTAAACAAGGAGTCACTTGTCATCTCTGGCCTGAGACACTTCACTGGGTACCGC
-ATTGAGCTGCAGGCATGCAATCAGGACTCCCCAGAAGAGAGGTGCAGCGTGGCTGCCTAC
-GTCAGTGCCCGGACCATGCCTGAAGCTAAGGCAGATGACATCGTTGGCCCTGTGACCCAT
-GAAATCTTTGAGAACAATGTTGTACACTTAATGTGGCAAGAGCCAAAGGAACCTAATGGT
-CTGATTGTGCTATATGAAGTGAGCTATCGGCGATATGGTGATGAGGAGCTGCACCTCTGT
-GTCTCCCGGAAGCATTTTGCCCTGGAGCGGGGCTGCAGGCTTCGAGGGCTCTCTCCAGGA
-AACTACAGTGTTCGAGTCCGGGCTACCTCTCTGGCAGGAAATGGCTCCTGGACAGAACCC
-ACCTATTTTTATGTGACTGATTATTTAGATGTCCCATCAAATATTGCCAAAATTATCATC
-GGGCCCCTCATCTTCGTCTTCCTCTTCAGTGTCGTGATCGGAAGTATTTATCTATTCTTG
-AGGAAGAGGCAGCCAGATGGGCCAATGGGACCACTGTACGCTTCTTCAAACCCAGAGTAC
-CTCAGTGCCAGTGATGTCTTTCCATCTTCCGTATACGTTCCGGATGAGTGGGAGGTACCT
-CGAGAGAAGATCACCCTCCTCCGAGAGCTGGGGCAGGGATCCTTCGGTATGGTGTACGAA
-GGCAATGCCAAGGATATCATCAAGGGTGAGGTAGAGACCCGTGTTGCGGTGAAGACGGTC
-AATGAGTCAGCCAGTCTTCGAGAACGGATCGAGTTCCTCAATGAGGCATCAGTCATGAAG
-GGCTTCACCTGTCATCACGTGGTCCGCCTTCTTGGGGTGGTGTCCAAAGGCCAGCCCACA
-TTGGTAGTGATGGAACTGATGGCTCATGGAGACCTGAAAAGTCACCTCCGTTCTCTGCGG
-CCCGATGCTGAGAACAACCCAGGCCGTCCTCCCCCTACCTTGCAAGAAATGATTCAGATG
-ACAGCAGAAATTGCCGATGGCATGGCATACTTGAACGCCAAGAAGTTTGTGCACCGGGAC
-CTGGCAGCTCGGAACTGCATGGTTGCCCATGATTTTACTGTCAAAATCGGAGACTTTGGA
-ATGACGAGAGACATCTACGAGACAGATTACTATCGGAAAGGGGGCAAGGGGTTGCTGCCC
-GTGAGGTGGATGTCACCCGAGTCCCTGAAGGACGGAGTCTTCACTGCTTCTTCCGACATG
-TGGTCCTTTGGGGTGGTCCTTTGGGAAATCACCAGCCTGGCTGAGCAACCTTACCAAGGC
-CTGTCTAATGAACAGGTGTTGAAATTTGTCATGGATGGAGGCTATCTGGATCCCCCTGAT
-AACTGTCCAGAGAGACTCACTGACCTGATGCGCATGTGCTGGCAGTTCAACCCCAAGATG
-AGGCCGACCTTCCTGGAAATCGTCAACCTGCTCAAGGACGACCTCCACCCCAGCTTTCCG
-GAAGTTTCCTTCTTCTACAGCGAGGAGAACAAGGCTCCCGAGAGTGAAGAGCTGGAGATG
-GAGTTCGAGGACATGGAGAATGTCCCCTTGGATCGTTCCTCTCACTGTCAGAGAGAAGAG
-GCTGGATGCCGGGAGGGAGGGTCCTCTCTGAGCATCAAACGGACCTATGATGAACACATC
-CCCTACACCCACATGAACGGGGGCAAGAAGAATGGGCGGGTCCTCACCCTGCCGAGGTCG
-AACCCTTCCTAA
->ENSSSCT00000014817_susscrofa
-GTGTGCCCAGGGATGGATATCCGGAATAACCTTACACGGCTGCACGAGTTGGCCAACTGC
-TCGGTCATCGAAGGACATTTGCAGATCCTGTTGATGTTCAAAACGCGGCCCGAGGATTTC
-CGAGACCTCAGTTTCCCCAAACTCATCATGATCACTGATTACTTGCTGCTCTTCCGGGTC
-TACGGGCTGGAGAGCCTGAAGGACCTGTTCCCCAACCTCACCGTCATCCGGGGCTCACGC
-CTCTTCTTTAACTATGCGCTGGTCATCTTTGAGATGGTTCACTTGAAGGAGCTTGGCCTC
-TACAATTTGATGAACATCACCAGGGGTGCTGTCCGCATCGAGAAGAACAATGAGCTCTGC
-TACCTGGCGACCATTGACTGGTCGCGCATCCTGGACTCTGTGGAGGATAATTACATTGTG
-CTGAACAAAGACGACAACGAGGAGTGTGGGGACATTTGCCCAGGCACTGCGAAGGGCAAG
-ACCAATTGCCCTGCCACCGTCATCAATGGGCAATTTGTCGAGCGGTGTTGGACGCACAGT
-CACTGCCAGAAAGTGTGCCCGACCATCTGTAAGTCGCACGGCTGCACTGCTGAGGGCCTC
-TGCTGTCACAGCGAGTGTTTGGGCAACTGCTCTGAGCCAGACGACCCCACCAAGTGCGTG
-GCCTGCCGCAACTTCTACCTGGACGGCAGATGCGTGGAGACCTGCCCGCCCCCCTACTAC
-CACTTCCAAGACTGGCGCTGCGTGAACTTCAGCTTCTGCCAGGACCTGCACAACAAATGC
-AAGAACTCAAGGAGGCAGGGCTGCCACCAGTACGTCATTCACAACAACAAGTGTATCCCT
-GAGTGCCCCTCAGGGTACACGATGAATTCCAGCAACTTGATGTGCACTCCGTGCCTAGGC
-CCCTGTCCCAAAGTGTGTCACCTCCTGGAAGGCGAGAAGACCATCGACTCAGTGACATCC
-GCCCAGGAGCTCCGAGGCTGCACCATTATCAACGGGAGCCTAATCATCAACATTCGAGGA
-GGCAACAACCTGGCAGCCGAACTAGAGGCCAACCTTGGACTCATTGAGGAGATTTCAGGG
-TACCTGAAAATCCGCCGATCCTATGCCCTCGTGTCACTTTCCTTCTTCCGGAAGTTGCGT
-CTGATCCGAGGGGAGACGTTGGAAATTGGGAACTATTCTTTCTATGCCTTGGACAACCAG
-AACCTAAGGCAACTGTGGGACTGGAGCAAACACAACCTCACCATCACTCAGGGGAAACTC
-TTCTTCCATTATAATCCCAAACTCTGCTTGTCGGAAATTCACAAGATGGAGGAAGTTTCT
-GGAACCAAGGGGCGCCAGGAGAGAAATGATATTGCCCTGAAGACCAATGGGGACCAGGCG
-TCCTGTGAAAATGAGTTACTTAAATTTTCTTACATTCGGACATCTTATGACAAGATCTTG
-CTGAAGTGGGAGCCGTATTGGCCCCCCGACTTCCGAGACCTCCTGGGGTTCATGCTCTTC
-TACAAAGAGGCCCCTTATCAGAACGTGACGGAGTTTGACGGGCAGGATGCGTGTGGCTCC
-AACAGCTGGACGGTGGTGGACATTGACCCGCCTACGAGGTCCAATGACCCCAAGTCCCAG
-AACCATCCTGGGTGGCTGATGCGTGGTCTCAAGCCCTGGACCCAGTATGCCATCTTTGTC
-AAGACTTTGGTCACCTTTTCTGATGAACGACGCACCTATGGAGCCAAGAGTGACATCATC
-TACGTCCAGACAGATGCCACAAGTAAGCATGTC
-