changeset 5:733ca84b21ee draft default tip

"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/splitfasta commit 31945d5d8c5ebee64ebf29c6ea022fb831f47274"
author rnateam
date Mon, 21 Sep 2020 15:40:14 +0000
parents ae4d5733272f
children
files splitFasta.py splitFasta.xml split_fasta.py test-data/ID1.fasta test-data/ID1_result1.fasta test-data/ID2.fasta test-data/ID2_result1.fasta test-data/ID3.fasta test-data/ID3_result1.fasta test-data/part1.fasta test-data/part2.fasta test-data/part3.fasta test-data/part4.fasta test-data/sample1.fasta test-data/sample2.fasta test-data/test.fasta tool_dependencies.xml
diffstat 17 files changed, 2120 insertions(+), 51 deletions(-) [+]
line wrap: on
line diff
--- a/splitFasta.py	Fri Oct 16 16:13:34 2015 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,13 +0,0 @@
-#!/usr/bin/env python
-import os
-import sys
-from Bio import SeqIO
-
-if __name__ == "__main__":
-    inpath = sys.argv[1]
-    os.mkdir('splits')
-    with open(inpath, 'r') as handle:
-        for record in SeqIO.parse(handle, 'fasta'):
-            header = os.path.join('splits', record.id + '.fasta')
-            with open(header, 'w') as handle2:
-                SeqIO.write([record], handle2, 'fasta')
--- a/splitFasta.xml	Fri Oct 16 16:13:34 2015 -0400
+++ b/splitFasta.xml	Mon Sep 21 15:40:14 2020 +0000
@@ -1,35 +1,59 @@
-<tool id="rbc_splitfasta" name="Split Fasta" version="0.2.0">
+<tool id="rbc_splitfasta" name="Split Fasta" version="0.4.0">
     <description>files into a collection</description>
     <requirements>
-        <requirement type="package" version="1.65">biopython</requirement>
+        <requirement type="package" version="1.76">biopython</requirement>
     </requirements>
-    <stdio>
-        <exit_code range="1:" />
-    </stdio>
-    <command interpreter="python">
+    <command detect_errors="aggressive">
     <![CDATA[
-        splitFasta.py $inputFile
+        #if $splitmode.splitmode_select == "each":
+            python $__tool_directory__/split_fasta.py '$inputFile'
+        #else if $splitmode.splitmode_select == "chunks":
+            python $__tool_directory__/split_fasta.py '$inputFile' $splitmode.num_chunks
+        #end if
     ]]></command>
     <inputs>
         <param name="inputFile" type="data" format="fasta" label="Fasta file to split"/>
+        <conditional name="splitmode">
+            <param name="splitmode_select" type="select" label="Split mode">
+                <option value="each">Each sequence in its own dataset</option>
+                <option value="chunks">Split into a number of chunks</option>
+            </param>
+            <when value="chunks">
+                <param name="num_chunks" type="integer" value="10" label="Number of chunks to split into" />
+            </when>
+            <when value="each"/>
+        </conditional>
     </inputs>
     <outputs>
-        <collection name="splitted_fasta" type="list" label="Sequence collection in FASTA format">
+        <collection name="splitted_fasta" type="list" label="${tool.name} on ${on_string}">
             <discover_datasets pattern="(?P&lt;designation&gt;.*)" directory="splits" ext="fasta" visible="false"/>
         </collection>
     </outputs>
     <tests>
         <test>
-            <param name="inputFile" value="test.fasta" />
-            <output_collection name="splitted_fasta">
-                <element name="ID1.fasta" file="ID1_result1.fasta" ftype="fasta" />
-                <element name="ID2.fasta" file="ID2_result1.fasta" ftype="fasta" />
-                <element name="ID3.fasta" file="ID3_result1.fasta" ftype="fasta" />
+            <param name="inputFile" value="sample1.fasta" />
+            <param name="splitmode|splitmode_select" value="each" />
+            <output_collection name="splitted_fasta" count="3">
+                <element name="ID1" file="ID1.fasta" ftype="fasta" />
+                <element name="ID2" file="ID2.fasta" ftype="fasta" />
+                <element name="ID3" file="ID3.fasta" ftype="fasta" />
+            </output_collection>
+        </test>
+        <test>
+            <param name="inputFile" value="sample2.fasta" />
+            <param name="splitmode|splitmode_select" value="chunks" />
+            <param name="num_chunks" value="4" />
+            <output_collection name="splitted_fasta" count="4">
+                <element name="part1" file="part1.fasta" ftype="fasta" />
+                <element name="part2" file="part2.fasta" ftype="fasta" />
+                <element name="part3" file="part3.fasta" ftype="fasta" />
+                <element name="part4" file="part4.fasta" ftype="fasta" />
             </output_collection>
         </test>
     </tests>
     <help><![CDATA[
-        Takes an input file and writes each consecutive two lines to a separate file, in a dataset collection.
+        Takes an input FASTA file and writes entries (i.e. sequences) to separate datasets, which are organized in a dataset collection.
+        There are two modes: 1) each sequence is written to its own data set which is named by the ID of the sequence or 2) The file is split into a given number of chunks which are numbered.
     ]]></help>
     <citations>
         <citation type="bibtex">
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/split_fasta.py	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,50 @@
+#!/usr/bin/env python
+
+import os
+import sys
+from Bio import SeqIO
+
+num_chunks = 0
+if len(sys.argv) == 3:
+    num_chunks = int(sys.argv[2])
+    input_filename = sys.argv[1]
+elif len(sys.argv) == 2:
+    input_filename = sys.argv[1]
+else:
+    exit("Usage: split_fasta.py <input_filename> [<num_chunks>]")
+
+os.mkdir('splits')
+
+if num_chunks != 0:
+    # if splitting into chunks we need to count how many records are in the
+    # input file
+    record_count = 0
+    with open(input_filename) as input_file:
+        for line in input_file:
+            if line.lstrip().startswith('>'):
+                record_count += 1
+
+    records_per_chunk = round(float(record_count) / num_chunks)
+
+count = 1
+with open(input_filename) as input_file:
+
+    chunk_record_count = 0  # how many lines have we written to the output file
+    records = []
+    for record in SeqIO.parse(input_file, 'fasta'):
+        records.append(record)
+        if num_chunks == 0 or (count < num_chunks and
+           len(records) >= records_per_chunk):
+            if num_chunks == 0:
+                output_filename = os.path.join('splits', record.id)
+            else:
+                output_filename = os.path.join('splits', 'part{}'.format(count))
+            SeqIO.write(records, output_filename, 'fasta')
+            count += 1
+            records = []
+
+    if records:
+        # this only applies for the mode where input file is
+        # split into chunks
+        output_filename = os.path.join('splits', 'part{}'.format(count))
+        SeqIO.write(records, output_filename, 'fasta')
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/ID1.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,3 @@
+>ID1
+MSNSEASSTCPIPSRSIHEKSWSPLPDSYSQTPGGTVFSTTPGGTRIIYDRKFLLECRNS
+PIARTPPCCLPDIPGVTRPSLQIIEQEEDSKDLSIDDSQFVIDI
--- a/test-data/ID1_result1.fasta	Fri Oct 16 16:13:34 2015 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,2 +0,0 @@
->ID1 desc
-GATACA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/ID2.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,3 @@
+>ID2
+MADVVLGVGTGVFIITLIWILTLALTIILSRATGPTKLGIIPVVLLALIITLVLVFFPRA
+AEVPAPQRAAQIVDMFFIGRYVLLSLVSLVFLAALFMLLPLHFLEPIYAKPLRTH
--- a/test-data/ID2_result1.fasta	Fri Oct 16 16:13:34 2015 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,2 +0,0 @@
->ID2 desc
-GATACAGATACAGATACAGATACAGATACA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/ID3.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,5 @@
+>ID3
+MAVDNFLFGQCILYFLAFLFGFIAVVPLSENGDDFQGKCLLFTEGIWQNENMTMGKQRFI
+VEEWGPESSCRFITFVGIVSLILSAVQAWRTFFFLCKGHDDSLFHSFLNLLLSLLVLFVV
+FVAGTISSVGFSIWCDSVTENGAMPSSCEDLQDTDLELGVENSSFYDQFAIAQFGLWSAW
+LCWLGLTVLAFLKVYHNHRQQELLESLVQEKELLLGHPLQRSSYVYNRNAMI
--- a/test-data/ID3_result1.fasta	Fri Oct 16 16:13:34 2015 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,3 +0,0 @@
->ID3 desc
-GATACAGATACAGATACAGATACAGATACAGATACAGATACAGATACAGATACAGATACA
-GATACA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/part1.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,182 @@
+>NP_001007355.1 gi|55925472|ref|NP_001007355.1| eukaryotic translation initiation factor 4E-binding protein 3 [Danio rerio]
+MSNSEASSTCPIPSRSIHEKSWSPLPDSYSQTPGGTVFSTTPGGTRIIYDRKFLLECRNS
+PIARTPPCCLPDIPGVTRPSLQIIEQEEDSKDLSIDDSQFVIDI
+>NP_956692.1 gi|41055339|ref|NP_956692.1| transmembrane protein 218 [Danio rerio]
+MADVVLGVGTGVFIITLIWILTLALTIILSRATGPTKLGIIPVVLLALIITLVLVFFPRA
+AEVPAPQRAAQIVDMFFIGRYVLLSLVSLVFLAALFMLLPLHFLEPIYAKPLRTH
+>NP_001003767.1 gi|57524633|ref|NP_001003767.1| transmembrane protein 179 [Danio rerio]
+MAVDNFLFGQCILYFLAFLFGFIAVVPLSENGDDFQGKCLLFTEGIWQNENMTMGKQRFI
+VEEWGPESSCRFITFVGIVSLILSAVQAWRTFFFLCKGHDDSLFHSFLNLLLSLLVLFVV
+FVAGTISSVGFSIWCDSVTENGAMPSSCEDLQDTDLELGVENSSFYDQFAIAQFGLWSAW
+LCWLGLTVLAFLKVYHNHRQQELLESLVQEKELLLGHPLQRSSYVYNRNAMI
+>NP_001002700.1 gi|50540464|ref|NP_001002700.1| fatty-acid amide hydrolase 2-A [Danio rerio]
+MALTRFERFLGRLLRAVVWILFAAFKLFAPQQRHGVSRLPPITNPLLLLSAMQLARKIRR
+KEVTSVEVVQAYIDRIQEVNPLINAMVKDRFSAALQEAAQVDKLIEEETGGEDVLEDRLP
+LLGVPITVKEAFALQGMPNSTGLLTRRDLVSGADAPSVALLKRAGAIPLGVTNCSELCMW
+LESHNHLYGITNNPYDFERIVGGSSGGEGSILGAGSSVIGIGSDIGGSIRIPCFFNGIFG
+HKPSVGIVNNEGQYPPASGQQMGFLCTGPMCRYAEDLIPMLSIMGGPNAEKLSLFTEVDL
+KKLRFFSVPHNGGSHLVSPVEPQLLHAQKMVVKRLEADLGVKVQELLIPQLKYSFQIWGT
+MMASPGKDGKPPTTFAELMSEGGKKVWPAWELFKWFLGFSSHTLAAIGLALVELFQSSHP
+SPFIMQQKESLQQELEELLGTDGVLLYPSHPLIAQKHHHPIFTPFNFSYTGIFNILGLPV
+TQCPLGLSAEGLPLGVQIVAGKLQDRLSLATALYLEKAFGGWREPGKTTIKP
+>NP_001003555.1 gi|57525887|ref|NP_001003555.1| centromere protein P [Danio rerio]
+MEQKYEEDIQKLQQEIEMLEAEQEETLRSIFVQHGDRLQQGVKSACEERGGGGAQQHTLS
+KLITEVRELEKDLRRQTEINGITLNECFVKTLHKSERKLIQQLRLAGHCGLLLFQVEFAV
+TEIQEDNVLHRRVTELNIVVDGVEFKDFSAFVSRVEDTKDLLLFFRTLRTFSERCEDRRQ
+TFQHFQEKYPDVVNLPEGCRSEIMIIRSPQLPGISMTLFWKIHVSKEGVVKPLLDLLLKM
+PDQALELDTKKVMEKASDYFQSLLQLLGVEASIEGLIRTVCS
+>NP_997599.1 gi|47058959|ref|NP_997599.1| protein dispatched homolog 2 [Danio rerio]
+MESGSISRQREDAEMPDSSTTEGPSLEAPQSEIPEVSLCPPDSDSTESQMCPVEIEENQT
+KSSSPFNSHSSTQLERQVSQGSAYHSPPHKKCPCCGHQQPSQSDVCPGQMNALHQADCAA
+SPVKTLYSCSPSRLPSCHTKMQCHWLHGSHDGSNHKPVQHHMVTVRNDGLHRIPRSYSQV
+IVEYPMTVLISCTLVLFACSLAGILTGPLPDFSDPLLGFEPRGTDISVRLATWTRLKQNT
+GPGKPLSPVPWQLTEKTTTGKDTIKSEPQFRERSRRMLHRDNAEHNFFCNAPGERYAQLV
+FRSGNSASLWSLKAIYSMCQMEQTQIRSGPQFDKLCQVKSEFYGSMVKNECCPSWSLGNY
+LAVLNNISSCFSLTSQQVSESLGLLRFCAPYYHDGSLIASCTERSKFGRCASVPHRCKLS
+SIFQILHYLVDKDFLGPQTVEYKVPSLKYSIVFLPVEKSDSLMNIYLDHLEGHKLTYNNT
+TITGMDLGIKQKLFKYYLARDSIYPVLAALALLITIGLYLKSLFIAAMSLVAVILSLSTS
+YFFYKVAFRLTFFPLLNLAAVFVLLGSCLNQALTFVDFWKLQLSHNPPAVPEKRMNRVLQ
+EMGYLIIVSGLTSSVTFYSGYISSITAVRCYAVYLGSASLINTLFALVWLPCTLILQERY
+AVLSSNTVGKVAWKPCCSKNAGGFWETSSRKRCLFTFRQKLRTLGRGFSDTSNLLFLKIL
+PCGVVKFRYIWICWFAVLAAGGTYISCVDPGMKLPTSDSRTTQLFRSSHPFERYDAEYRH
+QFMFERMKDGEDEPMMLTLIWGIVPSDNGDHFDPKSNGSLSVDPGFNMSSLQAQIWLRDL
+CGKIQNQTFYSPLSAEQDTAEDNVCFVEHLIHWVSIRRCSESEDAFSFCCNNIPFPYPPR
+VFEQCLSMMVAEQHAEGRLPSAGGLRFDSEGRIAALVVIFKTVQLYSFNYNRMSQFYQEI
+LSWFNREISKAPAGLQRGWFVSQLGLYDLQQCLSSETLEVAGFSVALTFALLLLTTWNIP
+LSVYVSIAVAGSVFATVGLLVLLEWQLNGVEALFISAAAGLSVDFVANYCISYSLAPHSD
+RLGRVAHSIKRMGCPVATGAGAYFCVGIIMLPATALLFRKLGIFLLLVKCVACGFATFFF
+QSLCCFFGPQNNCGRITLPCVTQQSTENILSSCSATEPGTNNPAANGAFGCGKGSRVRRS
+FNKENEGFLCPNQQHHRKRQPVGGREPEQNELQPLACQLSDSFENSTCTSKLSNRPSVLS
+DDIQFCGLSPKQDYDRVSIEADSTEMCSRHLKGCNPPPALQTSSPYKENMLRLPQDACKE
+KVLCKKCRGQSRGGLQLWNVSLSSSSSMDEIMITQTTDTVNERSLSMDDHIHKRLLSCQS
+QSSIEGLEESNDTCLTEVEAAIPQAGKIEDEFQPGHLNGKRDTLRLSLKETVYDLASPGS
+GRVRTAQSDVPVILPNSKPDMPDVWIKREGKGEGGS
+>NP_001013313.1 gi|61651744|ref|NP_001013313.1| coiled-coil domain-containing protein 115 [Danio rerio]
+MRVDENLRLDEQLLLFMEQLEALEEKRQRLNSLIEEGWFSIAKARYSMGNKQVSALQYAS
+EMQPLAHVETSLLEGGTAEFKCERSENKAEEQKTKTIEDIGAKETGLRRRVHTKQKEVKE
+GEQDTDEVKTKTDSPTPEHRNPLKWFGILVPQNLKQAQSAFKEVITLSVEIASLQSTILA
+TRKEMQVQMKEKQERTEKAQLEVKEE
+>NP_991238.1 gi|45387769|ref|NP_991238.1| pituitary homeobox 3 [Danio rerio]
+MDFNLLTDSEARSPALSLSDSGTPQHDPGCKGQDNSDTEKSHQNHTDESNPEDGSLKKKQ
+RRQRTHFTSQQLQELEATFQRNRYPDMSTREEIAVWTNLTEARVRVWFKNRRAKWRKRER
+NQQAELCKNGFGAQFNGLMQPYDDMYSGYSYNNWATKSLASSPLSAKSFPFFNSMNVSPL
+SSQPMFSPPSSIPSMNMASSMVPSAVAGVPGSGLNNLGNLNNLNSPTLNSAAVSAAACPY
+ATTAGPYMYRDTCNSSLASLRLKAKQHANFAYPAVQNPVSNLSPCQYAVDRPV
+>NP_001244093.1 gi|380503827|ref|NP_001244093.1| blood vessel epicardial substance isoform 2 [Danio rerio]
+MSNTTSALPSSVPAVSLDPNATLCQDWEQSHHLLFHLANLSLGLGFLIPTTLALHMIFLR
+LLLMTGCSLFIAWATLYRCTLDVMVWNVVFLLVNFMHFFFLLYKRRPIKIDRELKSVYKR
+MFEPLHVREALFQRLTGQFCTIQTLKKGQVYAAEDKTSVDERLSILLKGKMKVSYRGHFL
+HNIYTNAFIDSPEFRSTQMNRGERFQVTIAAEENCKLLCWSRERLTYFLESESFLNEVFR
+YLIGKDITNKLYSLNDPTLSDKAVKKMDRQPSLCSQLSMMQMRNSMASTSDTDDVLNQIL
+RGGSTGSSLQKNPLTKTSTTMKPIEEGLEDDVFESESPTTSQNVSKTTKKDI
+>NP_001013309.2 gi|157042782|ref|NP_001013309.2| tRNA 2'-phosphotransferase 1 [Danio rerio]
+MDCETRGRGRRGRGNRNEESRDVRLSKSLSYVLRHGASKMGLQMNSDGFVFVEELLAHQQ
+FRSFSVDDVERVVASNDKQRFKLCKHPEDDRLQIRANQGHSVQVTDLELREISQDDQDYP
+REAVHGSYMKHWPSIRSQGLSRMNRTHIHLAPGLPGEGRVISGMRQSCDLAVYIDVTKAM
+SDGIKFFWSENGVLLTPGDAAGILAPCYFSRAQRLKPLPCDIELH
+>NP_001001847.2 gi|380503821|ref|NP_001001847.2| blood vessel epicardial substance isoform 1 [Danio rerio]
+MSNTTSALPSSVPAVSLDPNATLCQDWEQSHHLLFHLANLSLGLGFLIPTTLALHMIFLR
+LLLMTGCSLFIAWATLYRCTLDVMVWNVVFLLVNFMHFFFLLYKRRPIKIDRELKSVYKR
+MFEPLHVREALFQRLTGQFCTIQTLKKGQVYAAEDKTSVDERLSILLKGKMKVSYRGHFL
+HNIYTNAFIDSPEFRSTQMNRGERFQVTIAAEENCKLLCWSRERLTYFLESESFLNEVFR
+YLIGKDITNKLYSLNDPTLSDKAVKKMDRQPSLCSQLSMMQMRNSMASTSDTDDVLNQIL
+RGGSTGSSLPVTSDRA
+>NP_001015061.1 gi|62632729|ref|NP_001015061.1| putative all-trans-retinol 13,14-reductase precursor [Danio rerio]
+MWFAVVAIFLALVAFLYRYVVGSGPNPFAIDTREPLKPMVFDRKLKNKVLKQGFLASRVP
+EDLDAVVVGSGIGGLAIAVLLAKVGKKVLVLEQHDRAGGCCHTFKEQGFEFDVGIHYIGE
+LSNHKPLRCIIDQMTNGQLQWDPLENPFDNVVIGPPENRRIYQIYSGRKRYMDELKKCFP
+GEEKAIDEYVRLCKEVGQGVWVMVLLKFLPTPIANFLVRTGLANRLTSFSRYASRSLTDV
+VNELTQNKDLRAVLSYIFGTYGKIPKEASFSMHSLIVNHYMNGAWYPKGGATEIAYHMIP
+IIEKAGGAVLVRAPVNRILLNDAKEAIGVSVLKGQEEVHVRAPIVISDAGIFNTYEYLLP
+KDVQTMPAIQKQLSMLQHGDSGLSIFIGLDGTKEELGLKADNYFIYPENNIDELLEDYRS
+GNREESAKKNPLIFVASPSAKDSTWPERTPGKSTLTVVSFANYEWFEEWKDDKVKNRSTD
+YKQLKELFINYILEAVTEIYPKIKDRIEYVDAGTPITNQHYIAAPRGEIYGADHGIPRFS
+AELNATIRAQTPIKNLYLTGQDLMLCGFAGALTGALTCGSVILNRNLHLEAFSLAKRVQN
+GNNKKKT
+>NP_001003580.1 gi|57525791|ref|NP_001003580.1| kelch-like protein 15 [Danio rerio]
+MSGDVEVYLSQVHDGSVSSGFRALYEERLLLDVTLLIEEHHFQAHKALLATQSDYFRVMF
+TADMRERDQDKIHMKGLTAAGFGHVLRFMYYGSLELSMLTVQEILQAAMYVQLTEAVEFC
+CSFLLAKICLENCAEVMRLLEDFSVGVEGVQEQLDAFLLENFVPLMARPDFLSYLSLEKL
+MAYLDSDQLSRYPEIELYEAVQAWLRHDRRRWRHTDAVVQNLRFCLMTPANIFEKVKTSE
+FYRYSRQLRLEVDQALSYFHQVNEQPLAETKSNRIRSVRPQTAVFRGMIGHSMVNSKILL
+LHRPKVWWELEGPQVPLRPDCLAIVNNFAFLLGGEELGPDGEFHASSKVYRYDPRQNSWL
+RMADMSVPRSEFAVGVIGKYIYAVAGRTRDETFYSTERYDIVEDKWEFVDPYPVNKYGHE
+GTVLNGKLYITGGITSSSTSKQVCVFDPGREGSSEHRTRRTPILTNCWENKSKMNYARCF
+HKMISHNGKLYVFGGVCVILRASFESQGCPSTEVYDPETDEWTILASMPIGRSGHGVAVL
+DKQIMVLGGLCYNGHYSDSILTFDPEENKWKEDEYPRMPCKLDGLQVCSLHFPEYVLEHV
+RRCS
+>XP_006779743.1 gi|583968567|ref|XP_006779743.1| PREDICTED: CCAAT/enhancer-binding protein alpha-like [Neolamprologus brichardi]
+MELSNLYEVAPRPLMNNLNQQPPSGYRDPADLGGEIGDNETSIDLSAYIDPSAFNDDFLA
+DLFHHSSRQDKLKMMNGEYDPVSCGPGPQQLYMSNYMESKMEPLYEHNPPRLRPVAIKQE
+PRDDEDMNPGMPPTYHHPHPHPHPQQYSQQQQMPHLQYQIAHCAQTTMHLQPGHPTPPPT
+PVPSPHQHQHSHPHSHQGGMKLLEQQRGCGKTKKHVDKNSPEYRLRRERNNVAVRKSRDK
+AKMRNMETQHKVVELTADNDRLRRRVEHLTRELDTLRGIFRQLPDGSFKPMGS
+>XP_006779744.1 gi|583968570|ref|XP_006779744.1| PREDICTED: ras-related protein Rab-8B-like, partial [Neolamprologus brichardi]
+SLSGIDFKIRTIELDGKKIKLQIWDTAGQERFRTITTAYYRGAMGIMLVYDITNEKSFDN
+IKNWIRNIEEHASADVEKMVLGNKCDMNDKRQVSKERGEKLAIDYGIKFLETSAKSSINV
+EEGFYTLARDIMARLNRKMNDNNPSGGGGPVKITEPRSKKSLFRCSLL
+>XP_006779746.1 gi|583968574|ref|XP_006779746.1| PREDICTED: calcium and integrin-binding family member 2-like [Neolamprologus brichardi]
+MGNKQTTFTEEQLEAYQDCTFFTRKEILRLHARYRELAPHLVPLDYTNNPDIKVPMTLIV
+TMPELKVQFYRYRIVQVLWQLSTESSRWGSGPDFNRDNFICKEDLEKTLNKLTKGELMPE
+EVTLVCDKAIEEADLDGDHKLSFADFENMISKAPDFLSNFHIRI
+>XP_006779747.1 gi|583968576|ref|XP_006779747.1| PREDICTED: corticosteroid 11-beta-dehydrogenase isozyme 2-like [Neolamprologus brichardi]
+MEDYTLPFWIYLVIVTVFIGGAMKKILASHLNTTSTVVAWLGATVLVERLWAFCLPAMLL
+LVLFGITFCIYYATKTSQPRAMLPAHGKAVIITGCDSGFGNATAKHLDSLGFEVFATVLD
+LNGDGAKELQRTCSHRLTLLQVDITQPQQVQQALLDTKAKLGLKGLWALVNNAGVCVNFG
+EVELSLMSNYRGCMEVNFFGTLSITKAFLPLLRQTKGRIVTISSPAGDQPFPCLAAYGAS
+KAALNLITETLRHELEPWGVQVSTILPSSYRTAQSTNSAYWEKQHKHLLQNLSPALLEDY
+GEEYMTETKDLFQTFAKHTTTNLQPVVDTIVQALLAPQPQPRYFAGAGLSLMYFLYAYFP
+YSMSNNFLKKKFLKKNVIPRALRKQSAFDLNLSLHNNNNEEKLQQM
+>XP_006779748.1 gi|583968578|ref|XP_006779748.1| PREDICTED: transient receptor potential cation channel subfamily M member 1-like [Neolamprologus brichardi]
+MYIRVSFDSKPDSLLHLMVKDWQLELPTLLISVHGGLQNFDLPPKLKQVFGKGLIKAAVT
+TGAWIFTGGVSTGVIRHVGDALKDHSSKSRGKVCAIGIAPWGIVENKEDLIGRDVTRPYQ
+TMSNPLSKLSVLNSSHSHYILADNGTCGKYGAEVRLRRQLEKHISLQKINTRLGQGVPVV
+CLIVEGGPNVISITLESLKEEPPVPVVVCDGSGRASDILSFAHRYCEEDG
+>XP_006779749.1 gi|583968580|ref|XP_006779749.1| PREDICTED: chymotrypsin B-like [Neolamprologus brichardi]
+MAFLWIVSCLAFVGAAYGCGTPAIPPRVTGYARIVNGEEAVPHSWPWQVSLQQTNGFHFC
+GGSLISEQWVVTAAHCNVRTYHNVIVGEHNKGYGSTENIQVLKPAKVFTHPSWNPQTINN
+DITLIKLASPARLGTNVSPVCLADTTDSFAAGMKCVTTGWGLTRYNAPSTPNNLQQAALP
+LLSNEECKKHWGSNISDVMICAGGAGATSCMGDSGGPLVCQKDNVWTLVGIVSWGSSRCS
+TSTPAVYARVTKLRGWVDQILASN
+>XP_006779750.1 gi|583968582|ref|XP_006779750.1| PREDICTED: agouti-related protein-like [Neolamprologus brichardi]
+MFGTVLLCCWSFGLLPLASSLVHGNLPLDEGPVAGRRTETFLSEIERSQVPDRMHEPALL
+PVDSVEDHFLMDTGSYDEDTSAALQLQGRAMRSPRRCIPHQQSCLGYPLPCCDPCDTCYC
+RFFNAICYCRRVGHVCPPRRT
+>XP_006779751.1 gi|583968584|ref|XP_006779751.1| PREDICTED: EMILIN-1-like [Neolamprologus brichardi]
+MAALPLLLLLVLWTCGNAKGAFPLRQSYNLYTNGHAHGARAASRHRNWCAFVVTKTVSCV
+VEDGVETYVKPDYHPCSWGSGQCSRVVVYRTYMRPRYKVAYKMVTEMDWKCCHGYSGADC
+NIGPVGGGGTQISTTRPQPGQGGGTTSGQGGGGHSYGGGSSGSGQSGGNADNEKMRQLEE
+KIRSLTKNLQDLQSTMSTMNERLQEEGGRNGFGERSSGGRNPADAAQPEIKETIHSIQTK
+LDQLDNRTQAHDKTLVSINNHLVNGKGNELEGGASGGSLSEGRLNSLKEEILSKLERRVS
+LSCSSCQAGVEDLRKQQQQDRERIRALEKQMNAMDVQYRQSLDGLRRDVVRSQGCCDIIS
+DLQDRVTDAERKISTASENFDILQNRLDREISGQGGTSENTGSRGQGLPVGGETGGHGRD
+AMITEEHLNNRLKDLERRVNSTMQKTEESCSYLENHVKDYFHRELDELRSVFLERFDDQA
+DRITDVELDVEQVKDSISDHDKRLSKLENTTSQMSWRLEKCGCVASEQGGGGEGRGRGDG
+GYGGGSWGAGGGGSTGEGKDGGNRGDGGGTWGAGGGGGGSTGGGGRWGGTGGGLPGTGGE
+KDNSTKKSLEWRVVANEDQIRHFNTQLKDLSMSGDSLYDKVLDLTDDVGKIKALTGDHGE
+HFNRIVTVVEMLGEDCELCGKVEKELQKMRNYSQNALSNIQNHINRIQNRMDSEGDSCFQ
+MCSVLQSEVSVLRDDVRRCTNQCKSNPDMTTGVDHARPGGTDDNSGPLDPAKPLDGHSVI
+EGINNNHLKTLQGELSNVILTFSSINDTLKGLEHTVQKHDSVITDLGNTKDKIISEIDKV
+QQELTEHIEDNRNRLDKMDRDIRRFESTVLEMGDCKRSGDGLEKRLSKLEGVCGRLDGVS
+DSILKIKEGLNKHVSSLWTCVSGLNDTVIRHGGLLDFIQDGQDDIHSRVKNLNSSLNQVS
+RDLQSFSEHDLTGPPGPQGPQGHPGERGFNGPPGLPGPPGFPGPRGEIGPHGPKGETGLP
+GADAQIPKLSFSAALTAPMDRAGTIVFDKVFVNEGNFYNPRTGIFTAPVDGNYYFSAVLT
+GHRNEKIEAVLSKSNYGMARVDSGGYQPEGLENNPVAEAKVNPGSLAVFSIILPLQTQDT
+VCIDLVMGKLAHSVEPLTVFNGMLLYENK
+>XP_006779752.1 gi|583968586|ref|XP_006779752.1| PREDICTED: zinc finger protein 507-like isoform X1 [Neolamprologus brichardi]
+MEEITNVITHSSAASSSSSTSGSHTRQTKEKQPSQGFQQKTADDSLIQVIKKLSKIVEKR
+PQRRCASGGQKRALQVGERGAEQGGGSICKKIKRNLKDEVGVERSTDDSSLPSPWSGDDN
+NNVTTAVAEVAANPNSSDLKRTVTCYQCSLCPHLSQTLPLLKEHLKQHNEQHSDLILMCS
+ECHFTSRDHEQLEAHVRMHFDNGDNQKRKYPVSEAKEEVLKNQDVDLTGDNCSAGTEVKK
+SSVSNAKELPQKKKWYSYEEYGLYRCLICSYVCSQQRMLKTHAWKHAGLVDCSYPIFEDE
+DGGSAKREVQAAPNNASAREEIVVLQDKSLQKLPTGFKLQLCMPVAVEDKQEVVNLQGSH
+LSESPKTEEEDEYPIKDMTSEEPAVEVQVTTEAETEVELGGHHESTSATDSLLSSAQKII
+NRSPNSAGHINVIVERLPSAEDSVMASNPLLLSPDVDGDKSLLEKKAEEQEHVEGVKDEV
+VLCYSPGNANKSQHLGADIKPSIAKSNDLPRDENVPPAGRKRTHSESLRLHSLAAEVLVA
+MPMRTPELPNSGAKVALKTVAAQAQSPQAGQKPTEGAAAGQKASDVGTAAAMLNCNEGRE
+ETLGSLGLGKGDDDGPAANGGISLSLLTVIERLRERSDQNTSDEDILKELQDNAQFQSGA
+GVVAANGAGSYVCSSVPGMDGLVGSPDSGLVDYIPGSDRPYRCRLCRYSSGNKGYIKQHL
+RVHRQREPYQCPICEHIASDSKDLENHMIHHCKSRMYQCKQCPDAFHYKSQLRNHEREHH
+SFSGDVEMLTPVAETAAAMEETERVTYEEGSPQKMFKCDVCNYTSSTYVGVRNHRRIHNS
+DKPYRCCSCDFATTNMNSLKSHMRRHPQEHQAVQLLEQYRCSLCGYVCSHPPSLKSHMWK
+HAGDQNYNYEQVNKAINEAISQSSR
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/part2.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,235 @@
+>XP_006779753.1 gi|583968588|ref|XP_006779753.1| PREDICTED: zinc finger protein 507-like isoform X2 [Neolamprologus brichardi]
+MEEITNVITHSSAASSSSSTSGSHTRQTKEKQPSQGFQQKTADDSLIQVIKKLSKIVEKR
+PQRRCASGGQKRALQVGERGAEQGGGSICKKIKRNLKDEVGVERSTDDSSLPSPWSGDDN
+NNVTTAVAEVAANPNSSDLKRTVTCYQCSLCPHLSQTLPLLKEHLKQHNEQHSDLILMCS
+ECHFTSRDHEQLEAHVRMHFDNGDNQKRKYPVSEAKEEVLKNQDVDLTGDNCSAGTEVKK
+SSVSNAKELPQKKKWYSYEEYGLYRCLICSYVCSQQRMLKTHAWKHAGLVDCSYPIFEDE
+DGGSAKREVQAAPNNASAREEIVVLQDKSLQKLPTGFKLQLCMPVAVEDKQEVVNLQGSH
+LSESPKTEEEDEYPIKDMTSEEPAVEVQVTTEAETEVELGGHHESTSATDSLLSSAQKII
+NRSPNSAGHINVIVERLPSAEDSVMASNPLLLSPDVDGDKSLLEKKAEEQEHVEGVKDEV
+VLCYSPGNANKSQHLGADIKPSIAKSNDLPRDENVPPAGRKRTHSESLRLHSLAAEVLVA
+MPMRTPELPNSGAKVALKTVAAQAQSPQAGQKPTEGAAAGQKASDVGTAAAMLNCNEGRE
+ETLGSLGLGKGDDDGPAANGGISLSLLTVIERLRERSDQNTSDEDILKELQDNAQFQSGA
+GVVAANGAGSYVCSSVPGMDGLVGSPDSGLVDYIPGSDRPYRCRLCRYSSGNKGYIKQHL
+RVHRQREPYQCPICEHIASDSKDLENHMIHHCKSRMYQCKQCPDAFHYKSQLRNHEREHH
+SFSGDVEMLTPVAETAAAMEETERVTYEEGSPQKMFKCDVCNYTSSTYVGVRNHRRIHNS
+DKPYR
+>XP_006779754.1 gi|583968590|ref|XP_006779754.1| PREDICTED: probable C-mannosyltransferase DPY19L3-like isoform X1 [Neolamprologus brichardi]
+MTTLRQRKGSKGKEPSPAAELQSQQHNCCSEHHPEKILHGDWSWGAIIWTSVGWSVSVGL
+GLLCCIYVATLHENDLWFSNIKEVEREISFRTECGLYYSYYKQMLHAPSIQEGLKEMIHD
+NLTESKRTINLLQRMNIYQEVFLSVLYRLLPIQSYLEPVYFYIYTVFSLQAVYVIALYLT
+AWLLSGSWLAGALTGVWYILNRVDTTRVEFTISLRENWSLPFFALQVTAITCYLRPQLTT
+LQQKVMVWLMYVTTFCFCLTWQFNQFILLVQALVIYTLDCGDFLTTTQVTTLYLVQVSSL
+LSVWFLQFCNSMILGSLVLSFIVAALFIRHCQPGVKTGSLVVRLGKVLLHSALVLLLTVT
+INYLAKKALQLQSDEHIFKFIKSKFALGSTRDFDASLYLCEEAFGLLPLDTLERLAGTLL
+LYPYVLTLLLLCGMLVAAALQNLSRPNRGSTEEKKGAREGQVAAFRPDVAYNVLHTLFYG
+LLAFSTMRMKYIWTGHMCAVAAYGVCGTELWTVLLSALRCNTKLLLRLVRYVAPVVMIGF
+LYYKFWPKLMEELSELREFYDPDTVELMTWISTKTPKQAVFAGSMQLLAGIKLCTGRVLT
+NHPHYEDKDLRERTRQVYQVYARRSPEEVYDILKAIGADYVVLENSICYERRHRRGCRLR
+DLLDLANGHIMDGPGENDPDLVPATHPRFCDAIKTDAAYNALFTRTFQNKTFHVYRLKKK
+RKKNTKGSSEPSVTQ
+>XP_006779755.1 gi|583968592|ref|XP_006779755.1| PREDICTED: probable C-mannosyltransferase DPY19L3-like isoform X2 [Neolamprologus brichardi]
+MTTLRQRKGSKGKEPSPAAELQSQQHNCCSEHHPEKILHGDWSWGAIIWTSVGWSVSVGL
+GLLCCIYVATLHENDLWFSNIKEVEREISFRTECGLYYSYYKQMLHAPSIQEGLKEMIHD
+NLTESKRTINLLQRMNIYQEVFLSVLYRLLPIQSYLEPVYFYIYTVFSLQAVYVIALYLT
+AWLLSGSWLAGALTGVWYILNRVDTTRVEFTISLRENWSLPFFALQVTAITCYLRPQLTT
+LQQKVMVWLMYVTTFCFCLTWQFNQFILLVQALVIYTLDCGDFLTTTQVTTLYLVQVSSL
+LSVWFLQFCNSMILGSLVLSFIVAALFIRHCQPGVKTGSLVVRLGKVLLHSALVLLLTVT
+INYLAKKALQLQSDEHIFKFIKSKFALGSTRDFDASLYLCEEAFGLLPLDTLERLAGTLL
+LYPYVLTLLLLCGMLVAAALQNLRPNRGSTEEKKGAREGQVAAFRPDVAYNVLHTLFYGL
+LAFSTMRMKYIWTGHMCAVAAYGVCGTELWTVLLSALRCNTKLLLRLVRYVAPVVMIGFL
+YYKFWPKLMEELSELREFYDPDTVELMTWISTKTPKQAVFAGSMQLLAGIKLCTGRVLTN
+HPHYEDKDLRERTRQVYQVYARRSPEEVYDILKAIGADYVVLENSICYERRHRRGCRLRD
+LLDLANGHIMDGPGENDPDLVPATHPRFCDAIKTDAAYNALFTRTFQNKTFHVYRLKKKR
+KKNTKGSSEPSVTQ
+>XP_006779756.1 gi|583968594|ref|XP_006779756.1| PREDICTED: probable C-mannosyltransferase DPY19L3-like isoform X3 [Neolamprologus brichardi]
+MCRGLKEMIHDNLTESKRTINLLQRMNIYQEVFLSVLYRLLPIQSYLEPVYFYIYTVFSL
+QAVYVIALYLTAWLLSGSWLAGALTGVWYILNRVDTTRVEFTISLRENWSLPFFALQVTA
+ITCYLRPQLTTLQQKVMVWLMYVTTFCFCLTWQFNQFILLVQALVIYTLDCGDFLTTTQV
+TTLYLVQVSSLLSVWFLQFCNSMILGSLVLSFIVAALFIRHCQPGVKTGSLVVRLGKVLL
+HSALVLLLTVTINYLAKKALQLQSDEHIFKFIKSKFALGSTRDFDASLYLCEEAFGLLPL
+DTLERLAGTLLLYPYVLTLLLLCGMLVAAALQNLSRPNRGSTEEKKGAREGQVAAFRPDV
+AYNVLHTLFYGLLAFSTMRMKYIWTGHMCAVAAYGVCGTELWTVLLSALRCNTKLLLRLV
+RYVAPVVMIGFLYYKFWPKLMEELSELREFYDPDTVELMTWISTKTPKQAVFAGSMQLLA
+GIKLCTGRVLTNHPHYEDKDLRERTRQVYQVYARRSPEEVYDILKAIGADYVVLENSICY
+ERRHRRGCRLRDLLDLANGHIMDGPGENDPDLVPATHPRFCDAIKTDAAYNALFTRTFQN
+KTFHVYRLKKKRKKNTKGSSEPSVTQ
+>XP_006779757.1 gi|583968598|ref|XP_006779757.1| PREDICTED: MTSS1-like protein-like isoform X1 [Neolamprologus brichardi]
+MLGEITHLQAIIDDLTVLTTDPHKLPPASEQVIKDLKGSDYSWSYQTPPSSPSSSGSRKS
+SMCSSVNSTHSSASRSSGGGGSGGVGGGGSLPHSPTSSSSSSCRYRSSLPHQPPPPGGIA
+AHRLSSVSSHDSGFVSQDANIYSKPPSPMPSDITSQKSSSSASSEASETCQSVSECSSPT
+TFGSSFATFRPALFHSGSTRPLSVILPVPASPPYIRPPGSSSSSPTSKVPMWKDWSKAGQ
+YEQPVAAAAVQRRREPLDRLRESEASPGSQGYAGPSHPDDGQRARMTPATIAAKHGEEVS
+PAASDLAMVLTRGLSMEQQKSNRDSLQYSSGYSTETTTPSCSEDTIPSQGSDYDCYSVNG
+DAEGPDGQTEFDKSSTIPRHSNIAQNYRRMIQTKRPASTAGLPTGVLGPGAHGIPGQPGG
+AGGGGTGTPGTATIRRTPSTKPGVRRTLSSAGPIPIRPPIVPVKTPTVPGDSHSPGAGGG
+HAGGVPVRVGSEECVFFTGAEDSQGALDYVKASPKRLSLPNTAWGSGAALEVYAQQHGGL
+AIGTGSGTGSEEDQMIAANRHSLVEKIGELVASAHALGEGQFPFPALPDDPAPPPTGPTD
+TETGTEGAEGSGDMLTTIRRGVRLRKTVSNDRSAPRIL
+>XP_006779758.1 gi|583968600|ref|XP_006779758.1| PREDICTED: MTSS1-like protein-like isoform X2 [Neolamprologus brichardi]
+MLGEITHLQAIIDDLTVLTTDPHKLPPASEQVIKDLKGSDYSWSYQTPPSSPSSSGSRKS
+SMCSSLPHQPPPPGGIAAHRLSSVSSHDSGFVSQDANIYSKPPSPMPSDITSQKSSSSAS
+SEASETCQSVSECSSPTTFGSSFATFRPALFHSGSTRPLSVILPVPASPPYIRPPGSSSS
+SPTSKVPMWKDWSKAGQYEQPVAAAAVQRRREPLDRLRESEASPGSQGYAGPSHPDDGQR
+ARMTPATIAAKHGEEVSPAASDLAMVLTRGLSMEQQKSNRDSLQYSSGYSTETTTPSCSE
+DTIPSQGSDYDCYSVNGDAEGPDGQTEFDKSSTIPRHSNIAQNYRRMIQTKRPASTAGLP
+TGVLGPGAHGIPGQPGGAGGGGTGTPGTATIRRTPSTKPGVRRTLSSAGPIPIRPPIVPV
+KTPTVPGDSHSPGAGGGHAGGVPVRVGSEECVFFTGAEDSQGALDYVKASPKRLSLPNTA
+WGSGAALEVYAQQHGGLAIGTGSGTGSEEDQMIAANRHSLVEKIGELVASAHALGEGQFP
+FPALPDDPAPPPTGPTDTETGTEGAEGSGDMLTTIRRGVRLRKTVSNDRSAPRIL
+>XP_006779759.1 gi|583968603|ref|XP_006779759.1| PREDICTED: G-protein coupled receptor 64-like [Neolamprologus brichardi]
+MCFSPQIPDPSITKKDQEILTRITVIGCSISLFTLVIAILLFITNRKLRQDVSMKVHINL
+VIALMLLNLHFLPSQAVAAGSPSGLCLYMALLLHYSLLATFSWMALEGFHLYLLLVKVFN
+IYVKKYLLKLSVVGWGVPAMIVSVVVIIDRTFYGLAPLDTSHSSTAM
+>XP_006779760.1 gi|583968609|ref|XP_006779760.1| PREDICTED: probable RNA polymerase II nuclear localization protein SLC7A6OS-like [Neolamprologus brichardi]
+MDPNTTILRVKRKRGTDPADALLLACKRIRPETSQSSGETVPEPNEAEVENSVFKLVATV
+ATQEAPVQTQVRQALARPRTAHALRPSAASSQRILGDLRSTKWSTRREERYRILSSHRAG
+LSAPAEQQTPQMGASECVEETGKETDKCWGLGEIQVVDLIHEDGEDQDKPSGKILSSEPD
+EILCNNTKMLRERLSISGDRLGEEHREQDDGYVYDLYYQETVTPGWIQDILSVRAYADEG
+ELVPDLVVHEEEVYEDEDDENEEGNWRNDYPDEESDTDSDREERYGGYWEEEHSYSRRSW
+QRYQREVTHELGCRGDDDNGDDDDDDGDKYDSD
+>XP_006779761.1 gi|583968612|ref|XP_006779761.1| PREDICTED: Y+L amino acid transporter 2-like [Neolamprologus brichardi]
+MANREESKKMNGNSGDSSTLLETPKESMQLKKEISLLNGVSLIVGNMIGSGIFVSPKGVL
+IYSASYGLSLVIWAIGGLFSVIGALCYAELGTTITKSGASYAYILESFGGFIAFIRLWTS
+LLIIEPTSQAVIAITFANYLVQPLFPTCEPPYAASRLIAAACVCLLTFINSAYVKWGTRV
+QDIFTYAKVAALIVIIVTGIVKLCQGYTGNFESSFQGSSTDPGDIALALYSALFSYSGWD
+TLNFVTEEIKSPERNLPMAIAISMPIVTIIYILTNVAYYAVLDASAILASDAVAVTFADH
+TLGVMSWTIPIAVALSCYGGLNASIIAASRLFFVGSREGHLPDALSMIHIQRFTPIPALI
+FNCVMSLIYLTVEDVFQLINYYSFSYWFFMGLSIAGQIYLRLKEPDRPRPLKLSLLYPVV
+FCLCTIFLVAVPLYSDTVNSLIGIAIALSGVPVYFLGVYLPESKRPPVITKLLRSLTDFT
+QYTCFCVLTEMDKSQ
+>XP_006779762.1 gi|583968614|ref|XP_006779762.1| PREDICTED: G-protein coupled receptor 64-like [Neolamprologus brichardi]
+MGIEVLHTFWLVYMVFTPRLKPYIWNLVGFALPAVPVVILAPIGDIYGPIEVPPSEDPEN
+PYKMCWMDITENKGWLAFCFTNVMILALLVSSGLVMLFLVYRQIRTRDEWKQNRVAFLSI
+WGLSCLYGTTWGLAFLEFEPISTFILFITCILNSFQGFFLMLRFCMLDWMQKQAGGSGLG
+SSSTGSTRQHMLQAQERS
+>XP_006779763.1 gi|583968616|ref|XP_006779763.1| PREDICTED: synapse-associated protein 1-like [Neolamprologus brichardi]
+MLKGLGTWLGLEGPTVTETSVDKEKLNVEQEEKVVEAQTEVNKQQPADQDGTPEAEQENS
+DQSTGLGGYIFSFASSATKKISDSMVETAQTIKKTVEEGKIDGIIDKTFLGDFQKEQEKF
+VQEKKAKKSEAAVPPWVGYNEEETIQQQILALSADKRNFLRDPPAGVQFHFDMEQMYPLA
+AVMLEEDELLNRMRFDLVPKHVKEEMFWRNYFYRVSLIKQSAQLTALAAQQQRNDSVDKG
+ASVSPEDIVLTDNVRPKTPPVSISDIQKPTHEEDEEISTSPGVSEFVSDAFDSTAINQED
+LRKEMEQLVLDKKDSPSPDDESADWEKELQQELQEYEVVTESGNKDDQWDQEIEKMLQSD
+DS
+>XP_006779764.1 gi|583968618|ref|XP_006779764.1| PREDICTED: LOW QUALITY PROTEIN: probable phosphatase phospho2-like [Neolamprologus brichardi]
+MKILMVFDFDHTVVDANSDTWVVRCLPDKTLPGSVENSYRKGYWTEYMGRVLNYIGEQKV
+SPDRVRSVMETIPFTAGMTELLTFIAENKNAIDCIVISDSNTLFIEWILHAAGLQAAVDK
+VFTNPAKLNELGHVEVQCYHSHACDQCPVNLCKKKVLELYLSEQSDAGVEYEQIFYAGDG
+GNDLCPTSCLRGRDVVMPRKGYTLEKLLAKLEGQEGNFSVRAKNIAWSSGTDILRELKAS
+MQSXPWHMKYYKF
+>XP_006779765.1 gi|583968620|ref|XP_006779765.1| PREDICTED: cadherin-8-like isoform X1 [Neolamprologus brichardi]
+MPKRSEEMLTDLWLSLLLVWITCVLSVSMTPIIGQSKSTQTGGSAVVASGVGEGQRLLSR
+AKRGWVWNQMFVLEEFSGPDPILVGRLHTDKVENDTARYSLAGEGAGTIFAINEKTGDIH
+AMKRLDREEKAEYTLTAKVTNGITGQLLEPMTEFIIKVQDINDNAPKFTEGPYHAAVEEM
+SAVGTSVITITATDADDPVYGNSAKLVYSILEGQPYFSVDPNSATIRIALHGMDREMRED
+YQVVIQAKDMGGHMGGLSGTTTVSITLQDINDNPPKFSKSLYEFVIPEDLPLGKEGGKVK
+ANDRDIGENAKSTYSIIEGDDQGVFEIITNATTQEGILQLRKPLDYESKRNYTLKVEATN
+IRSEPRSNGPFKDTATVKIVVEDSDEPPVFSKPMYLLEVDENAPINKIIGTVTARDPDAT
+GSPIRYFIDRHTDLERQFNINVDNGRITLAKPLDRETDMWHNITVTATEVRNHSQISRAV
+VAIRVMDINDNAPEFATEYETFLCENGKPGQVIQTVSAVDKDDPIQGHYFDYRLVPEMLN
+NPNFTIKNNQDNSISVLAKHDTFRRQKQEMYFLPIIVTDNGNPPMSSTNTLTIRVCGCSK
+DGIVQSCNVEAYVLPIGLSMGALIAILACIILLLVIVVLFVTLRRHKNEPLIIKDDEDVR
+ENIIRYDDEGGGEEDTEAFDIATLQNPDGINGYLPRKDIKPDLQFMPRAGQHSGPNGVDV
+DEFINVRLHEADNDPTAPPYDSIQIYGYEGRGSIAGSLSSLETASSDSDQNYDYLREWGP
+RFRRLGELYSVGESDRET
+>XP_006779766.1 gi|583968622|ref|XP_006779766.1| PREDICTED: cadherin-8-like isoform X2 [Neolamprologus brichardi]
+MPKRSEEMLTDLWLSLLLVWITCVLSVSMTPIIGQSKSTQTGGSAVVASGVGEGQRLLSR
+AKRGWVWNQMFVLEEFSGPDPILVGRLHTDKVENDTARYSLAGEGAGTIFAINEKTGDIH
+AMKRLDREEKAEYTLTAKVTNGITGQLLEPMTEFIIKVQDINDNAPKFTEGPYHAAVEEM
+SAVGTSVITITATDADDPVYGNSAKLVYSILEGQPYFSVDPNSATIRIALHGMDREMRED
+YQVVIQAKDMGGHMGGLSGTTTVSITLQDINDNPPKFSKSLYEFVIPEDLPLGKEGGKVK
+ANDRDIGENAKSTYSIIEGDDQGVFEIITNATTQEGILQLRKPLDYESKRNYTLKVEATN
+IRSEPRSNGPFKDTATVKIVVEDSDEPPVFSKPMYLLEVDENAPINKIIGTVTARDPDAT
+GSPIRYFIDRHTDLERQFNINVDNGRITLAKPLDRETDMWHNITVTATEVRNHSQISRAV
+VAIRVMDINDNAPEFATEYETFLCENGKPGQVIQTVSAVDKDDPIQGHYFDYRLVPEMLN
+NPNFTIKNNQDNSISVLAKHDTFRRQKQEMYFLPIIVTDNGNPPMSSTNTLTIRVCGCSK
+DGIVQSCNVEAYVLPIGLSMGALIAILACIILLLVVLFVTLRRHKNEPLIIKDDEDVREN
+IIRYDDEGGGEEDTEAFDIATLQNPDGINGYLPRKDIKPDLQFMPRAGQHSGPNGVDVDE
+FINVRLHEADNDPTAPPYDSIQIYGYEGRGSIAGSLSSLETASSDSDQNYDYLREWGPRF
+RRLGELYSVGESDRET
+>XP_006779767.1 gi|583968626|ref|XP_006779767.1| PREDICTED: T-cell immunomodulatory protein-like [Neolamprologus brichardi]
+MIWTLKLITLAFLLLLGGQYNTFALQDVTADLFGPGNFGTVAAFGDFNSDKQTDIFTIKE
+QSDLVIFLADSKPPYFKPKVQAKNILGKDITSVVPGDYDGDSQMDVLLTAKNGPKTEVFI
+FWGHNQTLDIGGGIKLNYTFSDQPLVMDFNGDMIPDVFGVISSSSSVVCYLTKRTEVCSK
+ALSLTGNMRTPHSNAFIDLDRDFTADLFLTMNNDRMFETWLNKDGNFTKTDVMSKPDETT
+LIGQSSFVDFDGDGYQDHLLPACLDTSCQRSTIYLAKSGSRDSKWIPVLSDFKRKETIWG
+FVPDNLSQPPALHLGDYNLDGFPDALVVLQNKSGSGQQAFLLENVPCNSETCHSVGRMFH
+IHWDQSDLGAIKNAVRATFFDIYEDGILDMLVQSKAEGKQDLRIHALKNNFEADAYFVKV
+MVLSGLCSNDCPEGVKPFGVNQPGPYVMYTTVDSNGYLKNASAGQLSQSAYFSLQLPYTV
+LGLGRSANFLDHLFVGIPRQPGETEIRNKEWTAIIPNSQLIVMPFPHDTPRSWSAKLYLT
+PSNSVLLTAIALIGVCVFILVIIGILHWQEKKADDREKRQEAHRFHFDAM
+>XP_006779768.1 gi|583968628|ref|XP_006779768.1| PREDICTED: neuropilin and tolloid-like protein 2-like [Neolamprologus brichardi]
+MHRAWVLFFLIEEGFALAQRTKESPSDYGGQRPNQNDCGTWIRNINGGSFTSPNYPNPYP
+PNKECVYILEALPRQRIQLSFDKNYYIEPSFECRFDHIEIRDGPFGFSPLIDRFCGGKNP
+EIVTSTGRFMWVKFTSDEELEGLGFRIEYTFIADPDFHLHVGGLLNPIPECQFNVGGWDG
+IIRSSQVEEEKRVKPGDALDCIWTIKAPSQSKIYLRFIDYQMEHSNECKKNFVAVYDGSS
+AIENLKAKFCSTVANDVMLNNDMGVVRMWADEKSRLSRFRMLFTSFIDPPCNDNTFFCHS
+NMCINNSLVCNGVQNCVYPWDENHCKEKRSKGLFHQITKTHGTVIGVSSGIVLVLLIISI
+LVQMKQPRKKVVARRPGVFNKAGFQEVFDPPHYELFSLRDKEMSSDLADLSEELDSFHKM
+RRSSTMSRCVHEHHCGSQGSVATGGGSMKHSRTTLSSMELSYHNDFSKPPPMKTFNSTAS
+YKKSCYGYKQHSQTHDCDQQVIEDRVTEETTCEIYGRGATGVGGGAAGGGAMGGGGASGI
+AGGAIGGAVGITGGVAMGGGMGGGMSMAGAMSMAGPSGIAGGIGGMGGACGTLSVRGNSA
+RNSTTIVDPQQRSMSMDF
+>XP_006779769.1 gi|583968630|ref|XP_006779769.1| PREDICTED: dnaJ homolog subfamily A member 2-like [Neolamprologus brichardi]
+MSNVVDTKLYDILGVSPSATENELKKAYRKLAKEYHPDKNPNSGDKFKEISFAYEVLTNP
+EKKELYDRYGEQGLREGGGGGPGMDDIFSHIFGGGLFGFMGGQSSRSRNGGRRRGEDMVH
+PLKVSLEDLYNGKTTKLQLSKNVLCSTCNGQGGKTGAVQKCTACRGRGMRIMIRQLAPGM
+VQQMQSVCTDCNGEGEVISEKDRCKKCEGKKVVKEVKILEVHVDKGMKHGQKITFGGEAD
+QAPGVEPGDIVLVLQEKEHETYRRDGNDLFMNHKIGLVEALCGFQFMLKHLDGRQIVVKY
+PAGKVIEPGSVRMVRGEGMPQYRNPFEKGDLYIKFDVQFPDNNWISPEKLGELEDMLPSR
+SEPPIISGDTEEVDLQDYDVSQSSSSGNRREAYNDSSDEEGSHHGSGVQCAHQ
+>XP_006779770.1 gi|583968632|ref|XP_006779770.1| PREDICTED: low-density lipoprotein receptor-related protein 3-like [Neolamprologus brichardi]
+MGLTELPLLLPLLGLLWLRCALLCAGCSEQVEIHTERRGVIYSPSWPLNYPAGVNCSWHI
+QGGQGEVITISFRNFDLAESGKCTGDWLLLTPTWKRESRLCGSVLPQPFISTRGRVWLFF
+HSQANSSGQAQGFRLSYIRGHLGQSSCQSDEFLCGNGKCLPRSWKCNGQDECGDASDERS
+CLPTPTEAQPGLCPFGSLPCTEGQSTRCLPTALRCNGARDCHDGSDELGCPDTTCGKRLG
+NFYGSFASPDFFRANRSGDTELRCSWLLDTQDPKPIVLQLDLQLGPGDLLHVYDGLLQRA
+EHLLQVFSYHNNRRPALLESSRGQMSVLYMAQPHSPGHGFNATYQVKGYCFPGERPCGSD
+QGCYSERQRCDGYWHCPSGRDEEGCPMCPDGEFPCEGGTGMCYPASERCNNQKRCPDGSD
+EKNCYDCQPGNFHCGTNLCIFETWRCDGQEDCLDGSDERDCLAAVPRKVITAALIGSLVC
+SLLLVIALGCALKLHSLRNREYRAFETQMTRMEADFVQREAPPSYGQLIAQGLIPPVEDF
+PVYNPTQASVLQNLRLAMRRQIRRHSTRRSTSSSSRRRLGHLWNRLFRSGGRGRGHAPLL
+DPPGPTQITLGLHSYRTVGEQGPQSRAVPAGGSDVVGVDLPESPASPLSFHSVDSPEEEE
+DLSPVSRDGSRAAESSPPTPCQSDSSVQSGLPLSPQEASVPLCPPRASRKLVLELAVNLK
+GVSLRRYSPLGPLSPISPPVFPSSSQTPSTQPQPQGSEVTSPTEPLFSSVKPEDSDSQFT
+VNVPSRDETKPEARSSLCRFGRSISEEGGDLGRETLC
+>XP_006779771.1 gi|583968634|ref|XP_006779771.1| PREDICTED: LOW QUALITY PROTEIN: rhophilin-2-like [Neolamprologus brichardi]
+MTDALLSNGINDGGGDKNYFKKGCNPFAQTGRSKLQNTRASLNQQIIKQMRMRAGAENLL
+KATSNSKVKEMVLLELSYVNSNLQLLMSELEGLNSSVEVYQNNQSSTQRILVPVFLNETT
+VEFSILKIXSDFILEHYSEDGKTFEDEIADFMDLRQACRTPSRSEAGVELLGKYYSHLPL
+IESRFFSPTRQTGIFFTWYTAFLGLKYQQNHICLIXFCFLFFFLLLFSVKSLMIXITSTN
+CSFLALIRFQLVPTALSCPGVLNNLKETFTHTPSYDMSPAMLSMLIRLMLAQAQECLFEK
+IALPGIRNQFYSLMKVAQEAAKVSEIYDQVHQCMIQTPVKDNVPFFWSTMSQIKTNHYRS
+MAHYFVASALLDHQLGPGDDEDKQEKTLSQVYDSLPEGCTALDILKKKDERQRIGKAHIR
+RAIFGHEEALRIYGLCKNTNNLEVLQEILKASHQRSVNKHSENENEEEFADYMEAPKIIS
+KTEHKAEMEFPAAAKVKVIDFFQRLGPQSVFSAKQRWTAPRTIRVRSDDRDLGFTLKGDS
+PVQVVSLDPLCAAAADGLKEGDYIITVGDTECKWMSVSDVMRLLKDVDEEGIDIQVVSMM
+DNSTAMPTKSATFCGNLPKTYSMICLAYNEDDKNSKVRKVAKKSSFLSWGLKNKMKSAST
+LSLPTADKAGALPWNKPCPTFPSSSSYNNDSGLY
+>XP_006779772.1 gi|583968636|ref|XP_006779772.1| PREDICTED: E3 ubiquitin-protein ligase RNF182-like [Neolamprologus brichardi]
+MKDSAAETSGVEEGESHTLGQEHDLKMSCPQTEFEEKESPPPEELECKICYQRYNVHHRK
+PKILDCLHRVCARCLIKILDIADSAGCISCPFCRHQTEITEQEISALPDDVNIVSHLVMR
+DKSWNSDQNREVVLTPKSFSSSSPSHDSSNCLVITIMEVQRDSQHSPSQNGSSDVYAEQS
+LDSVSIGSNGPADQDALSKFCNHVPRILVWLLGFLYFGSLPLGIYLLVIQRVTLGIVCVS
+LVPSSLTVCLVYGFCQCLCQGMCDCSSRG
+>XP_006779773.1 gi|583968638|ref|XP_006779773.1| PREDICTED: centrosomal protein of 89 kDa-like [Neolamprologus brichardi]
+MLRFSFRREKDKEFKHIAHGLIPAASIAPKPAVPRTPPPRSPNPSPERPRSALAAAILSS
+SLTGQTWAIPPARLMSLSESGQSESFTSEPNISTALYTRDRWSEDLVSRPRLSSPDQSEG
+ELEDKEQEVVDEEDGEEHVYHTLDRRQNSSLTESVYALPLKAKSVFKSTTPLPTQTSGRR
+ESSPDFTEETSGQSPEPKEKKMSVRKTLENWKDDVPTTPTISTAGHPRQASQAKSPKDLR
+ELPPEPSNTYSELRKKVVRDRREKNTRMVDKEKLQEERLQRLEREISDSKAFSNQRSSAG
+SQAELQNLRQHAQELVDENDALKLTVHRLNVELSHYQARFRPLSKEEHSKVSGLPNTGSP
+PPWLVDMKYSSPLLLAYEDRMNEKDAILQTTEENMEKLHVQLEEVIKENEKLHDEITKTG
+AVNQKDCYQIQQQAVLVLQENQVLINQLEAQHAEAKDTHSRHNTEVAKVSKKMMLLEVEN
+QRLEGDLEESRRELQKNKRDLQVLQARLKDAVTWDEHCSIAGKLRRQLEQHESRSKDGID
+KLLLRVSNLQEENRILALDKAQLTAKTRAMEAELELSRQASRKAERRMSMLKQQKAECVL
+KEEKTRHYLGAVISVAEHISQERDRLLHMASSLQQEKQRFISRILSGTVRFGKLQEEVKV
+YRSQASTRLAALEEAVEGRTVSYQTEILHLQTLLRERQEAEEKLLQSKREIEEELEVVWE
+AATRENQQMRETLLDSKLTGDLHSWPAHAPDEITTSSQQQQHKHGLDFYC
+>XP_006779774.1 gi|583968640|ref|XP_006779774.1| PREDICTED: myocyte-specific enhancer factor 2A-like [Neolamprologus brichardi]
+MGRKKIQITRIVDERNRQVTFMKRKFGLMKKAYELSVLCDCEIALIIFNGSNKLFQYAST
+DMDKVLLKYTEYNEPHESRTNSDIVEALNKKEHRGCDSPDADASYVLTPNTEEKYKKINE
+EFDNMMKTHKISTGQQQQQHQQHFMHVAPGSMAYSHSGGGGATSQALAAATAALADGGIL
+PSPHSHLHRNINSSQRPPSAGGGLQGSSELALQNGSGPTVNGFGKIIPSKSPPPPPPHGN
+SMVPTSRKTDLRVVIPHSKGMMQTLNNQRMSSSQSSQPLSTPVVSITTPSLPHQSLVYAG
+IGSAYNDYSLNSGELSGFNSAAGPSLSSMAAWEQQQLSSMG
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/part3.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,343 @@
+>XP_006779775.1 gi|583968642|ref|XP_006779775.1| PREDICTED: COUP transcription factor 2-like [Neolamprologus brichardi]
+MAMVAWRNTEAVGDSQGTLSSPVSQVAPLSLPGELTGHMNPAPSLEIPQTAAAPQGAPPP
+NPSGNTVATTTNNNNSTSSSSSSSSLSMDKQQSQQIECIVCGDKSSGKHYGQFTCEGCKS
+FFKRSVRRNLTYTCRANRNCPIDQHHRNQCQYCRLKKCLKVGMRREAVQRGRIPTQSYHG
+QFALTNGDPLQCHSYLSGYISLLLRAEPYPTSRFGSQCLQNNNILGIENICELAARMLFS
+AVEWARNIPFFPDLQVPDQVALLRLTWSELFVLNAAQCSMPVHAAPLLAAAGLHASPMSA
+DRVVAFMDHIRVFQEQVEKLKVLHVDSAEYSCIKAIVLFTTDACGLSDVAHVEGLQEKSQ
+CALEEYVRSQYPNQPNRFGKLLLRLPSLRSVSSSVIEQLFFVRLVGKTPIETLIRDMLLS
+GSSFNWPYMAIQ
+>XP_006779776.1 gi|583968644|ref|XP_006779776.1| PREDICTED: solute carrier organic anion transporter family member 3A1-like [Neolamprologus brichardi]
+MQVKNQICTERSSNDDPEQDDNQKKTSCFSNIKIFLVSECALMLAQGTVGAYLVSVLTTL
+ERRFNLQSADVGVIASSFEIGNLALILFVSYFGAKAHRPRLIGCGGIVMALGALLSALPE
+FLTHQYEYEAGDSWHAEDGRDVCSNISRSENRDSGFKCGNRANTNMMYLLLIGAQVLLGI
+GATPVQPLGVSYIDDHVHRKDSSLYIGILFSTLVFGPACGFILGSVCTKVYVDAVFIDTS
+TLDITPDDPRWIGAWWGGFLLCGALLFLSALFMFGFPQALDEQDMDSGAESEQAMLPSSL
+SLEFQGSKPNGAIHGFDINSGLSVCQHLRVIPRVTRHLLSNPVFSCITLAACMEIAVVAG
+FAAFLGKYLEQQFNLTTSSANQLLGMTAIPCACLGIFLGGLLVKKLNLSALGAVRMAMLV
+NLVSTACYVSFLFLGCDTGPVAGVTVAYGNETLQSWQQPESACISNCNCYTASVSPVCGS
+NGVTYLSACFAGCTKPNLTNCACISSNSEEAVALPGKCPSPGCQQAFLTFLCVICVCSMI
+GAMAQTPSVIILIRTVSPELKSYALGVLFLLLRLIGFIPPPLIFGMGIDSTCLFWSSVCG
+EKGACMLYDNVAYRHLYVSIAIVLKSSAFLLYTTTWQCLRKNYRKYIKNNEGYLTPTELF
+ASNVTLDNLGKDITQNPTNRTKFIYNLEDRETCDNMESVL
+>XP_006779777.1 gi|583968646|ref|XP_006779777.1| PREDICTED: gonadotropin-releasing hormone II receptor-like isoform X1 [Neolamprologus brichardi]
+MNGSSCCDPAAVMYQQRSGLDLNASCEWPDPHCNWTSVDGALQLPTFSTAAKIRVIVTFI
+LCGISTFCNLAVLWAANGHKRKSHVRVLIINLTAADLLVTFIVMPVDAVWNITVQWLAGD
+LACRFLMFLKLQAMYSCAFVTVVISLDRQSAILNPLGIAMVRKRNRVMLMVAWIMSALLS
+IPQMFIFHNVTITYPANFTQCTTRGSFVTHWQETAYNMFTFCCLFLLPLVIMIICYTRIF
+VQISKQMTKKNMPSNEPHLRCSKNNIPKARMRTLKMSIVIVICFIVCWTPYYLLGLWYWF
+FPDDLEGKVSHSLTHILFIFGLFNACLDPIIYGLFTIRFQKGLRNCYRKAAVMSSLETNA
+VIMESLKCTGSVLPSKRGMTSGEKDISSEQAEAKSTDNSV
+>XP_006779778.1 gi|583968648|ref|XP_006779778.1| PREDICTED: gonadotropin-releasing hormone II receptor-like isoform X2 [Neolamprologus brichardi]
+MNGSSCCDPAAVMYQQRSGLDLNASCEWPDPHCNWTSVDGALQLPTFSTAAKIRVIVTFI
+LCGISTFCNLAVLWAANGHKHAVWNITVQWLAGDLACRFLMFLKLQAMYSCAFVTVVISL
+DRQSAILNPLGIAMVRKRNRVMLMVAWIMSALLSIPQMFIFHNVTITYPANFTQCTTRGS
+FVTHWQETAYNMFTFCCLFLLPLVIMIICYTRIFVQISKQMTKKNMPSNEPHLRCSKNNI
+PKARMRTLKMSIVIVICFIVCWTPYYLLGLWYWFFPDDLEGKVSHSLTHILFIFGLFNAC
+LDPIIYGLFTIRFQKGLRNCYRKAAVMSSLETNAVIMESLKCTGSVLPSKRGMTSGEKDI
+SSEQAEAKSTDNSV
+>XP_006779779.1 gi|583968650|ref|XP_006779779.1| PREDICTED: lactoylglutathione lyase-like [Neolamprologus brichardi]
+MSDKGLSDEAVAAVCKDGDPITKDFMMQQTMLRVKDPNKSLDFYTRILGMTLLQKFDFPS
+MRFSLFFLGYEDKKEIPADVKEKTAWTFSRRATLELTHNWGSESDDSQSYHNGNSDPRGF
+GHIGIAVPDVYAACKLFEEQGVTFVKKPDDGKMKGLAFIQDPDGYWIEILSPNNMVSITS
+K
+>XP_006779780.1 gi|583968652|ref|XP_006779780.1| PREDICTED: bifunctional glutamate/proline--tRNA ligase-like isoform X1 [Neolamprologus brichardi]
+MALNLTINTSNPPLGALLTAEHVKSSVQVSVEEGKDTRLHISDSVQFSDDNSICRYLARV
+APALGLYGSNMMEQTEVDHWLEFSARSLCNQPDLTVALAELDKALSLRTFLVGHALTLAD
+LSVWAALKDHGEWPKQGKSFSHVSRWFFFLSSQVPFTAVGNKYASKKASMNKTKSEGKKA
+DVGKFVELPGAEMGKVVVRFPPEASGYLHIGHAKAALLNQHYQVTFKGKLIMRFDDTNPE
+KEKEDFEKVILEDVAMLQIHPDQFTYTSDHFPIIMKFAEKLLAEGKAYIDNTPPEQMKQE
+REQRVESTCRNNSVEQNMKMWSEMKAGTEYGQTCCMRAKIDMNSNNGCMRDPTLYRCKNA
+AHPRTGNTYNIYPTYDFACPIVDSLEGVTHALRTTEYHDRDEQFYWIINALGLRKPYVWE
+YARLNLNNTVLSKRKLTWFVDQGYVDGWDDPRFPTVRGVLRRGMTVEGLKQFIAAQGGSR
+SVVNMEWDKIWSFNKKLPVSCLKVIDPVAPRYTALSSSYVVPVSVPEATEEMKEIAKHPK
+NAEVGMKEVWFGPRVLIEGADAETFTEGETVTFINWGNLIITKINKGADGKVLSMKASLN
+LDNKDYKKTTKITWLAETNNSLPVPAICVNYQPLISKAVITKDDNFKDYINKHSKLEEKM
+LGDPCLKNLKKGDIIQLQRRGFYICDQPYEPLSPNSCKESPCVLIYIPDGHTKEMPTAGS
+KEKSKTQASDNTPASPAKAPKTSVPAPASAPAADLFSSIVAQGEAVRLLKAAKAPKDEVD
+KAVKQLLSLKEQFKQQTGVEYKPGMAPPASTPAPPTSSSDSTSCPYTRVVQQGELVRKLK
+AEQAPKDQIDAAVKQLLALKAEFKKLTGQDYKPGMATPAPSASSPVTATSSSSPPSSSSG
+LYEHVAQQGEVVRKLKSEKAPKDQVDAAVKQLLALKEEYKRITGQEYKPGATPPQKAPAP
+VQNGSTNDLYEKVAEQGELVRKLKAEKAPKDQVDAAVKQLLALKAEYKQNTGKDYKPGLQ
+APATSAQTQTQASSASTQSNSSPQAQELFSQVSQQGDLVRKLKSEKAPKDQVDEAVKTLL
+DLKSKYKTLTGQDYKPVAAAGGTGGEDKNRKEKENKSEKQGGGGGGKKGKGDKGGQSKES
+SGGAGGAGEGQGPKKQTRLGLEAKKEENLADWYSQVITKAEMIEYYDVSGCYVLRPWAFS
+IWESIKDFFDKEIKKLGVENCYFPMFVSQAALEKEKSHIADFAPEVAWVTRSGKTELAEP
+IAVRPTSETVMYPAYAKWVQSHRDLPIKLNQWCNVVGWEFKHPQPFLRTREFLWQEGHTA
+FATKEEAAEEVLQILDLYARVYEELMAIPVVKGRKTEKEKFAGGDYTTTVEAFISASGRA
+IQGATSHHLGQNFSKMFEIVFEDPKRPGEKQLAFQNSWGITTRTIGVLTMVHGDDMGLVL
+PPRVACLQVVIIPCGITATLPEQEKEVLLAQCTKYLKRLQEAGIRVKSDLRDNYSPGWKF
+NHWELKGVPIRLEVGPKDMQQKQCVAVRRDSGAKVTIAEAEVEKNLLNMLEDIQNSLFKK
+ASDDLKSHMVAADTMEQFQKELDQGKIVQIPFCGGIECEDWIKKTTAKDQDLEPGAPSMG
+AKSLCIPFTPLKTLQPGQKCVSGKEPAQYYTLFGRSY
+>XP_006779781.1 gi|583968654|ref|XP_006779781.1| PREDICTED: bifunctional glutamate/proline--tRNA ligase-like isoform X2 [Neolamprologus brichardi]
+MALNLTINTSNPPLGALLTAEHVKSSVQVSVEEGKDTRLHISDSVQFSDDNSICRYLARV
+APALGLYGSNMMEQTEVDHWLEFSARSLCNQPDLTVALAELDKALSLRTFLVGHALTLAD
+LSVWAALKDHGEWPKQGKSFSHVSRWFFFLSSQVPFTAVGNKYASKKASMNKTKSEGKKA
+DVGKFVELPGAEMGKVVVRFPPEASGYLHIGHAKAALLNQHYQVTFKGKLIMRFDDTNPE
+KEKEDFEKVILEDVAMLQIHPDQFTYTSDHFPIIMKFAEKLLAEGKAYIDNTPPEQMKQE
+REQRVESTCRNNSVEQNMKMWSEMKAGTEYGQTCCMRAKIDMNSNNGCMRDPTLYRCKNA
+AHPRTGNTYNIYPTYDFACPIVDSLEGVTHALRTTEYHDRDEQFYWIINALGLRKPYVWE
+YARLNLNNTVLSKRKLTWFVDQGYVDGWDDPRFPTVRGVLRRGMTVEGLKQFIAAQGGSR
+SVVNMEWDKIWSFNKKVIDPVAPRYTALSSSYVVPVSVPEATEEMKEIAKHPKNAEVGMK
+EVWFGPRVLIEGADAETFTEGETVTFINWGNLIITKINKGADGKVLSMKASLNLDNKDYK
+KTTKITWLAETNNSLPVPAICVNYQPLISKAVITKDDNFKDYINKHSKLEEKMLGDPCLK
+NLKKGDIIQLQRRGFYICDQPYEPLSPNSCKESPCVLIYIPDGHTKEMPTAGSKEKSKTQ
+ASDNTPASPAKAPKTSVPAPASAPAADLFSSIVAQGEAVRLLKAAKAPKDEVDKAVKQLL
+SLKEQFKQQTGVEYKPGMAPPASTPAPPTSSSDSTSCPYTRVVQQGELVRKLKAEQAPKD
+QIDAAVKQLLALKAEFKKLTGQDYKPGMATPAPSASSPVTATSSSSPPSSSSGLYEHVAQ
+QGEVVRKLKSEKAPKDQVDAAVKQLLALKEEYKRITGQEYKPGATPPQKAPAPVQNGSTN
+DLYEKVAEQGELVRKLKAEKAPKDQVDAAVKQLLALKAEYKQNTGKDYKPGLQAPATSAQ
+TQTQASSASTQSNSSPQAQELFSQVSQQGDLVRKLKSEKAPKDQVDEAVKTLLDLKSKYK
+TLTGQDYKPVAAAGGTGGEDKNRKEKENKSEKQGGGGGGKKGKGDKGGQSKESSGGAGGA
+GEGQGPKKQTRLGLEAKKEENLADWYSQVITKAEMIEYYDVSGCYVLRPWAFSIWESIKD
+FFDKEIKKLGVENCYFPMFVSQAALEKEKSHIADFAPEVAWVTRSGKTELAEPIAVRPTS
+ETVMYPAYAKWVQSHRDLPIKLNQWCNVVGWEFKHPQPFLRTREFLWQEGHTAFATKEEA
+AEEVLQILDLYARVYEELMAIPVVKGRKTEKEKFAGGDYTTTVEAFISASGRAIQGATSH
+HLGQNFSKMFEIVFEDPKRPGEKQLAFQNSWGITTRTIGVLTMVHGDDMGLVLPPRVACL
+QVVIIPCGITATLPEQEKEVLLAQCTKYLKRLQEAGIRVKSDLRDNYSPGWKFNHWELKG
+VPIRLEVGPKDMQQKQCVAVRRDSGAKVTIAEAEVEKNLLNMLEDIQNSLFKKASDDLKS
+HMVAADTMEQFQKELDQGKIVQIPFCGGIECEDWIKKTTAKDQDLEPGAPSMGAKSLCIP
+FTPLKTLQPGQKCVSGKEPAQYYTLFGRSY
+>XP_006779782.1 gi|583968656|ref|XP_006779782.1| PREDICTED: bifunctional glutamate/proline--tRNA ligase-like isoform X3 [Neolamprologus brichardi]
+MALNLTINTSNPPLGALLTAEHVKSSVQVSVEEGKDTRLHISDSVQFSDDNSICRYLARV
+APALGLYGSNMMEQTEVDHWLEFSARSLCNQPDLTVALAELDKALSLRTFLVGHALTLAD
+LSVWAALKDHGEWPKQGKSFSHVSRWFFFLSSQVPFTAVGNKYASKKASMNKTKSEGKKA
+DVGKFVELPGAEMGKVVVRFPPEASGYLHIGHAKAALLNQHYQVTFKGKLIMRFDDTNPE
+KEKEDFEKVILEDVAMLQIHPDQFTYTSDHFPIIMKFAEKLLAEGKAYIDNTPPEQMKQE
+REQRVESTCRNNSVEQNMKMWSEMKAGTEYGQTCCMRAKIDMNSNNGCMRDPTLYRCKNA
+AHPRTGNTYNIYPTYDFACPIVDSLEGVTHALRTTEYHDRDEQFYWIINALGLRKPYVWE
+YARLNLNNTVLSKRKLTWFVDQGYVDGWDDPRFPTVRGVLRRGMTVEGLKQFIAAQGGSR
+SVVNMEWDKIWSFNKKLPVSCLKVIDPVAPRYTALSSSYVVPVSVPEATEEMKEIAKHPK
+NAEVGMKEVWFGPRVLIEGADAETFTEGETVTFINWGNLIITKINKGADGKVLSMKASLN
+LDNKDYKKTTKITWLAETNNSLPVPAICVNYQPLISKAVITKDDNFKDYINKHSKLEEKM
+LGDPCLKNLKKGDIIQLQRRGFYICDQPYEPLSPNSCKESPCVLIYIPDGHTKEMPTAGS
+KEKSKTQASDNTPASPAKAPKTSVPAPASAPAADLFSSIVAQGEAVRLLKAAKAPKDEVD
+KAVKQLLSLKEQFKQQTGVEYKPGMAPPASTPAPPTSSSDSTSCPYTRVVQQGELVRKLK
+AEQAPKDQVDAAVKQLLALKEEYKRITGQEYKPGATPPQKAPAPVQNGSTNDLYEKVAEQ
+GELVRKLKAEKAPKDQVDAAVKQLLALKAEYKQNTGKDYKPGLQAPATSAQTQTQASSAS
+TQSNSSPQAQELFSQVSQQGDLVRKLKSEKAPKDQVDEAVKTLLDLKSKYKTLTGQDYKP
+VAAAGGTGGEDKNRKEKENKSEKQGGGGGGKKGKGDKGGQSKESSGGAGGAGEGQGPKKQ
+TRLGLEAKKEENLADWYSQVITKAEMIEYYDVSGCYVLRPWAFSIWESIKDFFDKEIKKL
+GVENCYFPMFVSQAALEKEKSHIADFAPEVAWVTRSGKTELAEPIAVRPTSETVMYPAYA
+KWVQSHRDLPIKLNQWCNVVGWEFKHPQPFLRTREFLWQEGHTAFATKEEAAEEVLQILD
+LYARVYEELMAIPVVKGRKTEKEKFAGGDYTTTVEAFISASGRAIQGATSHHLGQNFSKM
+FEIVFEDPKRPGEKQLAFQNSWGITTRTIGVLTMVHGDDMGLVLPPRVACLQVVIIPCGI
+TATLPEQEKEVLLAQCTKYLKRLQEAGIRVKSDLRDNYSPGWKFNHWELKGVPIRLEVGP
+KDMQQKQCVAVRRDSGAKVTIAEAEVEKNLLNMLEDIQNSLFKKASDDLKSHMVAADTME
+QFQKELDQGKIVQIPFCGGIECEDWIKKTTAKDQDLEPGAPSMGAKSLCIPFTPLKTLQP
+GQKCVSGKEPAQYYTLFGRSY
+>XP_006779783.1 gi|583968658|ref|XP_006779783.1| PREDICTED: bifunctional glutamate/proline--tRNA ligase-like isoform X4 [Neolamprologus brichardi]
+MALNLTINTSNPPLGALLTAEHVKSSVQVSVEEGKDTRLHISDSVQFSDDNSICRYLARV
+APALGLYGSNMMEQTEVDHWLEFSARSLCNQPDLTVALAELDKALSLRTFLVGHALTLAD
+LSVWAALKDHGEWPKQGKSFSHVSRWFFFLSSQVPFTAVGNKYASKKASMNKTKSEGKKA
+DVGKFVELPGAEMGKVVVRFPPEASGYLHIGHAKAALLNQHYQVTFKGKLIMRFDDTNPE
+KEKEDFEKVILEDVAMLQIHPDQFTYTSDHFPIIMKFAEKLLAEGKAYIDNTPPEQMKQE
+REQRVESTCRNNSVEQNMKMWSEMKAGTEYGQTCCMRAKIDMNSNNGCMRDPTLYRCKNA
+AHPRTGNTYNIYPTYDFACPIVDSLEGVTHALRTTEYHDRDEQFYWIINALGLRKPYVWE
+YARLNLNNTVLSKRKLTWFVDQGYVDGWDDPRFPTVRGVLRRGMTVEGLKQFIAAQGGSR
+SVVNMEWDKIWSFNKKVIDPVAPRYTALSSSYVVPVSVPEATEEMKEIAKHPKNAEVGMK
+EVWFGPRVLIEGADAETFTEGETVTFINWGNLIITKINKGADGKVLSMKASLNLDNKDYK
+KTTKITWLAETNNSLPVPAICVNYQPLISKAVITKDDNFKDYINKHSKLEEKMLGDPCLK
+NLKKGDIIQLQRRGFYICDQPYEPLSPNSCKESPCVLIYIPDGHTKEMPTAGSKEKSKTQ
+ASDNTPASPAKAPKTSVPAPASAPAADLFSSIVAQGEAVRLLKAAKAPKDEVDKAVKQLL
+SLKEQFKQQTGVEYKPGMAPPASTPAPPTSSSDSTSCPYTRVVQQGELVRKLKAEQAPKD
+QVDAAVKQLLALKEEYKRITGQEYKPGATPPQKAPAPVQNGSTNDLYEKVAEQGELVRKL
+KAEKAPKDQVDAAVKQLLALKAEYKQNTGKDYKPGLQAPATSAQTQTQASSASTQSNSSP
+QAQELFSQVSQQGDLVRKLKSEKAPKDQVDEAVKTLLDLKSKYKTLTGQDYKPVAAAGGT
+GGEDKNRKEKENKSEKQGGGGGGKKGKGDKGGQSKESSGGAGGAGEGQGPKKQTRLGLEA
+KKEENLADWYSQVITKAEMIEYYDVSGCYVLRPWAFSIWESIKDFFDKEIKKLGVENCYF
+PMFVSQAALEKEKSHIADFAPEVAWVTRSGKTELAEPIAVRPTSETVMYPAYAKWVQSHR
+DLPIKLNQWCNVVGWEFKHPQPFLRTREFLWQEGHTAFATKEEAAEEVLQILDLYARVYE
+ELMAIPVVKGRKTEKEKFAGGDYTTTVEAFISASGRAIQGATSHHLGQNFSKMFEIVFED
+PKRPGEKQLAFQNSWGITTRTIGVLTMVHGDDMGLVLPPRVACLQVVIIPCGITATLPEQ
+EKEVLLAQCTKYLKRLQEAGIRVKSDLRDNYSPGWKFNHWELKGVPIRLEVGPKDMQQKQ
+CVAVRRDSGAKVTIAEAEVEKNLLNMLEDIQNSLFKKASDDLKSHMVAADTMEQFQKELD
+QGKIVQIPFCGGIECEDWIKKTTAKDQDLEPGAPSMGAKSLCIPFTPLKTLQPGQKCVSG
+KEPAQYYTLFGRSY
+>XP_006779784.1 gi|583968660|ref|XP_006779784.1| PREDICTED: kinesin-like protein KIF13B-like isoform X1 [Neolamprologus brichardi]
+MGEPSLDDSNVKVAVRVRPMNRREKELNTKCVVEMVKNQTILHPAGGNLGKGDSRSQSKV
+FAYDYCFWSMDETDKEKFAGQEVVFQCLGESLLHNAFQGYNACIFAYGQTGSGKSYTMMG
+SVDQPGLIPRLCSALFERTQKEQREEESFTVEVSYMEIYNEKVRDLLDPKGGRQTLRVRE
+HKVLGPYVDGLSRLAVASYKDIESLMSEGNKSRTVAATNMNEESSRSHAVFNIILTHTLK
+DLKSGTSGEKVSRLSLVDLAGSERAAKTGAAGERLKEGSNINKSLTTLGLVISALAEQGT
+AKNKTKFVPYRDSVLTWLLKDCLGGNSRTAMVATVSPAADNYEETLSTLRYADRAKSIVN
+HAVVNEDPNARIIRELREEVEKLRVQLTQAESLKAPELKDRLEESEKLIQEMTVTWEEKL
+RKTEEIAQERQKQLESLGISLQSSGIKVGDDKSFLVNLNADPALNELLVYYLKEHTKVGS
+ADSQDIQLCGMGIQAEHCVIDITAEAAVILAPYRNARTCVNGSPVTSALQLHHGDRILWG
+NNHFFRINLPKRRSRAADDEEGEGGVMKNSGSSEQLDADGDTASEVSSEVSFSYEFAQTE
+VMMKALGSNDPMQAVLQSLERQHEEEKRSALERQRQMYEQELQQLRKKLNPERLSTGQSG
+GPTIGQQGPGQQSHYRSMERLSIGGMSHSSSAQSRLRQWSEDREAVLVRSLRRLREQIVR
+ANLLVQEACFIADELERHTEYRVTLQIPSDNLNANRKRDAVLSEPAIQVRRRGRGKQIWS
+LEKMENRLVDMRELYQEWQDYHLNNPDDQVMRSYFRRADPFFDEQENHSLIGVANVFLSC
+LFYDVKLQYAVPIINQKGEVAGRLHVEVVRVGGGLEDNMAGGDEPDNNQDIEVQDRKLVC
+MIKILQATGLPQYLSNFVFCQYSFWDQPEPIIVAPEVDTSSSSPSNKDPHCMVVFDSCKE
+LAVSVTEEFIEHLTEGAVAIEVYGHRQADAGRNPALWDLSIIQAKTRTLRDRWSEVTRKL
+ELWIQILEINENGDFVPVEVVPARDVRTGGIFQLRQGQSRRIQVDVRSVQDSGTMPLIAE
+IVLAVSVGCVEIRNTTANQEADEMDSYQERDLERLRRQWLGALTKRQEYLDQHLQSLVSK
+AEKTEDDMEREAQLLEWRLTLTEERNAVMVPSAGSGIPGAPAEWVPLPGMETHIPVLFLN
+LKPDDLSSQDQFEVPEAGGWDAILNGEDEDDFFDLQIVRHYDGEVKAEASWDSTVHECPQ
+LSRGGSYPEQRVYLTIRVVVQLSHPADMQLVLRKRICVNVNPGRQGFAHNFLRRMSTRST
+VPGCGVTFEVVSNIPGDAPGSEDREMLARLAASAHNSQSGDDEAAIEKYLRSVLSLENIL
+TLDRLRQEVAVKEQLTSRGKSNRRSISSPSVNRLSGSRQDLSTTCLLDDKGRWESQQDIY
+MPSQFPRTLPRPASSPSTYSTSPSSSPTPFGTPPPQNQEPEQGRSGLAASYLSVKALVPQ
+MPKLLKSLFPVRDEKKELRPSPQNQQQHVPRIVTSSGGDDNKGKTETTAILRPPAKDRRA
+ELPEVSPLPVHDPHDTTPLSPLSQSSSGYFSASVSTATLCDVLQPSSSSSSLLAAETTLP
+TNPQQQGADRNDIVTSPSQFGAKVSAVASPASHNSANHNSITSDVSSEQKLINSGGSEGF
+ERLEIFVEDDERGGEDVLPDWLTEGAYVTVGNNKAGTVRYIGVTQFAEGVWVGVELDTPV
+GKNDGSVGGQRYFHCKPGYGVLVRPNRLSSRERTNRQTGEFTPSAHVPILRGEAIVARRG
+ENRKSWSS
+>XP_006779785.1 gi|583968662|ref|XP_006779785.1| PREDICTED: kinesin-like protein KIF13B-like isoform X2 [Neolamprologus brichardi]
+MGEPSLDDSNVKVAVRVRPMNRREKELNTKCVVEMVKNQTILHPAGGNLGKGDSRSQSKV
+FAYDYCFWSMDETDKEKFAGQEVVFQCLGESLLHNAFQGYNACIFAYGQTGSGKSYTMMG
+SVDQPGLIPRLCSALFERTQKEQREEESFTVEVSYMEIYNEKVRDLLDPKGGRQTLRVRE
+HKVLGPYVDGLSRLAVASYKDIESLMSEGNKSRTVAATNMNEESSRSHAVFNIILTHTLK
+DLKSGTSGEKVSRLSLVDLAGSERAAKTGAAGERLKEGSNINKSLTTLGLVISALAEQGT
+AKNKTKFVPYRDSVLTWLLKDCLGGNSRTAMVATVSPAADNYEETLSTLRYADRAKSIVN
+HAVVNEDPNARIIRELREEVEKLRVQLTQAESLKAPELKDRLEESEKLIQEMTVTWEEKL
+RKTEEIAQERQKQLESLGISLQSSGIKVGDDKSFLVNLNADPALNELLVYYLKEHTKVGS
+ADSQDIQLCGMGIQAEHCVIDITAEAAVILAPYRNARTCVNGSPVTSALQLHHGDRILWG
+NNHFFRINLPKRRSRAADDEEGEGGVMKNSGSSEQLDADGDTASEVSSEVSFSYEFAQTE
+VMMKALGSNDPMQAVLQSLERQHEEEKRSALERQRQMYEQELQQLRKKLNPERLSTGQSG
+GPTIGQQGPGQQSHYRSMERLSIGGMSHSSSAQSRLRQWSEDREAVLVRSLRRLREQIVR
+ANLLVQEACFIADELERHTEYRVTLQIPSDNLNANRKRDAVLSEPAIQVRRRGRGKQIWS
+LEKMENRLVDMRELYQEWQDYHLNNPDDQVMRSYFRRADPFFDEQENHSLIGVANVFLSC
+LFYDVKLQYAVPIINQKGEVAGRLHVEVVRVGGGLEDNMAGGDEPDNNQDIEVQDRKLVC
+MIKILQATGLPQYLSNFVFCQYSFWDQPEPIIVAPEVDTSSSSPSNKDPHCMVVFDSCKE
+LAVSVTEEFIEHLTEGAVAIEVYGHRQADAGRNPALWDLSIIQAKTRTLRDRWSEVTRKL
+ELWIQILEINENGDFVPVEVVPARDVRTGGIFQLRQGQSRRIQVDVRSVQDSGTMPLIAE
+IVLAVSVGCVEIRNTTANQEADEMDSYQERDLERLRRQWLGALTKRQEYLDQHLQSLVSK
+AEKTEDDMEREAQLLEWRLTLTEERNAVMVPSAGSGIPGAPAEWVPLPGMETHIPVLFLN
+LKPDDLSSQDQFEVPEAGGWDAILNGEDEDDFFDLQIVRHYDGEVKAEASWDSTVHECPQ
+LSRGGSYPEQRVYLTIRVVVQLSHPADMQLVLRKRICVNVNPGRQGFAHNFLRRMSTRST
+VPGCGVTFEVVSNIPGDAPGSEDREMLARLAASAHNSQSGDDEAAIEKYLRSVLSLENIL
+TLDRLRQEVAVKEQLTSRGKSNRRSISSPSVNRLSGSRQDLSTTCLLDDKGRWESQQDIY
+MPSQFPRTLPRPASSPSTYSTSPSSSPTPFGTPPPQNQEPEQGRSGLAASYLSVKALVPQ
+MPKLLKSLFPVRDEKKELRPSPQNQQHVPRIVTSSGGDDNKGKTETTAILRPPAKDRRAE
+LPEVSPLPVHDPHDTTPLSPLSQSSSGYFSASVSTATLCDVLQPSSSSSSLLAAETTLPT
+NPQQQGADRNDIVTSPSQFGAKVSAVASPASHNSANHNSITSDVSSEQKLINSGGSEGFE
+RLEIFVEDDERGGEDVLPDWLTEGAYVTVGNNKAGTVRYIGVTQFAEGVWVGVELDTPVG
+KNDGSVGGQRYFHCKPGYGVLVRPNRLSSRERTNRQTGEFTPSAHVPILRGEAIVARRGE
+NRKSWSS
+>XP_006779786.1 gi|583968664|ref|XP_006779786.1| PREDICTED: kinesin-like protein KIF13B-like isoform X3 [Neolamprologus brichardi]
+MGEPSLDDSNVKVAVRVRPMNRREKELNTKCVVEMVKNQTILHPAGGNLGKGDSRSQSKV
+FAYDYCFWSMDETDKEKFAGQEVVFQCLGESLLHNAFQGYNACIFAYGQTGSGKSYTMMG
+SVDQPGLIPRLCSALFERTQKEQREEESFTVEVSYMEIYNEKVRDLLDPKGGRQTLRVRE
+HKVLGPYVDGLSRLAVASYKDIESLMSEGNKSRTVAATNMNEESSRSHAVFNIILTHTLK
+DLKSGTSGEKVSRLSLVDLAGSERAAKTGAAGERLKEGSNINKSLTTLGLVISALAEQGT
+AKNKTKFVPYRDSVLTWLLKDCLGGNSRTAMVATVSPAADNYEETLSTLRYADRAKSIVN
+HAVVNEDPNARIIRELREEVEKLRVQLTQAESLKAPELKDRLEESEKLIQEMTVTWEEKL
+RKTEEIAQERQKQLESLGISLQSSGIKVGDDKSFLVNLNADPALNELLVYYLKEHTKVGS
+ADSQDIQLCGMGIQAEHCVIDITAEAAVILAPYRNARTCVNGSPVTSALQLHHGDRILWG
+NNHFFRINLPKRRSRAADDEEGEGGVMKNSGSSEQLDADGDTASEVSSEVSFSYEFAQTE
+VMMKALGSNDPMQAVLQSLERQHEEEKRSALERQRQMYEQELQQLRKKLNPERLSTGQSG
+GPTIGQQGPGQQSHYRSMERLSIGGMSHSSSAQSRLRQWSEDREAVLVRSLRRLREQIVR
+ANLLVQEACFIADELERHTEYRVTLQIPSDNLNANRKRDAVLSEPAIQVRRRGRGKQIWS
+LEKMENRLVDMRELYQEWQDYHLNNPDDQVMRSYFRRADPFFDEQENHSLIGVANVFLSC
+LFYDVKLQYAVPIINQKGEVAGRLHVEVVRVGGGLEDNMAGGDEPDNNQDIEVQDRKLVC
+MIKILQATGLPQYLSNFVFCQYSFWDQPEPIIVAPEVDTSSSSPSNKDPHCMVVFDSCKE
+LAVSVTEEFIEHLTEGAVAIEVYGHRQADAGRNPALWDLSIIQAKTRTLRDRWSEVTRKL
+ELWIQILEINENGDFVPVEVVPARDVRTGGIFQLRQGQSRRIQVDVRSVQDSGTMPLIAE
+IVLAVSVGCVEIRNTTANQEADEMDSYQERDLERLRRQWLGALTKRQEYLDQHLQSLVSK
+AEKTEDDMEREAQLLEWRLTLTEERNAVMVPSAGSGIPGAPAEWVPLPGMETHIPVLFLN
+LKPDDLSSQDQFEVPEAGGWDAILNGEDEDDFFDLQIVRHYDGEVKAEASWDSTVHECPQ
+LSRGGSYPEQRVYLTIRVVVQLSHPADMQLVLRKRICVNVNPGRQGFAHNFLRRMSTRST
+VPGCGVTFEVVSNIPGDAPGSEDREMLARLAASAHNSQSGDDEAAIEKYLRSVLSLENIL
+TLDRLRQEVAVKEQLTSRGKSNRRSISSPSVNRLSGSRQDLSTTCLLDDKGRWESQQDIY
+MPSQFPRTLPRPASSPSTYSTSPSSSPTPFGTPPPQNQEPEQVKALVPQMPKLLKSLFPV
+RDEKKELRPSPQNQQQHVPRIVTSSGGDDNKGKTETTAILRPPAKDRRAELPEVSPLPVH
+DPHDTTPLSPLSQSSSGYFSASVSTATLCDVLQPSSSSSSLLAAETTLPTNPQQQGADRN
+DIVTSPSQFGAKVSAVASPASHNSANHNSITSDVSSEQKLINSGGSEGFERLEIFVEDDE
+RGGEDVLPDWLTEGAYVTVGNNKAGTVRYIGVTQFAEGVWVGVELDTPVGKNDGSVGGQR
+YFHCKPGYGVLVRPNRLSSRERTNRQTGEFTPSAHVPILRGEAIVARRGENRKSWSS
+>XP_006779787.1 gi|583968666|ref|XP_006779787.1| PREDICTED: prepronociceptin-like [Neolamprologus brichardi]
+MKTVVALLLLCLCDPGQSDCQADCLSCNNILPKQLSFNTMVCFIECESSVSPSSSWDLCH
+EALLSQILSPSGSVWKRSQEEVEALFPGEDEQMKGSLFLPIALQRVDHVTHGLDTEERDL
+GGKGNHLNAAYNSQNAMSLEDEYAEEEEGQEGGDPDVAAGQGDVALISKRFGGFVKGRHG
+HRRLMSPGRSYQKRYGGFVGIRKSARKWNNQKRFSEFLKQYLGMSTRATEFNSVSEDLAQ
+QNEV
+>XP_006779792.1 gi|583968676|ref|XP_006779792.1| PREDICTED: NT-3 growth factor receptor-like isoform X1 [Neolamprologus brichardi]
+MDLWFHSIRICWWRVLFLMSIFQDYLSSMLDCPPTCSCSQTEIFCNKSDNGRFFPLLALQ
+DTGSNGTSVDIAELFKNITSIHIENWTGLQTLRDVDMELYTGLQKLTIMNCNLKSIQPRA
+FAQNPHLSTINLSKNPLTTLSWQLFQHLQLQELRLDGVVFDCGCDIRWIQLWHQRGEAKL
+NTQQLYCRNGATKIRLENMYIHNCDLPEISVSHSSVLVMEGDNVTVSCNGSGSPLPEVDW
+TVSGLHSINTHLSNVYWPNIHSINLTLFNISRDDNNFQLTCIAENVVGMTNSSIQLNVQF
+PPVILRLAEPEQRLDTCIEFTVRGYPQPQLRWFHKQKEIIKNDYIRTEMDFYQDYLEGCL
+TFQNPTHINNGNYTLEASNALGTVTKTVYGHFLENPDEPDPVEEVTPPHPRPPDEDTFGV
+SIAVGLAGFACVLLLVLFVLINKYGRRSKFGMKGPVAVISGEEDSASPLHHVNHGIITPC
+TLDASPDAVVIGMTRIPVVENPQYFRHGHNCNKPATLVQHIKRRDIILKRELGEGAFGKV
+FLAECYNLSPTKDKMLVAVKTLKDPNLSARKDFQREAELLTNLQHDHIVKFYGVCVDGDP
+LIMVFEYMKHGDLNKFLRAHGPDAMILVDGQPLQSNGELGLSQMLHIATQIASGMVYLAS
+QHFVHRDLATRNCLVGNGLLVKIGDFGMSRDIYSSDYYRVGGHTMLPIRWMPPESIMYRK
+FSTESDVWSFGVILWEIFTYGKQPWFQLGNNEVIECITQGRVLERPRICPKEVYDIMLGC
+WQREPQQRLNIKDIQKVLFAMGKATPVYLDILG
+>XP_006779793.1 gi|583968679|ref|XP_006779793.1| PREDICTED: NT-3 growth factor receptor-like isoform X2 [Neolamprologus brichardi]
+MDLWFHSIRICWWRVLFLMSIFQDYLSSMLDCPPTCSCSQTEIFCNKSDNGRFFPLLALQ
+DTGSNGTSVDIAELFKNITSIHIENWTGLQTLRDVDMELYTGLQKLTIMNCNLKSIQPRA
+FAQNPHLSTINLSKNPLTTLSWQLFQHLQLQELRLDGVVFDCGCDIRWIQLWHQRGEAKL
+NTQQLYCRNGATKIRLENMYIHNCDLPEISVSHSSVLVMEGDNVTVSCNGSGSPLPEVDW
+TVSGLHSINTHLSNVYWPNIHSINLTLFNISRDDNNFQLTCIAENVVGMTNSSIQLNVQF
+PPVILRLAEPEQRLDTCIEFTVRGYPQPQLRWFHKQKEIIKNDYIRTEMDFYQDYLEGCL
+TFQNPTHINNGNYTLEASNALGTVTKTVYGHFLENPDEPVTPPHPRPPDEDTFGVSIAVG
+LAGFACVLLLVLFVLINKYGRRSKFGMKGPVAVISGEEDSASPLHHVNHGIITPCTLDAS
+PDAVVIGMTRIPVVENPQYFRHGHNCNKPATLVQHIKRRDIILKRELGEGAFGKVFLAEC
+YNLSPTKDKMLVAVKTLKDPNLSARKDFQREAELLTNLQHDHIVKFYGVCVDGDPLIMVF
+EYMKHGDLNKFLRAHGPDAMILVDGQPLQSNGELGLSQMLHIATQIASGMVYLASQHFVH
+RDLATRNCLVGNGLLVKIGDFGMSRDIYSSDYYRVGGHTMLPIRWMPPESIMYRKFSTES
+DVWSFGVILWEIFTYGKQPWFQLGNNEVIECITQGRVLERPRICPKEVYDIMLGCWQREP
+QQRLNIKDIQKVLFAMGKATPVYLDILG
+>XP_006779794.1 gi|583968681|ref|XP_006779794.1| PREDICTED: synaptic vesicle glycoprotein 2B-like [Neolamprologus brichardi]
+MDDPYRNNVNQQMTEGGDYTYTQDGGGQDGYPYQTDYPPQDEDAASDATEGADEDDQMYE
+GEYQGIPHPDEIKEARRAARVEARRKARMAAQQEEEEENLPEQYETIMEDCGHGRFQWML
+FFVLGLALMADGVDGFVVGFVLPSAEKDMCISNADKGLLGLLVYVAMMVGALVWGGLCDK
+MGRRKCLIYVLTIDLVFSFLSCFAQGYGFFLFLRFCSGFGIGGSIPIVYTYFTEFLQMDK
+RGEHLSWLCMFWMFGGLYASFTAWGIIPHYGWGFAIGTHIQMHSWRLFILVCLFPALAAL
+IGLVFMPESPRFLLENARHDEAWMILRQVHDTNWKAKGEPERVFTVTNIKTPQTQDDEFI
+EIQSETGTAFQRWTVRKMTMLQQVMANIMSLSAPELRLQGLLLVIVWFCLAFSYHGLGVW
+FPDMIKYMQYEEYESKVRIFHRERVERFHFNFSLVNQIHREGEYIHDKFANIEIKSVKFE
+SSLFENCYFEDVKSTNTFFENCTIKNTVFYNTDLWQDKFKNCRMENATFLHPKKGCHLNF
+QEENDIVIYMVSFLGSLAVLPGNIISALFMDKIGRIRIIGGSMLASSACTFLLLLSFSQG
+AVICWQCLFYGVSVAAWNGLEVISVELYPSSKRGTAFGILNGICKFAAIIASSIFAAFIG
+ITKIIPIFLAFAALVCGGMVALKLPETREKILS
+>XP_006779795.1 gi|583968683|ref|XP_006779795.1| PREDICTED: AP-3 complex subunit sigma-2-like [Neolamprologus brichardi]
+MIKAILIFNNHGKPRLIRFYQYFAEDMQQQIIRETFHLVSKRDDNVCNFLEGGSLIGGSD
+YKLIYRHYATLYFVFCVDSSESELGILDLIQVFVETLDKCFENVCELDLIFHMDKVHYIL
+QEVVMGGMVLETNMNEIVAQVEVQNRMEKSEGGLSAAPARAVSAVKNMNLPEIPRNINIG
+DINIKVPSLSPF
+>XP_006779796.1 gi|583968685|ref|XP_006779796.1| PREDICTED: synaptosomal-associated protein 25-B-like isoform X1 [Neolamprologus brichardi]
+MADESDMRNELADLQTRADQIADESLESTRRMLALVEESKDAGIRTLVMLDEQGEQLERI
+EEGMDQINKDMKDAEKNLNNLGQFCGLCSCPCNKIKGGGQAWGGNQDGVVNSQPGARVVD
+EREQMAISGGFIRRVTNDARENEMDENLEQVGGIIGNLRHMALDMGQEIDTQNRQIDRIM
+DKADSNKTRIDEANQRATKMLGSG
+>XP_006779797.1 gi|583968687|ref|XP_006779797.1| PREDICTED: synaptosomal-associated protein 25-B-like isoform X2 [Neolamprologus brichardi]
+MADESDMRNELADLQTRADQIADESLESTRRMLALVEESKDAGIRTLVMLDEQGEQLDRV
+EEGMNKVNADLKEAEKDLKDIGQCCGLICPCIKKIKGGGQAWGGNQDGVVNSQPGARVVD
+EREQMAISGGFIRRVTNDARENEMDENLEQVGGIIGNLRHMALDMGQEIDTQNRQIDRIM
+DKADSNKTRIDEANQRATKMLGSG
+>XP_006779798.1 gi|583968689|ref|XP_006779798.1| PREDICTED: protein FAM219B-like [Neolamprologus brichardi]
+MMNDILEEPEKDSLLEAQQDSQGLSGPSSGTRPKSIDGGIRPVEKRGPYIMSRAPAIHLK
+LQKHREMARKALKKKALSPGPPVTHQPRQGAKRMVKYNKGYAALSQHAEDTLVAIDSDSD
+EEIDFEQYSSGYSSAEIHPDLSKQLLQDGYRLDEIPDDEDLDLIPPKAMGSSVCCCSEGP
+SCPIQ
+>XP_006779799.1 gi|583968691|ref|XP_006779799.1| PREDICTED: semaphorin-7A-like [Neolamprologus brichardi]
+MFLEIWKMRFSLVACLFFLHICCLAVGNDRSPRMIFTEKEAAMNRLDLLHGPPVRILLEE
+KPDTVLAVGKTYLNTYNIKNQNKNQTRMQLENCNRNCSYDITLAHLMEDAKKLFVCGTIH
+DETVCCNSNLTEQPPICKDIKDISSFNIKEGDLSALAESKQSTDLYITRSGSDESVGIHK
+FGKARVGPKNHHKEQHYVGLVLSKREEDPSQNRVYGFYREKTKDDGLFSEMWLPFVTQVC
+MTDVGGPKNNLQYTWTSQMNARLFCGDQERKQHFSELVDVSTVDADRWQYTKIYALFRNE
+WGMSAVCVYTIEDISKIFENSPFNGYTKKQMDRPRMCAPDSSKLSVDTLKNIDKTSEMEQ
+LVHPVGNPGLLFFNHRNYTHIQVDSKPNSRGGLEWLQFLTVNNGGIHKVLQNESHTFVIA
+EYQPFKQKAHVLSIILQSTFKKLYVNNGSQLVQLDVADCSQYGDTCQDCMLSRDPYCGWN
+GTQCIRETEGSWHDAATGNLSICNEHNASNYKGDPVPVPRYSKYFLQCPVSSRHAQYSWQ
+HDENSTACSSGKEQCLYLIDNMDSECKGTYKCISQEMGYSKVLVQYELQVENDAKTQPYK
+RLWPNKAEGRKTSPVIWVCLMMALIKSLSF
+>XP_006779800.1 gi|583968694|ref|XP_006779800.1| PREDICTED: cytochrome P450 1A1-like [Neolamprologus brichardi]
+MALMILPFIGALSVSHVLVAVTTACLVYMIIKNAQNKIPEGLQQLPGPKPFPIIGNVLEL
+GSRPYLSLTSMSKRYGDVFQIQIGMRPVVVLSGNETVRQALIKQGDEFAGRPDLYSFRYI
+NDGKSLSFSTDQAGIWRARRKLAYSALRSFSNLDSTTPEYSCALEEHISKETEYLIKELN
+TVMKTKGSFDPFRYVVVSVANVICGMCFGRRYDHHDDELVSLVNLSDDFVKVVGSGNPAD
+FIPLLQYLPSTKMKKFMSLNARFSKFVQKLVTEHYATFDKDNIRDITDSLIDHCEDRKLD
+ENANIQMSDEKIVGIVNDLFGAGFDTISTALSWSLMYFVAYPEIQNRLFEEIKEKVGLDR
+MPVFSDRNNLPLLEAYILELFRHSSYLPFTIPHCTTKDTSLNGYFIPKDTCVFINQWQIN
+HDPEMWEDPFSFKPERFLNADGTEVNKVEGEKVMTFGLGKRRCIGEVIARNEVFLFLAIL
+IQKLNFQALPGDQLDLTPEYGLTMKHKRYHLRATMRVRNEQ
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/part4.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,245 @@
+>XP_006779801.1 gi|583968696|ref|XP_006779801.1| PREDICTED: enhancer of mRNA-decapping protein 3-like [Neolamprologus brichardi]
+MATDWVGSVVSIDCGATLGVYQGEVSSVDRVSQTISLKHPYHNGVKCPVPEVTFSAMDIK
+DLKFLDIQNKVNKTSAGKDTATEPSYISTGRHGQTNKTNHSLAISNSSGLSSNPRKGSSN
+SRGTTQSTPRRSNVRNGGAGGQRSKNDECFGDGTDENLDTDFDFEGNLALFDKAAVFSQI
+DGASSNSNKLQHHNTQAEQKTQSYRHDENILEVKPVTYRQITVPQHGGKEYCTDTGLVVP
+TVPYELHKQLLAAAERWGLSLERRLEAVGVCSSQMALTLLGGPNRLTPKNVHQRPTVVLL
+CGPHVQGAQGISCGRHLANHEVEVILFLPNFVKMQESVTSEVNLFSKTSGKQVSSVKDLP
+MSPVDLVINCLDCHENPLLKEQSWYQSVADWANKNRAPVLSIDPPVSEQPQSVDAKWTLS
+LGLPLPLADKDSRVYLCDIGLPKMVYQEVGINYHSPFGCKFVIPLHSV
+>XP_006779802.1 gi|583968698|ref|XP_006779802.1| PREDICTED: tyrosine-protein kinase CSK-like isoform X1 [Neolamprologus brichardi]
+MSGIHVPWSTGTECVAKYNFQTANEQDLPFCKGDVLTIIGVTRDPNWYRARNQVGREGTI
+PANYVQKREGVKSGGKLSLMPWFHGKITREQAERLLYPPETGLFLVRESTNYPGDYTLCV
+SCDGKVEHYRIIYHNGKLTIDEEEYFENLMQLVEHYTKDADGLCTRLIKPKLMEGTVAAQ
+DEFSRSGWALNRKELKLLQTIGKGEFGDVMVGDYRGTKVAVKCIKNDATAQAFIAEASVM
+TQLRHNNLVQLLGVIVEERGSLYIVTEYMAKGSLVDYLRSRGRTVLGGDCLLKFSLDVCE
+AMEYLEANNFVHRDLAARNVLVSDDNIAKVSDFGLTKEASSIQDTAKLPVKWTSPEALRE
+KRFSTKSDVWSYGILLWEIYSFGRVPYPRIPLKEVVPRVEKGYKMDAPDGCPAVVYDLMK
+QCWTLDPVMRPSFRMLREKLQHIRAKELYL
+>XP_006779803.1 gi|583968700|ref|XP_006779803.1| PREDICTED: tyrosine-protein kinase CSK-like isoform X2 [Neolamprologus brichardi]
+MSGIHVPWSTGTECVAKYNFQTANEQDLPFCKGDVLTIIGVTRDPNWYRARNQVGREGTI
+PANYVQKREGVKSGGKLSLMPWFHGKITREQAERLLYPPETGLFLVRESTNYPGDYTLCV
+SCDGKVEHYRIIYHNGKLTIDEEEYFENLMQLVEHYTKDADGLCTRLIKPKLMEGTVAAQ
+DEFSRSGWALNRKELKLLQTIGKGEFGDVMVGDYRGTKVAVKCIKNDATAQAFIAEASVM
+TQLRHNNLVQLLGVIVEERGSLYIVTEYMAKGSLVDYLRSRGRTVLGGDCLLKFSLDVCE
+AMEYLEANNFVHRDLAARNVLVSDDNIAKVSDFGLTKEASSIQDTAKLPVKWTSPEALRE
+KRFSTKSDVWSYGILLWEIYSFGRVPYPRIPLKEVVPRVEKGYKMDAPDGCPAVVYDLMK
+QCWTLDPVMRPSFRMLREKLQHIRAKELYL
+>XP_006779804.1 gi|583968702|ref|XP_006779804.1| PREDICTED: complexin-3-like [Neolamprologus brichardi]
+MAFMVKHVVGGQLKNLTGGLTEEKSEGEKSDAAAQGMTQEEFEQYQQQLEEEKKEREAHY
+AQKKAERATVRTHFREKYRLPKNEMDETQIQQAGDDVVLPTELAKMIAEDNEEETHKQSV
+LGQLSNIQNVDIDQLKDKAQATLEDLKKQTENCSLM
+>XP_006779805.1 gi|583968704|ref|XP_006779805.1| PREDICTED: growth arrest-specific protein 1-like [Neolamprologus brichardi]
+MKCWCSALALLPWVLVALDAQLICWQALLRCHDEPECELAYNQYMTACEGNIKGTRKQCP
+SHCISALIRLNHTRSGPDLETCDCAQDLDCLDAKRAIEPCLPRRHPKDAGGIGCMEARQR
+CEEDSNCHTSLTAYLSYCGQLFNGRKCSSKCKATIQQMLFIPNGMLLNRCICDGVERPFC
+EVVKENMSKLCSIGDHSVVSDPTKDYEDPYEDDYSKNDKEVDFSENSSASQSLSRGVLPL
+CLLTARILY
+>XP_006779806.1 gi|583968706|ref|XP_006779806.1| PREDICTED: serine/threonine-protein kinase ULK3-like [Neolamprologus brichardi]
+MASTSSFAPPKLSDFILTERLGSGTYATVYKAYRKGNSREVVAVKVVGKKTLNKASTENL
+LTEIEILKTVRHPHIVQLKDFQWDAENIYLILEWCSGGDLSRFIRSRRILPESVTRRFLQ
+QIACALQFLHERNISHLDLKPQNILLSGSILKLADFGFAQYMSPWDEQSVLRGSPLYMAP
+EMVCRRQYDSRVDLWSVGVILYEALFGRAPFASKSYAELEEKIRSNQPIELPPGARVSKD
+CRDLLLRLLERNPDARITFAEFFTHPFVDMEHMPSAESIVKAKKLVLQAIQKDQEGERSE
+ALSLYCSALEHFVPAIYYETNCQRKEALRQKVRQYVSRAEELKALVASDNRLSFEQARTS
+RDILREMSKDQPRLLAALEMASTAIAKEESGSDDLEALDMYQQCLGELLLGLAAEPQGRR
+RELLHSEIKSLMSRAEYLKKHIKMQETQRDVSLDRESLAESVRSSCCLQ
+>XP_006779807.1 gi|583968708|ref|XP_006779807.1| PREDICTED: TM2 domain-containing protein 3-like [Neolamprologus brichardi]
+MATVCQIWRPDRGRCLKSYGIIAVLFMDLMLQCVNGSLSTTNVETHYTRDGPFITSPVVP
+DASSVFPADEDTSKCPSGGLCHRLPAHCIQCDYHLKCTYGKPTLFTCRPKKGVHCIGESG
+HQQTNFSLNITCQFCWQLDPSQYRCTNSTNCMTVSCPRKRYNATCDVLDHVHCLGKRRFP
+KRLFCNWTGGYKWSTALALSITLGGFGADRFYLGQWREGLGKLFSFGGLGIWTLIDVLLI
+GVGYVGPVDGSLYI
+>XP_006779808.1 gi|583968710|ref|XP_006779808.1| PREDICTED: la-related protein 6-like [Neolamprologus brichardi]
+MYALVNAFMRCLSFLLPPSWLYVSFCLWVGNECEETLQRPNPRARFKSREPLTYEEVKAA
+AKAAAEAEAQGGSRPSVSPGPDCVSLAATSPAAPKGPSSGLIWIGGLWRAVERVFGAPWV
+LLRHHLCPKRRRAALGAPYPVCAFELGKIKSFQRGAAAAAAAAKIVDVKGPGETTFTYSK
+NMSGSVGVPSVNSTECASDASAEQGIDEVITVDQLSQEMGTVTITVAIQAAEDEEPEEVT
+SNNADFLGGSCSEDEIGRHDKSSGAGTSGGELEEESWQPPDPELIQKLVTQIEYYLSDEN
+LEHDAFLLKHVRRNKLGFVSVKLLTSFKKVKHLTRDWRTTAYALRHSKILELNDEGRKVR
+RKSAVPVFASESLPSRMLLLSDLQRWPELAALTKDNGSAEGGATQQEQLMKLLLKAFGTY
+GAIASVRVLKPGKDLPADLKRLSGRYAQLGTEECAIVEFEEVEAAVKANEAAGSENGGPN
+LLGLKVVLIGTKPPKKKVPKERPREEGGMRKSRSLNSRVRELQYHGDDSACSSSETESTP
+TSPRLARKSQSCNKLSPTTAGISFQNNHLSPSMSPRNSPWSSPRASPCSQRKSPHSHKSP
+LAVEGRLSPEAGRRWADYSSDSSLTPSGSPWVQRRKQVASQESSPVGSPMLGRKIQNADG
+LPPGVMRLPRGPDGTRGFHCVAIERGKTAATQT
+>XP_006779809.1 gi|583968712|ref|XP_006779809.1| PREDICTED: leucine-rich repeat-containing protein 49-like isoform X1 [Neolamprologus brichardi]
+MEEDLAEGKITRSHKQNTSEKWMFLTPMINSCKLHLTTVKSLVPARAQAMSDSQDHVKET
+FNYSDLENSLHAGIQKRVVQELFESDKCTYNQKAGAAVSNAAYKARHKARRQTQCTGETF
+GQNALKNAKPAGDFPGCNYSALPGFLSTQLPFTSSFQQIDLERQSLEECPQLDFVKELQF
+LNLQHNLITKIQHLSHLQQLVSLNLHDNHISDMAGIEVLRSLKILILGKNRIHEICCLDS
+LSKLNMLDLHDNQICRIENVSHLSELRVLNLAGNNILKMENLQGLDSLTELNLGQNCISV
+VTEVDRLPLLQRLFLSCNNITSFDQLACLGESCSLSELTLDGNPVALETWYKQAVLRCVL
+HLRQLDMKRITDEDRRMAGVQARKEEEKKKESHKQTIHKEKRRLAIRNAAQQWEGVRACL
+ELPSTNGAKEEVSPENSPAHSPAQTNGLTQEPSPDEPRRVSPGSGPERPSGGTEIRLQTN
+SRPNSPRDPKLVEAGSGSVQSLSLSDSHLAELDGDTLRLFGLGALEALERGWGVQTAGAV
+TVITFRYINFDAIVPTLPRIRVKFPNLSHMIFLETNISRLPQLAALAQVRRLDQLTIHPD
+GNPVVSLTLWRSFVIYRLHHFNLQRINGQEVTMNDVIAAERVFGTLGHIAATETPRCRLL
+LLLEESRKRQLQFLLEGRGRRAGLSPEELRDNGKLLGEGLSRALFNYPSRDCSAESPEEG
+SVESSERATMVEQYLQELVQSASDTNLKGEALHKLWPSMFAEMVRDCVLEMRDRAAFRQA
+SLAKLSETK
+>XP_006779810.1 gi|583968715|ref|XP_006779810.1| PREDICTED: leucine-rich repeat-containing protein 49-like isoform X2 [Neolamprologus brichardi]
+MEEDLAEGKITRSHKQNTSEKWMFLTPMINSCKLHLTTVKSLVPARAQAMSDSQDHVKET
+FNYSDLENSLHAGIQKRVVQELFESDKCTYNQKAGAAVSNAAYKARHKARRQTQCTGETF
+GQNALKNAKPAGDFPGCNYSALPGFLSTQLPFTSSFQQIDLERQSLEECPQLDFVKELQF
+LNLQHNLITKIQHLSHLQQLVSLNLHDNHISDMAGIEVLRSLKILILGKNRIHEICCLDS
+LSKLNMLDLHDNQICRIENVSHLSELRVLNLAGNNILKMENLQGLDSLTELNLGQNCISV
+VTEVDRLPLLQRLFLSCNNITSFDQLACLGESCSLSELTLDGNPVALETWYKQAVLRCVL
+HLRQLDMKRITDEDRRMAGVQARKEEEKKKESHKQTIHKEKRRLAIRNAAQQWEGVRACL
+ELPSTNGAKEEVSPENSPAHSPAQTNGLTQEPSPDEPRRVSPGSGPERPSGGTEIRLQTN
+SRPNSPRDPKLVEAGSGSVQSLSLSDSHLAELDGDTLRLFGLGALEALERGWGVQTAGAV
+TVITFRYINFDAIVPTLPRIRVKFPNLSHMIFLETNISRLPQLAALAQVRRLDQLTIHPD
+GNPVVSLTLWRSFVIYRLHHFNLQRINGQEVTMNDVIAAERVFGTLGHIAATETPRCRLL
+LLLEESRKRQLQFLLEGRGRRAGLSPEELRDNGKLLGEGLSRALFNYPSRDCSAESPEEG
+SVESSERATMVEQYLQELVQSASDTNLKGEALHKLWPSMFAEMVRDCVLEMRDRAAFRQA
+SLAKLSETK
+>XP_006779811.1 gi|583968717|ref|XP_006779811.1| PREDICTED: xaa-Pro dipeptidase-like [Neolamprologus brichardi]
+MAAAAQPVYWLGNDTLRVSAALFAENRRRLCQGLKAKDGVVPKSVVVLQGGEQTQRYCTD
+TDVLFRQESFFHWAFGVTEADCYGAIDVDSGKSILFVPKLPESYATWMGEIFPKEHFKEK
+YAVDEVHHTCDIANVLSNLKPAVLLTLRGQNTDSGSTCREASFDGISRFQVNNTLLHPVI
+VDCRVVKTDMELEVLRYTNRVSSEAHKMVMKHVKPGKKEYEMESLFQHYCYTKGGMRHTS
+YTCICGTGNNSSVLHYGHAGAPNDKTITDGDMCLFDMGGEYYCYSSDITCSFPANGKFTP
+DQRAIYEAVLKASRAVMAALRPGVKWTDMHRVADRVHLEELVKIGILHGSVEDMMKVHLG
+SVFMPHGLGHLLGIDVHDVGGYPEGIERIDEPGLKSLRMGRLVQERMVLTVEPGIYFINH
+LLNQALANPAQSCFIDNQVLARFRGFGGVRIEDDIAVTADGIELMTCVPRTVEEIEAFMA
+DSTKPFSPVV
+>XP_006779812.1 gi|583968719|ref|XP_006779812.1| PREDICTED: carbohydrate sulfotransferase 8-like isoform X1 [Neolamprologus brichardi]
+MLWMKWKMVVDSLRGRRRRLPCSLWFVLLFAAGGLVLFIHQQALSEMVQQQGPENVTNKQ
+QLKVTALKTRQSISGVKLGSTPRQSRETLSTRDRERGKSDSFQDLQVTENILSSAIPPMQ
+FPHFEKSRKTASPGSQEQDIGSLHVTKRQRKLLKTSPPIRHTKNTISSSSSSSVSSSSSI
+SSSITSGFFSPESWQKLSGILEARQQLMKEICAKYKSSISKTITRHHVKSIFVEDKYKLL
+YCQVPKAGCSNWKRTLMVLAGKASNTQSIKHDTVHYGQHLKKLDSFDQQGIMHRLQTYTK
+VIFVREPLERMVSAYRDKFENPNNYYHSLFGKPIISKYRVNPSKAALKTGNGVTFKEFVQ
+YLLDVHRPVGMDIHWEQANQLCNPCLIDYDFIGKFENMEEESNFLLRLSGAPPNLTLPSF
+KDRNPSDKRTSMQITENYFSQVSALERQRVYDFYYMDYLMFNYSKPFKDLY
+>XP_006779813.1 gi|583968721|ref|XP_006779813.1| PREDICTED: carbohydrate sulfotransferase 8-like isoform X2 [Neolamprologus brichardi]
+MLWMKWKMVVDSLRGRRRRLPCSLWFVLLFAAGGLVLFIHQQALSEMVQQQGPGVKLGST
+PRQSRETLSTRDRERGKSDSFQDLQVTENILSSAIPPMQFPHFEKSRKTASPGSQEQDIG
+SLHVTKRQRKLLKTSPPIRHTKNTISSSSSSSVSSSSSISSSITSGFFSPESWQKLSGIL
+EARQQLMKEICAKYKSSISKTITRHHVKSIFVEDKYKLLYCQVPKAGCSNWKRTLMVLAG
+KASNTQSIKHDTVHYGQHLKKLDSFDQQGIMHRLQTYTKVIFVREPLERMVSAYRDKFEN
+PNNYYHSLFGKPIISKYRVNPSKAALKTGNGVTFKEFVQYLLDVHRPVGMDIHWEQANQL
+CNPCLIDYDFIGKFENMEEESNFLLRLSGAPPNLTLPSFKDRNPSDKRTSMQITENYFSQ
+VSALERQRVYDFYYMDYLMFNYSKPFKDLY
+>XP_006779814.1 gi|583968723|ref|XP_006779814.1| PREDICTED: BTB/POZ domain-containing protein kctd15-like isoform X1 [Neolamprologus brichardi]
+MFETEGRSMSRLSLTRSPVSPLAAQGIPLPAQLTKANAPVHIDVGGHMYTSSLATLTKYP
+DSRISRLFNGTEPIVLDSLKQHYFIDRDGEIFRYILSFLRTSKLLLPDDFKDFHLLYEEA
+RYYQLTPMIKELERWKQEREQRRMAQPCDCLVVRVTPDLGERIALSGEKVLIEEIFPETG
+DVMCNSVNAGWNQDPTHVIRFPLNGYCRLNSVQVLERLFQKGFSVAASCGGGVDSSQFSE
+YVLCREDRRSLSINTPIRIKQEPLD
+>XP_006779815.1 gi|583968725|ref|XP_006779815.1| PREDICTED: BTB/POZ domain-containing protein kctd15-like isoform X2 [Neolamprologus brichardi]
+MFKEGRSMSRLSLTRSPVSPLAAQGIPLPAQLTKANAPVHIDVGGHMYTSSLATLTKYPD
+SRISRLFNGTEPIVLDSLKQHYFIDRDGEIFRYILSFLRTSKLLLPDDFKDFHLLYEEAR
+YYQLTPMIKELERWKQEREQRRMAQPCDCLVVRVTPDLGERIALSGEKVLIEEIFPETGD
+VMCNSVNAGWNQDPTHVIRFPLNGYCRLNSVQVLERLFQKGFSVAASCGGGVDSSQFSEY
+VLCREDRRSLSINTPIRIKQEPLD
+>XP_006779816.1 gi|583968727|ref|XP_006779816.1| PREDICTED: transcription initiation factor TFIID subunit 4-like isoform X1 [Neolamprologus brichardi]
+MAGASDPLEDMLFSEVDEKAVSDLVGSLESQLAGQSNPAGKADENGGAGSVAPANHHLGK
+TLPAPVSTTTLEQQQQQQGRRNKTEMRQEINSKDVSPDKTVTSPSPGCSPSFGEPSTTSG
+ACVSATSSGSQSHGASITTLTASGVSTLASLPPASISTTISSQGSKVTVGTGETSTGATP
+PRKRITTPRRSASARIKSLNGAAVTTRRNSNTAVVDSVSQVDTSASTPNSGRPVTTSINT
+STFTLSNASLPVGQSAIALDRGTPTIALHRLPSHIVASIAQNGNGTSVSALVQQGARIGP
+VTSLASPGNQTKMVTDTGASKTDDCQSKIVMLTQSSVVNSVVNTVSTSSPPLPPPPPSST
+SSSIVTPPTTTTAAATTTITITQPLNSITPAACVTGMATSSVCGAGQTTSVTTTITMVRP
+TAPSPTPAVATSAQSQPRPGLTAPQRIVTPQLIVRPPQQQTTIQLPPGFTIPQGMVLVRT
+ELGQLVMVPQQALAQAQAQAQAQAQAQAQNNISPRPATPTTGTSFRVTSPQQSPVTSQTS
+RQCPLTPAKMAPSPSPTPSSPALQTSSSSSSSSSSSCPALRPKGPVAPVVAVTAPQQTPV
+VLPPQAPAQPAPQPVQPAQPGIATASGGSVASQEMQENVKKCKNFLATLIKLASHNSPSP
+ETSKNVKALVQDLLDAKIEPEEFTSRLQTELKSSPQPYLVPFLKKSLPALRLSLLNSQQS
+LTQPPQQGLKPAPCGTPPAIVAGPAVRIRHPNSVSTTTGASALPAGTLGHAAAMGVKTGG
+AVGGQVRMPVVITQSIRAQGTMGKGAIIQAGKSPMGLPVQITGNQKNKLNDPGGGTFRDD
+DDINDVASMAGVNLNEESARILATNSDLVGTQIRSCKDEAFLHPGLLHRRIQETAKKFGI
+TEVPMETVTFISHATQSRLRTVVEKVSTIAQHRLDSCKDDECYEQSADVRSQLRFFEQLE
+RIEKQRKDEQEREILLKAAKSRSRQEDPEQARLKQKAKEMQQQELAQMRQRDANLTALAA
+IGPRKKRKVDSPGATPSGTEVSGSTAGSPASSSAPSTSSRQYTRQRITRVNLRDLIFYME
+QERETAHSLLLYRALLK
+>XP_006779817.1 gi|583968729|ref|XP_006779817.1| PREDICTED: transcription initiation factor TFIID subunit 4-like isoform X2 [Neolamprologus brichardi]
+MAGASDPLEDMLFSEVDEKAVSDLVGSLESQLAGQSNPAGKADENGGAGSVAPANHHLGK
+TLPAPVSTTTLEQQQQQQGRRNKTEMRQEINSKDVSPDKTVTSPSPGCSPSFGEPSTTSG
+ACVSATSSGSQSHGASITTLTASGVSTLASLPPASISTTISSQGSKVTVGTGETSTGATP
+PRKRITTPRRSASARIKSLNGAAVTTRRNSNTAVVDSVSQVDTSASTPNSGRPVTTSINT
+STFTLSNASLPVGQSAIALDRGTPTIALHRLPSHIVASIAQNGNGTSVSALVQQGARIGP
+VTSLASPGNQTKMVTDTGASKTDDCQSKIVMLTQSSVVNSVVNTVSTSSPPLPPPPPSST
+SSSIVTPPTTTTAAATTTITITQPLNSITPAACVTGMATSSVCGAGQTTSVTTTITMVRP
+TAPSPTPAVATSAQSQPRPGLTAPQRIVTPQLIVRPPQQQTTIQLPPGFTIPQGMVLVRT
+ELGQLVMVPQQALAQAQAQAQAQAQAQAQNNISPRPATPTTGTSFRVTSPQKGPVAPVVA
+VTAPQQTPVVLPPQAPAQPAPQPVQPAQPGIATASGGSVASQEMQENVKKCKNFLATLIK
+LASHNSPSPETSKNVKALVQDLLDAKIEPEEFTSRLQTELKSSPQPYLVPFLKKSLPALR
+LSLLNSQQSLTQPPQQGLKPAPCGTPPAIVAGPAVRIRHPNSVSTTTGASALPAGTLGHA
+AAMGVKTGGAVGGQVRMPVVITQSIRAQGTMGKGAIIQAGKSPMGLPVQITGNQKNKLND
+PGGGTFRDDDDINDVASMAGVNLNEESARILATNSDLVGTQIRSCKDEAFLHPGLLHRRI
+QETAKKFGITEVPMETVTFISHATQSRLRTVVEKVSTIAQHRLDSCKDDECYEQSADVRS
+QLRFFEQLERIEKQRKDEQEREILLKAAKSRSRQEDPEQARLKQKAKEMQQQELAQMRQR
+DANLTALAAIGPRKKRKVDSPGATPSGTEVSGSTAGSPASSSAPSTSSRQYTRQRITRVN
+LRDLIFYMEQERETAHSLLLYRALLK
+>XP_006779818.1 gi|583968731|ref|XP_006779818.1| PREDICTED: protein LSM14 homolog A-like [Neolamprologus brichardi]
+MSGGGTPYLGSKISLISKAEIRYEGILYTIDTENSTVALAKVRSFGTEDRPTDRPIPPRD
+EVFEYIIFRGSDIKDLTVCEPPKATSALPQDPAIVQSSIGSSSAAAPPSFQAPGSYAPFS
+RAPAPSYSQFGVATIGSQQFGSTGAVGRTSPQLDSRRKSPTLEQAVQAPPSSAQAPPAPV
+GQRSQTGAAASRTTTTGIQKPPDLLEQRKVPEVPKVAQPDNEQGAVENRDPNKRQGAGVQ
+SSNRRGRGRGNRSRGKVNVRRDGTVKFDEDFDFETANAQFHKDEIDKELQNKLKLKDDKT
+EKALNGEESEHPANEGAAEEEEAVINTCYYDKSKSFFDNLSCDDTRDRRPTWAEERRMNA
+ETFGLPLRHNRGRGGFRGRGFMGPRGGRGRPVSRGSFGPPRGAPPGFRGGFRGGRGGRDF
+SDFEYRKENKVAA
+>XP_006779819.1 gi|583968733|ref|XP_006779819.1| PREDICTED: SS18-like protein 2-like [Neolamprologus brichardi]
+MSIVFVPKKLRGKATVNQETIQRLLDENDQLIRCITEYMQKGRAVECVQYQQILHRNIVY
+LATIADASPDSAASTSNCTSNDTSASAAAVNGHTEGS
+>XP_006779820.1 gi|583968735|ref|XP_006779820.1| PREDICTED: uncharacterized protein KIAA0355-like [Neolamprologus brichardi]
+MYCCSAQESKMDYKRRFLLGGSKQKVQQHQQYQMPELSRTLSASLASSCSASSPMGTGVG
+MSGSCHPPPSGTSTAVADIQQGISKYLDALNVFCRASAFLTDLFSSVFRNSHYSKAAMQL
+KDVQEHVMEAASRLTAAIKPEIAKMLMELSAGAANFKDQNDFSLQDVEVLGRCFLTVMQV
+HFQFLSQALQKVQPVAQSCLAEALAQAQERCANARSQSSDLGPLTELEEASRSWKGAAEA
+TARLRERGRDGCLAGIQVQQLFCSNNTTIPEHQLKELNMKIDSALQAYKAALESLGHSEY
+ALKAGFHLNPKAVEAALQGCCSEAEAQQAGRMQTTSQPIQCELPTIPVQIGSHFLKGVSF
+NESAAENLKLKTHTMLQLIKEALGQNGVTPRDDSPVTEVLNQVCPSSWRGACKTAVQLLF
+AQAGLVVVDTAQIENKEAYAPQITLEGSKVVVQVPSTWCLKEDPATMSLLQRSLDPEKTL
+GLVDVLYTAVFDINRWKERKEQALPTIQIQLQRESPDYGIPTDLPPGTSSKTSSGLPKTI
+SKLTSKFTKKVSSSSNSGGSFSIPSTPSRSMLTTSNSEDKAKGLGHSDGRLQSILQMGSL
+PCTSDSTQQNQLANGSVSEDQGMNLPTDQEMQDVIDFLSGFNMGKSQQASPLVKRRNSVA
+SANPAELKPPSGPSQATSSISHSALQPPAQTLPQPQPQPQPSQPVQKQQPQPNPQPPPPQ
+QQQPQQQQQPPPPPPQQPSPQAQHLYYQHLLQPITQQQAPPPQLPPQQTPPQVLPQQRVA
+SKWLGTSGQQPPPQGPPAGLSPLGPIGQWASSGLPDLSSDLYSLGLVSTYMDSVVSEMLG
+QKPQGPRNNTWPNRDQSEGVFGVLGDTLPFDPAVGSDPEFARYVAGVSQAMQQKRQVQHI
+RRPSNTRSNWPMPDEQHRTWSHPEYFNEGDAVNSGWSANQGDSASSSDETSSANGDSLFS
+MFSGPDLVAAVKQRRKHSCGEPEVCTLPSPPLHHIGDDSQDSKTKTWPPKAPWQHSTHTN
+TMPNPSSSLYQMNIPPSSQWGDSMPMLQSPVWSTASDCPPSTGISSGFPFTQQQQQQQQQ
+QHKPMTKGFKSFPVKHEHRPSYLHQY
+>XP_006779821.1 gi|583968737|ref|XP_006779821.1| PREDICTED: glucose-6-phosphate isomerase-like [Neolamprologus brichardi]
+MGLTQDPNFQKLQEWYTAHALGLNMRHMFEADKERFNKLSLTLKTEDGDILLDYSKNLIT
+EDVMKMLVDLAKSRGIEAAREKMFTGEKINFTEGRAVLHVALRNRSNTPIMVDGKDVMPD
+VNKVLEKMKGFCHKVRSGEWKGYTGKAITDVVNVGIGGSDLGPLMVTEALKPYSKDGPRV
+WFVSNIDGTHIAKTLAQLNPETTLFIIASKTFTTQETITNAESAKAWFLEHAKDKAAVAK
+HFVALSTNGPKVKDFGIDTENMFEFWDWVGGRFSLWSAIGMAIALHIGFDNFEKLLSGAH
+WMDKHFRTAPLDKNAPILLALLGIWYINFFHAETQAMLPYDQYMHRFTAYFQQGDMESNG
+KYITNHGTRVNYHTGPIVWGEPGTNGQHAFYQLIHQGTRMVPCDFLIPAQSQHPIRDNLH
+HKVSLMLERYLSKXXALMKGKTTEEAKKELEASGLSGEALEKILPHKVRRIKRNDLIKDN
+EPAALLMARNSNKLKPKLKRRAPCRVAFTKRDSPSKNSVNRC
+>XP_006779822.1 gi|583968739|ref|XP_006779822.1| PREDICTED: Wilms tumor protein 1-interacting protein homolog [Neolamprologus brichardi]
+MEHYQEDLGLRATKLMEDLSLYDAYQDGMYDARRDLVINPDLDFSAPALVEHKAKPMNGT
+SVLHQQHHTVENFSSGNKVYNAAPVRPVNCNRTVPVDFCAPQRDAVYNEDGCCTKSEVAL
+PCYTGTSERHRRYSLEVQGHRYSTGSTFDGVPLNKPVAVPGNRCNSVCIASSHDGRYNAT
+SPRSSLASSLSSQEQSKHASPRSSISSPRTSLVVPGQERYTSPRSSLVHCEGNSVLSPRS
+SYASTASDTSKHSSPRASLNSCDCCSKPNSNRTSGISMGYDQRHTSPRSSTASQYSFTTS
+PRSSYSDSRYGPVVNQDLEGVLHSAPLASPRSSICSQDGSARPGASANCVVSPRSSISSH
+SSRSSRSSRGSMSTYPDLQLPSPRSSMLGTSLHEDTLLQEFGDSNGVQNRIHLQGLSAVP
+EPQQQSGQTGGTADIPSGSPSSYSYVMPSKTASSGQRFKLPYQVTPSRESGPSQAEKRLE
+ALTLELEKELEMHMKKEYFGICVKCGKGVYGASQACQAMGNLYHTNCFTCCSCGRRLRGK
+AFYNVNGKVYCEEDFLYSGFQQTAEKCFVCGHLIMEMILQALGKSYHPGCFRCVVCKEGL
+DGVPFTVDVENNIYCVKDYHTVFAPKCASCNQPILPAQGSEETIRVVSMDKDYHVECYHC
+EDCGLQLNDEERHRCYPLEGHLLCHDCHILRLQSQVPAHAPPSYPLHVTEL
+>XP_006779823.1 gi|583968741|ref|XP_006779823.1| PREDICTED: short-chain dehydrogenase/reductase family 42E member 1-like isoform X1 [Neolamprologus brichardi]
+MGTASKETFLITGGSGYFGNRLALSLLKKGAKVILFDIIPPSQELPEDVVFVQGDIREYP
+DVEKAVTGVDCVFHIASYGMSGREQLNRQLIEAVNVQGTQNILKACVEHGVSRLIYTSTF
+NVVFGGQVIENGDESLPYLPLHLHPDHYSRTKSLADMAVLKANGTVLKGCSGLLSTCALR
+PAGIYGPGEQRHLPRIVDYIEKGIFRFVYGKPSSLVEFVHVDNLVSAHVLAAEALTPEKQ
+HRAAGQAYFISDGRPVNNFEFFRPLVEGLGYRFPTLRLPISLIYFFAFLTEMIHCLIGPF
+YNFQPLLTRTEVYKTGVTHYFSMAKAKAELGYEPREYNLDEVVQWFRSRGHGKKCHRSFL
+SRLLLNVLFVSALVAVSLSFLPVVGS
+>XP_006779824.1 gi|583968743|ref|XP_006779824.1| PREDICTED: short-chain dehydrogenase/reductase family 42E member 1-like isoform X2 [Neolamprologus brichardi]
+MGTASKETFLITGGSGYFGNRLALSLLKKGAKVILFDIIPPSQELPEDVVFVQGDIREYP
+DVEKAVTGVDCVFHIASYGMSGREQLNRQLIEAVNVQGTQNILKACVEHGVSRLIYTSTF
+NVVFGGQVIENGDESLPYLPLHLHPDHYSRTKSLADMAVLKANGTVLKGCSGLLSTCALR
+PAGIYGPGEQRHLPRIVDYIEKGIFRFVYGKPSSLVEFVHVDNLVSAHVLAAEALTPEKQ
+HRAAGQAYFISDGRPVNNFEFFRPLVEGLGYRFPTLRLPISLIYFFAFLTEMIHCLIGPF
+YNFQPLLTRTEVYKTGVTHYFSMAKAKAELGYEPREYNLDEVVQWFRSRGHGKKCHRSFL
+SRLLLNVLFVSALVAVSLSFLPVVGS
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sample1.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,11 @@
+>ID1
+MSNSEASSTCPIPSRSIHEKSWSPLPDSYSQTPGGTVFSTTPGGTRIIYDRKFLLECRNS
+PIARTPPCCLPDIPGVTRPSLQIIEQEEDSKDLSIDDSQFVIDI
+>ID2
+MADVVLGVGTGVFIITLIWILTLALTIILSRATGPTKLGIIPVVLLALIITLVLVFFPRA
+AEVPAPQRAAQIVDMFFIGRYVLLSLVSLVFLAALFMLLPLHFLEPIYAKPLRTH
+>ID3
+MAVDNFLFGQCILYFLAFLFGFIAVVPLSENGDDFQGKCLLFTEGIWQNENMTMGKQRFI
+VEEWGPESSCRFITFVGIVSLILSAVQAWRTFFFLCKGHDDSLFHSFLNLLLSLLVLFVV
+FVAGTISSVGFSIWCDSVTENGAMPSSCEDLQDTDLELGVENSSFYDQFAIAQFGLWSAW
+LCWLGLTVLAFLKVYHNHRQQELLESLVQEKELLLGHPLQRSSYVYNRNAMI
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sample2.fasta	Mon Sep 21 15:40:14 2020 +0000
@@ -0,0 +1,1005 @@
+>NP_001007355.1 gi|55925472|ref|NP_001007355.1| eukaryotic translation initiation factor 4E-binding protein 3 [Danio rerio]
+MSNSEASSTCPIPSRSIHEKSWSPLPDSYSQTPGGTVFSTTPGGTRIIYDRKFLLECRNS
+PIARTPPCCLPDIPGVTRPSLQIIEQEEDSKDLSIDDSQFVIDI
+>NP_956692.1 gi|41055339|ref|NP_956692.1| transmembrane protein 218 [Danio rerio]
+MADVVLGVGTGVFIITLIWILTLALTIILSRATGPTKLGIIPVVLLALIITLVLVFFPRA
+AEVPAPQRAAQIVDMFFIGRYVLLSLVSLVFLAALFMLLPLHFLEPIYAKPLRTH
+>NP_001003767.1 gi|57524633|ref|NP_001003767.1| transmembrane protein 179 [Danio rerio]
+MAVDNFLFGQCILYFLAFLFGFIAVVPLSENGDDFQGKCLLFTEGIWQNENMTMGKQRFI
+VEEWGPESSCRFITFVGIVSLILSAVQAWRTFFFLCKGHDDSLFHSFLNLLLSLLVLFVV
+FVAGTISSVGFSIWCDSVTENGAMPSSCEDLQDTDLELGVENSSFYDQFAIAQFGLWSAW
+LCWLGLTVLAFLKVYHNHRQQELLESLVQEKELLLGHPLQRSSYVYNRNAMI
+>NP_001002700.1 gi|50540464|ref|NP_001002700.1| fatty-acid amide hydrolase 2-A [Danio rerio]
+MALTRFERFLGRLLRAVVWILFAAFKLFAPQQRHGVSRLPPITNPLLLLSAMQLARKIRR
+KEVTSVEVVQAYIDRIQEVNPLINAMVKDRFSAALQEAAQVDKLIEEETGGEDVLEDRLP
+LLGVPITVKEAFALQGMPNSTGLLTRRDLVSGADAPSVALLKRAGAIPLGVTNCSELCMW
+LESHNHLYGITNNPYDFERIVGGSSGGEGSILGAGSSVIGIGSDIGGSIRIPCFFNGIFG
+HKPSVGIVNNEGQYPPASGQQMGFLCTGPMCRYAEDLIPMLSIMGGPNAEKLSLFTEVDL
+KKLRFFSVPHNGGSHLVSPVEPQLLHAQKMVVKRLEADLGVKVQELLIPQLKYSFQIWGT
+MMASPGKDGKPPTTFAELMSEGGKKVWPAWELFKWFLGFSSHTLAAIGLALVELFQSSHP
+SPFIMQQKESLQQELEELLGTDGVLLYPSHPLIAQKHHHPIFTPFNFSYTGIFNILGLPV
+TQCPLGLSAEGLPLGVQIVAGKLQDRLSLATALYLEKAFGGWREPGKTTIKP
+>NP_001003555.1 gi|57525887|ref|NP_001003555.1| centromere protein P [Danio rerio]
+MEQKYEEDIQKLQQEIEMLEAEQEETLRSIFVQHGDRLQQGVKSACEERGGGGAQQHTLS
+KLITEVRELEKDLRRQTEINGITLNECFVKTLHKSERKLIQQLRLAGHCGLLLFQVEFAV
+TEIQEDNVLHRRVTELNIVVDGVEFKDFSAFVSRVEDTKDLLLFFRTLRTFSERCEDRRQ
+TFQHFQEKYPDVVNLPEGCRSEIMIIRSPQLPGISMTLFWKIHVSKEGVVKPLLDLLLKM
+PDQALELDTKKVMEKASDYFQSLLQLLGVEASIEGLIRTVCS
+>NP_997599.1 gi|47058959|ref|NP_997599.1| protein dispatched homolog 2 [Danio rerio]
+MESGSISRQREDAEMPDSSTTEGPSLEAPQSEIPEVSLCPPDSDSTESQMCPVEIEENQT
+KSSSPFNSHSSTQLERQVSQGSAYHSPPHKKCPCCGHQQPSQSDVCPGQMNALHQADCAA
+SPVKTLYSCSPSRLPSCHTKMQCHWLHGSHDGSNHKPVQHHMVTVRNDGLHRIPRSYSQV
+IVEYPMTVLISCTLVLFACSLAGILTGPLPDFSDPLLGFEPRGTDISVRLATWTRLKQNT
+GPGKPLSPVPWQLTEKTTTGKDTIKSEPQFRERSRRMLHRDNAEHNFFCNAPGERYAQLV
+FRSGNSASLWSLKAIYSMCQMEQTQIRSGPQFDKLCQVKSEFYGSMVKNECCPSWSLGNY
+LAVLNNISSCFSLTSQQVSESLGLLRFCAPYYHDGSLIASCTERSKFGRCASVPHRCKLS
+SIFQILHYLVDKDFLGPQTVEYKVPSLKYSIVFLPVEKSDSLMNIYLDHLEGHKLTYNNT
+TITGMDLGIKQKLFKYYLARDSIYPVLAALALLITIGLYLKSLFIAAMSLVAVILSLSTS
+YFFYKVAFRLTFFPLLNLAAVFVLLGSCLNQALTFVDFWKLQLSHNPPAVPEKRMNRVLQ
+EMGYLIIVSGLTSSVTFYSGYISSITAVRCYAVYLGSASLINTLFALVWLPCTLILQERY
+AVLSSNTVGKVAWKPCCSKNAGGFWETSSRKRCLFTFRQKLRTLGRGFSDTSNLLFLKIL
+PCGVVKFRYIWICWFAVLAAGGTYISCVDPGMKLPTSDSRTTQLFRSSHPFERYDAEYRH
+QFMFERMKDGEDEPMMLTLIWGIVPSDNGDHFDPKSNGSLSVDPGFNMSSLQAQIWLRDL
+CGKIQNQTFYSPLSAEQDTAEDNVCFVEHLIHWVSIRRCSESEDAFSFCCNNIPFPYPPR
+VFEQCLSMMVAEQHAEGRLPSAGGLRFDSEGRIAALVVIFKTVQLYSFNYNRMSQFYQEI
+LSWFNREISKAPAGLQRGWFVSQLGLYDLQQCLSSETLEVAGFSVALTFALLLLTTWNIP
+LSVYVSIAVAGSVFATVGLLVLLEWQLNGVEALFISAAAGLSVDFVANYCISYSLAPHSD
+RLGRVAHSIKRMGCPVATGAGAYFCVGIIMLPATALLFRKLGIFLLLVKCVACGFATFFF
+QSLCCFFGPQNNCGRITLPCVTQQSTENILSSCSATEPGTNNPAANGAFGCGKGSRVRRS
+FNKENEGFLCPNQQHHRKRQPVGGREPEQNELQPLACQLSDSFENSTCTSKLSNRPSVLS
+DDIQFCGLSPKQDYDRVSIEADSTEMCSRHLKGCNPPPALQTSSPYKENMLRLPQDACKE
+KVLCKKCRGQSRGGLQLWNVSLSSSSSMDEIMITQTTDTVNERSLSMDDHIHKRLLSCQS
+QSSIEGLEESNDTCLTEVEAAIPQAGKIEDEFQPGHLNGKRDTLRLSLKETVYDLASPGS
+GRVRTAQSDVPVILPNSKPDMPDVWIKREGKGEGGS
+>NP_001013313.1 gi|61651744|ref|NP_001013313.1| coiled-coil domain-containing protein 115 [Danio rerio]
+MRVDENLRLDEQLLLFMEQLEALEEKRQRLNSLIEEGWFSIAKARYSMGNKQVSALQYAS
+EMQPLAHVETSLLEGGTAEFKCERSENKAEEQKTKTIEDIGAKETGLRRRVHTKQKEVKE
+GEQDTDEVKTKTDSPTPEHRNPLKWFGILVPQNLKQAQSAFKEVITLSVEIASLQSTILA
+TRKEMQVQMKEKQERTEKAQLEVKEE
+>NP_991238.1 gi|45387769|ref|NP_991238.1| pituitary homeobox 3 [Danio rerio]
+MDFNLLTDSEARSPALSLSDSGTPQHDPGCKGQDNSDTEKSHQNHTDESNPEDGSLKKKQ
+RRQRTHFTSQQLQELEATFQRNRYPDMSTREEIAVWTNLTEARVRVWFKNRRAKWRKRER
+NQQAELCKNGFGAQFNGLMQPYDDMYSGYSYNNWATKSLASSPLSAKSFPFFNSMNVSPL
+SSQPMFSPPSSIPSMNMASSMVPSAVAGVPGSGLNNLGNLNNLNSPTLNSAAVSAAACPY
+ATTAGPYMYRDTCNSSLASLRLKAKQHANFAYPAVQNPVSNLSPCQYAVDRPV
+>NP_001244093.1 gi|380503827|ref|NP_001244093.1| blood vessel epicardial substance isoform 2 [Danio rerio]
+MSNTTSALPSSVPAVSLDPNATLCQDWEQSHHLLFHLANLSLGLGFLIPTTLALHMIFLR
+LLLMTGCSLFIAWATLYRCTLDVMVWNVVFLLVNFMHFFFLLYKRRPIKIDRELKSVYKR
+MFEPLHVREALFQRLTGQFCTIQTLKKGQVYAAEDKTSVDERLSILLKGKMKVSYRGHFL
+HNIYTNAFIDSPEFRSTQMNRGERFQVTIAAEENCKLLCWSRERLTYFLESESFLNEVFR
+YLIGKDITNKLYSLNDPTLSDKAVKKMDRQPSLCSQLSMMQMRNSMASTSDTDDVLNQIL
+RGGSTGSSLQKNPLTKTSTTMKPIEEGLEDDVFESESPTTSQNVSKTTKKDI
+>NP_001013309.2 gi|157042782|ref|NP_001013309.2| tRNA 2'-phosphotransferase 1 [Danio rerio]
+MDCETRGRGRRGRGNRNEESRDVRLSKSLSYVLRHGASKMGLQMNSDGFVFVEELLAHQQ
+FRSFSVDDVERVVASNDKQRFKLCKHPEDDRLQIRANQGHSVQVTDLELREISQDDQDYP
+REAVHGSYMKHWPSIRSQGLSRMNRTHIHLAPGLPGEGRVISGMRQSCDLAVYIDVTKAM
+SDGIKFFWSENGVLLTPGDAAGILAPCYFSRAQRLKPLPCDIELH
+>NP_001001847.2 gi|380503821|ref|NP_001001847.2| blood vessel epicardial substance isoform 1 [Danio rerio]
+MSNTTSALPSSVPAVSLDPNATLCQDWEQSHHLLFHLANLSLGLGFLIPTTLALHMIFLR
+LLLMTGCSLFIAWATLYRCTLDVMVWNVVFLLVNFMHFFFLLYKRRPIKIDRELKSVYKR
+MFEPLHVREALFQRLTGQFCTIQTLKKGQVYAAEDKTSVDERLSILLKGKMKVSYRGHFL
+HNIYTNAFIDSPEFRSTQMNRGERFQVTIAAEENCKLLCWSRERLTYFLESESFLNEVFR
+YLIGKDITNKLYSLNDPTLSDKAVKKMDRQPSLCSQLSMMQMRNSMASTSDTDDVLNQIL
+RGGSTGSSLPVTSDRA
+>NP_001015061.1 gi|62632729|ref|NP_001015061.1| putative all-trans-retinol 13,14-reductase precursor [Danio rerio]
+MWFAVVAIFLALVAFLYRYVVGSGPNPFAIDTREPLKPMVFDRKLKNKVLKQGFLASRVP
+EDLDAVVVGSGIGGLAIAVLLAKVGKKVLVLEQHDRAGGCCHTFKEQGFEFDVGIHYIGE
+LSNHKPLRCIIDQMTNGQLQWDPLENPFDNVVIGPPENRRIYQIYSGRKRYMDELKKCFP
+GEEKAIDEYVRLCKEVGQGVWVMVLLKFLPTPIANFLVRTGLANRLTSFSRYASRSLTDV
+VNELTQNKDLRAVLSYIFGTYGKIPKEASFSMHSLIVNHYMNGAWYPKGGATEIAYHMIP
+IIEKAGGAVLVRAPVNRILLNDAKEAIGVSVLKGQEEVHVRAPIVISDAGIFNTYEYLLP
+KDVQTMPAIQKQLSMLQHGDSGLSIFIGLDGTKEELGLKADNYFIYPENNIDELLEDYRS
+GNREESAKKNPLIFVASPSAKDSTWPERTPGKSTLTVVSFANYEWFEEWKDDKVKNRSTD
+YKQLKELFINYILEAVTEIYPKIKDRIEYVDAGTPITNQHYIAAPRGEIYGADHGIPRFS
+AELNATIRAQTPIKNLYLTGQDLMLCGFAGALTGALTCGSVILNRNLHLEAFSLAKRVQN
+GNNKKKT
+>NP_001003580.1 gi|57525791|ref|NP_001003580.1| kelch-like protein 15 [Danio rerio]
+MSGDVEVYLSQVHDGSVSSGFRALYEERLLLDVTLLIEEHHFQAHKALLATQSDYFRVMF
+TADMRERDQDKIHMKGLTAAGFGHVLRFMYYGSLELSMLTVQEILQAAMYVQLTEAVEFC
+CSFLLAKICLENCAEVMRLLEDFSVGVEGVQEQLDAFLLENFVPLMARPDFLSYLSLEKL
+MAYLDSDQLSRYPEIELYEAVQAWLRHDRRRWRHTDAVVQNLRFCLMTPANIFEKVKTSE
+FYRYSRQLRLEVDQALSYFHQVNEQPLAETKSNRIRSVRPQTAVFRGMIGHSMVNSKILL
+LHRPKVWWELEGPQVPLRPDCLAIVNNFAFLLGGEELGPDGEFHASSKVYRYDPRQNSWL
+RMADMSVPRSEFAVGVIGKYIYAVAGRTRDETFYSTERYDIVEDKWEFVDPYPVNKYGHE
+GTVLNGKLYITGGITSSSTSKQVCVFDPGREGSSEHRTRRTPILTNCWENKSKMNYARCF
+HKMISHNGKLYVFGGVCVILRASFESQGCPSTEVYDPETDEWTILASMPIGRSGHGVAVL
+DKQIMVLGGLCYNGHYSDSILTFDPEENKWKEDEYPRMPCKLDGLQVCSLHFPEYVLEHV
+RRCS
+>XP_006779743.1 gi|583968567|ref|XP_006779743.1| PREDICTED: CCAAT/enhancer-binding protein alpha-like [Neolamprologus brichardi]
+MELSNLYEVAPRPLMNNLNQQPPSGYRDPADLGGEIGDNETSIDLSAYIDPSAFNDDFLA
+DLFHHSSRQDKLKMMNGEYDPVSCGPGPQQLYMSNYMESKMEPLYEHNPPRLRPVAIKQE
+PRDDEDMNPGMPPTYHHPHPHPHPQQYSQQQQMPHLQYQIAHCAQTTMHLQPGHPTPPPT
+PVPSPHQHQHSHPHSHQGGMKLLEQQRGCGKTKKHVDKNSPEYRLRRERNNVAVRKSRDK
+AKMRNMETQHKVVELTADNDRLRRRVEHLTRELDTLRGIFRQLPDGSFKPMGS
+>XP_006779744.1 gi|583968570|ref|XP_006779744.1| PREDICTED: ras-related protein Rab-8B-like, partial [Neolamprologus brichardi]
+SLSGIDFKIRTIELDGKKIKLQIWDTAGQERFRTITTAYYRGAMGIMLVYDITNEKSFDN
+IKNWIRNIEEHASADVEKMVLGNKCDMNDKRQVSKERGEKLAIDYGIKFLETSAKSSINV
+EEGFYTLARDIMARLNRKMNDNNPSGGGGPVKITEPRSKKSLFRCSLL
+>XP_006779746.1 gi|583968574|ref|XP_006779746.1| PREDICTED: calcium and integrin-binding family member 2-like [Neolamprologus brichardi]
+MGNKQTTFTEEQLEAYQDCTFFTRKEILRLHARYRELAPHLVPLDYTNNPDIKVPMTLIV
+TMPELKVQFYRYRIVQVLWQLSTESSRWGSGPDFNRDNFICKEDLEKTLNKLTKGELMPE
+EVTLVCDKAIEEADLDGDHKLSFADFENMISKAPDFLSNFHIRI
+>XP_006779747.1 gi|583968576|ref|XP_006779747.1| PREDICTED: corticosteroid 11-beta-dehydrogenase isozyme 2-like [Neolamprologus brichardi]
+MEDYTLPFWIYLVIVTVFIGGAMKKILASHLNTTSTVVAWLGATVLVERLWAFCLPAMLL
+LVLFGITFCIYYATKTSQPRAMLPAHGKAVIITGCDSGFGNATAKHLDSLGFEVFATVLD
+LNGDGAKELQRTCSHRLTLLQVDITQPQQVQQALLDTKAKLGLKGLWALVNNAGVCVNFG
+EVELSLMSNYRGCMEVNFFGTLSITKAFLPLLRQTKGRIVTISSPAGDQPFPCLAAYGAS
+KAALNLITETLRHELEPWGVQVSTILPSSYRTAQSTNSAYWEKQHKHLLQNLSPALLEDY
+GEEYMTETKDLFQTFAKHTTTNLQPVVDTIVQALLAPQPQPRYFAGAGLSLMYFLYAYFP
+YSMSNNFLKKKFLKKNVIPRALRKQSAFDLNLSLHNNNNEEKLQQM
+>XP_006779748.1 gi|583968578|ref|XP_006779748.1| PREDICTED: transient receptor potential cation channel subfamily M member 1-like [Neolamprologus brichardi]
+MYIRVSFDSKPDSLLHLMVKDWQLELPTLLISVHGGLQNFDLPPKLKQVFGKGLIKAAVT
+TGAWIFTGGVSTGVIRHVGDALKDHSSKSRGKVCAIGIAPWGIVENKEDLIGRDVTRPYQ
+TMSNPLSKLSVLNSSHSHYILADNGTCGKYGAEVRLRRQLEKHISLQKINTRLGQGVPVV
+CLIVEGGPNVISITLESLKEEPPVPVVVCDGSGRASDILSFAHRYCEEDG
+>XP_006779749.1 gi|583968580|ref|XP_006779749.1| PREDICTED: chymotrypsin B-like [Neolamprologus brichardi]
+MAFLWIVSCLAFVGAAYGCGTPAIPPRVTGYARIVNGEEAVPHSWPWQVSLQQTNGFHFC
+GGSLISEQWVVTAAHCNVRTYHNVIVGEHNKGYGSTENIQVLKPAKVFTHPSWNPQTINN
+DITLIKLASPARLGTNVSPVCLADTTDSFAAGMKCVTTGWGLTRYNAPSTPNNLQQAALP
+LLSNEECKKHWGSNISDVMICAGGAGATSCMGDSGGPLVCQKDNVWTLVGIVSWGSSRCS
+TSTPAVYARVTKLRGWVDQILASN
+>XP_006779750.1 gi|583968582|ref|XP_006779750.1| PREDICTED: agouti-related protein-like [Neolamprologus brichardi]
+MFGTVLLCCWSFGLLPLASSLVHGNLPLDEGPVAGRRTETFLSEIERSQVPDRMHEPALL
+PVDSVEDHFLMDTGSYDEDTSAALQLQGRAMRSPRRCIPHQQSCLGYPLPCCDPCDTCYC
+RFFNAICYCRRVGHVCPPRRT
+>XP_006779751.1 gi|583968584|ref|XP_006779751.1| PREDICTED: EMILIN-1-like [Neolamprologus brichardi]
+MAALPLLLLLVLWTCGNAKGAFPLRQSYNLYTNGHAHGARAASRHRNWCAFVVTKTVSCV
+VEDGVETYVKPDYHPCSWGSGQCSRVVVYRTYMRPRYKVAYKMVTEMDWKCCHGYSGADC
+NIGPVGGGGTQISTTRPQPGQGGGTTSGQGGGGHSYGGGSSGSGQSGGNADNEKMRQLEE
+KIRSLTKNLQDLQSTMSTMNERLQEEGGRNGFGERSSGGRNPADAAQPEIKETIHSIQTK
+LDQLDNRTQAHDKTLVSINNHLVNGKGNELEGGASGGSLSEGRLNSLKEEILSKLERRVS
+LSCSSCQAGVEDLRKQQQQDRERIRALEKQMNAMDVQYRQSLDGLRRDVVRSQGCCDIIS
+DLQDRVTDAERKISTASENFDILQNRLDREISGQGGTSENTGSRGQGLPVGGETGGHGRD
+AMITEEHLNNRLKDLERRVNSTMQKTEESCSYLENHVKDYFHRELDELRSVFLERFDDQA
+DRITDVELDVEQVKDSISDHDKRLSKLENTTSQMSWRLEKCGCVASEQGGGGEGRGRGDG
+GYGGGSWGAGGGGSTGEGKDGGNRGDGGGTWGAGGGGGGSTGGGGRWGGTGGGLPGTGGE
+KDNSTKKSLEWRVVANEDQIRHFNTQLKDLSMSGDSLYDKVLDLTDDVGKIKALTGDHGE
+HFNRIVTVVEMLGEDCELCGKVEKELQKMRNYSQNALSNIQNHINRIQNRMDSEGDSCFQ
+MCSVLQSEVSVLRDDVRRCTNQCKSNPDMTTGVDHARPGGTDDNSGPLDPAKPLDGHSVI
+EGINNNHLKTLQGELSNVILTFSSINDTLKGLEHTVQKHDSVITDLGNTKDKIISEIDKV
+QQELTEHIEDNRNRLDKMDRDIRRFESTVLEMGDCKRSGDGLEKRLSKLEGVCGRLDGVS
+DSILKIKEGLNKHVSSLWTCVSGLNDTVIRHGGLLDFIQDGQDDIHSRVKNLNSSLNQVS
+RDLQSFSEHDLTGPPGPQGPQGHPGERGFNGPPGLPGPPGFPGPRGEIGPHGPKGETGLP
+GADAQIPKLSFSAALTAPMDRAGTIVFDKVFVNEGNFYNPRTGIFTAPVDGNYYFSAVLT
+GHRNEKIEAVLSKSNYGMARVDSGGYQPEGLENNPVAEAKVNPGSLAVFSIILPLQTQDT
+VCIDLVMGKLAHSVEPLTVFNGMLLYENK
+>XP_006779752.1 gi|583968586|ref|XP_006779752.1| PREDICTED: zinc finger protein 507-like isoform X1 [Neolamprologus brichardi]
+MEEITNVITHSSAASSSSSTSGSHTRQTKEKQPSQGFQQKTADDSLIQVIKKLSKIVEKR
+PQRRCASGGQKRALQVGERGAEQGGGSICKKIKRNLKDEVGVERSTDDSSLPSPWSGDDN
+NNVTTAVAEVAANPNSSDLKRTVTCYQCSLCPHLSQTLPLLKEHLKQHNEQHSDLILMCS
+ECHFTSRDHEQLEAHVRMHFDNGDNQKRKYPVSEAKEEVLKNQDVDLTGDNCSAGTEVKK
+SSVSNAKELPQKKKWYSYEEYGLYRCLICSYVCSQQRMLKTHAWKHAGLVDCSYPIFEDE
+DGGSAKREVQAAPNNASAREEIVVLQDKSLQKLPTGFKLQLCMPVAVEDKQEVVNLQGSH
+LSESPKTEEEDEYPIKDMTSEEPAVEVQVTTEAETEVELGGHHESTSATDSLLSSAQKII
+NRSPNSAGHINVIVERLPSAEDSVMASNPLLLSPDVDGDKSLLEKKAEEQEHVEGVKDEV
+VLCYSPGNANKSQHLGADIKPSIAKSNDLPRDENVPPAGRKRTHSESLRLHSLAAEVLVA
+MPMRTPELPNSGAKVALKTVAAQAQSPQAGQKPTEGAAAGQKASDVGTAAAMLNCNEGRE
+ETLGSLGLGKGDDDGPAANGGISLSLLTVIERLRERSDQNTSDEDILKELQDNAQFQSGA
+GVVAANGAGSYVCSSVPGMDGLVGSPDSGLVDYIPGSDRPYRCRLCRYSSGNKGYIKQHL
+RVHRQREPYQCPICEHIASDSKDLENHMIHHCKSRMYQCKQCPDAFHYKSQLRNHEREHH
+SFSGDVEMLTPVAETAAAMEETERVTYEEGSPQKMFKCDVCNYTSSTYVGVRNHRRIHNS
+DKPYRCCSCDFATTNMNSLKSHMRRHPQEHQAVQLLEQYRCSLCGYVCSHPPSLKSHMWK
+HAGDQNYNYEQVNKAINEAISQSSR
+>XP_006779753.1 gi|583968588|ref|XP_006779753.1| PREDICTED: zinc finger protein 507-like isoform X2 [Neolamprologus brichardi]
+MEEITNVITHSSAASSSSSTSGSHTRQTKEKQPSQGFQQKTADDSLIQVIKKLSKIVEKR
+PQRRCASGGQKRALQVGERGAEQGGGSICKKIKRNLKDEVGVERSTDDSSLPSPWSGDDN
+NNVTTAVAEVAANPNSSDLKRTVTCYQCSLCPHLSQTLPLLKEHLKQHNEQHSDLILMCS
+ECHFTSRDHEQLEAHVRMHFDNGDNQKRKYPVSEAKEEVLKNQDVDLTGDNCSAGTEVKK
+SSVSNAKELPQKKKWYSYEEYGLYRCLICSYVCSQQRMLKTHAWKHAGLVDCSYPIFEDE
+DGGSAKREVQAAPNNASAREEIVVLQDKSLQKLPTGFKLQLCMPVAVEDKQEVVNLQGSH
+LSESPKTEEEDEYPIKDMTSEEPAVEVQVTTEAETEVELGGHHESTSATDSLLSSAQKII
+NRSPNSAGHINVIVERLPSAEDSVMASNPLLLSPDVDGDKSLLEKKAEEQEHVEGVKDEV
+VLCYSPGNANKSQHLGADIKPSIAKSNDLPRDENVPPAGRKRTHSESLRLHSLAAEVLVA
+MPMRTPELPNSGAKVALKTVAAQAQSPQAGQKPTEGAAAGQKASDVGTAAAMLNCNEGRE
+ETLGSLGLGKGDDDGPAANGGISLSLLTVIERLRERSDQNTSDEDILKELQDNAQFQSGA
+GVVAANGAGSYVCSSVPGMDGLVGSPDSGLVDYIPGSDRPYRCRLCRYSSGNKGYIKQHL
+RVHRQREPYQCPICEHIASDSKDLENHMIHHCKSRMYQCKQCPDAFHYKSQLRNHEREHH
+SFSGDVEMLTPVAETAAAMEETERVTYEEGSPQKMFKCDVCNYTSSTYVGVRNHRRIHNS
+DKPYR
+>XP_006779754.1 gi|583968590|ref|XP_006779754.1| PREDICTED: probable C-mannosyltransferase DPY19L3-like isoform X1 [Neolamprologus brichardi]
+MTTLRQRKGSKGKEPSPAAELQSQQHNCCSEHHPEKILHGDWSWGAIIWTSVGWSVSVGL
+GLLCCIYVATLHENDLWFSNIKEVEREISFRTECGLYYSYYKQMLHAPSIQEGLKEMIHD
+NLTESKRTINLLQRMNIYQEVFLSVLYRLLPIQSYLEPVYFYIYTVFSLQAVYVIALYLT
+AWLLSGSWLAGALTGVWYILNRVDTTRVEFTISLRENWSLPFFALQVTAITCYLRPQLTT
+LQQKVMVWLMYVTTFCFCLTWQFNQFILLVQALVIYTLDCGDFLTTTQVTTLYLVQVSSL
+LSVWFLQFCNSMILGSLVLSFIVAALFIRHCQPGVKTGSLVVRLGKVLLHSALVLLLTVT
+INYLAKKALQLQSDEHIFKFIKSKFALGSTRDFDASLYLCEEAFGLLPLDTLERLAGTLL
+LYPYVLTLLLLCGMLVAAALQNLSRPNRGSTEEKKGAREGQVAAFRPDVAYNVLHTLFYG
+LLAFSTMRMKYIWTGHMCAVAAYGVCGTELWTVLLSALRCNTKLLLRLVRYVAPVVMIGF
+LYYKFWPKLMEELSELREFYDPDTVELMTWISTKTPKQAVFAGSMQLLAGIKLCTGRVLT
+NHPHYEDKDLRERTRQVYQVYARRSPEEVYDILKAIGADYVVLENSICYERRHRRGCRLR
+DLLDLANGHIMDGPGENDPDLVPATHPRFCDAIKTDAAYNALFTRTFQNKTFHVYRLKKK
+RKKNTKGSSEPSVTQ
+>XP_006779755.1 gi|583968592|ref|XP_006779755.1| PREDICTED: probable C-mannosyltransferase DPY19L3-like isoform X2 [Neolamprologus brichardi]
+MTTLRQRKGSKGKEPSPAAELQSQQHNCCSEHHPEKILHGDWSWGAIIWTSVGWSVSVGL
+GLLCCIYVATLHENDLWFSNIKEVEREISFRTECGLYYSYYKQMLHAPSIQEGLKEMIHD
+NLTESKRTINLLQRMNIYQEVFLSVLYRLLPIQSYLEPVYFYIYTVFSLQAVYVIALYLT
+AWLLSGSWLAGALTGVWYILNRVDTTRVEFTISLRENWSLPFFALQVTAITCYLRPQLTT
+LQQKVMVWLMYVTTFCFCLTWQFNQFILLVQALVIYTLDCGDFLTTTQVTTLYLVQVSSL
+LSVWFLQFCNSMILGSLVLSFIVAALFIRHCQPGVKTGSLVVRLGKVLLHSALVLLLTVT
+INYLAKKALQLQSDEHIFKFIKSKFALGSTRDFDASLYLCEEAFGLLPLDTLERLAGTLL
+LYPYVLTLLLLCGMLVAAALQNLRPNRGSTEEKKGAREGQVAAFRPDVAYNVLHTLFYGL
+LAFSTMRMKYIWTGHMCAVAAYGVCGTELWTVLLSALRCNTKLLLRLVRYVAPVVMIGFL
+YYKFWPKLMEELSELREFYDPDTVELMTWISTKTPKQAVFAGSMQLLAGIKLCTGRVLTN
+HPHYEDKDLRERTRQVYQVYARRSPEEVYDILKAIGADYVVLENSICYERRHRRGCRLRD
+LLDLANGHIMDGPGENDPDLVPATHPRFCDAIKTDAAYNALFTRTFQNKTFHVYRLKKKR
+KKNTKGSSEPSVTQ
+>XP_006779756.1 gi|583968594|ref|XP_006779756.1| PREDICTED: probable C-mannosyltransferase DPY19L3-like isoform X3 [Neolamprologus brichardi]
+MCRGLKEMIHDNLTESKRTINLLQRMNIYQEVFLSVLYRLLPIQSYLEPVYFYIYTVFSL
+QAVYVIALYLTAWLLSGSWLAGALTGVWYILNRVDTTRVEFTISLRENWSLPFFALQVTA
+ITCYLRPQLTTLQQKVMVWLMYVTTFCFCLTWQFNQFILLVQALVIYTLDCGDFLTTTQV
+TTLYLVQVSSLLSVWFLQFCNSMILGSLVLSFIVAALFIRHCQPGVKTGSLVVRLGKVLL
+HSALVLLLTVTINYLAKKALQLQSDEHIFKFIKSKFALGSTRDFDASLYLCEEAFGLLPL
+DTLERLAGTLLLYPYVLTLLLLCGMLVAAALQNLSRPNRGSTEEKKGAREGQVAAFRPDV
+AYNVLHTLFYGLLAFSTMRMKYIWTGHMCAVAAYGVCGTELWTVLLSALRCNTKLLLRLV
+RYVAPVVMIGFLYYKFWPKLMEELSELREFYDPDTVELMTWISTKTPKQAVFAGSMQLLA
+GIKLCTGRVLTNHPHYEDKDLRERTRQVYQVYARRSPEEVYDILKAIGADYVVLENSICY
+ERRHRRGCRLRDLLDLANGHIMDGPGENDPDLVPATHPRFCDAIKTDAAYNALFTRTFQN
+KTFHVYRLKKKRKKNTKGSSEPSVTQ
+>XP_006779757.1 gi|583968598|ref|XP_006779757.1| PREDICTED: MTSS1-like protein-like isoform X1 [Neolamprologus brichardi]
+MLGEITHLQAIIDDLTVLTTDPHKLPPASEQVIKDLKGSDYSWSYQTPPSSPSSSGSRKS
+SMCSSVNSTHSSASRSSGGGGSGGVGGGGSLPHSPTSSSSSSCRYRSSLPHQPPPPGGIA
+AHRLSSVSSHDSGFVSQDANIYSKPPSPMPSDITSQKSSSSASSEASETCQSVSECSSPT
+TFGSSFATFRPALFHSGSTRPLSVILPVPASPPYIRPPGSSSSSPTSKVPMWKDWSKAGQ
+YEQPVAAAAVQRRREPLDRLRESEASPGSQGYAGPSHPDDGQRARMTPATIAAKHGEEVS
+PAASDLAMVLTRGLSMEQQKSNRDSLQYSSGYSTETTTPSCSEDTIPSQGSDYDCYSVNG
+DAEGPDGQTEFDKSSTIPRHSNIAQNYRRMIQTKRPASTAGLPTGVLGPGAHGIPGQPGG
+AGGGGTGTPGTATIRRTPSTKPGVRRTLSSAGPIPIRPPIVPVKTPTVPGDSHSPGAGGG
+HAGGVPVRVGSEECVFFTGAEDSQGALDYVKASPKRLSLPNTAWGSGAALEVYAQQHGGL
+AIGTGSGTGSEEDQMIAANRHSLVEKIGELVASAHALGEGQFPFPALPDDPAPPPTGPTD
+TETGTEGAEGSGDMLTTIRRGVRLRKTVSNDRSAPRIL
+>XP_006779758.1 gi|583968600|ref|XP_006779758.1| PREDICTED: MTSS1-like protein-like isoform X2 [Neolamprologus brichardi]
+MLGEITHLQAIIDDLTVLTTDPHKLPPASEQVIKDLKGSDYSWSYQTPPSSPSSSGSRKS
+SMCSSLPHQPPPPGGIAAHRLSSVSSHDSGFVSQDANIYSKPPSPMPSDITSQKSSSSAS
+SEASETCQSVSECSSPTTFGSSFATFRPALFHSGSTRPLSVILPVPASPPYIRPPGSSSS
+SPTSKVPMWKDWSKAGQYEQPVAAAAVQRRREPLDRLRESEASPGSQGYAGPSHPDDGQR
+ARMTPATIAAKHGEEVSPAASDLAMVLTRGLSMEQQKSNRDSLQYSSGYSTETTTPSCSE
+DTIPSQGSDYDCYSVNGDAEGPDGQTEFDKSSTIPRHSNIAQNYRRMIQTKRPASTAGLP
+TGVLGPGAHGIPGQPGGAGGGGTGTPGTATIRRTPSTKPGVRRTLSSAGPIPIRPPIVPV
+KTPTVPGDSHSPGAGGGHAGGVPVRVGSEECVFFTGAEDSQGALDYVKASPKRLSLPNTA
+WGSGAALEVYAQQHGGLAIGTGSGTGSEEDQMIAANRHSLVEKIGELVASAHALGEGQFP
+FPALPDDPAPPPTGPTDTETGTEGAEGSGDMLTTIRRGVRLRKTVSNDRSAPRIL
+>XP_006779759.1 gi|583968603|ref|XP_006779759.1| PREDICTED: G-protein coupled receptor 64-like [Neolamprologus brichardi]
+MCFSPQIPDPSITKKDQEILTRITVIGCSISLFTLVIAILLFITNRKLRQDVSMKVHINL
+VIALMLLNLHFLPSQAVAAGSPSGLCLYMALLLHYSLLATFSWMALEGFHLYLLLVKVFN
+IYVKKYLLKLSVVGWGVPAMIVSVVVIIDRTFYGLAPLDTSHSSTAM
+>XP_006779760.1 gi|583968609|ref|XP_006779760.1| PREDICTED: probable RNA polymerase II nuclear localization protein SLC7A6OS-like [Neolamprologus brichardi]
+MDPNTTILRVKRKRGTDPADALLLACKRIRPETSQSSGETVPEPNEAEVENSVFKLVATV
+ATQEAPVQTQVRQALARPRTAHALRPSAASSQRILGDLRSTKWSTRREERYRILSSHRAG
+LSAPAEQQTPQMGASECVEETGKETDKCWGLGEIQVVDLIHEDGEDQDKPSGKILSSEPD
+EILCNNTKMLRERLSISGDRLGEEHREQDDGYVYDLYYQETVTPGWIQDILSVRAYADEG
+ELVPDLVVHEEEVYEDEDDENEEGNWRNDYPDEESDTDSDREERYGGYWEEEHSYSRRSW
+QRYQREVTHELGCRGDDDNGDDDDDDGDKYDSD
+>XP_006779761.1 gi|583968612|ref|XP_006779761.1| PREDICTED: Y+L amino acid transporter 2-like [Neolamprologus brichardi]
+MANREESKKMNGNSGDSSTLLETPKESMQLKKEISLLNGVSLIVGNMIGSGIFVSPKGVL
+IYSASYGLSLVIWAIGGLFSVIGALCYAELGTTITKSGASYAYILESFGGFIAFIRLWTS
+LLIIEPTSQAVIAITFANYLVQPLFPTCEPPYAASRLIAAACVCLLTFINSAYVKWGTRV
+QDIFTYAKVAALIVIIVTGIVKLCQGYTGNFESSFQGSSTDPGDIALALYSALFSYSGWD
+TLNFVTEEIKSPERNLPMAIAISMPIVTIIYILTNVAYYAVLDASAILASDAVAVTFADH
+TLGVMSWTIPIAVALSCYGGLNASIIAASRLFFVGSREGHLPDALSMIHIQRFTPIPALI
+FNCVMSLIYLTVEDVFQLINYYSFSYWFFMGLSIAGQIYLRLKEPDRPRPLKLSLLYPVV
+FCLCTIFLVAVPLYSDTVNSLIGIAIALSGVPVYFLGVYLPESKRPPVITKLLRSLTDFT
+QYTCFCVLTEMDKSQ
+>XP_006779762.1 gi|583968614|ref|XP_006779762.1| PREDICTED: G-protein coupled receptor 64-like [Neolamprologus brichardi]
+MGIEVLHTFWLVYMVFTPRLKPYIWNLVGFALPAVPVVILAPIGDIYGPIEVPPSEDPEN
+PYKMCWMDITENKGWLAFCFTNVMILALLVSSGLVMLFLVYRQIRTRDEWKQNRVAFLSI
+WGLSCLYGTTWGLAFLEFEPISTFILFITCILNSFQGFFLMLRFCMLDWMQKQAGGSGLG
+SSSTGSTRQHMLQAQERS
+>XP_006779763.1 gi|583968616|ref|XP_006779763.1| PREDICTED: synapse-associated protein 1-like [Neolamprologus brichardi]
+MLKGLGTWLGLEGPTVTETSVDKEKLNVEQEEKVVEAQTEVNKQQPADQDGTPEAEQENS
+DQSTGLGGYIFSFASSATKKISDSMVETAQTIKKTVEEGKIDGIIDKTFLGDFQKEQEKF
+VQEKKAKKSEAAVPPWVGYNEEETIQQQILALSADKRNFLRDPPAGVQFHFDMEQMYPLA
+AVMLEEDELLNRMRFDLVPKHVKEEMFWRNYFYRVSLIKQSAQLTALAAQQQRNDSVDKG
+ASVSPEDIVLTDNVRPKTPPVSISDIQKPTHEEDEEISTSPGVSEFVSDAFDSTAINQED
+LRKEMEQLVLDKKDSPSPDDESADWEKELQQELQEYEVVTESGNKDDQWDQEIEKMLQSD
+DS
+>XP_006779764.1 gi|583968618|ref|XP_006779764.1| PREDICTED: LOW QUALITY PROTEIN: probable phosphatase phospho2-like [Neolamprologus brichardi]
+MKILMVFDFDHTVVDANSDTWVVRCLPDKTLPGSVENSYRKGYWTEYMGRVLNYIGEQKV
+SPDRVRSVMETIPFTAGMTELLTFIAENKNAIDCIVISDSNTLFIEWILHAAGLQAAVDK
+VFTNPAKLNELGHVEVQCYHSHACDQCPVNLCKKKVLELYLSEQSDAGVEYEQIFYAGDG
+GNDLCPTSCLRGRDVVMPRKGYTLEKLLAKLEGQEGNFSVRAKNIAWSSGTDILRELKAS
+MQSXPWHMKYYKF
+>XP_006779765.1 gi|583968620|ref|XP_006779765.1| PREDICTED: cadherin-8-like isoform X1 [Neolamprologus brichardi]
+MPKRSEEMLTDLWLSLLLVWITCVLSVSMTPIIGQSKSTQTGGSAVVASGVGEGQRLLSR
+AKRGWVWNQMFVLEEFSGPDPILVGRLHTDKVENDTARYSLAGEGAGTIFAINEKTGDIH
+AMKRLDREEKAEYTLTAKVTNGITGQLLEPMTEFIIKVQDINDNAPKFTEGPYHAAVEEM
+SAVGTSVITITATDADDPVYGNSAKLVYSILEGQPYFSVDPNSATIRIALHGMDREMRED
+YQVVIQAKDMGGHMGGLSGTTTVSITLQDINDNPPKFSKSLYEFVIPEDLPLGKEGGKVK
+ANDRDIGENAKSTYSIIEGDDQGVFEIITNATTQEGILQLRKPLDYESKRNYTLKVEATN
+IRSEPRSNGPFKDTATVKIVVEDSDEPPVFSKPMYLLEVDENAPINKIIGTVTARDPDAT
+GSPIRYFIDRHTDLERQFNINVDNGRITLAKPLDRETDMWHNITVTATEVRNHSQISRAV
+VAIRVMDINDNAPEFATEYETFLCENGKPGQVIQTVSAVDKDDPIQGHYFDYRLVPEMLN
+NPNFTIKNNQDNSISVLAKHDTFRRQKQEMYFLPIIVTDNGNPPMSSTNTLTIRVCGCSK
+DGIVQSCNVEAYVLPIGLSMGALIAILACIILLLVIVVLFVTLRRHKNEPLIIKDDEDVR
+ENIIRYDDEGGGEEDTEAFDIATLQNPDGINGYLPRKDIKPDLQFMPRAGQHSGPNGVDV
+DEFINVRLHEADNDPTAPPYDSIQIYGYEGRGSIAGSLSSLETASSDSDQNYDYLREWGP
+RFRRLGELYSVGESDRET
+>XP_006779766.1 gi|583968622|ref|XP_006779766.1| PREDICTED: cadherin-8-like isoform X2 [Neolamprologus brichardi]
+MPKRSEEMLTDLWLSLLLVWITCVLSVSMTPIIGQSKSTQTGGSAVVASGVGEGQRLLSR
+AKRGWVWNQMFVLEEFSGPDPILVGRLHTDKVENDTARYSLAGEGAGTIFAINEKTGDIH
+AMKRLDREEKAEYTLTAKVTNGITGQLLEPMTEFIIKVQDINDNAPKFTEGPYHAAVEEM
+SAVGTSVITITATDADDPVYGNSAKLVYSILEGQPYFSVDPNSATIRIALHGMDREMRED
+YQVVIQAKDMGGHMGGLSGTTTVSITLQDINDNPPKFSKSLYEFVIPEDLPLGKEGGKVK
+ANDRDIGENAKSTYSIIEGDDQGVFEIITNATTQEGILQLRKPLDYESKRNYTLKVEATN
+IRSEPRSNGPFKDTATVKIVVEDSDEPPVFSKPMYLLEVDENAPINKIIGTVTARDPDAT
+GSPIRYFIDRHTDLERQFNINVDNGRITLAKPLDRETDMWHNITVTATEVRNHSQISRAV
+VAIRVMDINDNAPEFATEYETFLCENGKPGQVIQTVSAVDKDDPIQGHYFDYRLVPEMLN
+NPNFTIKNNQDNSISVLAKHDTFRRQKQEMYFLPIIVTDNGNPPMSSTNTLTIRVCGCSK
+DGIVQSCNVEAYVLPIGLSMGALIAILACIILLLVVLFVTLRRHKNEPLIIKDDEDVREN
+IIRYDDEGGGEEDTEAFDIATLQNPDGINGYLPRKDIKPDLQFMPRAGQHSGPNGVDVDE
+FINVRLHEADNDPTAPPYDSIQIYGYEGRGSIAGSLSSLETASSDSDQNYDYLREWGPRF
+RRLGELYSVGESDRET
+>XP_006779767.1 gi|583968626|ref|XP_006779767.1| PREDICTED: T-cell immunomodulatory protein-like [Neolamprologus brichardi]
+MIWTLKLITLAFLLLLGGQYNTFALQDVTADLFGPGNFGTVAAFGDFNSDKQTDIFTIKE
+QSDLVIFLADSKPPYFKPKVQAKNILGKDITSVVPGDYDGDSQMDVLLTAKNGPKTEVFI
+FWGHNQTLDIGGGIKLNYTFSDQPLVMDFNGDMIPDVFGVISSSSSVVCYLTKRTEVCSK
+ALSLTGNMRTPHSNAFIDLDRDFTADLFLTMNNDRMFETWLNKDGNFTKTDVMSKPDETT
+LIGQSSFVDFDGDGYQDHLLPACLDTSCQRSTIYLAKSGSRDSKWIPVLSDFKRKETIWG
+FVPDNLSQPPALHLGDYNLDGFPDALVVLQNKSGSGQQAFLLENVPCNSETCHSVGRMFH
+IHWDQSDLGAIKNAVRATFFDIYEDGILDMLVQSKAEGKQDLRIHALKNNFEADAYFVKV
+MVLSGLCSNDCPEGVKPFGVNQPGPYVMYTTVDSNGYLKNASAGQLSQSAYFSLQLPYTV
+LGLGRSANFLDHLFVGIPRQPGETEIRNKEWTAIIPNSQLIVMPFPHDTPRSWSAKLYLT
+PSNSVLLTAIALIGVCVFILVIIGILHWQEKKADDREKRQEAHRFHFDAM
+>XP_006779768.1 gi|583968628|ref|XP_006779768.1| PREDICTED: neuropilin and tolloid-like protein 2-like [Neolamprologus brichardi]
+MHRAWVLFFLIEEGFALAQRTKESPSDYGGQRPNQNDCGTWIRNINGGSFTSPNYPNPYP
+PNKECVYILEALPRQRIQLSFDKNYYIEPSFECRFDHIEIRDGPFGFSPLIDRFCGGKNP
+EIVTSTGRFMWVKFTSDEELEGLGFRIEYTFIADPDFHLHVGGLLNPIPECQFNVGGWDG
+IIRSSQVEEEKRVKPGDALDCIWTIKAPSQSKIYLRFIDYQMEHSNECKKNFVAVYDGSS
+AIENLKAKFCSTVANDVMLNNDMGVVRMWADEKSRLSRFRMLFTSFIDPPCNDNTFFCHS
+NMCINNSLVCNGVQNCVYPWDENHCKEKRSKGLFHQITKTHGTVIGVSSGIVLVLLIISI
+LVQMKQPRKKVVARRPGVFNKAGFQEVFDPPHYELFSLRDKEMSSDLADLSEELDSFHKM
+RRSSTMSRCVHEHHCGSQGSVATGGGSMKHSRTTLSSMELSYHNDFSKPPPMKTFNSTAS
+YKKSCYGYKQHSQTHDCDQQVIEDRVTEETTCEIYGRGATGVGGGAAGGGAMGGGGASGI
+AGGAIGGAVGITGGVAMGGGMGGGMSMAGAMSMAGPSGIAGGIGGMGGACGTLSVRGNSA
+RNSTTIVDPQQRSMSMDF
+>XP_006779769.1 gi|583968630|ref|XP_006779769.1| PREDICTED: dnaJ homolog subfamily A member 2-like [Neolamprologus brichardi]
+MSNVVDTKLYDILGVSPSATENELKKAYRKLAKEYHPDKNPNSGDKFKEISFAYEVLTNP
+EKKELYDRYGEQGLREGGGGGPGMDDIFSHIFGGGLFGFMGGQSSRSRNGGRRRGEDMVH
+PLKVSLEDLYNGKTTKLQLSKNVLCSTCNGQGGKTGAVQKCTACRGRGMRIMIRQLAPGM
+VQQMQSVCTDCNGEGEVISEKDRCKKCEGKKVVKEVKILEVHVDKGMKHGQKITFGGEAD
+QAPGVEPGDIVLVLQEKEHETYRRDGNDLFMNHKIGLVEALCGFQFMLKHLDGRQIVVKY
+PAGKVIEPGSVRMVRGEGMPQYRNPFEKGDLYIKFDVQFPDNNWISPEKLGELEDMLPSR
+SEPPIISGDTEEVDLQDYDVSQSSSSGNRREAYNDSSDEEGSHHGSGVQCAHQ
+>XP_006779770.1 gi|583968632|ref|XP_006779770.1| PREDICTED: low-density lipoprotein receptor-related protein 3-like [Neolamprologus brichardi]
+MGLTELPLLLPLLGLLWLRCALLCAGCSEQVEIHTERRGVIYSPSWPLNYPAGVNCSWHI
+QGGQGEVITISFRNFDLAESGKCTGDWLLLTPTWKRESRLCGSVLPQPFISTRGRVWLFF
+HSQANSSGQAQGFRLSYIRGHLGQSSCQSDEFLCGNGKCLPRSWKCNGQDECGDASDERS
+CLPTPTEAQPGLCPFGSLPCTEGQSTRCLPTALRCNGARDCHDGSDELGCPDTTCGKRLG
+NFYGSFASPDFFRANRSGDTELRCSWLLDTQDPKPIVLQLDLQLGPGDLLHVYDGLLQRA
+EHLLQVFSYHNNRRPALLESSRGQMSVLYMAQPHSPGHGFNATYQVKGYCFPGERPCGSD
+QGCYSERQRCDGYWHCPSGRDEEGCPMCPDGEFPCEGGTGMCYPASERCNNQKRCPDGSD
+EKNCYDCQPGNFHCGTNLCIFETWRCDGQEDCLDGSDERDCLAAVPRKVITAALIGSLVC
+SLLLVIALGCALKLHSLRNREYRAFETQMTRMEADFVQREAPPSYGQLIAQGLIPPVEDF
+PVYNPTQASVLQNLRLAMRRQIRRHSTRRSTSSSSRRRLGHLWNRLFRSGGRGRGHAPLL
+DPPGPTQITLGLHSYRTVGEQGPQSRAVPAGGSDVVGVDLPESPASPLSFHSVDSPEEEE
+DLSPVSRDGSRAAESSPPTPCQSDSSVQSGLPLSPQEASVPLCPPRASRKLVLELAVNLK
+GVSLRRYSPLGPLSPISPPVFPSSSQTPSTQPQPQGSEVTSPTEPLFSSVKPEDSDSQFT
+VNVPSRDETKPEARSSLCRFGRSISEEGGDLGRETLC
+>XP_006779771.1 gi|583968634|ref|XP_006779771.1| PREDICTED: LOW QUALITY PROTEIN: rhophilin-2-like [Neolamprologus brichardi]
+MTDALLSNGINDGGGDKNYFKKGCNPFAQTGRSKLQNTRASLNQQIIKQMRMRAGAENLL
+KATSNSKVKEMVLLELSYVNSNLQLLMSELEGLNSSVEVYQNNQSSTQRILVPVFLNETT
+VEFSILKIXSDFILEHYSEDGKTFEDEIADFMDLRQACRTPSRSEAGVELLGKYYSHLPL
+IESRFFSPTRQTGIFFTWYTAFLGLKYQQNHICLIXFCFLFFFLLLFSVKSLMIXITSTN
+CSFLALIRFQLVPTALSCPGVLNNLKETFTHTPSYDMSPAMLSMLIRLMLAQAQECLFEK
+IALPGIRNQFYSLMKVAQEAAKVSEIYDQVHQCMIQTPVKDNVPFFWSTMSQIKTNHYRS
+MAHYFVASALLDHQLGPGDDEDKQEKTLSQVYDSLPEGCTALDILKKKDERQRIGKAHIR
+RAIFGHEEALRIYGLCKNTNNLEVLQEILKASHQRSVNKHSENENEEEFADYMEAPKIIS
+KTEHKAEMEFPAAAKVKVIDFFQRLGPQSVFSAKQRWTAPRTIRVRSDDRDLGFTLKGDS
+PVQVVSLDPLCAAAADGLKEGDYIITVGDTECKWMSVSDVMRLLKDVDEEGIDIQVVSMM
+DNSTAMPTKSATFCGNLPKTYSMICLAYNEDDKNSKVRKVAKKSSFLSWGLKNKMKSAST
+LSLPTADKAGALPWNKPCPTFPSSSSYNNDSGLY
+>XP_006779772.1 gi|583968636|ref|XP_006779772.1| PREDICTED: E3 ubiquitin-protein ligase RNF182-like [Neolamprologus brichardi]
+MKDSAAETSGVEEGESHTLGQEHDLKMSCPQTEFEEKESPPPEELECKICYQRYNVHHRK
+PKILDCLHRVCARCLIKILDIADSAGCISCPFCRHQTEITEQEISALPDDVNIVSHLVMR
+DKSWNSDQNREVVLTPKSFSSSSPSHDSSNCLVITIMEVQRDSQHSPSQNGSSDVYAEQS
+LDSVSIGSNGPADQDALSKFCNHVPRILVWLLGFLYFGSLPLGIYLLVIQRVTLGIVCVS
+LVPSSLTVCLVYGFCQCLCQGMCDCSSRG
+>XP_006779773.1 gi|583968638|ref|XP_006779773.1| PREDICTED: centrosomal protein of 89 kDa-like [Neolamprologus brichardi]
+MLRFSFRREKDKEFKHIAHGLIPAASIAPKPAVPRTPPPRSPNPSPERPRSALAAAILSS
+SLTGQTWAIPPARLMSLSESGQSESFTSEPNISTALYTRDRWSEDLVSRPRLSSPDQSEG
+ELEDKEQEVVDEEDGEEHVYHTLDRRQNSSLTESVYALPLKAKSVFKSTTPLPTQTSGRR
+ESSPDFTEETSGQSPEPKEKKMSVRKTLENWKDDVPTTPTISTAGHPRQASQAKSPKDLR
+ELPPEPSNTYSELRKKVVRDRREKNTRMVDKEKLQEERLQRLEREISDSKAFSNQRSSAG
+SQAELQNLRQHAQELVDENDALKLTVHRLNVELSHYQARFRPLSKEEHSKVSGLPNTGSP
+PPWLVDMKYSSPLLLAYEDRMNEKDAILQTTEENMEKLHVQLEEVIKENEKLHDEITKTG
+AVNQKDCYQIQQQAVLVLQENQVLINQLEAQHAEAKDTHSRHNTEVAKVSKKMMLLEVEN
+QRLEGDLEESRRELQKNKRDLQVLQARLKDAVTWDEHCSIAGKLRRQLEQHESRSKDGID
+KLLLRVSNLQEENRILALDKAQLTAKTRAMEAELELSRQASRKAERRMSMLKQQKAECVL
+KEEKTRHYLGAVISVAEHISQERDRLLHMASSLQQEKQRFISRILSGTVRFGKLQEEVKV
+YRSQASTRLAALEEAVEGRTVSYQTEILHLQTLLRERQEAEEKLLQSKREIEEELEVVWE
+AATRENQQMRETLLDSKLTGDLHSWPAHAPDEITTSSQQQQHKHGLDFYC
+>XP_006779774.1 gi|583968640|ref|XP_006779774.1| PREDICTED: myocyte-specific enhancer factor 2A-like [Neolamprologus brichardi]
+MGRKKIQITRIVDERNRQVTFMKRKFGLMKKAYELSVLCDCEIALIIFNGSNKLFQYAST
+DMDKVLLKYTEYNEPHESRTNSDIVEALNKKEHRGCDSPDADASYVLTPNTEEKYKKINE
+EFDNMMKTHKISTGQQQQQHQQHFMHVAPGSMAYSHSGGGGATSQALAAATAALADGGIL
+PSPHSHLHRNINSSQRPPSAGGGLQGSSELALQNGSGPTVNGFGKIIPSKSPPPPPPHGN
+SMVPTSRKTDLRVVIPHSKGMMQTLNNQRMSSSQSSQPLSTPVVSITTPSLPHQSLVYAG
+IGSAYNDYSLNSGELSGFNSAAGPSLSSMAAWEQQQLSSMG
+>XP_006779775.1 gi|583968642|ref|XP_006779775.1| PREDICTED: COUP transcription factor 2-like [Neolamprologus brichardi]
+MAMVAWRNTEAVGDSQGTLSSPVSQVAPLSLPGELTGHMNPAPSLEIPQTAAAPQGAPPP
+NPSGNTVATTTNNNNSTSSSSSSSSLSMDKQQSQQIECIVCGDKSSGKHYGQFTCEGCKS
+FFKRSVRRNLTYTCRANRNCPIDQHHRNQCQYCRLKKCLKVGMRREAVQRGRIPTQSYHG
+QFALTNGDPLQCHSYLSGYISLLLRAEPYPTSRFGSQCLQNNNILGIENICELAARMLFS
+AVEWARNIPFFPDLQVPDQVALLRLTWSELFVLNAAQCSMPVHAAPLLAAAGLHASPMSA
+DRVVAFMDHIRVFQEQVEKLKVLHVDSAEYSCIKAIVLFTTDACGLSDVAHVEGLQEKSQ
+CALEEYVRSQYPNQPNRFGKLLLRLPSLRSVSSSVIEQLFFVRLVGKTPIETLIRDMLLS
+GSSFNWPYMAIQ
+>XP_006779776.1 gi|583968644|ref|XP_006779776.1| PREDICTED: solute carrier organic anion transporter family member 3A1-like [Neolamprologus brichardi]
+MQVKNQICTERSSNDDPEQDDNQKKTSCFSNIKIFLVSECALMLAQGTVGAYLVSVLTTL
+ERRFNLQSADVGVIASSFEIGNLALILFVSYFGAKAHRPRLIGCGGIVMALGALLSALPE
+FLTHQYEYEAGDSWHAEDGRDVCSNISRSENRDSGFKCGNRANTNMMYLLLIGAQVLLGI
+GATPVQPLGVSYIDDHVHRKDSSLYIGILFSTLVFGPACGFILGSVCTKVYVDAVFIDTS
+TLDITPDDPRWIGAWWGGFLLCGALLFLSALFMFGFPQALDEQDMDSGAESEQAMLPSSL
+SLEFQGSKPNGAIHGFDINSGLSVCQHLRVIPRVTRHLLSNPVFSCITLAACMEIAVVAG
+FAAFLGKYLEQQFNLTTSSANQLLGMTAIPCACLGIFLGGLLVKKLNLSALGAVRMAMLV
+NLVSTACYVSFLFLGCDTGPVAGVTVAYGNETLQSWQQPESACISNCNCYTASVSPVCGS
+NGVTYLSACFAGCTKPNLTNCACISSNSEEAVALPGKCPSPGCQQAFLTFLCVICVCSMI
+GAMAQTPSVIILIRTVSPELKSYALGVLFLLLRLIGFIPPPLIFGMGIDSTCLFWSSVCG
+EKGACMLYDNVAYRHLYVSIAIVLKSSAFLLYTTTWQCLRKNYRKYIKNNEGYLTPTELF
+ASNVTLDNLGKDITQNPTNRTKFIYNLEDRETCDNMESVL
+>XP_006779777.1 gi|583968646|ref|XP_006779777.1| PREDICTED: gonadotropin-releasing hormone II receptor-like isoform X1 [Neolamprologus brichardi]
+MNGSSCCDPAAVMYQQRSGLDLNASCEWPDPHCNWTSVDGALQLPTFSTAAKIRVIVTFI
+LCGISTFCNLAVLWAANGHKRKSHVRVLIINLTAADLLVTFIVMPVDAVWNITVQWLAGD
+LACRFLMFLKLQAMYSCAFVTVVISLDRQSAILNPLGIAMVRKRNRVMLMVAWIMSALLS
+IPQMFIFHNVTITYPANFTQCTTRGSFVTHWQETAYNMFTFCCLFLLPLVIMIICYTRIF
+VQISKQMTKKNMPSNEPHLRCSKNNIPKARMRTLKMSIVIVICFIVCWTPYYLLGLWYWF
+FPDDLEGKVSHSLTHILFIFGLFNACLDPIIYGLFTIRFQKGLRNCYRKAAVMSSLETNA
+VIMESLKCTGSVLPSKRGMTSGEKDISSEQAEAKSTDNSV
+>XP_006779778.1 gi|583968648|ref|XP_006779778.1| PREDICTED: gonadotropin-releasing hormone II receptor-like isoform X2 [Neolamprologus brichardi]
+MNGSSCCDPAAVMYQQRSGLDLNASCEWPDPHCNWTSVDGALQLPTFSTAAKIRVIVTFI
+LCGISTFCNLAVLWAANGHKHAVWNITVQWLAGDLACRFLMFLKLQAMYSCAFVTVVISL
+DRQSAILNPLGIAMVRKRNRVMLMVAWIMSALLSIPQMFIFHNVTITYPANFTQCTTRGS
+FVTHWQETAYNMFTFCCLFLLPLVIMIICYTRIFVQISKQMTKKNMPSNEPHLRCSKNNI
+PKARMRTLKMSIVIVICFIVCWTPYYLLGLWYWFFPDDLEGKVSHSLTHILFIFGLFNAC
+LDPIIYGLFTIRFQKGLRNCYRKAAVMSSLETNAVIMESLKCTGSVLPSKRGMTSGEKDI
+SSEQAEAKSTDNSV
+>XP_006779779.1 gi|583968650|ref|XP_006779779.1| PREDICTED: lactoylglutathione lyase-like [Neolamprologus brichardi]
+MSDKGLSDEAVAAVCKDGDPITKDFMMQQTMLRVKDPNKSLDFYTRILGMTLLQKFDFPS
+MRFSLFFLGYEDKKEIPADVKEKTAWTFSRRATLELTHNWGSESDDSQSYHNGNSDPRGF
+GHIGIAVPDVYAACKLFEEQGVTFVKKPDDGKMKGLAFIQDPDGYWIEILSPNNMVSITS
+K
+>XP_006779780.1 gi|583968652|ref|XP_006779780.1| PREDICTED: bifunctional glutamate/proline--tRNA ligase-like isoform X1 [Neolamprologus brichardi]
+MALNLTINTSNPPLGALLTAEHVKSSVQVSVEEGKDTRLHISDSVQFSDDNSICRYLARV
+APALGLYGSNMMEQTEVDHWLEFSARSLCNQPDLTVALAELDKALSLRTFLVGHALTLAD
+LSVWAALKDHGEWPKQGKSFSHVSRWFFFLSSQVPFTAVGNKYASKKASMNKTKSEGKKA
+DVGKFVELPGAEMGKVVVRFPPEASGYLHIGHAKAALLNQHYQVTFKGKLIMRFDDTNPE
+KEKEDFEKVILEDVAMLQIHPDQFTYTSDHFPIIMKFAEKLLAEGKAYIDNTPPEQMKQE
+REQRVESTCRNNSVEQNMKMWSEMKAGTEYGQTCCMRAKIDMNSNNGCMRDPTLYRCKNA
+AHPRTGNTYNIYPTYDFACPIVDSLEGVTHALRTTEYHDRDEQFYWIINALGLRKPYVWE
+YARLNLNNTVLSKRKLTWFVDQGYVDGWDDPRFPTVRGVLRRGMTVEGLKQFIAAQGGSR
+SVVNMEWDKIWSFNKKLPVSCLKVIDPVAPRYTALSSSYVVPVSVPEATEEMKEIAKHPK
+NAEVGMKEVWFGPRVLIEGADAETFTEGETVTFINWGNLIITKINKGADGKVLSMKASLN
+LDNKDYKKTTKITWLAETNNSLPVPAICVNYQPLISKAVITKDDNFKDYINKHSKLEEKM
+LGDPCLKNLKKGDIIQLQRRGFYICDQPYEPLSPNSCKESPCVLIYIPDGHTKEMPTAGS
+KEKSKTQASDNTPASPAKAPKTSVPAPASAPAADLFSSIVAQGEAVRLLKAAKAPKDEVD
+KAVKQLLSLKEQFKQQTGVEYKPGMAPPASTPAPPTSSSDSTSCPYTRVVQQGELVRKLK
+AEQAPKDQIDAAVKQLLALKAEFKKLTGQDYKPGMATPAPSASSPVTATSSSSPPSSSSG
+LYEHVAQQGEVVRKLKSEKAPKDQVDAAVKQLLALKEEYKRITGQEYKPGATPPQKAPAP
+VQNGSTNDLYEKVAEQGELVRKLKAEKAPKDQVDAAVKQLLALKAEYKQNTGKDYKPGLQ
+APATSAQTQTQASSASTQSNSSPQAQELFSQVSQQGDLVRKLKSEKAPKDQVDEAVKTLL
+DLKSKYKTLTGQDYKPVAAAGGTGGEDKNRKEKENKSEKQGGGGGGKKGKGDKGGQSKES
+SGGAGGAGEGQGPKKQTRLGLEAKKEENLADWYSQVITKAEMIEYYDVSGCYVLRPWAFS
+IWESIKDFFDKEIKKLGVENCYFPMFVSQAALEKEKSHIADFAPEVAWVTRSGKTELAEP
+IAVRPTSETVMYPAYAKWVQSHRDLPIKLNQWCNVVGWEFKHPQPFLRTREFLWQEGHTA
+FATKEEAAEEVLQILDLYARVYEELMAIPVVKGRKTEKEKFAGGDYTTTVEAFISASGRA
+IQGATSHHLGQNFSKMFEIVFEDPKRPGEKQLAFQNSWGITTRTIGVLTMVHGDDMGLVL
+PPRVACLQVVIIPCGITATLPEQEKEVLLAQCTKYLKRLQEAGIRVKSDLRDNYSPGWKF
+NHWELKGVPIRLEVGPKDMQQKQCVAVRRDSGAKVTIAEAEVEKNLLNMLEDIQNSLFKK
+ASDDLKSHMVAADTMEQFQKELDQGKIVQIPFCGGIECEDWIKKTTAKDQDLEPGAPSMG
+AKSLCIPFTPLKTLQPGQKCVSGKEPAQYYTLFGRSY
+>XP_006779781.1 gi|583968654|ref|XP_006779781.1| PREDICTED: bifunctional glutamate/proline--tRNA ligase-like isoform X2 [Neolamprologus brichardi]
+MALNLTINTSNPPLGALLTAEHVKSSVQVSVEEGKDTRLHISDSVQFSDDNSICRYLARV
+APALGLYGSNMMEQTEVDHWLEFSARSLCNQPDLTVALAELDKALSLRTFLVGHALTLAD
+LSVWAALKDHGEWPKQGKSFSHVSRWFFFLSSQVPFTAVGNKYASKKASMNKTKSEGKKA
+DVGKFVELPGAEMGKVVVRFPPEASGYLHIGHAKAALLNQHYQVTFKGKLIMRFDDTNPE
+KEKEDFEKVILEDVAMLQIHPDQFTYTSDHFPIIMKFAEKLLAEGKAYIDNTPPEQMKQE
+REQRVESTCRNNSVEQNMKMWSEMKAGTEYGQTCCMRAKIDMNSNNGCMRDPTLYRCKNA
+AHPRTGNTYNIYPTYDFACPIVDSLEGVTHALRTTEYHDRDEQFYWIINALGLRKPYVWE
+YARLNLNNTVLSKRKLTWFVDQGYVDGWDDPRFPTVRGVLRRGMTVEGLKQFIAAQGGSR
+SVVNMEWDKIWSFNKKVIDPVAPRYTALSSSYVVPVSVPEATEEMKEIAKHPKNAEVGMK
+EVWFGPRVLIEGADAETFTEGETVTFINWGNLIITKINKGADGKVLSMKASLNLDNKDYK
+KTTKITWLAETNNSLPVPAICVNYQPLISKAVITKDDNFKDYINKHSKLEEKMLGDPCLK
+NLKKGDIIQLQRRGFYICDQPYEPLSPNSCKESPCVLIYIPDGHTKEMPTAGSKEKSKTQ
+ASDNTPASPAKAPKTSVPAPASAPAADLFSSIVAQGEAVRLLKAAKAPKDEVDKAVKQLL
+SLKEQFKQQTGVEYKPGMAPPASTPAPPTSSSDSTSCPYTRVVQQGELVRKLKAEQAPKD
+QIDAAVKQLLALKAEFKKLTGQDYKPGMATPAPSASSPVTATSSSSPPSSSSGLYEHVAQ
+QGEVVRKLKSEKAPKDQVDAAVKQLLALKEEYKRITGQEYKPGATPPQKAPAPVQNGSTN
+DLYEKVAEQGELVRKLKAEKAPKDQVDAAVKQLLALKAEYKQNTGKDYKPGLQAPATSAQ
+TQTQASSASTQSNSSPQAQELFSQVSQQGDLVRKLKSEKAPKDQVDEAVKTLLDLKSKYK
+TLTGQDYKPVAAAGGTGGEDKNRKEKENKSEKQGGGGGGKKGKGDKGGQSKESSGGAGGA
+GEGQGPKKQTRLGLEAKKEENLADWYSQVITKAEMIEYYDVSGCYVLRPWAFSIWESIKD
+FFDKEIKKLGVENCYFPMFVSQAALEKEKSHIADFAPEVAWVTRSGKTELAEPIAVRPTS
+ETVMYPAYAKWVQSHRDLPIKLNQWCNVVGWEFKHPQPFLRTREFLWQEGHTAFATKEEA
+AEEVLQILDLYARVYEELMAIPVVKGRKTEKEKFAGGDYTTTVEAFISASGRAIQGATSH
+HLGQNFSKMFEIVFEDPKRPGEKQLAFQNSWGITTRTIGVLTMVHGDDMGLVLPPRVACL
+QVVIIPCGITATLPEQEKEVLLAQCTKYLKRLQEAGIRVKSDLRDNYSPGWKFNHWELKG
+VPIRLEVGPKDMQQKQCVAVRRDSGAKVTIAEAEVEKNLLNMLEDIQNSLFKKASDDLKS
+HMVAADTMEQFQKELDQGKIVQIPFCGGIECEDWIKKTTAKDQDLEPGAPSMGAKSLCIP
+FTPLKTLQPGQKCVSGKEPAQYYTLFGRSY
+>XP_006779782.1 gi|583968656|ref|XP_006779782.1| PREDICTED: bifunctional glutamate/proline--tRNA ligase-like isoform X3 [Neolamprologus brichardi]
+MALNLTINTSNPPLGALLTAEHVKSSVQVSVEEGKDTRLHISDSVQFSDDNSICRYLARV
+APALGLYGSNMMEQTEVDHWLEFSARSLCNQPDLTVALAELDKALSLRTFLVGHALTLAD
+LSVWAALKDHGEWPKQGKSFSHVSRWFFFLSSQVPFTAVGNKYASKKASMNKTKSEGKKA
+DVGKFVELPGAEMGKVVVRFPPEASGYLHIGHAKAALLNQHYQVTFKGKLIMRFDDTNPE
+KEKEDFEKVILEDVAMLQIHPDQFTYTSDHFPIIMKFAEKLLAEGKAYIDNTPPEQMKQE
+REQRVESTCRNNSVEQNMKMWSEMKAGTEYGQTCCMRAKIDMNSNNGCMRDPTLYRCKNA
+AHPRTGNTYNIYPTYDFACPIVDSLEGVTHALRTTEYHDRDEQFYWIINALGLRKPYVWE
+YARLNLNNTVLSKRKLTWFVDQGYVDGWDDPRFPTVRGVLRRGMTVEGLKQFIAAQGGSR
+SVVNMEWDKIWSFNKKLPVSCLKVIDPVAPRYTALSSSYVVPVSVPEATEEMKEIAKHPK
+NAEVGMKEVWFGPRVLIEGADAETFTEGETVTFINWGNLIITKINKGADGKVLSMKASLN
+LDNKDYKKTTKITWLAETNNSLPVPAICVNYQPLISKAVITKDDNFKDYINKHSKLEEKM
+LGDPCLKNLKKGDIIQLQRRGFYICDQPYEPLSPNSCKESPCVLIYIPDGHTKEMPTAGS
+KEKSKTQASDNTPASPAKAPKTSVPAPASAPAADLFSSIVAQGEAVRLLKAAKAPKDEVD
+KAVKQLLSLKEQFKQQTGVEYKPGMAPPASTPAPPTSSSDSTSCPYTRVVQQGELVRKLK
+AEQAPKDQVDAAVKQLLALKEEYKRITGQEYKPGATPPQKAPAPVQNGSTNDLYEKVAEQ
+GELVRKLKAEKAPKDQVDAAVKQLLALKAEYKQNTGKDYKPGLQAPATSAQTQTQASSAS
+TQSNSSPQAQELFSQVSQQGDLVRKLKSEKAPKDQVDEAVKTLLDLKSKYKTLTGQDYKP
+VAAAGGTGGEDKNRKEKENKSEKQGGGGGGKKGKGDKGGQSKESSGGAGGAGEGQGPKKQ
+TRLGLEAKKEENLADWYSQVITKAEMIEYYDVSGCYVLRPWAFSIWESIKDFFDKEIKKL
+GVENCYFPMFVSQAALEKEKSHIADFAPEVAWVTRSGKTELAEPIAVRPTSETVMYPAYA
+KWVQSHRDLPIKLNQWCNVVGWEFKHPQPFLRTREFLWQEGHTAFATKEEAAEEVLQILD
+LYARVYEELMAIPVVKGRKTEKEKFAGGDYTTTVEAFISASGRAIQGATSHHLGQNFSKM
+FEIVFEDPKRPGEKQLAFQNSWGITTRTIGVLTMVHGDDMGLVLPPRVACLQVVIIPCGI
+TATLPEQEKEVLLAQCTKYLKRLQEAGIRVKSDLRDNYSPGWKFNHWELKGVPIRLEVGP
+KDMQQKQCVAVRRDSGAKVTIAEAEVEKNLLNMLEDIQNSLFKKASDDLKSHMVAADTME
+QFQKELDQGKIVQIPFCGGIECEDWIKKTTAKDQDLEPGAPSMGAKSLCIPFTPLKTLQP
+GQKCVSGKEPAQYYTLFGRSY
+>XP_006779783.1 gi|583968658|ref|XP_006779783.1| PREDICTED: bifunctional glutamate/proline--tRNA ligase-like isoform X4 [Neolamprologus brichardi]
+MALNLTINTSNPPLGALLTAEHVKSSVQVSVEEGKDTRLHISDSVQFSDDNSICRYLARV
+APALGLYGSNMMEQTEVDHWLEFSARSLCNQPDLTVALAELDKALSLRTFLVGHALTLAD
+LSVWAALKDHGEWPKQGKSFSHVSRWFFFLSSQVPFTAVGNKYASKKASMNKTKSEGKKA
+DVGKFVELPGAEMGKVVVRFPPEASGYLHIGHAKAALLNQHYQVTFKGKLIMRFDDTNPE
+KEKEDFEKVILEDVAMLQIHPDQFTYTSDHFPIIMKFAEKLLAEGKAYIDNTPPEQMKQE
+REQRVESTCRNNSVEQNMKMWSEMKAGTEYGQTCCMRAKIDMNSNNGCMRDPTLYRCKNA
+AHPRTGNTYNIYPTYDFACPIVDSLEGVTHALRTTEYHDRDEQFYWIINALGLRKPYVWE
+YARLNLNNTVLSKRKLTWFVDQGYVDGWDDPRFPTVRGVLRRGMTVEGLKQFIAAQGGSR
+SVVNMEWDKIWSFNKKVIDPVAPRYTALSSSYVVPVSVPEATEEMKEIAKHPKNAEVGMK
+EVWFGPRVLIEGADAETFTEGETVTFINWGNLIITKINKGADGKVLSMKASLNLDNKDYK
+KTTKITWLAETNNSLPVPAICVNYQPLISKAVITKDDNFKDYINKHSKLEEKMLGDPCLK
+NLKKGDIIQLQRRGFYICDQPYEPLSPNSCKESPCVLIYIPDGHTKEMPTAGSKEKSKTQ
+ASDNTPASPAKAPKTSVPAPASAPAADLFSSIVAQGEAVRLLKAAKAPKDEVDKAVKQLL
+SLKEQFKQQTGVEYKPGMAPPASTPAPPTSSSDSTSCPYTRVVQQGELVRKLKAEQAPKD
+QVDAAVKQLLALKEEYKRITGQEYKPGATPPQKAPAPVQNGSTNDLYEKVAEQGELVRKL
+KAEKAPKDQVDAAVKQLLALKAEYKQNTGKDYKPGLQAPATSAQTQTQASSASTQSNSSP
+QAQELFSQVSQQGDLVRKLKSEKAPKDQVDEAVKTLLDLKSKYKTLTGQDYKPVAAAGGT
+GGEDKNRKEKENKSEKQGGGGGGKKGKGDKGGQSKESSGGAGGAGEGQGPKKQTRLGLEA
+KKEENLADWYSQVITKAEMIEYYDVSGCYVLRPWAFSIWESIKDFFDKEIKKLGVENCYF
+PMFVSQAALEKEKSHIADFAPEVAWVTRSGKTELAEPIAVRPTSETVMYPAYAKWVQSHR
+DLPIKLNQWCNVVGWEFKHPQPFLRTREFLWQEGHTAFATKEEAAEEVLQILDLYARVYE
+ELMAIPVVKGRKTEKEKFAGGDYTTTVEAFISASGRAIQGATSHHLGQNFSKMFEIVFED
+PKRPGEKQLAFQNSWGITTRTIGVLTMVHGDDMGLVLPPRVACLQVVIIPCGITATLPEQ
+EKEVLLAQCTKYLKRLQEAGIRVKSDLRDNYSPGWKFNHWELKGVPIRLEVGPKDMQQKQ
+CVAVRRDSGAKVTIAEAEVEKNLLNMLEDIQNSLFKKASDDLKSHMVAADTMEQFQKELD
+QGKIVQIPFCGGIECEDWIKKTTAKDQDLEPGAPSMGAKSLCIPFTPLKTLQPGQKCVSG
+KEPAQYYTLFGRSY
+>XP_006779784.1 gi|583968660|ref|XP_006779784.1| PREDICTED: kinesin-like protein KIF13B-like isoform X1 [Neolamprologus brichardi]
+MGEPSLDDSNVKVAVRVRPMNRREKELNTKCVVEMVKNQTILHPAGGNLGKGDSRSQSKV
+FAYDYCFWSMDETDKEKFAGQEVVFQCLGESLLHNAFQGYNACIFAYGQTGSGKSYTMMG
+SVDQPGLIPRLCSALFERTQKEQREEESFTVEVSYMEIYNEKVRDLLDPKGGRQTLRVRE
+HKVLGPYVDGLSRLAVASYKDIESLMSEGNKSRTVAATNMNEESSRSHAVFNIILTHTLK
+DLKSGTSGEKVSRLSLVDLAGSERAAKTGAAGERLKEGSNINKSLTTLGLVISALAEQGT
+AKNKTKFVPYRDSVLTWLLKDCLGGNSRTAMVATVSPAADNYEETLSTLRYADRAKSIVN
+HAVVNEDPNARIIRELREEVEKLRVQLTQAESLKAPELKDRLEESEKLIQEMTVTWEEKL
+RKTEEIAQERQKQLESLGISLQSSGIKVGDDKSFLVNLNADPALNELLVYYLKEHTKVGS
+ADSQDIQLCGMGIQAEHCVIDITAEAAVILAPYRNARTCVNGSPVTSALQLHHGDRILWG
+NNHFFRINLPKRRSRAADDEEGEGGVMKNSGSSEQLDADGDTASEVSSEVSFSYEFAQTE
+VMMKALGSNDPMQAVLQSLERQHEEEKRSALERQRQMYEQELQQLRKKLNPERLSTGQSG
+GPTIGQQGPGQQSHYRSMERLSIGGMSHSSSAQSRLRQWSEDREAVLVRSLRRLREQIVR
+ANLLVQEACFIADELERHTEYRVTLQIPSDNLNANRKRDAVLSEPAIQVRRRGRGKQIWS
+LEKMENRLVDMRELYQEWQDYHLNNPDDQVMRSYFRRADPFFDEQENHSLIGVANVFLSC
+LFYDVKLQYAVPIINQKGEVAGRLHVEVVRVGGGLEDNMAGGDEPDNNQDIEVQDRKLVC
+MIKILQATGLPQYLSNFVFCQYSFWDQPEPIIVAPEVDTSSSSPSNKDPHCMVVFDSCKE
+LAVSVTEEFIEHLTEGAVAIEVYGHRQADAGRNPALWDLSIIQAKTRTLRDRWSEVTRKL
+ELWIQILEINENGDFVPVEVVPARDVRTGGIFQLRQGQSRRIQVDVRSVQDSGTMPLIAE
+IVLAVSVGCVEIRNTTANQEADEMDSYQERDLERLRRQWLGALTKRQEYLDQHLQSLVSK
+AEKTEDDMEREAQLLEWRLTLTEERNAVMVPSAGSGIPGAPAEWVPLPGMETHIPVLFLN
+LKPDDLSSQDQFEVPEAGGWDAILNGEDEDDFFDLQIVRHYDGEVKAEASWDSTVHECPQ
+LSRGGSYPEQRVYLTIRVVVQLSHPADMQLVLRKRICVNVNPGRQGFAHNFLRRMSTRST
+VPGCGVTFEVVSNIPGDAPGSEDREMLARLAASAHNSQSGDDEAAIEKYLRSVLSLENIL
+TLDRLRQEVAVKEQLTSRGKSNRRSISSPSVNRLSGSRQDLSTTCLLDDKGRWESQQDIY
+MPSQFPRTLPRPASSPSTYSTSPSSSPTPFGTPPPQNQEPEQGRSGLAASYLSVKALVPQ
+MPKLLKSLFPVRDEKKELRPSPQNQQQHVPRIVTSSGGDDNKGKTETTAILRPPAKDRRA
+ELPEVSPLPVHDPHDTTPLSPLSQSSSGYFSASVSTATLCDVLQPSSSSSSLLAAETTLP
+TNPQQQGADRNDIVTSPSQFGAKVSAVASPASHNSANHNSITSDVSSEQKLINSGGSEGF
+ERLEIFVEDDERGGEDVLPDWLTEGAYVTVGNNKAGTVRYIGVTQFAEGVWVGVELDTPV
+GKNDGSVGGQRYFHCKPGYGVLVRPNRLSSRERTNRQTGEFTPSAHVPILRGEAIVARRG
+ENRKSWSS
+>XP_006779785.1 gi|583968662|ref|XP_006779785.1| PREDICTED: kinesin-like protein KIF13B-like isoform X2 [Neolamprologus brichardi]
+MGEPSLDDSNVKVAVRVRPMNRREKELNTKCVVEMVKNQTILHPAGGNLGKGDSRSQSKV
+FAYDYCFWSMDETDKEKFAGQEVVFQCLGESLLHNAFQGYNACIFAYGQTGSGKSYTMMG
+SVDQPGLIPRLCSALFERTQKEQREEESFTVEVSYMEIYNEKVRDLLDPKGGRQTLRVRE
+HKVLGPYVDGLSRLAVASYKDIESLMSEGNKSRTVAATNMNEESSRSHAVFNIILTHTLK
+DLKSGTSGEKVSRLSLVDLAGSERAAKTGAAGERLKEGSNINKSLTTLGLVISALAEQGT
+AKNKTKFVPYRDSVLTWLLKDCLGGNSRTAMVATVSPAADNYEETLSTLRYADRAKSIVN
+HAVVNEDPNARIIRELREEVEKLRVQLTQAESLKAPELKDRLEESEKLIQEMTVTWEEKL
+RKTEEIAQERQKQLESLGISLQSSGIKVGDDKSFLVNLNADPALNELLVYYLKEHTKVGS
+ADSQDIQLCGMGIQAEHCVIDITAEAAVILAPYRNARTCVNGSPVTSALQLHHGDRILWG
+NNHFFRINLPKRRSRAADDEEGEGGVMKNSGSSEQLDADGDTASEVSSEVSFSYEFAQTE
+VMMKALGSNDPMQAVLQSLERQHEEEKRSALERQRQMYEQELQQLRKKLNPERLSTGQSG
+GPTIGQQGPGQQSHYRSMERLSIGGMSHSSSAQSRLRQWSEDREAVLVRSLRRLREQIVR
+ANLLVQEACFIADELERHTEYRVTLQIPSDNLNANRKRDAVLSEPAIQVRRRGRGKQIWS
+LEKMENRLVDMRELYQEWQDYHLNNPDDQVMRSYFRRADPFFDEQENHSLIGVANVFLSC
+LFYDVKLQYAVPIINQKGEVAGRLHVEVVRVGGGLEDNMAGGDEPDNNQDIEVQDRKLVC
+MIKILQATGLPQYLSNFVFCQYSFWDQPEPIIVAPEVDTSSSSPSNKDPHCMVVFDSCKE
+LAVSVTEEFIEHLTEGAVAIEVYGHRQADAGRNPALWDLSIIQAKTRTLRDRWSEVTRKL
+ELWIQILEINENGDFVPVEVVPARDVRTGGIFQLRQGQSRRIQVDVRSVQDSGTMPLIAE
+IVLAVSVGCVEIRNTTANQEADEMDSYQERDLERLRRQWLGALTKRQEYLDQHLQSLVSK
+AEKTEDDMEREAQLLEWRLTLTEERNAVMVPSAGSGIPGAPAEWVPLPGMETHIPVLFLN
+LKPDDLSSQDQFEVPEAGGWDAILNGEDEDDFFDLQIVRHYDGEVKAEASWDSTVHECPQ
+LSRGGSYPEQRVYLTIRVVVQLSHPADMQLVLRKRICVNVNPGRQGFAHNFLRRMSTRST
+VPGCGVTFEVVSNIPGDAPGSEDREMLARLAASAHNSQSGDDEAAIEKYLRSVLSLENIL
+TLDRLRQEVAVKEQLTSRGKSNRRSISSPSVNRLSGSRQDLSTTCLLDDKGRWESQQDIY
+MPSQFPRTLPRPASSPSTYSTSPSSSPTPFGTPPPQNQEPEQGRSGLAASYLSVKALVPQ
+MPKLLKSLFPVRDEKKELRPSPQNQQHVPRIVTSSGGDDNKGKTETTAILRPPAKDRRAE
+LPEVSPLPVHDPHDTTPLSPLSQSSSGYFSASVSTATLCDVLQPSSSSSSLLAAETTLPT
+NPQQQGADRNDIVTSPSQFGAKVSAVASPASHNSANHNSITSDVSSEQKLINSGGSEGFE
+RLEIFVEDDERGGEDVLPDWLTEGAYVTVGNNKAGTVRYIGVTQFAEGVWVGVELDTPVG
+KNDGSVGGQRYFHCKPGYGVLVRPNRLSSRERTNRQTGEFTPSAHVPILRGEAIVARRGE
+NRKSWSS
+>XP_006779786.1 gi|583968664|ref|XP_006779786.1| PREDICTED: kinesin-like protein KIF13B-like isoform X3 [Neolamprologus brichardi]
+MGEPSLDDSNVKVAVRVRPMNRREKELNTKCVVEMVKNQTILHPAGGNLGKGDSRSQSKV
+FAYDYCFWSMDETDKEKFAGQEVVFQCLGESLLHNAFQGYNACIFAYGQTGSGKSYTMMG
+SVDQPGLIPRLCSALFERTQKEQREEESFTVEVSYMEIYNEKVRDLLDPKGGRQTLRVRE
+HKVLGPYVDGLSRLAVASYKDIESLMSEGNKSRTVAATNMNEESSRSHAVFNIILTHTLK
+DLKSGTSGEKVSRLSLVDLAGSERAAKTGAAGERLKEGSNINKSLTTLGLVISALAEQGT
+AKNKTKFVPYRDSVLTWLLKDCLGGNSRTAMVATVSPAADNYEETLSTLRYADRAKSIVN
+HAVVNEDPNARIIRELREEVEKLRVQLTQAESLKAPELKDRLEESEKLIQEMTVTWEEKL
+RKTEEIAQERQKQLESLGISLQSSGIKVGDDKSFLVNLNADPALNELLVYYLKEHTKVGS
+ADSQDIQLCGMGIQAEHCVIDITAEAAVILAPYRNARTCVNGSPVTSALQLHHGDRILWG
+NNHFFRINLPKRRSRAADDEEGEGGVMKNSGSSEQLDADGDTASEVSSEVSFSYEFAQTE
+VMMKALGSNDPMQAVLQSLERQHEEEKRSALERQRQMYEQELQQLRKKLNPERLSTGQSG
+GPTIGQQGPGQQSHYRSMERLSIGGMSHSSSAQSRLRQWSEDREAVLVRSLRRLREQIVR
+ANLLVQEACFIADELERHTEYRVTLQIPSDNLNANRKRDAVLSEPAIQVRRRGRGKQIWS
+LEKMENRLVDMRELYQEWQDYHLNNPDDQVMRSYFRRADPFFDEQENHSLIGVANVFLSC
+LFYDVKLQYAVPIINQKGEVAGRLHVEVVRVGGGLEDNMAGGDEPDNNQDIEVQDRKLVC
+MIKILQATGLPQYLSNFVFCQYSFWDQPEPIIVAPEVDTSSSSPSNKDPHCMVVFDSCKE
+LAVSVTEEFIEHLTEGAVAIEVYGHRQADAGRNPALWDLSIIQAKTRTLRDRWSEVTRKL
+ELWIQILEINENGDFVPVEVVPARDVRTGGIFQLRQGQSRRIQVDVRSVQDSGTMPLIAE
+IVLAVSVGCVEIRNTTANQEADEMDSYQERDLERLRRQWLGALTKRQEYLDQHLQSLVSK
+AEKTEDDMEREAQLLEWRLTLTEERNAVMVPSAGSGIPGAPAEWVPLPGMETHIPVLFLN
+LKPDDLSSQDQFEVPEAGGWDAILNGEDEDDFFDLQIVRHYDGEVKAEASWDSTVHECPQ
+LSRGGSYPEQRVYLTIRVVVQLSHPADMQLVLRKRICVNVNPGRQGFAHNFLRRMSTRST
+VPGCGVTFEVVSNIPGDAPGSEDREMLARLAASAHNSQSGDDEAAIEKYLRSVLSLENIL
+TLDRLRQEVAVKEQLTSRGKSNRRSISSPSVNRLSGSRQDLSTTCLLDDKGRWESQQDIY
+MPSQFPRTLPRPASSPSTYSTSPSSSPTPFGTPPPQNQEPEQVKALVPQMPKLLKSLFPV
+RDEKKELRPSPQNQQQHVPRIVTSSGGDDNKGKTETTAILRPPAKDRRAELPEVSPLPVH
+DPHDTTPLSPLSQSSSGYFSASVSTATLCDVLQPSSSSSSLLAAETTLPTNPQQQGADRN
+DIVTSPSQFGAKVSAVASPASHNSANHNSITSDVSSEQKLINSGGSEGFERLEIFVEDDE
+RGGEDVLPDWLTEGAYVTVGNNKAGTVRYIGVTQFAEGVWVGVELDTPVGKNDGSVGGQR
+YFHCKPGYGVLVRPNRLSSRERTNRQTGEFTPSAHVPILRGEAIVARRGENRKSWSS
+>XP_006779787.1 gi|583968666|ref|XP_006779787.1| PREDICTED: prepronociceptin-like [Neolamprologus brichardi]
+MKTVVALLLLCLCDPGQSDCQADCLSCNNILPKQLSFNTMVCFIECESSVSPSSSWDLCH
+EALLSQILSPSGSVWKRSQEEVEALFPGEDEQMKGSLFLPIALQRVDHVTHGLDTEERDL
+GGKGNHLNAAYNSQNAMSLEDEYAEEEEGQEGGDPDVAAGQGDVALISKRFGGFVKGRHG
+HRRLMSPGRSYQKRYGGFVGIRKSARKWNNQKRFSEFLKQYLGMSTRATEFNSVSEDLAQ
+QNEV
+>XP_006779792.1 gi|583968676|ref|XP_006779792.1| PREDICTED: NT-3 growth factor receptor-like isoform X1 [Neolamprologus brichardi]
+MDLWFHSIRICWWRVLFLMSIFQDYLSSMLDCPPTCSCSQTEIFCNKSDNGRFFPLLALQ
+DTGSNGTSVDIAELFKNITSIHIENWTGLQTLRDVDMELYTGLQKLTIMNCNLKSIQPRA
+FAQNPHLSTINLSKNPLTTLSWQLFQHLQLQELRLDGVVFDCGCDIRWIQLWHQRGEAKL
+NTQQLYCRNGATKIRLENMYIHNCDLPEISVSHSSVLVMEGDNVTVSCNGSGSPLPEVDW
+TVSGLHSINTHLSNVYWPNIHSINLTLFNISRDDNNFQLTCIAENVVGMTNSSIQLNVQF
+PPVILRLAEPEQRLDTCIEFTVRGYPQPQLRWFHKQKEIIKNDYIRTEMDFYQDYLEGCL
+TFQNPTHINNGNYTLEASNALGTVTKTVYGHFLENPDEPDPVEEVTPPHPRPPDEDTFGV
+SIAVGLAGFACVLLLVLFVLINKYGRRSKFGMKGPVAVISGEEDSASPLHHVNHGIITPC
+TLDASPDAVVIGMTRIPVVENPQYFRHGHNCNKPATLVQHIKRRDIILKRELGEGAFGKV
+FLAECYNLSPTKDKMLVAVKTLKDPNLSARKDFQREAELLTNLQHDHIVKFYGVCVDGDP
+LIMVFEYMKHGDLNKFLRAHGPDAMILVDGQPLQSNGELGLSQMLHIATQIASGMVYLAS
+QHFVHRDLATRNCLVGNGLLVKIGDFGMSRDIYSSDYYRVGGHTMLPIRWMPPESIMYRK
+FSTESDVWSFGVILWEIFTYGKQPWFQLGNNEVIECITQGRVLERPRICPKEVYDIMLGC
+WQREPQQRLNIKDIQKVLFAMGKATPVYLDILG
+>XP_006779793.1 gi|583968679|ref|XP_006779793.1| PREDICTED: NT-3 growth factor receptor-like isoform X2 [Neolamprologus brichardi]
+MDLWFHSIRICWWRVLFLMSIFQDYLSSMLDCPPTCSCSQTEIFCNKSDNGRFFPLLALQ
+DTGSNGTSVDIAELFKNITSIHIENWTGLQTLRDVDMELYTGLQKLTIMNCNLKSIQPRA
+FAQNPHLSTINLSKNPLTTLSWQLFQHLQLQELRLDGVVFDCGCDIRWIQLWHQRGEAKL
+NTQQLYCRNGATKIRLENMYIHNCDLPEISVSHSSVLVMEGDNVTVSCNGSGSPLPEVDW
+TVSGLHSINTHLSNVYWPNIHSINLTLFNISRDDNNFQLTCIAENVVGMTNSSIQLNVQF
+PPVILRLAEPEQRLDTCIEFTVRGYPQPQLRWFHKQKEIIKNDYIRTEMDFYQDYLEGCL
+TFQNPTHINNGNYTLEASNALGTVTKTVYGHFLENPDEPVTPPHPRPPDEDTFGVSIAVG
+LAGFACVLLLVLFVLINKYGRRSKFGMKGPVAVISGEEDSASPLHHVNHGIITPCTLDAS
+PDAVVIGMTRIPVVENPQYFRHGHNCNKPATLVQHIKRRDIILKRELGEGAFGKVFLAEC
+YNLSPTKDKMLVAVKTLKDPNLSARKDFQREAELLTNLQHDHIVKFYGVCVDGDPLIMVF
+EYMKHGDLNKFLRAHGPDAMILVDGQPLQSNGELGLSQMLHIATQIASGMVYLASQHFVH
+RDLATRNCLVGNGLLVKIGDFGMSRDIYSSDYYRVGGHTMLPIRWMPPESIMYRKFSTES
+DVWSFGVILWEIFTYGKQPWFQLGNNEVIECITQGRVLERPRICPKEVYDIMLGCWQREP
+QQRLNIKDIQKVLFAMGKATPVYLDILG
+>XP_006779794.1 gi|583968681|ref|XP_006779794.1| PREDICTED: synaptic vesicle glycoprotein 2B-like [Neolamprologus brichardi]
+MDDPYRNNVNQQMTEGGDYTYTQDGGGQDGYPYQTDYPPQDEDAASDATEGADEDDQMYE
+GEYQGIPHPDEIKEARRAARVEARRKARMAAQQEEEEENLPEQYETIMEDCGHGRFQWML
+FFVLGLALMADGVDGFVVGFVLPSAEKDMCISNADKGLLGLLVYVAMMVGALVWGGLCDK
+MGRRKCLIYVLTIDLVFSFLSCFAQGYGFFLFLRFCSGFGIGGSIPIVYTYFTEFLQMDK
+RGEHLSWLCMFWMFGGLYASFTAWGIIPHYGWGFAIGTHIQMHSWRLFILVCLFPALAAL
+IGLVFMPESPRFLLENARHDEAWMILRQVHDTNWKAKGEPERVFTVTNIKTPQTQDDEFI
+EIQSETGTAFQRWTVRKMTMLQQVMANIMSLSAPELRLQGLLLVIVWFCLAFSYHGLGVW
+FPDMIKYMQYEEYESKVRIFHRERVERFHFNFSLVNQIHREGEYIHDKFANIEIKSVKFE
+SSLFENCYFEDVKSTNTFFENCTIKNTVFYNTDLWQDKFKNCRMENATFLHPKKGCHLNF
+QEENDIVIYMVSFLGSLAVLPGNIISALFMDKIGRIRIIGGSMLASSACTFLLLLSFSQG
+AVICWQCLFYGVSVAAWNGLEVISVELYPSSKRGTAFGILNGICKFAAIIASSIFAAFIG
+ITKIIPIFLAFAALVCGGMVALKLPETREKILS
+>XP_006779795.1 gi|583968683|ref|XP_006779795.1| PREDICTED: AP-3 complex subunit sigma-2-like [Neolamprologus brichardi]
+MIKAILIFNNHGKPRLIRFYQYFAEDMQQQIIRETFHLVSKRDDNVCNFLEGGSLIGGSD
+YKLIYRHYATLYFVFCVDSSESELGILDLIQVFVETLDKCFENVCELDLIFHMDKVHYIL
+QEVVMGGMVLETNMNEIVAQVEVQNRMEKSEGGLSAAPARAVSAVKNMNLPEIPRNINIG
+DINIKVPSLSPF
+>XP_006779796.1 gi|583968685|ref|XP_006779796.1| PREDICTED: synaptosomal-associated protein 25-B-like isoform X1 [Neolamprologus brichardi]
+MADESDMRNELADLQTRADQIADESLESTRRMLALVEESKDAGIRTLVMLDEQGEQLERI
+EEGMDQINKDMKDAEKNLNNLGQFCGLCSCPCNKIKGGGQAWGGNQDGVVNSQPGARVVD
+EREQMAISGGFIRRVTNDARENEMDENLEQVGGIIGNLRHMALDMGQEIDTQNRQIDRIM
+DKADSNKTRIDEANQRATKMLGSG
+>XP_006779797.1 gi|583968687|ref|XP_006779797.1| PREDICTED: synaptosomal-associated protein 25-B-like isoform X2 [Neolamprologus brichardi]
+MADESDMRNELADLQTRADQIADESLESTRRMLALVEESKDAGIRTLVMLDEQGEQLDRV
+EEGMNKVNADLKEAEKDLKDIGQCCGLICPCIKKIKGGGQAWGGNQDGVVNSQPGARVVD
+EREQMAISGGFIRRVTNDARENEMDENLEQVGGIIGNLRHMALDMGQEIDTQNRQIDRIM
+DKADSNKTRIDEANQRATKMLGSG
+>XP_006779798.1 gi|583968689|ref|XP_006779798.1| PREDICTED: protein FAM219B-like [Neolamprologus brichardi]
+MMNDILEEPEKDSLLEAQQDSQGLSGPSSGTRPKSIDGGIRPVEKRGPYIMSRAPAIHLK
+LQKHREMARKALKKKALSPGPPVTHQPRQGAKRMVKYNKGYAALSQHAEDTLVAIDSDSD
+EEIDFEQYSSGYSSAEIHPDLSKQLLQDGYRLDEIPDDEDLDLIPPKAMGSSVCCCSEGP
+SCPIQ
+>XP_006779799.1 gi|583968691|ref|XP_006779799.1| PREDICTED: semaphorin-7A-like [Neolamprologus brichardi]
+MFLEIWKMRFSLVACLFFLHICCLAVGNDRSPRMIFTEKEAAMNRLDLLHGPPVRILLEE
+KPDTVLAVGKTYLNTYNIKNQNKNQTRMQLENCNRNCSYDITLAHLMEDAKKLFVCGTIH
+DETVCCNSNLTEQPPICKDIKDISSFNIKEGDLSALAESKQSTDLYITRSGSDESVGIHK
+FGKARVGPKNHHKEQHYVGLVLSKREEDPSQNRVYGFYREKTKDDGLFSEMWLPFVTQVC
+MTDVGGPKNNLQYTWTSQMNARLFCGDQERKQHFSELVDVSTVDADRWQYTKIYALFRNE
+WGMSAVCVYTIEDISKIFENSPFNGYTKKQMDRPRMCAPDSSKLSVDTLKNIDKTSEMEQ
+LVHPVGNPGLLFFNHRNYTHIQVDSKPNSRGGLEWLQFLTVNNGGIHKVLQNESHTFVIA
+EYQPFKQKAHVLSIILQSTFKKLYVNNGSQLVQLDVADCSQYGDTCQDCMLSRDPYCGWN
+GTQCIRETEGSWHDAATGNLSICNEHNASNYKGDPVPVPRYSKYFLQCPVSSRHAQYSWQ
+HDENSTACSSGKEQCLYLIDNMDSECKGTYKCISQEMGYSKVLVQYELQVENDAKTQPYK
+RLWPNKAEGRKTSPVIWVCLMMALIKSLSF
+>XP_006779800.1 gi|583968694|ref|XP_006779800.1| PREDICTED: cytochrome P450 1A1-like [Neolamprologus brichardi]
+MALMILPFIGALSVSHVLVAVTTACLVYMIIKNAQNKIPEGLQQLPGPKPFPIIGNVLEL
+GSRPYLSLTSMSKRYGDVFQIQIGMRPVVVLSGNETVRQALIKQGDEFAGRPDLYSFRYI
+NDGKSLSFSTDQAGIWRARRKLAYSALRSFSNLDSTTPEYSCALEEHISKETEYLIKELN
+TVMKTKGSFDPFRYVVVSVANVICGMCFGRRYDHHDDELVSLVNLSDDFVKVVGSGNPAD
+FIPLLQYLPSTKMKKFMSLNARFSKFVQKLVTEHYATFDKDNIRDITDSLIDHCEDRKLD
+ENANIQMSDEKIVGIVNDLFGAGFDTISTALSWSLMYFVAYPEIQNRLFEEIKEKVGLDR
+MPVFSDRNNLPLLEAYILELFRHSSYLPFTIPHCTTKDTSLNGYFIPKDTCVFINQWQIN
+HDPEMWEDPFSFKPERFLNADGTEVNKVEGEKVMTFGLGKRRCIGEVIARNEVFLFLAIL
+IQKLNFQALPGDQLDLTPEYGLTMKHKRYHLRATMRVRNEQ
+>XP_006779801.1 gi|583968696|ref|XP_006779801.1| PREDICTED: enhancer of mRNA-decapping protein 3-like [Neolamprologus brichardi]
+MATDWVGSVVSIDCGATLGVYQGEVSSVDRVSQTISLKHPYHNGVKCPVPEVTFSAMDIK
+DLKFLDIQNKVNKTSAGKDTATEPSYISTGRHGQTNKTNHSLAISNSSGLSSNPRKGSSN
+SRGTTQSTPRRSNVRNGGAGGQRSKNDECFGDGTDENLDTDFDFEGNLALFDKAAVFSQI
+DGASSNSNKLQHHNTQAEQKTQSYRHDENILEVKPVTYRQITVPQHGGKEYCTDTGLVVP
+TVPYELHKQLLAAAERWGLSLERRLEAVGVCSSQMALTLLGGPNRLTPKNVHQRPTVVLL
+CGPHVQGAQGISCGRHLANHEVEVILFLPNFVKMQESVTSEVNLFSKTSGKQVSSVKDLP
+MSPVDLVINCLDCHENPLLKEQSWYQSVADWANKNRAPVLSIDPPVSEQPQSVDAKWTLS
+LGLPLPLADKDSRVYLCDIGLPKMVYQEVGINYHSPFGCKFVIPLHSV
+>XP_006779802.1 gi|583968698|ref|XP_006779802.1| PREDICTED: tyrosine-protein kinase CSK-like isoform X1 [Neolamprologus brichardi]
+MSGIHVPWSTGTECVAKYNFQTANEQDLPFCKGDVLTIIGVTRDPNWYRARNQVGREGTI
+PANYVQKREGVKSGGKLSLMPWFHGKITREQAERLLYPPETGLFLVRESTNYPGDYTLCV
+SCDGKVEHYRIIYHNGKLTIDEEEYFENLMQLVEHYTKDADGLCTRLIKPKLMEGTVAAQ
+DEFSRSGWALNRKELKLLQTIGKGEFGDVMVGDYRGTKVAVKCIKNDATAQAFIAEASVM
+TQLRHNNLVQLLGVIVEERGSLYIVTEYMAKGSLVDYLRSRGRTVLGGDCLLKFSLDVCE
+AMEYLEANNFVHRDLAARNVLVSDDNIAKVSDFGLTKEASSIQDTAKLPVKWTSPEALRE
+KRFSTKSDVWSYGILLWEIYSFGRVPYPRIPLKEVVPRVEKGYKMDAPDGCPAVVYDLMK
+QCWTLDPVMRPSFRMLREKLQHIRAKELYL
+>XP_006779803.1 gi|583968700|ref|XP_006779803.1| PREDICTED: tyrosine-protein kinase CSK-like isoform X2 [Neolamprologus brichardi]
+MSGIHVPWSTGTECVAKYNFQTANEQDLPFCKGDVLTIIGVTRDPNWYRARNQVGREGTI
+PANYVQKREGVKSGGKLSLMPWFHGKITREQAERLLYPPETGLFLVRESTNYPGDYTLCV
+SCDGKVEHYRIIYHNGKLTIDEEEYFENLMQLVEHYTKDADGLCTRLIKPKLMEGTVAAQ
+DEFSRSGWALNRKELKLLQTIGKGEFGDVMVGDYRGTKVAVKCIKNDATAQAFIAEASVM
+TQLRHNNLVQLLGVIVEERGSLYIVTEYMAKGSLVDYLRSRGRTVLGGDCLLKFSLDVCE
+AMEYLEANNFVHRDLAARNVLVSDDNIAKVSDFGLTKEASSIQDTAKLPVKWTSPEALRE
+KRFSTKSDVWSYGILLWEIYSFGRVPYPRIPLKEVVPRVEKGYKMDAPDGCPAVVYDLMK
+QCWTLDPVMRPSFRMLREKLQHIRAKELYL
+>XP_006779804.1 gi|583968702|ref|XP_006779804.1| PREDICTED: complexin-3-like [Neolamprologus brichardi]
+MAFMVKHVVGGQLKNLTGGLTEEKSEGEKSDAAAQGMTQEEFEQYQQQLEEEKKEREAHY
+AQKKAERATVRTHFREKYRLPKNEMDETQIQQAGDDVVLPTELAKMIAEDNEEETHKQSV
+LGQLSNIQNVDIDQLKDKAQATLEDLKKQTENCSLM
+>XP_006779805.1 gi|583968704|ref|XP_006779805.1| PREDICTED: growth arrest-specific protein 1-like [Neolamprologus brichardi]
+MKCWCSALALLPWVLVALDAQLICWQALLRCHDEPECELAYNQYMTACEGNIKGTRKQCP
+SHCISALIRLNHTRSGPDLETCDCAQDLDCLDAKRAIEPCLPRRHPKDAGGIGCMEARQR
+CEEDSNCHTSLTAYLSYCGQLFNGRKCSSKCKATIQQMLFIPNGMLLNRCICDGVERPFC
+EVVKENMSKLCSIGDHSVVSDPTKDYEDPYEDDYSKNDKEVDFSENSSASQSLSRGVLPL
+CLLTARILY
+>XP_006779806.1 gi|583968706|ref|XP_006779806.1| PREDICTED: serine/threonine-protein kinase ULK3-like [Neolamprologus brichardi]
+MASTSSFAPPKLSDFILTERLGSGTYATVYKAYRKGNSREVVAVKVVGKKTLNKASTENL
+LTEIEILKTVRHPHIVQLKDFQWDAENIYLILEWCSGGDLSRFIRSRRILPESVTRRFLQ
+QIACALQFLHERNISHLDLKPQNILLSGSILKLADFGFAQYMSPWDEQSVLRGSPLYMAP
+EMVCRRQYDSRVDLWSVGVILYEALFGRAPFASKSYAELEEKIRSNQPIELPPGARVSKD
+CRDLLLRLLERNPDARITFAEFFTHPFVDMEHMPSAESIVKAKKLVLQAIQKDQEGERSE
+ALSLYCSALEHFVPAIYYETNCQRKEALRQKVRQYVSRAEELKALVASDNRLSFEQARTS
+RDILREMSKDQPRLLAALEMASTAIAKEESGSDDLEALDMYQQCLGELLLGLAAEPQGRR
+RELLHSEIKSLMSRAEYLKKHIKMQETQRDVSLDRESLAESVRSSCCLQ
+>XP_006779807.1 gi|583968708|ref|XP_006779807.1| PREDICTED: TM2 domain-containing protein 3-like [Neolamprologus brichardi]
+MATVCQIWRPDRGRCLKSYGIIAVLFMDLMLQCVNGSLSTTNVETHYTRDGPFITSPVVP
+DASSVFPADEDTSKCPSGGLCHRLPAHCIQCDYHLKCTYGKPTLFTCRPKKGVHCIGESG
+HQQTNFSLNITCQFCWQLDPSQYRCTNSTNCMTVSCPRKRYNATCDVLDHVHCLGKRRFP
+KRLFCNWTGGYKWSTALALSITLGGFGADRFYLGQWREGLGKLFSFGGLGIWTLIDVLLI
+GVGYVGPVDGSLYI
+>XP_006779808.1 gi|583968710|ref|XP_006779808.1| PREDICTED: la-related protein 6-like [Neolamprologus brichardi]
+MYALVNAFMRCLSFLLPPSWLYVSFCLWVGNECEETLQRPNPRARFKSREPLTYEEVKAA
+AKAAAEAEAQGGSRPSVSPGPDCVSLAATSPAAPKGPSSGLIWIGGLWRAVERVFGAPWV
+LLRHHLCPKRRRAALGAPYPVCAFELGKIKSFQRGAAAAAAAAKIVDVKGPGETTFTYSK
+NMSGSVGVPSVNSTECASDASAEQGIDEVITVDQLSQEMGTVTITVAIQAAEDEEPEEVT
+SNNADFLGGSCSEDEIGRHDKSSGAGTSGGELEEESWQPPDPELIQKLVTQIEYYLSDEN
+LEHDAFLLKHVRRNKLGFVSVKLLTSFKKVKHLTRDWRTTAYALRHSKILELNDEGRKVR
+RKSAVPVFASESLPSRMLLLSDLQRWPELAALTKDNGSAEGGATQQEQLMKLLLKAFGTY
+GAIASVRVLKPGKDLPADLKRLSGRYAQLGTEECAIVEFEEVEAAVKANEAAGSENGGPN
+LLGLKVVLIGTKPPKKKVPKERPREEGGMRKSRSLNSRVRELQYHGDDSACSSSETESTP
+TSPRLARKSQSCNKLSPTTAGISFQNNHLSPSMSPRNSPWSSPRASPCSQRKSPHSHKSP
+LAVEGRLSPEAGRRWADYSSDSSLTPSGSPWVQRRKQVASQESSPVGSPMLGRKIQNADG
+LPPGVMRLPRGPDGTRGFHCVAIERGKTAATQT
+>XP_006779809.1 gi|583968712|ref|XP_006779809.1| PREDICTED: leucine-rich repeat-containing protein 49-like isoform X1 [Neolamprologus brichardi]
+MEEDLAEGKITRSHKQNTSEKWMFLTPMINSCKLHLTTVKSLVPARAQAMSDSQDHVKET
+FNYSDLENSLHAGIQKRVVQELFESDKCTYNQKAGAAVSNAAYKARHKARRQTQCTGETF
+GQNALKNAKPAGDFPGCNYSALPGFLSTQLPFTSSFQQIDLERQSLEECPQLDFVKELQF
+LNLQHNLITKIQHLSHLQQLVSLNLHDNHISDMAGIEVLRSLKILILGKNRIHEICCLDS
+LSKLNMLDLHDNQICRIENVSHLSELRVLNLAGNNILKMENLQGLDSLTELNLGQNCISV
+VTEVDRLPLLQRLFLSCNNITSFDQLACLGESCSLSELTLDGNPVALETWYKQAVLRCVL
+HLRQLDMKRITDEDRRMAGVQARKEEEKKKESHKQTIHKEKRRLAIRNAAQQWEGVRACL
+ELPSTNGAKEEVSPENSPAHSPAQTNGLTQEPSPDEPRRVSPGSGPERPSGGTEIRLQTN
+SRPNSPRDPKLVEAGSGSVQSLSLSDSHLAELDGDTLRLFGLGALEALERGWGVQTAGAV
+TVITFRYINFDAIVPTLPRIRVKFPNLSHMIFLETNISRLPQLAALAQVRRLDQLTIHPD
+GNPVVSLTLWRSFVIYRLHHFNLQRINGQEVTMNDVIAAERVFGTLGHIAATETPRCRLL
+LLLEESRKRQLQFLLEGRGRRAGLSPEELRDNGKLLGEGLSRALFNYPSRDCSAESPEEG
+SVESSERATMVEQYLQELVQSASDTNLKGEALHKLWPSMFAEMVRDCVLEMRDRAAFRQA
+SLAKLSETK
+>XP_006779810.1 gi|583968715|ref|XP_006779810.1| PREDICTED: leucine-rich repeat-containing protein 49-like isoform X2 [Neolamprologus brichardi]
+MEEDLAEGKITRSHKQNTSEKWMFLTPMINSCKLHLTTVKSLVPARAQAMSDSQDHVKET
+FNYSDLENSLHAGIQKRVVQELFESDKCTYNQKAGAAVSNAAYKARHKARRQTQCTGETF
+GQNALKNAKPAGDFPGCNYSALPGFLSTQLPFTSSFQQIDLERQSLEECPQLDFVKELQF
+LNLQHNLITKIQHLSHLQQLVSLNLHDNHISDMAGIEVLRSLKILILGKNRIHEICCLDS
+LSKLNMLDLHDNQICRIENVSHLSELRVLNLAGNNILKMENLQGLDSLTELNLGQNCISV
+VTEVDRLPLLQRLFLSCNNITSFDQLACLGESCSLSELTLDGNPVALETWYKQAVLRCVL
+HLRQLDMKRITDEDRRMAGVQARKEEEKKKESHKQTIHKEKRRLAIRNAAQQWEGVRACL
+ELPSTNGAKEEVSPENSPAHSPAQTNGLTQEPSPDEPRRVSPGSGPERPSGGTEIRLQTN
+SRPNSPRDPKLVEAGSGSVQSLSLSDSHLAELDGDTLRLFGLGALEALERGWGVQTAGAV
+TVITFRYINFDAIVPTLPRIRVKFPNLSHMIFLETNISRLPQLAALAQVRRLDQLTIHPD
+GNPVVSLTLWRSFVIYRLHHFNLQRINGQEVTMNDVIAAERVFGTLGHIAATETPRCRLL
+LLLEESRKRQLQFLLEGRGRRAGLSPEELRDNGKLLGEGLSRALFNYPSRDCSAESPEEG
+SVESSERATMVEQYLQELVQSASDTNLKGEALHKLWPSMFAEMVRDCVLEMRDRAAFRQA
+SLAKLSETK
+>XP_006779811.1 gi|583968717|ref|XP_006779811.1| PREDICTED: xaa-Pro dipeptidase-like [Neolamprologus brichardi]
+MAAAAQPVYWLGNDTLRVSAALFAENRRRLCQGLKAKDGVVPKSVVVLQGGEQTQRYCTD
+TDVLFRQESFFHWAFGVTEADCYGAIDVDSGKSILFVPKLPESYATWMGEIFPKEHFKEK
+YAVDEVHHTCDIANVLSNLKPAVLLTLRGQNTDSGSTCREASFDGISRFQVNNTLLHPVI
+VDCRVVKTDMELEVLRYTNRVSSEAHKMVMKHVKPGKKEYEMESLFQHYCYTKGGMRHTS
+YTCICGTGNNSSVLHYGHAGAPNDKTITDGDMCLFDMGGEYYCYSSDITCSFPANGKFTP
+DQRAIYEAVLKASRAVMAALRPGVKWTDMHRVADRVHLEELVKIGILHGSVEDMMKVHLG
+SVFMPHGLGHLLGIDVHDVGGYPEGIERIDEPGLKSLRMGRLVQERMVLTVEPGIYFINH
+LLNQALANPAQSCFIDNQVLARFRGFGGVRIEDDIAVTADGIELMTCVPRTVEEIEAFMA
+DSTKPFSPVV
+>XP_006779812.1 gi|583968719|ref|XP_006779812.1| PREDICTED: carbohydrate sulfotransferase 8-like isoform X1 [Neolamprologus brichardi]
+MLWMKWKMVVDSLRGRRRRLPCSLWFVLLFAAGGLVLFIHQQALSEMVQQQGPENVTNKQ
+QLKVTALKTRQSISGVKLGSTPRQSRETLSTRDRERGKSDSFQDLQVTENILSSAIPPMQ
+FPHFEKSRKTASPGSQEQDIGSLHVTKRQRKLLKTSPPIRHTKNTISSSSSSSVSSSSSI
+SSSITSGFFSPESWQKLSGILEARQQLMKEICAKYKSSISKTITRHHVKSIFVEDKYKLL
+YCQVPKAGCSNWKRTLMVLAGKASNTQSIKHDTVHYGQHLKKLDSFDQQGIMHRLQTYTK
+VIFVREPLERMVSAYRDKFENPNNYYHSLFGKPIISKYRVNPSKAALKTGNGVTFKEFVQ
+YLLDVHRPVGMDIHWEQANQLCNPCLIDYDFIGKFENMEEESNFLLRLSGAPPNLTLPSF
+KDRNPSDKRTSMQITENYFSQVSALERQRVYDFYYMDYLMFNYSKPFKDLY
+>XP_006779813.1 gi|583968721|ref|XP_006779813.1| PREDICTED: carbohydrate sulfotransferase 8-like isoform X2 [Neolamprologus brichardi]
+MLWMKWKMVVDSLRGRRRRLPCSLWFVLLFAAGGLVLFIHQQALSEMVQQQGPGVKLGST
+PRQSRETLSTRDRERGKSDSFQDLQVTENILSSAIPPMQFPHFEKSRKTASPGSQEQDIG
+SLHVTKRQRKLLKTSPPIRHTKNTISSSSSSSVSSSSSISSSITSGFFSPESWQKLSGIL
+EARQQLMKEICAKYKSSISKTITRHHVKSIFVEDKYKLLYCQVPKAGCSNWKRTLMVLAG
+KASNTQSIKHDTVHYGQHLKKLDSFDQQGIMHRLQTYTKVIFVREPLERMVSAYRDKFEN
+PNNYYHSLFGKPIISKYRVNPSKAALKTGNGVTFKEFVQYLLDVHRPVGMDIHWEQANQL
+CNPCLIDYDFIGKFENMEEESNFLLRLSGAPPNLTLPSFKDRNPSDKRTSMQITENYFSQ
+VSALERQRVYDFYYMDYLMFNYSKPFKDLY
+>XP_006779814.1 gi|583968723|ref|XP_006779814.1| PREDICTED: BTB/POZ domain-containing protein kctd15-like isoform X1 [Neolamprologus brichardi]
+MFETEGRSMSRLSLTRSPVSPLAAQGIPLPAQLTKANAPVHIDVGGHMYTSSLATLTKYP
+DSRISRLFNGTEPIVLDSLKQHYFIDRDGEIFRYILSFLRTSKLLLPDDFKDFHLLYEEA
+RYYQLTPMIKELERWKQEREQRRMAQPCDCLVVRVTPDLGERIALSGEKVLIEEIFPETG
+DVMCNSVNAGWNQDPTHVIRFPLNGYCRLNSVQVLERLFQKGFSVAASCGGGVDSSQFSE
+YVLCREDRRSLSINTPIRIKQEPLD
+>XP_006779815.1 gi|583968725|ref|XP_006779815.1| PREDICTED: BTB/POZ domain-containing protein kctd15-like isoform X2 [Neolamprologus brichardi]
+MFKEGRSMSRLSLTRSPVSPLAAQGIPLPAQLTKANAPVHIDVGGHMYTSSLATLTKYPD
+SRISRLFNGTEPIVLDSLKQHYFIDRDGEIFRYILSFLRTSKLLLPDDFKDFHLLYEEAR
+YYQLTPMIKELERWKQEREQRRMAQPCDCLVVRVTPDLGERIALSGEKVLIEEIFPETGD
+VMCNSVNAGWNQDPTHVIRFPLNGYCRLNSVQVLERLFQKGFSVAASCGGGVDSSQFSEY
+VLCREDRRSLSINTPIRIKQEPLD
+>XP_006779816.1 gi|583968727|ref|XP_006779816.1| PREDICTED: transcription initiation factor TFIID subunit 4-like isoform X1 [Neolamprologus brichardi]
+MAGASDPLEDMLFSEVDEKAVSDLVGSLESQLAGQSNPAGKADENGGAGSVAPANHHLGK
+TLPAPVSTTTLEQQQQQQGRRNKTEMRQEINSKDVSPDKTVTSPSPGCSPSFGEPSTTSG
+ACVSATSSGSQSHGASITTLTASGVSTLASLPPASISTTISSQGSKVTVGTGETSTGATP
+PRKRITTPRRSASARIKSLNGAAVTTRRNSNTAVVDSVSQVDTSASTPNSGRPVTTSINT
+STFTLSNASLPVGQSAIALDRGTPTIALHRLPSHIVASIAQNGNGTSVSALVQQGARIGP
+VTSLASPGNQTKMVTDTGASKTDDCQSKIVMLTQSSVVNSVVNTVSTSSPPLPPPPPSST
+SSSIVTPPTTTTAAATTTITITQPLNSITPAACVTGMATSSVCGAGQTTSVTTTITMVRP
+TAPSPTPAVATSAQSQPRPGLTAPQRIVTPQLIVRPPQQQTTIQLPPGFTIPQGMVLVRT
+ELGQLVMVPQQALAQAQAQAQAQAQAQAQNNISPRPATPTTGTSFRVTSPQQSPVTSQTS
+RQCPLTPAKMAPSPSPTPSSPALQTSSSSSSSSSSSCPALRPKGPVAPVVAVTAPQQTPV
+VLPPQAPAQPAPQPVQPAQPGIATASGGSVASQEMQENVKKCKNFLATLIKLASHNSPSP
+ETSKNVKALVQDLLDAKIEPEEFTSRLQTELKSSPQPYLVPFLKKSLPALRLSLLNSQQS
+LTQPPQQGLKPAPCGTPPAIVAGPAVRIRHPNSVSTTTGASALPAGTLGHAAAMGVKTGG
+AVGGQVRMPVVITQSIRAQGTMGKGAIIQAGKSPMGLPVQITGNQKNKLNDPGGGTFRDD
+DDINDVASMAGVNLNEESARILATNSDLVGTQIRSCKDEAFLHPGLLHRRIQETAKKFGI
+TEVPMETVTFISHATQSRLRTVVEKVSTIAQHRLDSCKDDECYEQSADVRSQLRFFEQLE
+RIEKQRKDEQEREILLKAAKSRSRQEDPEQARLKQKAKEMQQQELAQMRQRDANLTALAA
+IGPRKKRKVDSPGATPSGTEVSGSTAGSPASSSAPSTSSRQYTRQRITRVNLRDLIFYME
+QERETAHSLLLYRALLK
+>XP_006779817.1 gi|583968729|ref|XP_006779817.1| PREDICTED: transcription initiation factor TFIID subunit 4-like isoform X2 [Neolamprologus brichardi]
+MAGASDPLEDMLFSEVDEKAVSDLVGSLESQLAGQSNPAGKADENGGAGSVAPANHHLGK
+TLPAPVSTTTLEQQQQQQGRRNKTEMRQEINSKDVSPDKTVTSPSPGCSPSFGEPSTTSG
+ACVSATSSGSQSHGASITTLTASGVSTLASLPPASISTTISSQGSKVTVGTGETSTGATP
+PRKRITTPRRSASARIKSLNGAAVTTRRNSNTAVVDSVSQVDTSASTPNSGRPVTTSINT
+STFTLSNASLPVGQSAIALDRGTPTIALHRLPSHIVASIAQNGNGTSVSALVQQGARIGP
+VTSLASPGNQTKMVTDTGASKTDDCQSKIVMLTQSSVVNSVVNTVSTSSPPLPPPPPSST
+SSSIVTPPTTTTAAATTTITITQPLNSITPAACVTGMATSSVCGAGQTTSVTTTITMVRP
+TAPSPTPAVATSAQSQPRPGLTAPQRIVTPQLIVRPPQQQTTIQLPPGFTIPQGMVLVRT
+ELGQLVMVPQQALAQAQAQAQAQAQAQAQNNISPRPATPTTGTSFRVTSPQKGPVAPVVA
+VTAPQQTPVVLPPQAPAQPAPQPVQPAQPGIATASGGSVASQEMQENVKKCKNFLATLIK
+LASHNSPSPETSKNVKALVQDLLDAKIEPEEFTSRLQTELKSSPQPYLVPFLKKSLPALR
+LSLLNSQQSLTQPPQQGLKPAPCGTPPAIVAGPAVRIRHPNSVSTTTGASALPAGTLGHA
+AAMGVKTGGAVGGQVRMPVVITQSIRAQGTMGKGAIIQAGKSPMGLPVQITGNQKNKLND
+PGGGTFRDDDDINDVASMAGVNLNEESARILATNSDLVGTQIRSCKDEAFLHPGLLHRRI
+QETAKKFGITEVPMETVTFISHATQSRLRTVVEKVSTIAQHRLDSCKDDECYEQSADVRS
+QLRFFEQLERIEKQRKDEQEREILLKAAKSRSRQEDPEQARLKQKAKEMQQQELAQMRQR
+DANLTALAAIGPRKKRKVDSPGATPSGTEVSGSTAGSPASSSAPSTSSRQYTRQRITRVN
+LRDLIFYMEQERETAHSLLLYRALLK
+>XP_006779818.1 gi|583968731|ref|XP_006779818.1| PREDICTED: protein LSM14 homolog A-like [Neolamprologus brichardi]
+MSGGGTPYLGSKISLISKAEIRYEGILYTIDTENSTVALAKVRSFGTEDRPTDRPIPPRD
+EVFEYIIFRGSDIKDLTVCEPPKATSALPQDPAIVQSSIGSSSAAAPPSFQAPGSYAPFS
+RAPAPSYSQFGVATIGSQQFGSTGAVGRTSPQLDSRRKSPTLEQAVQAPPSSAQAPPAPV
+GQRSQTGAAASRTTTTGIQKPPDLLEQRKVPEVPKVAQPDNEQGAVENRDPNKRQGAGVQ
+SSNRRGRGRGNRSRGKVNVRRDGTVKFDEDFDFETANAQFHKDEIDKELQNKLKLKDDKT
+EKALNGEESEHPANEGAAEEEEAVINTCYYDKSKSFFDNLSCDDTRDRRPTWAEERRMNA
+ETFGLPLRHNRGRGGFRGRGFMGPRGGRGRPVSRGSFGPPRGAPPGFRGGFRGGRGGRDF
+SDFEYRKENKVAA
+>XP_006779819.1 gi|583968733|ref|XP_006779819.1| PREDICTED: SS18-like protein 2-like [Neolamprologus brichardi]
+MSIVFVPKKLRGKATVNQETIQRLLDENDQLIRCITEYMQKGRAVECVQYQQILHRNIVY
+LATIADASPDSAASTSNCTSNDTSASAAAVNGHTEGS
+>XP_006779820.1 gi|583968735|ref|XP_006779820.1| PREDICTED: uncharacterized protein KIAA0355-like [Neolamprologus brichardi]
+MYCCSAQESKMDYKRRFLLGGSKQKVQQHQQYQMPELSRTLSASLASSCSASSPMGTGVG
+MSGSCHPPPSGTSTAVADIQQGISKYLDALNVFCRASAFLTDLFSSVFRNSHYSKAAMQL
+KDVQEHVMEAASRLTAAIKPEIAKMLMELSAGAANFKDQNDFSLQDVEVLGRCFLTVMQV
+HFQFLSQALQKVQPVAQSCLAEALAQAQERCANARSQSSDLGPLTELEEASRSWKGAAEA
+TARLRERGRDGCLAGIQVQQLFCSNNTTIPEHQLKELNMKIDSALQAYKAALESLGHSEY
+ALKAGFHLNPKAVEAALQGCCSEAEAQQAGRMQTTSQPIQCELPTIPVQIGSHFLKGVSF
+NESAAENLKLKTHTMLQLIKEALGQNGVTPRDDSPVTEVLNQVCPSSWRGACKTAVQLLF
+AQAGLVVVDTAQIENKEAYAPQITLEGSKVVVQVPSTWCLKEDPATMSLLQRSLDPEKTL
+GLVDVLYTAVFDINRWKERKEQALPTIQIQLQRESPDYGIPTDLPPGTSSKTSSGLPKTI
+SKLTSKFTKKVSSSSNSGGSFSIPSTPSRSMLTTSNSEDKAKGLGHSDGRLQSILQMGSL
+PCTSDSTQQNQLANGSVSEDQGMNLPTDQEMQDVIDFLSGFNMGKSQQASPLVKRRNSVA
+SANPAELKPPSGPSQATSSISHSALQPPAQTLPQPQPQPQPSQPVQKQQPQPNPQPPPPQ
+QQQPQQQQQPPPPPPQQPSPQAQHLYYQHLLQPITQQQAPPPQLPPQQTPPQVLPQQRVA
+SKWLGTSGQQPPPQGPPAGLSPLGPIGQWASSGLPDLSSDLYSLGLVSTYMDSVVSEMLG
+QKPQGPRNNTWPNRDQSEGVFGVLGDTLPFDPAVGSDPEFARYVAGVSQAMQQKRQVQHI
+RRPSNTRSNWPMPDEQHRTWSHPEYFNEGDAVNSGWSANQGDSASSSDETSSANGDSLFS
+MFSGPDLVAAVKQRRKHSCGEPEVCTLPSPPLHHIGDDSQDSKTKTWPPKAPWQHSTHTN
+TMPNPSSSLYQMNIPPSSQWGDSMPMLQSPVWSTASDCPPSTGISSGFPFTQQQQQQQQQ
+QHKPMTKGFKSFPVKHEHRPSYLHQY
+>XP_006779821.1 gi|583968737|ref|XP_006779821.1| PREDICTED: glucose-6-phosphate isomerase-like [Neolamprologus brichardi]
+MGLTQDPNFQKLQEWYTAHALGLNMRHMFEADKERFNKLSLTLKTEDGDILLDYSKNLIT
+EDVMKMLVDLAKSRGIEAAREKMFTGEKINFTEGRAVLHVALRNRSNTPIMVDGKDVMPD
+VNKVLEKMKGFCHKVRSGEWKGYTGKAITDVVNVGIGGSDLGPLMVTEALKPYSKDGPRV
+WFVSNIDGTHIAKTLAQLNPETTLFIIASKTFTTQETITNAESAKAWFLEHAKDKAAVAK
+HFVALSTNGPKVKDFGIDTENMFEFWDWVGGRFSLWSAIGMAIALHIGFDNFEKLLSGAH
+WMDKHFRTAPLDKNAPILLALLGIWYINFFHAETQAMLPYDQYMHRFTAYFQQGDMESNG
+KYITNHGTRVNYHTGPIVWGEPGTNGQHAFYQLIHQGTRMVPCDFLIPAQSQHPIRDNLH
+HKVSLMLERYLSKXXALMKGKTTEEAKKELEASGLSGEALEKILPHKVRRIKRNDLIKDN
+EPAALLMARNSNKLKPKLKRRAPCRVAFTKRDSPSKNSVNRC
+>XP_006779822.1 gi|583968739|ref|XP_006779822.1| PREDICTED: Wilms tumor protein 1-interacting protein homolog [Neolamprologus brichardi]
+MEHYQEDLGLRATKLMEDLSLYDAYQDGMYDARRDLVINPDLDFSAPALVEHKAKPMNGT
+SVLHQQHHTVENFSSGNKVYNAAPVRPVNCNRTVPVDFCAPQRDAVYNEDGCCTKSEVAL
+PCYTGTSERHRRYSLEVQGHRYSTGSTFDGVPLNKPVAVPGNRCNSVCIASSHDGRYNAT
+SPRSSLASSLSSQEQSKHASPRSSISSPRTSLVVPGQERYTSPRSSLVHCEGNSVLSPRS
+SYASTASDTSKHSSPRASLNSCDCCSKPNSNRTSGISMGYDQRHTSPRSSTASQYSFTTS
+PRSSYSDSRYGPVVNQDLEGVLHSAPLASPRSSICSQDGSARPGASANCVVSPRSSISSH
+SSRSSRSSRGSMSTYPDLQLPSPRSSMLGTSLHEDTLLQEFGDSNGVQNRIHLQGLSAVP
+EPQQQSGQTGGTADIPSGSPSSYSYVMPSKTASSGQRFKLPYQVTPSRESGPSQAEKRLE
+ALTLELEKELEMHMKKEYFGICVKCGKGVYGASQACQAMGNLYHTNCFTCCSCGRRLRGK
+AFYNVNGKVYCEEDFLYSGFQQTAEKCFVCGHLIMEMILQALGKSYHPGCFRCVVCKEGL
+DGVPFTVDVENNIYCVKDYHTVFAPKCASCNQPILPAQGSEETIRVVSMDKDYHVECYHC
+EDCGLQLNDEERHRCYPLEGHLLCHDCHILRLQSQVPAHAPPSYPLHVTEL
+>XP_006779823.1 gi|583968741|ref|XP_006779823.1| PREDICTED: short-chain dehydrogenase/reductase family 42E member 1-like isoform X1 [Neolamprologus brichardi]
+MGTASKETFLITGGSGYFGNRLALSLLKKGAKVILFDIIPPSQELPEDVVFVQGDIREYP
+DVEKAVTGVDCVFHIASYGMSGREQLNRQLIEAVNVQGTQNILKACVEHGVSRLIYTSTF
+NVVFGGQVIENGDESLPYLPLHLHPDHYSRTKSLADMAVLKANGTVLKGCSGLLSTCALR
+PAGIYGPGEQRHLPRIVDYIEKGIFRFVYGKPSSLVEFVHVDNLVSAHVLAAEALTPEKQ
+HRAAGQAYFISDGRPVNNFEFFRPLVEGLGYRFPTLRLPISLIYFFAFLTEMIHCLIGPF
+YNFQPLLTRTEVYKTGVTHYFSMAKAKAELGYEPREYNLDEVVQWFRSRGHGKKCHRSFL
+SRLLLNVLFVSALVAVSLSFLPVVGS
+>XP_006779824.1 gi|583968743|ref|XP_006779824.1| PREDICTED: short-chain dehydrogenase/reductase family 42E member 1-like isoform X2 [Neolamprologus brichardi]
+MGTASKETFLITGGSGYFGNRLALSLLKKGAKVILFDIIPPSQELPEDVVFVQGDIREYP
+DVEKAVTGVDCVFHIASYGMSGREQLNRQLIEAVNVQGTQNILKACVEHGVSRLIYTSTF
+NVVFGGQVIENGDESLPYLPLHLHPDHYSRTKSLADMAVLKANGTVLKGCSGLLSTCALR
+PAGIYGPGEQRHLPRIVDYIEKGIFRFVYGKPSSLVEFVHVDNLVSAHVLAAEALTPEKQ
+HRAAGQAYFISDGRPVNNFEFFRPLVEGLGYRFPTLRLPISLIYFFAFLTEMIHCLIGPF
+YNFQPLLTRTEVYKTGVTHYFSMAKAKAELGYEPREYNLDEVVQWFRSRGHGKKCHRSFL
+SRLLLNVLFVSALVAVSLSFLPVVGS
--- a/test-data/test.fasta	Fri Oct 16 16:13:34 2015 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,11 +0,0 @@
->ID1 desc
-GATACA
-
-
->ID2 desc
-GATACAGATACA
-GATACAGA
-TACAGATACA
->ID3 desc
-GATACAGATACAGATACAGATACAGATACAGATACAGATACAGATACAGATACAGA
-TACAGATACA
--- a/tool_dependencies.xml	Fri Oct 16 16:13:34 2015 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,6 +0,0 @@
-<?xml version="1.0"?>
-<tool_dependency>
-    <package name="biopython" version="1.65">
-        <repository changeset_revision="dc595937617c" name="package_biopython_1_65" owner="biopython" toolshed="https://toolshed.g2.bx.psu.edu" />
-    </package>
-</tool_dependency>