changeset 18:0a507f4bd19a draft default tip

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/mafft commit 3216eed8c66b2fff7c571ab27d3f1e6aaddc186f
author bgruening
date Mon, 14 Jul 2025 18:16:36 +0000
parents 1233363389c1
children
files macros.xml mafft.xml test-data/mafft_seed_out.aln test-data/seed.aln test-data/seed2.aln
diffstat 5 files changed, 1822 insertions(+), 1 deletions(-) [+]
line wrap: on
line diff
--- a/macros.xml	Wed Mar 05 16:46:36 2025 +0000
+++ b/macros.xml	Mon Jul 14 18:16:36 2025 +0000
@@ -1,6 +1,6 @@
 <macros>
     <token name="@TOOL_VERSION@">7.526</token>
-    <token name="@VERSION_SUFFIX@">1</token>
+    <token name="@VERSION_SUFFIX@">2</token>
     <token name="@PROFILE@">22.01</token>
     <!-- currently, the fasta3 executable is named according to its major version
     => needs updating together with the package requirement! -->
--- a/mafft.xml	Wed Mar 05 16:46:36 2025 +0000
+++ b/mafft.xml	Mon Jul 14 18:16:36 2025 +0000
@@ -105,6 +105,12 @@
     #end if
   #end if
 
+  #if $seed
+    #for $s in $seed:
+      --seed '$s'
+    #end for
+  #end if
+
   ## handle scoring matrix
   $datatype_selection.datatype
   $anysymbol
@@ -218,6 +224,7 @@
                 <expand macro="misc_scoring_scheme" />
             </when>
         </conditional>
+        <param argument="--seed" type="data" format="fasta" optional="true" multiple="true" label="Use a seed alignment?" help="The --seed option can be used for adding unaligned sequences into a highly reliable alignment (seed) consisting of a small number of sequences.  In this option, the aligned letters in the seed alignment are preserved but gaps are not necessarily preserved.  If the given alignment (including the gap pattern) has to be completely preserved, use mafft-add."/>
         <param argument="--anysymbol" type="boolean" truevalue="--anysymbol" falsevalue="" checked="False" label="Support unusual characters?" help="e.g., U as selenocysteine in protein sequence; i as inosine in nucleotide sequence" />
         <conditional name="flavour">
             <param name="type" type="select" label="MAFFT flavour" help="Run mafft with pre-defined input parameters. Specification of these parameters can be found in the help section. With 'Auto', the tool automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size from few to many respectively. Default setting: FFT-NS-2.">
@@ -487,6 +494,20 @@
                 <metadata name="sequences" value="39"/>
             </output>
         </test>
+        <!-- test with seed alignments -->
+        <test expect_num_outputs="1">
+            <conditional name="input">
+                <param name="mapping" value="implicit"/>
+                <repeat name="batches">
+                    <param name="inputs" value="sample_amino.fa"/>
+                </repeat>
+            </conditional>
+            <conditional name="flavour">
+                <param name="type" value="mafft-linsi"/>
+            </conditional>
+            <param name="seed" value="seed.aln,seed2.aln"/>
+            <output name="outputAlignment" ftype="fasta" file="mafft_seed_out.aln"/>
+        </test>
     </tests>
     <help><![CDATA[
 **What it does**
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/mafft_seed_out.aln	Mon Jul 14 18:16:36 2025 +0000
@@ -0,0 +1,1368 @@
+>_seed_PINI_ARATH/9-617
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------HVMTAMVPLYVAMILA-
+YGSVKWWKIFTPDQCSGINRFVALFA-----------VPLLSFHFIAANNPYA-------
+---MNLRFLAADSLQKVIVLSLLFLWCKLSR---NGSLDWTITLFSLSTLPNTLVMGIPL
+LKGMYGN----------------------------------FSGDLMVQIVVLQCIIWYT
+LML------------------FLFEYRGAKLLISEQFP-DTAGSIVSIHVDSDIMSLDGR
+Q-PLETEAEIKEDGKLHVTVRRSNASRSDIYS-----RRSQGL-SATPRPSNLTNAEIYS
+LQSSRNPTPRGSSFNHTDFY---------------SMMASGGGRNSNFGPGEA-------
+--------VFGSKGPTPRPSNYEEDGGPAKPTAAGTAAGAGRFHYQSGGSGGGGGAHYPA
+PNPGMFSPNTGGGGGTAAKGNAPVVGGKRQDGN------GRDLHMFVWSSSASPVSDVFG
+GGGGNHHADYSTATNDHQKDVKISVPQGNSNDNQYVEREEFSFGNKDDDSKVLATDGGNN
+ISNKTTQAKVMPPTSVMTRLILIMVWRKLIRNPNSYSSLFGITWSLI-SFKWNIEMP---
+---ALIAKSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALNPRIIACGNRRAAFA--------AAMRFVVGPAVMLVASYAVGLRGV--LLHV
+AIIQ------------AALPQGIVPFVFAKEYNVHPDILSTAVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------LYY
+>_seed_Q9FVF6_POPPZ/9-609
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------HVMTAMVPLYVAMILA-
+YGSVKWWKIFTPDQCSGINRFVALFA-----------VPLLSFHFISTNDPYN-------
+---MNLRFITADSLQKVIVLVVLALWTKLSK---RGCLEWTITLFSLSTLPNTLVMGIPL
+LKGMYGD----------------------------------YSGSLMVQVVVLQCIIWYT
+LML------------------FMFEYRGAKLLISEQFP-DTAGSIVSIHVDSDIMSLDGR
+Q-PLETEAAIKEDGKLHVTVRKSNASRSDIFS-----RRSQGLSSTTPRPSNLTNAEIYS
+LQSSRNPTPRGSSFNHTDFY---------------SMMA--AGRNSNFGASDVY------
+-------GLSASRGPTPRPSNFEEEHGGSNKPRFHHYHAPGGATHYPAPNPGMFSPTTAA
+SKGVSANANNAAAAAAKKPNGQAQQKAED-------------GRDLHMFVWSSSASPVSD
+VFGGHDYGAHDLKDVRVAVSPGKVEGQRENQEDYNLERDDFSFGNRGLDRERNSHEGEKG
+GFD--GKPKAMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWSLV-SFRWNVKMP---
+---LIIAKSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALQPRIIACGNSIATFS--------MAVRFLTGPAIMAAASIAVGIRGT--LLHI
+AIVQ------------AALPQGIVPFVFAKEYNVHPEILSTGVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------VYY
+>_seed_B8AIF2_ORYSI/9-590
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------HVMTAMVPLYVAMILA-
+YGSVKWWRIFTPDQCSGINRFVALFA-----------VPLLSFHFISTNNPYT-------
+---MNLRFIAADTLQKLMVLAMLTAWSHLSR---RGSLEWTITLFSLSTLPNTLVMGIPL
+LKGMYGE----------------------------------FSGSLMVQIVVLQCIIWYT
+LML------------------FMFEYRGARMLITEQFP-DTAANIASIVVDPDVVSLDGR
+RDAIETETEVKEDGRIHVTVRRSNASRSDIYS-----RRSMGFSSTTPRPSNLTNAEIYS
+LQSSRNPTPRGSSFNHTDFY---------------SMV----GRSSNFGAADA-------
+--------FGVRTGATPRPSNYEDDASKPKYPLPASNAAPMAGHYPAPNPAVSSAPKGAK
+KAATNGQAKGEDLHMFVWSS-------------------------------SASPVSDVF
+GGGAPDYNDAAAVKSPRKMDGAKDREDYVERDDFSFGNRGVMDRDAEAGDEKAAAAAGAD
+PSKAMAAPTAMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWSLV-CFRWNFEMP---
+---AIVLKSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALQPHIIACGNKVATYA--------MAVRFLAGPAVMAAASFAVGLRGT--LLHV
+AIVQ------------AALPQGIVPFVFAKEYSVHPSILSTAVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------VYY
+>_seed_PIN6_ARATH/9-565
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------TVMCAMAPLYFAMFVA-
+YGSVKWCKIFTPAQCSGINRFVSVFA-----------VPVLSFHFISQNNPYK-------
+---MDTMFILADTLSKIFVFVLLSLWAVFFK---AGGLDWLITLFSIATLPNTLVMGIPL
+LQAMYGD----------------------------------YTQTLMVQLVVLQCIIWYT
+LLL------------------FLFELRAARLLIRAEFPGQAAGSIAKIQVDDDVISLDGM
+D-PLRTETETDVNGRIRLRIRRSVSSVPDSVMSSSLC--------LTPRASNLSNAEIFS
+VN----------TPNNRFFHGGGGSGTLQFYNGSNEIMF-CNGDLGGFGFTRPGLGASPR
+RLSGYASSDAYSLQPTPRASNFNELDVNGNGTPVWMKSPAAGRIYRQSSPKMMWESGQRH
+AAK---------------------------------------------------------
+---------DINGSVPEKEISFRDALKAAPQATAAGGGASMEEGAAGKDTTPVA-AIG-K
+-QE-------MPSAIVMMRLILTVVGRKLSRNPNTYSSLLGLVWSLI-SFKWNIPMP---
+---NIVDFSIKIISDAGLGMAMFSL--------GL-------------------------
+---FMALQPKMIPCGAKKATMG--------MLIRFISGPLFMAGASLLVGLRGS--RLHA
+AIVQ------------AALPQGIVPFVFAREYNLHPDLLSTLVI----------------
+-FG-MIV-S-LPVTI---------------------------------------------
+-------------------------------------------------------LYY
+>_seed_YFDV_ECOLI/4-307
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------FFIGDLLPIIVIMLLG-
+YFSGRR-ETFSEDQARAFNKLVLNYA-----------LPAALFVSITRANREM-------
+---IFADTRLTLVSLVVIVGCFFFSWFGCYK-FFKRTHAEAAVCALIAGSPTIGFLGFAV
+LDPIYGD----------------------SV---------STGLVVAIISIIVNAITIPI
+GLY------------------LLNPSSGADGKK---------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------NSNLSALISAAKEPVVWAPVLATILVLV-GVKIP-------
+---AAWDPTFNLIAKANSGVAVFAA--------GL-------------------------
+---TLAAHKFEFSAEIAYN-----------TFLKLILMPLALLLVGMACHLNSE--HLQM
+MVLA------------GALPPAFSGIIIASRFNVYTRTGTASLA----------------
+-VS-VLG-F-VVTAP---------------------------------------------
+-------------------------------------------------------LWI
+>_seed_YWKB_BACSU/5-315
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------DILILLAPIFFVIVLG-
+WFAGHF-GSYDAKSAKGVSTLVTKYA-----------LPAHFIAGILTTSRSE-------
+---FLSQVPLMISLIIGIVGFYIIILLVCRF-IFKYDLTNSSVFSLNSAQPTFAFMGIPV
+LGSLFGA----------------------------------NEVAIPIAVTGIVVNAILD
+PLA------------------IIIATVGESSKKNEESGD---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------SFWKMTGKSILHGLCEPLAAAPLISMILVLVFNFTLP-------
+---ELGVKMLDQLGSTTSGVALFAV--------GV-------------------------
+---TVGIRKIKLSMPAIG-----------IALLKVAVQPALMFLIALAIGLPAD-QTTKA
+ILL-------------VAFPGSAVAAMIATRFEKQEEETATAFV----------------
+-VS-AIL-S-LISLP---------------------------------------------
+-------------------------------------------------------III
+>_seed_P71425_KLEPN/4-313
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------VIIHALAPIFVIMLLG-
+FWAGKA-GMVDNKNVSLLNIFVMDFA-----------LPATLFSATVQTPWAG-------
+---IVAQSPLVLVLTGAMWITYAAIYFLATS-VFKRTPQDGAVLTLTVALPNYAALGLPI
+LGSVLGE---------------------------------GASTSLSVAVSIACGSVLMT
+PFC------------------LLILEREKARAAGENSG----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------STLAMLPVLMWRSVKKPIVWGPLLGVVLSAI-GIKMP-------
+---DLLLASIKPLGLAATAAALFLT--------GV-------------------------
+---ILSARKLQLNALIAAS-----------TIVKLLVQPFIAWGLVMLLGLHGS-IAITA
+ILM-------------IALAAGFFGVVFGNRFGVQSPDAEAVLL----------------
+-LS-SVL-C-ILSLP---------------------------------------------
+-------------------------------------------------------LFI
+>_seed_Q98L58_RHILO/3-308
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------PLTETVLFVFSLVALG-
+YLAGLT-GYLRPASGEGISDFAVSVA-----------MPLLLFQTMVKADFHG-------
+-----VAPWPLWGAYFTAVAITWAAGHLVTTRIFGRDARAGVVGGVSSAYSNVVLLGAPF
+ILGIFGP-----------------------S---------GFEVLSLLVSVHLPVMMMAS
+IVL------------------FEMFGRGGGEHV---------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------HPLRVLRSFLRRLFINPLIIGILLGLAWRLS-GVPLP-------
+---SLVMRLVDALANTAGPVALFAM--------GL-------------------------
+---SLRRFGVSGNVRPALA----------LSALKLFLMPALVLAFVLLLGLPPL--TAKV
+AVVV------------AALPSGINSYLIAVQFNTGQALASNQMT----------------
+-IA-TAC-A-AVTTA---------------------------------------------
+-------------------------------------------------------FWL
+>_seed_O67397_AQUAE/2-289
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------FIYEKVFFILLIIAFA-
+YTLKRG-GIFKEEHALPFINYVIYFA-----------LPFTIFKNLRF---LE-------
+---IGKEVLGVVLIAWGAIFLSILFAFLFGK-FLKLEEKTLRAFLLVSSFGNTAFMGYPF
+LYALEGN----------------------------------EGLKYAILYDQLGSFLMVI
+TLG---------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------LFLAIGKFDLKELILFPPFIALVLSFLLHGV-RFP---------
+---QFFEHSVEIISGSLIPVILFSL--------GL-------------------------
+---RLNFTDMKSDYRTLFSA----------LFIKMFLVPLLILVFLKIFGLTSL--PYRV
+ALIE------------SAMPPMVFAGVLALKYELDFRLAFSAIT----------------
+-LG-IVI-S-LFTVP---------------------------------------------
+-------------------------------------------------------VFR
+>_seed_Q97M34_CLOAB/2-296
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------YVFEQIVILFLIMGIG-
+YYAAKS-KIIDDDTTSHLSNFIVSIT-----------LPLMILTSFNVEYSRK-------
+---TVITIINLLVFSVAAFIISIVIGKII---SFKFAMDKRDILMFMSIFSNCGFIGFPV
+LKVVYGN----------------------------------KGVLYTSIFNLVYNVFIWT
+IGI------------------VIINDKREKIDY---------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+--------------------------KKILFNHNIIAVIVGVFLMLL-SIKIP-------
+---YVMSSAFNLIGSMTAPLSMIVI--------GS-------------------------
+---ILA--------GVDFNDIFKDWSLYYIAILRLIIIPLIIYFALKPFQINKI--VIGV
+IIIC------------EAMPGGTLCPILAKSCNRNFKYASKIVL----------------
+-IT-TIL-S-MMTIP---------------------------------------------
+-------------------------------------------------------FMT
+>_seed_YB8B_YEAST/13-413
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------LVFESVLQVVIIALAG-
+FWSASS-GLLPKQSQKIISLLNVDLF-----------TPCLIFSKLAKSLSMA-------
+---KIFEIAIIPIFFGLTTGISFISGKIMSR-ILDLDKDETNFVVANSVFGNSNSLPVSL
+TLSLAYTLPNLTW-D-----QIPNDNRDNVA---------SRGILYLLIFQQIGQMLRWS
+WGY------------------NKLMKWSGENTQHMPPSQVQSLLERTPNIDNEELVNEEQ
+EEQELLEEENNRMNSSFLSSSSIGDKIWQKSCTVFER-----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+--------------------------IRANLNPPLYSMIFAVVVAAI-GPLQRELFMEDG
+FINNTFAEAVTQLGSVSIPLILVVL--------GS-------------------------
+---NLYPSA-----EVFPKTVHHSKLLIGSIIGRMILPSCFLLPIIAIAV------KYIN
+VSILDDPIFLVVGFLLTVSPPAIQLTQITQLNEFFEAEMADILF----------------
+-WG-YAV-L-SLPVS---------------------------------------------
+-------------------------------------------------------IIV
+>_seed_YDQ4_SCHPO/18-440
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------PIIESDLEVIVIALGG-
+YVLAKK-GFLPRDAQKVISSLNVYFF-----------TPCLVFEKVGNGLNLK-------
+---MLIDLSLLPVFYVIISAASILISFLLAK-LFRLTPRQRNFATACITFQNSNSLPLAL
+VSSLATTVKDLLW-D-----KIPDDTPDKVA---------SRGIMYLLIFSQLGQALRWS
+YGY------------------RILLSPNQPEDPLPIGNRSWSHSDVNEEEIQNLLASSAN
+VDGVQNSVQANEGSTVQTDSSAISKNDNVQVETSNEEVGGFGAASSKISK----------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------------FIVLLLDFFSPPLYSLFIALFIAVV-PPLQRFFFEEGS
+FVEGSITSGIRMAGQVAVPMILVVL--------GA-------------------------
+---SLATDISKTEPTQEVRKNNDTRVIIVCLLGRMVVVPLALLPAFSLLS------YFSE
+ISTVDDPVFVVVIFLLVGSPTAIQLTQICQLNGVFERECAKVLW----------------
+-WS-YAV-F-TPPNS---------------------------------------------
+-------------------------------------------------------LLL
+>_seed_PILS4_ARATH/9-407
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------ASSKPVVETLLITSVGF
+YLALDTVNLLGHDARKHLNNIVFYVF-----------SPSLIGSRLADSVTYE-------
+---SLVKMWFMPVNVLLTFMIGSLLGWIVIV-ITKPPSQLRGLIISCCASGNLGTMPLII
+IPAICKE-------K-----GGPFGDSESCE---------KYGMGYVTLSMT--AFFISV
+YKHDTNWYVSGGNGLLMDLYINLMR------VLSNSPVETHTHSIESNYDDSCKVQLISS
+K------------------------------------------EEEKEEDNHQVGRWEEV
+KQ----------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------RVVSLSKKVNLGSIFAPATIAAIIALVIGLI-TPLRNLIIGTVA
+PF-RVIQDSLTLLGDGAIPAMTLIL--------GG-------------------------
+---NLLKGMRRSEVRSSEMKNSCIIGV---LVARYILLPVSGVLLVRGAY-------KLD
+LVTS-EPLYQFVLLLQYAVPPAMNLGTKTQLFGAGESECSVIML----------------
+-WT-YSL-A-AVSLT---------------------------------------------
+-------------------------------------------------------VWP
+>_seed_PILS5_ARATH/9-388
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------VASMPVIQVLFMSLVGA
+FMASDRCKLFPVEARNSMNKVVFVLF-----------APALMFANLAQTVTLE-------
+---DIISWWFMPVNMGLTFLIGGLLGWLVVK-ILKPPPYLEGLIVATCSAGNMGNLPIIL
+VPAICDE-------D-----KSPFGNRSVCR---------TVGLSYASFSMALGGFYIWT
+YTF------------------RLIKGSAMKVQAIEESEKIAIKSSNSDLEADHKTHLLGA
+P-----------------------------------------EDKENKVVKEKTGFWRKG
+VD----------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------FLHEI-----LEELLAPPTLGAIIGFIFGAV-RWLRNLIIGDDA
+PL-RIVQSTAKLLGDGTIPCMTIIL--------GG-------------------------
+---NLIQG-----LRSSAVKPMVVLGI---VCVRYIAMPIIGIGIVLTAA-------NLG
+FLPA-DPLFQYVLMLQFTLPPAMNIGTMTQLYNVAQDECSVLML----------------
+-WT-YLV-A-ILALT---------------------------------------------
+-------------------------------------------------------VWS
+>_seed_PILS2_ARATH/18-441
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------SGVVPLLKLICLTVIGL
+LLAHPKTQLVPRATFRLLSKLVFALF-----------LPCLIFTELGESITLD-------
+---NIVQWWFIPVNVLLSAVVGSLIGYLVVL-ICRPPPEFNRFTIVMTAFGNTGNLLLAI
+VSSVCHT--------------KTNPFGPNCN---------SRGVSYVSFAQWVAVILVYT
+VVY------------------HMMEPPLEYYEVVEEEG-VEIEEINVENHDASRPLLVEA
+EWPGIEDKETEHCKTPFIARVFNSISSFSQTSFPEVDLGGEYGGESSSPRSIQCLAEPRV
+MR----------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------RIRVVAEQTPVKHILQPPTIASLLAIIIGSV-PQLKSVVFGYDA
+PL-SFITDSLNIMGSAMVPSVMLVL--------GG-------------------------
+---MLSEGPNESTLGLRTTIGI--------SVARLLVLPLVGIGIVMSAD-------KLG
+LISSADPMFKFVLLLQYSTPSAILLGAIASLRGYAVREASALLF----------------
+-WQ-HIF-A-LLSLT---------------------------------------------
+-------------------------------------------------------FYI
+>_seed_PILS6_ARATH/30-423
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------IAVMPIAKVFTMCFLGL
+LMASKYVNILPPSGRKLLNGLVFSLL-----------LPCLIFSQLGQAVTLQ-------
+---KMLQWWFIPVNVVLGTISGSIIGFIVAS-IVRPPYPYFKFTIIQIGVGNIGNVPLVL
+LAALCRD-------T-----SNPFGDSEKCS---------IDGTAYISFGQWVGAIILYT
+YVY------------------QMFAPPPEGFDAEEENLALKTLPVDAAPEQVPLLTQNFP
+KDFSPTQDL--------------------------------LPVQSTEPRGRGVSRKGKI
+AQ----------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------IFVFLYEKLKLKQIVQPAIVASILAMILGAI-PFTKKLIFTNGA
+PL-FFFTDSCMILGDAMIPCILLAL--------GG-------------------------
+---NLINGPGSSKLGFKTTAAI--------IIGRLVLVPPVGLGIVTVAD-------KLG
+FLPADDKMFRFVLLLQHTMPTSVLSGAVANLRGCG-RESAAVLF----------------
+-WV-HIF-A-IFSMA---------------------------------------------
+-------------------------------------------------------GWM
+>_seed_PIN4_ARATH/9-611
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------TVLTAVVPLYVAMILA-
+YGSVQWWKIFSPDQCSGINRFVAIFA-----------VPLLSFHFISTNDPYA-------
+---MNFRFVAADTLQKIIMLVLLALWANLTK---NGSLEWMITIFSLSTLPNTLVMGIPL
+LIAMYGT----------------------------------YAGSLMVQVVVLQCIIWYT
+LLL------------------FLFEYRGAKLLIMEQFP-ETGASIVSFKVESDVVSLDGH
+D-FLETDAEIGNDGKLHVTVRKSNASRRSLMM--------------TPRPSNLTGAEIYS
+LS----STPRGSNFNHSDFY---------------SVMGFPGGRLSNFGPADLY------
+-------SVQSSRGPTPRPSNFEENNAVKYGFYNNTNSSVPAAGSYPAPNPEFSTGTGVS
+TKPNKIPKENQQQLQEKDSKASHDAKELHMFVWSSSASPVSDVFGGGAGDNVATEQSEQG
+AKEIRMVVSDQPRKSNARGGGDDIGGLDSGEGEREIEKATAGLNKMGSNSTAELEAAG-G
+-DGGGNNGTHMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWALV-AYRWHVAMP---
+---KILQQSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALQPKIIACGNSVATFA--------MAVRFITGPAIMAVAGIAIGLHGD--LLRI
+AIVQ------------AALPQGIVPFVFAKEYNVHPTILSTGVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------VYY
+>_seed_PIN7_ARATH/9-614
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------TVLTAVIPLYVAMILA-
+YGSVRWWKIFSPDQCSGINRFVAIFA-----------VPLLSFHFISSNNPYA-------
+---MNLRFIAADTLQKLIMLTLLIIWANFTR---SGSLEWSITIFSLSTLPNTLVMGIPL
+LIAMYGE----------------------------------YSGSLMVQIVVLQCIIWYT
+LLL------------------FLFEYRGAKILIMEQFP-ETGASIVSFKVESDVVSLDGH
+D-FLETDAQIGDDGKLHVTVRKSNASRRSFYG--------GGGTNMTPRPSNLTGAEIYS
+L----NTTPRGSNFNHSDFY---------------SMMGFPGGRLSNFGPADMY------
+-------SVQSSRGPTPRPSNFEESCAMASSPRFGYYPGGAPGSYPAPNPEFSTGNKTGS
+KAPKENHHHVGKSNSNDAKELHMFVWGSNGSPV-----SDRAGLQVDNGANEQVGKSDQG
+GAKEIRMLISDHTQNGENKAGPMNGDYGGEEESERVKEVPNGLHKLRCNSTAELNPKEAI
+ETGETVPVKHMPPASVMTRLILIMVWRKLIRNPNTYSSLIGLIWALV-AFRWDVAMP---
+---KIIQQSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALQPKLIACGNSTATFA--------MAVRFFTGPAVMAVAAMAIGLRGD--LLRV
+AIVQ------------AALPQGIVPFVFAKEYNVHPAILSTGVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------VYY
+>_seed_PINI_ARATH/9-617
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------HVMTAMVPLYVAMILA-
+YGSVKWWKIFTPDQCSGINRFVALFA-----------VPLLSFHFIAANNPYA-------
+---MNLRFLAADSLQKVIVLSLLFLWCKLSR---NGSLDWTITLFSLSTLPNTLVMGIPL
+LKGMYGN----------------------------------FSGDLMVQIVVLQCIIWYT
+LML------------------FLFEYRGAKLLISEQFP-DTAGSIVSIHVDSDIMSLDGR
+Q-PLETEAEIKEDGKLHVTVRRSNASRSDIYS-----RRSQGL-SATPRPSNLTNAEIYS
+LQSSRNPTPRGSSFNHTDFY---------------SMMASGGGRNSNFGPGEA-------
+--------VFGSKGPTPRPSNYEEDGGPAKPTAAGTAAGAGRFHYQSGGSGGGGGAHYPA
+PNPGMFSPNTGGGGGTAAKGNAPVVGGKRQDGN------GRDLHMFVWSSSASPVSDVFG
+GGGGNHHADYSTATNDHQKDVKISVPQGNSNDNQYVEREEFSFGNKDDDSKVLATDGGNN
+ISNKTTQAKVMPPTSVMTRLILIMVWRKLIRNPNSYSSLFGITWSLI-SFKWNIEMP---
+---ALIAKSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALNPRIIACGNRRAAFA--------AAMRFVVGPAVMLVASYAVGLRGV--LLHV
+AIIQ------------AALPQGIVPFVFAKEYNVHPDILSTAVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------LYY
+>_seed_Q9FVF6_POPPZ/9-609
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------HVMTAMVPLYVAMILA-
+YGSVKWWKIFTPDQCSGINRFVALFA-----------VPLLSFHFISTNDPYN-------
+---MNLRFITADSLQKVIVLVVLALWTKLSK---RGCLEWTITLFSLSTLPNTLVMGIPL
+LKGMYGD----------------------------------YSGSLMVQVVVLQCIIWYT
+LML------------------FMFEYRGAKLLISEQFP-DTAGSIVSIHVDSDIMSLDGR
+Q-PLETEAAIKEDGKLHVTVRKSNASRSDIFS-----RRSQGLSSTTPRPSNLTNAEIYS
+LQSSRNPTPRGSSFNHTDFY---------------SMMA--AGRNSNFGASDVY------
+-------GLSASRGPTPRPSNFEEEHGGSNKPRFHHYHAPGGATHYPAPNPGMFSPTTAA
+SKGVSANANNAAAAAAKKPNGQAQQKAED-------------GRDLHMFVWSSSASPVSD
+VFGGHDYGAHDLKDVRVAVSPGKVEGQRENQEDYNLERDDFSFGNRGLDRERNSHEGEKG
+GFD--GKPKAMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWSLV-SFRWNVKMP---
+---LIIAKSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALQPRIIACGNSIATFS--------MAVRFLTGPAIMAAASIAVGIRGT--LLHI
+AIVQ------------AALPQGIVPFVFAKEYNVHPEILSTGVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------VYY
+>_seed_B8AIF2_ORYSI/9-590
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------HVMTAMVPLYVAMILA-
+YGSVKWWRIFTPDQCSGINRFVALFA-----------VPLLSFHFISTNNPYT-------
+---MNLRFIAADTLQKLMVLAMLTAWSHLSR---RGSLEWTITLFSLSTLPNTLVMGIPL
+LKGMYGE----------------------------------FSGSLMVQIVVLQCIIWYT
+LML------------------FMFEYRGARMLITEQFP-DTAANIASIVVDPDVVSLDGR
+RDAIETETEVKEDGRIHVTVRRSNASRSDIYS-----RRSMGFSSTTPRPSNLTNAEIYS
+LQSSRNPTPRGSSFNHTDFY---------------SMV----GRSSNFGAADA-------
+--------FGVRTGATPRPSNYEDDASKPKYPLPASNAAPMAGHYPAPNPAVSSAPKGAK
+KAATNGQAKGEDLHMFVWSS-------------------------------SASPVSDVF
+GGGAPDYNDAAAVKSPRKMDGAKDREDYVERDDFSFGNRGVMDRDAEAGDEKAAAAAGAD
+PSKAMAAPTAMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWSLV-CFRWNFEMP---
+---AIVLKSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALQPHIIACGNKVATYA--------MAVRFLAGPAVMAAASFAVGLRGT--LLHV
+AIVQ------------AALPQGIVPFVFAKEYSVHPSILSTAVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------VYY
+>_seed_PIN6_ARATH/9-565
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------TVMCAMAPLYFAMFVA-
+YGSVKWCKIFTPAQCSGINRFVSVFA-----------VPVLSFHFISQNNPYK-------
+---MDTMFILADTLSKIFVFVLLSLWAVFFK---AGGLDWLITLFSIATLPNTLVMGIPL
+LQAMYGD----------------------------------YTQTLMVQLVVLQCIIWYT
+LLL------------------FLFELRAARLLIRAEFPGQAAGSIAKIQVDDDVISLDGM
+D-PLRTETETDVNGRIRLRIRRSVSSVPDSVMSSSLC--------LTPRASNLSNAEIFS
+VN----------TPNNRFFHGGGGSGTLQFYNGSNEIMF-CNGDLGGFGFTRPGLGASPR
+RLSGYASSDAYSLQPTPRASNFNELDVNGNGTPVWMKSPAAGRIYRQSSPKMMWESGQRH
+AAK---------------------------------------------------------
+---------DINGSVPEKEISFRDALKAAPQATAAGGGASMEEGAAGKDTTPVA-AIG-K
+-QE-------MPSAIVMMRLILTVVGRKLSRNPNTYSSLLGLVWSLI-SFKWNIPMP---
+---NIVDFSIKIISDAGLGMAMFSL--------GL-------------------------
+---FMALQPKMIPCGAKKATMG--------MLIRFISGPLFMAGASLLVGLRGS--RLHA
+AIVQ------------AALPQGIVPFVFAREYNLHPDLLSTLVI----------------
+-FG-MIV-S-LPVTI---------------------------------------------
+-------------------------------------------------------LYY
+>_seed_YFDV_ECOLI/4-307
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------FFIGDLLPIIVIMLLG-
+YFSGRR-ETFSEDQARAFNKLVLNYA-----------LPAALFVSITRANREM-------
+---IFADTRLTLVSLVVIVGCFFFSWFGCYK-FFKRTHAEAAVCALIAGSPTIGFLGFAV
+LDPIYGD----------------------SV---------STGLVVAIISIIVNAITIPI
+GLY------------------LLNPSSGADGKK---------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------NSNLSALISAAKEPVVWAPVLATILVLV-GVKIP-------
+---AAWDPTFNLIAKANSGVAVFAA--------GL-------------------------
+---TLAAHKFEFSAEIAYN-----------TFLKLILMPLALLLVGMACHLNSE--HLQM
+MVLA------------GALPPAFSGIIIASRFNVYTRTGTASLA----------------
+-VS-VLG-F-VVTAP---------------------------------------------
+-------------------------------------------------------LWI
+>_seed_YWKB_BACSU/5-315
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------DILILLAPIFFVIVLG-
+WFAGHF-GSYDAKSAKGVSTLVTKYA-----------LPAHFIAGILTTSRSE-------
+---FLSQVPLMISLIIGIVGFYIIILLVCRF-IFKYDLTNSSVFSLNSAQPTFAFMGIPV
+LGSLFGA----------------------------------NEVAIPIAVTGIVVNAILD
+PLA------------------IIIATVGESSKKNEESGD---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------SFWKMTGKSILHGLCEPLAAAPLISMILVLVFNFTLP-------
+---ELGVKMLDQLGSTTSGVALFAV--------GV-------------------------
+---TVGIRKIKLSMPAIG-----------IALLKVAVQPALMFLIALAIGLPAD-QTTKA
+ILL-------------VAFPGSAVAAMIATRFEKQEEETATAFV----------------
+-VS-AIL-S-LISLP---------------------------------------------
+-------------------------------------------------------III
+>_seed_P71425_KLEPN/4-313
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------VIIHALAPIFVIMLLG-
+FWAGKA-GMVDNKNVSLLNIFVMDFA-----------LPATLFSATVQTPWAG-------
+---IVAQSPLVLVLTGAMWITYAAIYFLATS-VFKRTPQDGAVLTLTVALPNYAALGLPI
+LGSVLGE---------------------------------GASTSLSVAVSIACGSVLMT
+PFC------------------LLILEREKARAAGENSG----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------STLAMLPVLMWRSVKKPIVWGPLLGVVLSAI-GIKMP-------
+---DLLLASIKPLGLAATAAALFLT--------GV-------------------------
+---ILSARKLQLNALIAAS-----------TIVKLLVQPFIAWGLVMLLGLHGS-IAITA
+ILM-------------IALAAGFFGVVFGNRFGVQSPDAEAVLL----------------
+-LS-SVL-C-ILSLP---------------------------------------------
+-------------------------------------------------------LFI
+>_seed_Q98L58_RHILO/3-308
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------PLTETVLFVFSLVALG-
+YLAGLT-GYLRPASGEGISDFAVSVA-----------MPLLLFQTMVKADFHG-------
+-----VAPWPLWGAYFTAVAITWAAGHLVTTRIFGRDARAGVVGGVSSAYSNVVLLGAPF
+ILGIFGP-----------------------S---------GFEVLSLLVSVHLPVMMMAS
+IVL------------------FEMFGRGGGEHV---------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------HPLRVLRSFLRRLFINPLIIGILLGLAWRLS-GVPLP-------
+---SLVMRLVDALANTAGPVALFAM--------GL-------------------------
+---SLRRFGVSGNVRPALA----------LSALKLFLMPALVLAFVLLLGLPPL--TAKV
+AVVV------------AALPSGINSYLIAVQFNTGQALASNQMT----------------
+-IA-TAC-A-AVTTA---------------------------------------------
+-------------------------------------------------------FWL
+>_seed_O67397_AQUAE/2-289
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------FIYEKVFFILLIIAFA-
+YTLKRG-GIFKEEHALPFINYVIYFA-----------LPFTIFKNLRF---LE-------
+---IGKEVLGVVLIAWGAIFLSILFAFLFGK-FLKLEEKTLRAFLLVSSFGNTAFMGYPF
+LYALEGN----------------------------------EGLKYAILYDQLGSFLMVI
+TLG---------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------LFLAIGKFDLKELILFPPFIALVLSFLLHGV-RFP---------
+---QFFEHSVEIISGSLIPVILFSL--------GL-------------------------
+---RLNFTDMKSDYRTLFSA----------LFIKMFLVPLLILVFLKIFGLTSL--PYRV
+ALIE------------SAMPPMVFAGVLALKYELDFRLAFSAIT----------------
+-LG-IVI-S-LFTVP---------------------------------------------
+-------------------------------------------------------VFR
+>_seed_Q97M34_CLOAB/2-296
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------YVFEQIVILFLIMGIG-
+YYAAKS-KIIDDDTTSHLSNFIVSIT-----------LPLMILTSFNVEYSRK-------
+---TVITIINLLVFSVAAFIISIVIGKII---SFKFAMDKRDILMFMSIFSNCGFIGFPV
+LKVVYGN----------------------------------KGVLYTSIFNLVYNVFIWT
+IGI------------------VIINDKREKIDY---------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+--------------------------KKILFNHNIIAVIVGVFLMLL-SIKIP-------
+---YVMSSAFNLIGSMTAPLSMIVI--------GS-------------------------
+---ILA--------GVDFNDIFKDWSLYYIAILRLIIIPLIIYFALKPFQINKI--VIGV
+IIIC------------EAMPGGTLCPILAKSCNRNFKYASKIVL----------------
+-IT-TIL-S-MMTIP---------------------------------------------
+-------------------------------------------------------FMT
+>_seed_YB8B_YEAST/13-413
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------LVFESVLQVVIIALAG-
+FWSASS-GLLPKQSQKIISLLNVDLF-----------TPCLIFSKLAKSLSMA-------
+---KIFEIAIIPIFFGLTTGISFISGKIMSR-ILDLDKDETNFVVANSVFGNSNSLPVSL
+TLSLAYTLPNLTW-D-----QIPNDNRDNVA---------SRGILYLLIFQQIGQMLRWS
+WGY------------------NKLMKWSGENTQHMPPSQVQSLLERTPNIDNEELVNEEQ
+EEQELLEEENNRMNSSFLSSSSIGDKIWQKSCTVFER-----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+--------------------------IRANLNPPLYSMIFAVVVAAI-GPLQRELFMEDG
+FINNTFAEAVTQLGSVSIPLILVVL--------GS-------------------------
+---NLYPSA-----EVFPKTVHHSKLLIGSIIGRMILPSCFLLPIIAIAV------KYIN
+VSILDDPIFLVVGFLLTVSPPAIQLTQITQLNEFFEAEMADILF----------------
+-WG-YAV-L-SLPVS---------------------------------------------
+-------------------------------------------------------IIV
+>_seed_YDQ4_SCHPO/18-440
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------PIIESDLEVIVIALGG-
+YVLAKK-GFLPRDAQKVISSLNVYFF-----------TPCLVFEKVGNGLNLK-------
+---MLIDLSLLPVFYVIISAASILISFLLAK-LFRLTPRQRNFATACITFQNSNSLPLAL
+VSSLATTVKDLLW-D-----KIPDDTPDKVA---------SRGIMYLLIFSQLGQALRWS
+YGY------------------RILLSPNQPEDPLPIGNRSWSHSDVNEEEIQNLLASSAN
+VDGVQNSVQANEGSTVQTDSSAISKNDNVQVETSNEEVGGFGAASSKISK----------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------------FIVLLLDFFSPPLYSLFIALFIAVV-PPLQRFFFEEGS
+FVEGSITSGIRMAGQVAVPMILVVL--------GA-------------------------
+---SLATDISKTEPTQEVRKNNDTRVIIVCLLGRMVVVPLALLPAFSLLS------YFSE
+ISTVDDPVFVVVIFLLVGSPTAIQLTQICQLNGVFERECAKVLW----------------
+-WS-YAV-F-TPPNS---------------------------------------------
+-------------------------------------------------------LLL
+>_seed_PILS4_ARATH/9-407
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------ASSKPVVETLLITSVGF
+YLALDTVNLLGHDARKHLNNIVFYVF-----------SPSLIGSRLADSVTYE-------
+---SLVKMWFMPVNVLLTFMIGSLLGWIVIV-ITKPPSQLRGLIISCCASGNLGTMPLII
+IPAICKE-------K-----GGPFGDSESCE---------KYGMGYVTLSMT--AFFISV
+YKHDTNWYVSGGNGLLMDLYINLMR------VLSNSPVETHTHSIESNYDDSCKVQLISS
+K------------------------------------------EEEKEEDNHQVGRWEEV
+KQ----------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------RVVSLSKKVNLGSIFAPATIAAIIALVIGLI-TPLRNLIIGTVA
+PF-RVIQDSLTLLGDGAIPAMTLIL--------GG-------------------------
+---NLLKGMRRSEVRSSEMKNSCIIGV---LVARYILLPVSGVLLVRGAY-------KLD
+LVTS-EPLYQFVLLLQYAVPPAMNLGTKTQLFGAGESECSVIML----------------
+-WT-YSL-A-AVSLT---------------------------------------------
+-------------------------------------------------------VWP
+>_seed_PILS5_ARATH/9-388
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------VASMPVIQVLFMSLVGA
+FMASDRCKLFPVEARNSMNKVVFVLF-----------APALMFANLAQTVTLE-------
+---DIISWWFMPVNMGLTFLIGGLLGWLVVK-ILKPPPYLEGLIVATCSAGNMGNLPIIL
+VPAICDE-------D-----KSPFGNRSVCR---------TVGLSYASFSMALGGFYIWT
+YTF------------------RLIKGSAMKVQAIEESEKIAIKSSNSDLEADHKTHLLGA
+P-----------------------------------------EDKENKVVKEKTGFWRKG
+VD----------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------FLHEI-----LEELLAPPTLGAIIGFIFGAV-RWLRNLIIGDDA
+PL-RIVQSTAKLLGDGTIPCMTIIL--------GG-------------------------
+---NLIQG-----LRSSAVKPMVVLGI---VCVRYIAMPIIGIGIVLTAA-------NLG
+FLPA-DPLFQYVLMLQFTLPPAMNIGTMTQLYNVAQDECSVLML----------------
+-WT-YLV-A-ILALT---------------------------------------------
+-------------------------------------------------------VWS
+>_seed_PILS2_ARATH/18-441
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------SGVVPLLKLICLTVIGL
+LLAHPKTQLVPRATFRLLSKLVFALF-----------LPCLIFTELGESITLD-------
+---NIVQWWFIPVNVLLSAVVGSLIGYLVVL-ICRPPPEFNRFTIVMTAFGNTGNLLLAI
+VSSVCHT--------------KTNPFGPNCN---------SRGVSYVSFAQWVAVILVYT
+VVY------------------HMMEPPLEYYEVVEEEG-VEIEEINVENHDASRPLLVEA
+EWPGIEDKETEHCKTPFIARVFNSISSFSQTSFPEVDLGGEYGGESSSPRSIQCLAEPRV
+MR----------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------RIRVVAEQTPVKHILQPPTIASLLAIIIGSV-PQLKSVVFGYDA
+PL-SFITDSLNIMGSAMVPSVMLVL--------GG-------------------------
+---MLSEGPNESTLGLRTTIGI--------SVARLLVLPLVGIGIVMSAD-------KLG
+LISSADPMFKFVLLLQYSTPSAILLGAIASLRGYAVREASALLF----------------
+-WQ-HIF-A-LLSLT---------------------------------------------
+-------------------------------------------------------FYI
+>_seed_PILS6_ARATH/30-423
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------IAVMPIAKVFTMCFLGL
+LMASKYVNILPPSGRKLLNGLVFSLL-----------LPCLIFSQLGQAVTLQ-------
+---KMLQWWFIPVNVVLGTISGSIIGFIVAS-IVRPPYPYFKFTIIQIGVGNIGNVPLVL
+LAALCRD-------T-----SNPFGDSEKCS---------IDGTAYISFGQWVGAIILYT
+YVY------------------QMFAPPPEGFDAEEENLALKTLPVDAAPEQVPLLTQNFP
+KDFSPTQDL--------------------------------LPVQSTEPRGRGVSRKGKI
+AQ----------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------IFVFLYEKLKLKQIVQPAIVASILAMILGAI-PFTKKLIFTNGA
+PL-FFFTDSCMILGDAMIPCILLAL--------GG-------------------------
+---NLINGPGSSKLGFKTTAAI--------IIGRLVLVPPVGLGIVTVAD-------KLG
+FLPADDKMFRFVLLLQHTMPTSVLSGAVANLRGCG-RESAAVLF----------------
+-WV-HIF-A-IFSMA---------------------------------------------
+-------------------------------------------------------GWM
+>_seed_PIN4_ARATH/9-611
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------TVLTAVVPLYVAMILA-
+YGSVQWWKIFSPDQCSGINRFVAIFA-----------VPLLSFHFISTNDPYA-------
+---MNFRFVAADTLQKIIMLVLLALWANLTK---NGSLEWMITIFSLSTLPNTLVMGIPL
+LIAMYGT----------------------------------YAGSLMVQVVVLQCIIWYT
+LLL------------------FLFEYRGAKLLIMEQFP-ETGASIVSFKVESDVVSLDGH
+D-FLETDAEIGNDGKLHVTVRKSNASRRSLMM--------------TPRPSNLTGAEIYS
+LS----STPRGSNFNHSDFY---------------SVMGFPGGRLSNFGPADLY------
+-------SVQSSRGPTPRPSNFEENNAVKYGFYNNTNSSVPAAGSYPAPNPEFSTGTGVS
+TKPNKIPKENQQQLQEKDSKASHDAKELHMFVWSSSASPVSDVFGGGAGDNVATEQSEQG
+AKEIRMVVSDQPRKSNARGGGDDIGGLDSGEGEREIEKATAGLNKMGSNSTAELEAAG-G
+-DGGGNNGTHMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWALV-AYRWHVAMP---
+---KILQQSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALQPKIIACGNSVATFA--------MAVRFITGPAIMAVAGIAIGLHGD--LLRI
+AIVQ------------AALPQGIVPFVFAKEYNVHPTILSTGVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------VYY
+>_seed_PIN7_ARATH/9-614
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------------------TVLTAVIPLYVAMILA-
+YGSVRWWKIFSPDQCSGINRFVAIFA-----------VPLLSFHFISSNNPYA-------
+---MNLRFIAADTLQKLIMLTLLIIWANFTR---SGSLEWSITIFSLSTLPNTLVMGIPL
+LIAMYGE----------------------------------YSGSLMVQIVVLQCIIWYT
+LLL------------------FLFEYRGAKILIMEQFP-ETGASIVSFKVESDVVSLDGH
+D-FLETDAQIGDDGKLHVTVRKSNASRRSFYG--------GGGTNMTPRPSNLTGAEIYS
+L----NTTPRGSNFNHSDFY---------------SMMGFPGGRLSNFGPADMY------
+-------SVQSSRGPTPRPSNFEESCAMASSPRFGYYPGGAPGSYPAPNPEFSTGNKTGS
+KAPKENHHHVGKSNSNDAKELHMFVWGSNGSPV-----SDRAGLQVDNGANEQVGKSDQG
+GAKEIRMLISDHTQNGENKAGPMNGDYGGEEESERVKEVPNGLHKLRCNSTAELNPKEAI
+ETGETVPVKHMPPASVMTRLILIMVWRKLIRNPNTYSSLIGLIWALV-AFRWDVAMP---
+---KIIQQSISILSDAGLGMAMFSL--------GL-------------------------
+---FMALQPKLIACGNSTATFA--------MAVRFFTGPAVMAVAAMAIGLRGD--LLRV
+AIVQ------------AALPQGIVPFVFAKEYNVHPAILSTGVI----------------
+-FG-MLI-A-LPITL---------------------------------------------
+-------------------------------------------------------VYY
+>     1== M63632   1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
+----------MN-------------------GTEGDNFYV---------------P----
+-------------------------FSNKTGLARSPYEYPQY------------------
+----------------YLAEPW-------------------KYSALAAYMFFLILVGFPV
+NFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLF-GFTVTMYTSMN-GYFV--FGPTMC
+SIEGFFATLGGEVALWSLVVLAIERYIVICKPMGNF-RFGNTHAIMGVAFTWIMALACAA
+P-PLVG------WSR-----YIPEGMQCSCGPDYYTLNPNFNNESYVVYMFVVHFLVPFV
+IIF--------------FCYGRLLCTVKEAAAAQQESA----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEKEVTRMV----VLMVIGFLVCWVPYASVAFYIFTHQGS---DFGA
+TFMT--------LPAFFAKSSALYNPVIYILMNKQFRNCMITTL-----CC---GKNPLG
+DDE-SGA-S-TSK-TEVSSVS-TSPVSPA-------------------------------
+----------------------------------------------------------
+>     2== U22180   1 rat opsin <rod>[J.Mol.Neurosci.5(3),207-209'94]
+----------MN-------------------GTEGPNFYV---------------P----
+-------------------------FSNITGVVRSPFEQPQY------------------
+----------------YLAEPW-------------------QFSMLAAYMFLLIVLGFPI
+NFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFG-GFTTTLYTSLH-GYFV--FGPTGC
+NLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSNF-RFGENHAIMGVAFTWVMALACAA
+P-PLVG------WSR-----YIPEGMQCSCGIDYYTLKPEVNNESFVIYMFVVHFTIPMI
+VIF--------------FCYGQLVFTVKEAAAQQQESA----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------TTQKAEKEVTRMV----IIMVIFFLICWLPYASVAMYIFTHQGS---NFGP
+IFMT--------LPAFFAKTASIYNPIIYIMMNKQFRNCMLTSL-----CC---GKNPLG
+DDE-ASA-T-ASK-TETSQVA-PA------------------------------------
+----------------------------------------------------------
+>     3== M92038   1 chicken green sensitive cone opsin <retina>[PNAS89,5932-5936'9
+----------MN-------------------GTEGINFYV---------------P----
+-------------------------MSNKTGVVRSPFEYPQY------------------
+----------------YLAEPW-------------------KYRLVCCYIFFLISTGLPI
+NLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACF-GFTVTFYTAWN-GYFV--FGPVGC
+AVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGNF-RFSATHAMMGIAFTWVMAFSCAA
+P-PLFG------WSR-----YMPEGMQCSCGPDYYTHNPDYHNESYVLYMFVIHFIIPVV
+VIF--------------FSYGRLICKVREAAAQQQESA----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------TTQKAEKEVTRMV----ILMVLGFMLAWTPYAVVAFWIFTNKGA---DFTA
+TLMA--------VPAFFSKSSSLYNPIIYVLMNKQFRNCMITTI-----CC---GKNPFG
+DEDVSSTVS-QSK-TEVSSVS-SSQVSPA-------------------------------
+----------------------------------------------------------
+>     4=p A45229 opsin, green-sensitive (clone GFgr-1) - goldfish
+----------MN-------------------GTEGKNFYV---------------P----
+-------------------------MSNRTGLVRSPFEYPQY------------------
+----------------YLAEPW-------------------QFKILALYLFFLMSMGLPI
+NGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCF-GFTVTFYTAIN-GYFV--LGPTGC
+AVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGSF-KFSSSHAFAGIAFTWVMALACAA
+P-PLFG------WSR-----YIPEGMQCSCGPDYYTLNPDYNNESYVIYMFVCHFILPVA
+VIF--------------FTYGRLVCTVKAAAAQQQDSA----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEREVTKMV----ILMVFGFLIAWTPYATVAAWIFFNKGA---DFSA
+KFMA--------IPAFFSKSSALYNPVIYVLLNKQFRNCMLTTI-----FC---GKNPLG
+DDE-SSTVS-TSK-TEVSSVS-PA------------------------------------
+----------------------------------------------------------
+>     5=p B45229 opsin, green-sensitive (clone GFgr-2) - goldfish
+----------MN-------------------GTEGNNFYV---------------P----
+-------------------------LSNRTGLVRSPFEYPQY------------------
+----------------YLAEPW-------------------QFKLLAVYMFFLICLGLPI
+NGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCF-GFTVTFYTAIN-GYFA--LGPTGC
+AVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGSF-KFSSTHASAGIAFTWVMAMACAA
+P-PLVG------WSR-----YIPEGIQCSCGPDYYTLNPEYNNESYVLYMFICHFILPVT
+IIF--------------FTYGRLVCTVKAAAAQQQDSA----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEREVTKMV----ILMVLGFLVAWTPYATVAAWIFFNKGA---AFSA
+QFMA--------IPAFFSKTSALYNPVIYVLLNKQFRSCMLTTL-----FC---GKNPLG
+DEE-SSTVS-TSK-TEVSSVS-PA------------------------------------
+----------------------------------------------------------
+>     6== L11864   1 Carassius auratus blue cone opsin <retina>[Biochemistry32,208-
+----------MKQVPE-----------------FHEDFYI---------------P----
+-----------------------IPLDINNLSAYSPFLVPQD------------------
+----------------HLGNQG-------------------IFMAMSVFMFFIFIGGASI
+NILTILCTIQFKKLRSHLNYILVNLSIANLFVAIF-GSPLSFYSFFN-RYFI--FGATAC
+KIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGNF-TFKTPHAIAGCILPWISALAASL
+P-PLFG------WSR-----YIPEGLQCSCGPDWYTTNNKYNNESYVMFLFCFCFAVPFG
+TIV--------------FCYGQLLITLKLAAKAQADSA----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEREVTKMV----VVMVLGFLVCWAPYASFSLWIVSHRGE---EFDL
+RMAT--------IPSCLSKASTVYNPVIYVLMNKQFRSCMMKMV-----C----GKN-IE
+EDE-AST-S-SQV-TQVSSVA-PEK-----------------------------------
+----------------------------------------------------------
+>     7== M13299   1 human BCP <>[Science232(4747),193-202'86]
+----------MRKMS-------------------EEEFYL--------------------
+---------------------------FKNISSVGPWDGPQY------------------
+----------------HIAPVW-------------------AFYLQAAFMGTVFLIGFPL
+NAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIF-SVFPVFVASCN-GYFV--FGRHVC
+ALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGNF-RFSSKHALTVVLATWTIGIGVSI
+P-PFFG------WSR-----FIPEGLQCSCGPDWYTVGTKYRSESYTWFLFIFCFIVPLS
+LIC--------------FSYTQLLRALKAVAAQQQESA----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------TTQKAEREVSRMV----VVMVGSFCVCYVPYAAFAMYMVNNRNH---GLDL
+RLVT--------IPSFFSKSACIYNPIIYCFMNKQFQACIMKMV-----C----GKA-MT
+DES-DTC-S-SQK-TEVSTVS-STQVGPN-------------------------------
+----------------------------------------------------------
+>     8=opsin, greensensitive  human (fragment) S07060
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------------------DLAETVI-ASTISIVNQVS-GYFV--LGHPMC
+VLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGNV-RFDAKLAIVGIAFSWIWAAVWTA
+P-PIFG------WSR-----YWPHGLKTSCGPDVFSGSSYPGVQSYMIVLMVTCCITPLS
+IIV--------------LCYLQVWLAIRAVAKQQKESE----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEKEVTRMV----VVMVLAFC--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------------------------------------------------------
+>     9== K03494   1 human GCP <>[Science232(4747),193-202'86]
+----------MAQQWSLQRLAGRHPQDSYEDSTQSSIFTY--------------------
+---------------------------TNSNSTRGPFEGPNY------------------
+----------------HIAPRW-------------------VYHLTSVWMIFVVIASVFT
+NGLVLAATMKFKKLRHPLNWILVNLAVADLAETVI-ASTISVVNQVY-GYFV--LGHPMC
+VLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGNV-RFDAKLAIVGIAFSWIWAAVWTA
+P-PIFG------WSR-----YWPHGLKTSCGPDVFSGSSYPGVQSYMIVLMVTCCITPLS
+IIV--------------LCYLQVWLAIRAVAKQQKESE----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEKEVTRMV----VVMVLAFCFCWGPYAFFACFAAANPGY---PFHP
+LMAA--------LPAFFAKSATIYNPVIYVFMNRQFRNCILQLF----------GKK-VD
+DGS-ELS-S-ASK-TEVSSVS---SVSPA-------------------------------
+----------------------------------------------------------
+>    10== Z68193   1 human Red Opsin <>[]
+----------MAQQWSLQRLAGRHPQDSYEDSTQSSIFTY--------------------
+---------------------------TNSNSTRGPFEGPNY------------------
+----------------HIAPRW-------------------VYHLTSVWMIFVVTASVFT
+NGLVLAATMKFKKLRHPLNWILVNLAVADLAETVI-ASTISIVNQVS-GYFV--LGHPMC
+VLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGNV-RFDAKLAIVGIAFSWIWSAVWTA
+P-PIFG------WSR-----YWPHGLKTSCGPDVFSGSSYPGVQSYMIVLMVTCCIIPLA
+IIM--------------LCYLQVWLAIRAVAKQQKESE----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEKEVTRMV----VVMIFAYCVCWGPYTFFACFAAANPGY---AFHP
+LMAA--------LPAYFAKSATIYNPVIYVFMNRQFRNCILQLF----------GKK-VD
+DGS-ELS-S-ASK-TEVSSVS---SVSPA-------------------------------
+----------------------------------------------------------
+>    11== M92036   1 Gecko gecko P521 <retina>[PNAS89,6841-6845'92]
+----------MTEAWNVAVFAARRSRDD-DDTTRGSVFTY--------------------
+---------------------------TNTNNTRGPFEGPNY------------------
+----------------HIAPRW-------------------VYNLVSFFMIIVVIASCFT
+NGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLV-ASTISVFNQIF-GYFI--LGHPLC
+VIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGNI-KFDSKLAIIGIVFSWVWAWGWSA
+P-PIFG------WSR-----YWPHGLKTSCGPDVFSGSVELGCQSFMLTLMITCCFLPLF
+III--------------VCYLQVWMAIRAVAAQQKESE----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEREVSRMV----VVMIVAFCICWGPYASFVSFAAANPGY---AFHP
+LAAA--------LPAYFAKSATIYNPVIYVFMNRQFRNCIMQLF----------GKK-VD
+DGS-EAS-T-TSR-TEVSSVS-NSSVAPA-------------------------------
+----------------------------------------------------------
+>    12== M62903   1 chicken visual pigment <>[BBRC173,1212-1217'90]
+----------MA-AWE-AAFAARRRHEE-EDTTRDSVFTY--------------------
+---------------------------TNSNNTRGPFEGPNY------------------
+----------------HIAPRW-------------------VYNLTSVWMIFVVAASVFT
+NGLVLVATWKFKKLRHPLNWILVNLAVADLGETVI-ASTISVINQIS-GYFI--LGHPMC
+VVEGYTVSACGITALWSLAIISWERWFVVCKPFGNI-KFDGKLAVAGILFSWLWSCAWTA
+P-PIFG------WSR-----YWPHGLKTSCGPDVFSGSSDPGVQSYMVVLMVTCCFFPLA
+III--------------LCYLQVWLAIRAVAAQQKESE----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------STQKAEKEVSRMV----VVMIVAYCFCWGPYTFFACFAAANPGY---AFHP
+LAAA--------LPAYFAKSATIYNPIIYVFMNRQFRNCILQLF----------GKK-VD
+DGS-EVS-T--SR-TEVSSVS-NSSVSPA-------------------------------
+----------------------------------------------------------
+>    13== S75720   1 chicken P-opsin <>[Science267(5203),1502-1506'95]
+---------------------------------MSSNSSQ--------------------
+---------------------------APPNGTPGPFDGPQW------------------
+---------------PYQAPQS-------------------TYVGVAVLMGTVVACASVV
+NGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLC-GSSVSLSNNIN-GFFV--FGRRMC
+ELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGDF-QFQRRHAVSGCAFTWGWALLWSA
+P-PLLG------WSS-----YVPEGLRTSCGPNWYTGGSN--NNSYILSLFVTCFVLPLS
+LIL--------------FSYTNLLLTLRAAAAQQKEAD----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------TTQRAEREVTRMV----IVMVMAFLLCWLPYSTFALVVATHKGI---IIQP
+VLAS--------LPSYFSKTATVYNPIIYVFMNKQFQSCLLEML-----CCGYQPQR-TG
+KAS-PGT-P-GPH-ADVTAAGLRNKVMPAH------------------------------
+-----------P---------------------------------------------V
+>    14== M17718   1 D.melanogaster Rh3 <>[J.Neurosci.7,1550-1557'87]
+----------MESGN------------------VSSSLF---------------------
+-------------------------------GNVSTALRPEA------------RLSA--
+-ETRLLGWNVPPEELRHIPEHWLTYP----------EPPESMNYLLGTLYIFFTLMSMLG
+NGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSFH-QGYA--LGHLGC
+QIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIAMIIFIYMYATPWVV
+A-CYTET-----WGR-----FVPEGYLTSCTFDYLTDN--FDTRLFVACIFFFSFVCPTT
+MIT--------------YYYSQIVGHVFSHEKALRDQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVESLRS------------------------------------------------
+-----NVDKNKETAEIRIAKAA----ITICFLFFCSWTPYGVMSLIGAFGDKT---LLTP
+GATM--------IPACACKMVACIDPFVYAISHPRYRMELQKRCPWL--ALNEKAPE---
+-SS-AVA-S-TSTTQEP-----QQTTAA--------------------------------
+----------------------------------------------------------
+>    15== X65879   1 Drosophila pseudoobscura Dpse\Rh3 <>[Genetics132(1),193-204'92
+----------MEYHN------------------VSSVL----------------------
+-------------------------------GNVSSVLRPDA------------RLSA--
+-ESRLLGWNVPPDELRHIPEHWLIYP----------EPPESMNYLLGTLYIFFTVISMIG
+NGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSFH-QGYA--LGHLGC
+QIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIAMIIFIYLYATPWVV
+A-CYTES-----WGR-----FVPEGYLTSCTFDYLTDN--FDTRLFVACIFFFSFVCPTT
+MIT--------------YYYSQIVGHVFSHEKALRDQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVDSLRS------------------------------------------------
+-----NVDKSKEAAEIRIAKAA----ITICFLFFASWTPYGVMSLIGAFGDKT---LLTP
+GATM--------IPACTCKMVACIDPFVYAISHPRYRMELQKRCPWL--AISEKAPE---
+-SR-AAI-S-TSTTQEQ-----QQTTAA--------------------------------
+----------------------------------------------------------
+>    16== M17730   1 D.melanogaster Rh4 opsin <>[J.Neurosci.7,1558-1566'87]
+----------MEPLC---------------------------------------------
+-------------------------------NASEPPLRPEA------------R-SSGN
+GDLQFLGWNVPPDQIQYIPEHWLTQL----------EPPASMHYMLGVFYIFLFCASTVG
+NGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSFH-RGFAIYLGNTWC
+QIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVIMNIIIWLYCTPWVV
+L-PLTQF-----WDR-----FVPEGYLTSCSFDYLSDN--FDTRLFVGTIFFFSFVCPTL
+MIL--------------YYYSQIVGHVFSHEKALREQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVESLRS------------------------------------------------
+-----NVDKSKETAEIRIAKAA----ITICFLFFVSWTPYGVMSLIGAFGDKS---LLTQ
+GATM--------IPACTCKLVACIDPFVYAISHPRYRLELQKRCPWL--GVNEKSGE---
+-IS-SAQ-S-TTTQEQQ-----QTTAA---------------------------------
+----------------------------------------------------------
+>    17== X65880   1 Drosophila pseudoobscura Dpse\Rh4 <>[Genetics132(1),193-204'92
+----------MDALC---------------------------------------------
+-------------------------------NASEPPLRPEA------------RMSSGS
+DELQFLGWNVPPDQIQYIPEHWLTQL----------EPPASMHYMLGVFYIFLFFASTLG
+NGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSFH-RGFA--LGNTWC
+QIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVIMNIIIWLYCTPWVV
+L-PLTQF-----WDR-----FVPEGYLTSCSFDYLSDN--FDTRLFVGTIFLFSFVVPTL
+MIL--------------YYYSQIVGHVFNHEKALREQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVESLRS------------------------------------------------
+-----NVDKSKETAEIRIAKAA----ITICFLFFVSWTPYGVMSLIGAFGDKS---LLTP
+GATM--------IPACTCKLVACIEPFVYAISHPRYRMELQKRCPWL--GVNEKSGE---
+-AS-SAQ-S-TTTQEQT-----QQTSAA--------------------------------
+----------------------------------------------------------
+>    18== D50584   1 Hemigrapsus sanguineus opsin BcRh2 <compound eye>[J.Exp.Biol.1
+----------MTNAT-------------------GPQMAY--------------------
+-----------------------------YGAASMDFGYPE-------------GVSIVD
+--------FVRPEIKPYVHQHWYNYP----------PVNPMWHYLLGVIYLFLGTVSIFG
+NGLVIYLFNKSAALRTPANILVVNLALSDLIMLTT-NVPFFTYNCFSGGVWM--FSPQYC
+EIYACLGAITGVCSIWLLCMISFDRYNIICNGFNGP-KLTTGKAVVFALISWVIAIGCAL
+P-PFFG------WGN-----YILEGILDSCSYDYLTQD--FNTFSYNIFIFVFDYFLPAA
+IIV--------------FSYVFIVKAIFAHEAAMRAQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVSTLRS------------------------------------------------
+------NEADAQRAEIRIAKTA----LVNVSLWFICWTPYALISLKGVMGDTS---GITP
+LVST--------LPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWF--CVHETETK-SN
+DDS-QSN-S-TVAQDKA-------------------------------------------
+----------------------------------------------------------
+>    19== D50583   1 Hemigrapsus sanguineus opsin BcRh1 <compound eye>[J.Exp.Biol.1
+----------MANVT-------------------GPQMAF--------------------
+-----------------------------YGSGAATFGYPE-------------GMTVAD
+--------FVPDRVKHMVLDHWYNYP----------PVNPMWHYLLGVVYLFLGVISIAG
+NGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTT-NFPPFCYNCFSGGRWM--FSGTYC
+EIYAALGAITGVCSIWTLCMISFDRYNIICNGFNGP-KLTQGKATFMCGLAWVISVGWSL
+P-PFFG------WGS-----YTLEGILDSCSYDYFTRD--MNTITYNICIFIFDFFLPAS
+VIV--------------FSYVFIVKAIFAHEAAMRAQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVTNLRS------------------------------------------------
+------NEAETQRAEIRIAKTA----LVNVSLWFICWTPYAAITIQGLLGNAE---GITP
+LLTT--------LPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWF--CVHEKDPN-DV
+EEN-QSS-N-TQTQEKS-------------------------------------------
+----------------------------------------------------------
+>    20== K02320   1 D.melanogaster opsin <>[Cell40,851-858'85]
+----------MESFA---------------------------------------------
+--------------------------------VAAAQLGPHFAPLS--------NGSVVD
+--------KVTPDMAHLISPYWNQFP----------AMDPIWAKILTAYMIMIGMISWCG
+NGVVIYIFATTKSLRTPANLLVINLAISDFGIMIT-NTPMMGINLYF-ETWV--LGPMMC
+DIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAGR-PMTIPLALGKM------------
+--------------------YVPEGNLTSCGIDYLERD--WNPRSYLIFYSIFVYYIPLF
+LIC--------------YSYWFIIAAVSAHEKAMREQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVKSLRS------------------------------------------------
+------SEDAEKSAEGKLAKVA----LVTITLWFMAWTPYLVINCMGLFKF-E---GLTP
+LNTI--------WGACFAKSAACYNPIVYGISHPKYRLALKEKCPCC--VFGKVDDG-KS
+SDA-QSQ-A-TASEAES-----KA------------------------------------
+----------------------------------------------------------
+>    21== K02315   1 D.melanogaster ninaE <>[Cell40,839-850'85]
+----------MESFA---------------------------------------------
+--------------------------------VAAAQLGPHFAPLS--------NGSVVD
+--------KVTPDMAHLISPYWNQFP----------AMDPIWAKILTAYMIMIGMISWCG
+NGVVIYIFATTKSLRTPANLLVINLAISDFGIMIT-NTPMMGINLYF-ETWV--LGPMMC
+DIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAGR-PMTIPLALGKIAYIWFMSSIWCL
+A-PAFG------WSR-----YVPEGNLTSCGIDYLERD--WNPRSYLIFYSIFVYYIPLF
+LIC--------------YSYWFIIAAVSAHEKAMREQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVKSLRS------------------------------------------------
+------SEDAEKSAEGKLAKVA----LVTITLWFMAWTPYLVINCMGLFKF-E---GLTP
+LNTI--------WGACFAKSAACYNPIVYGISHPKYRLALKEKCPCC--VFGKVDDG-KS
+SDA-QSQ-A-TASEAES-----KA------------------------------------
+----------------------------------------------------------
+>    22== X65877   1 Drosophila pseudoobscura Dpse\ninaE <>[Genetics132(1),193-204'
+----------MDSFA---------------------------------------------
+--------------------------------AVATQLGPQFAAPS--------NGSVVD
+--------KVTPDMAHLISPYWDQFP----------AMDPIWAKILTAYMIIIGMISWCG
+NGVVIYIFATTKSLRTPANLLVINLAISDFGIMIT-NTPMMGINLYF-ETWV--LGPMMC
+DIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAGR-PMTIPLALGKIAYIWFMSTIWCC
+LAPVFG------WSR-----YVPEGNLTSCGIDYLERD--WNPRSYLIFYSIFVYYIPLF
+LIC--------------YSYWFIIAAVSAHEKAMREQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVKSLRS------------------------------------------------
+------SEDADKSAEGKLAKVA----LVTISLWFMAWTPYLVINCMGLFKF-E---GLTP
+LNTI--------WGACFAKSAACYNPIVYGISHPKYRLALKEKCPCC--VFGKVDDG-KS
+SEA-QSQ-A-TTSEAES-----KA------------------------------------
+----------------------------------------------------------
+>    23== M12896   1 D.melanogaster Rh2 <>[Cell44,705-710'86]
+----------MERSH---------------------------------------------
+---------------------------LPETPFDLAHSGPRFQAQSSG------NGSVLD
+--------NVLPDMAHLVNPYWSRFA----------PMDPMMSKILGLFTLAIMIISCCG
+NGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMAS-QSPVMIINFYY-ETWV--LGPLWC
+DIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGINGT-PMTIKTSIMKILFIWMMAVFWTV
+M-PLIG------WSA-----YVPEGNLTACSIDYMTRM--WNPRSYLITYSLFVYYTPLF
+LIC--------------YSYWFIIAAVAAHEKAMREQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVKSLRS------------------------------------------------
+------SEDCDKSAEGKLAKVA----LTTISLWFMAWTPYLVICYFGLFKI-D---GLTP
+LTTI--------WGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMC--VFGNTDEP-KP
+DAP-ASD-TETTSEADS-----KA------------------------------------
+----------------------------------------------------------
+>    24== X65878   1 Drosophila pseudoobscura Dpse\Rh2 <>[Genetics132(1),193-204'92
+----------MERSL---------------------------------------------
+---------------------------LPEPPLAMALLGPRFEAQTGG------NRSVLD
+--------NVLPDMAPLVNPHWSRFA----------PMDPTMSKILGLFTLVILIISCCG
+NGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMAS-QSPVMIINFYY-ETWV--LGPLWC
+DIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGINGT-PMTIKTSIMKIAFIWMMAVFWTI
+M-PLIG------WSS-----YVPEGNLTACSIDYMTRQ--WNPRSYLITYSLFVYYTPLF
+MIC--------------YSYWFIIATVAAHEKAMRDQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVKSLRS------------------------------------------------
+------SEDCDKSAENKLAKVA----LTTISLWFMAWTPYLIICYFGLFKI-D---GLTP
+LTTI--------WGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMC--VCGTTDEP-KP
+DAP-PSD-TETTSEAES-----KD------------------------------------
+----------------------------------------------------------
+>    25== U26026   1 Apis mellifera long-wavelength rhodopsin <>[]
+----------M-------------------------------------------------
+----------------------------------IAVSGPSYEAFSYGGQARFNNQTVVD
+--------KVPPDMLHLIDANWYQYP----------PLNPMWHGILGFVIGMLGFVSAMG
+NGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFC-MSPPMVINCYY-ETWV--LGPLFC
+QIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSGK-PLSINGALIRIIAIWLFSLGWTI
+A-PMFG------WNR-----YVPEGNMTACGTDYFNRG--LLSASYLVCYGIWVYFVPLF
+LII--------------YSYWFIIQAVAAHEKNMREQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVASLRS------------------------------------------------
+------SENQNTSAECKLAKVA----LMTISLWFMAWTPYLVINFSGIFNL-V---KISP
+LFTI--------WGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSL--AC-AAEPS-SD
+AVS-TTS-G-TTTVTDN-----EKSNA---------------------------------
+----------------------------------------------------------
+>    26== L03781   1 Limulus polyphemus opsin <>[PNAS90,6150-6154'93]
+----------MANQL---------------------------------------------
+---------------------------------SYSSLGWPYQP----------NASVVD
+--------TMPKEMLYMIHEHWYAFP----------PMNPLWYSILGVAMIILGIICVLG
+NGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAF-MMPTMTSNCFA-ETWI--LGPFMC
+EVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAAA-PLTHKKATLLLLFVWIWSGGWTI
+L-PFFG------WSR-----YVPEGNLTSCTVDYLTKD--WSSASYVVIYGLAVYFLPLI
+TMI--------------YCYFFIVHAVAEHEKQLREQAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KMNVASLRA------------------------------------------------
+-----NADQQKQSAECRLAKVA----MMTVGLWFMAWTPYLIISWAGVFSSGT---RLTP
+LATI--------WGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSL--ACGSGESG-SD
+VKS-EAS-A-TTTMEEK-----PKIPEA--------------------------------
+----------------------------------------------------------
+>    27== X07797   1 Octopus dofleini rhodopsin <>[FEBS232(1),69-72'88]
+----------MVESTTL----------------VNQTWWY--------------------
+------------------------------------------------------NPTV--
+----------------DIHPHWAKFD----------PIPDAVYYSVGIFIGVVGIIGILG
+NGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAFM-KKWI--FGKVAC
+QLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFLMIIFVWMWSIVWSV
+G-PVFN------WGA-----YVPEGILTSCSFDYLSTD--PSTRSFILCMYFCGFMLPII
+IIA--------------FCYFNIVMSVSNHEKEMAAMAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---RLNAKELRK------------------------------------------------
+-------AQAGASAEMKLAKIS----MVIITQFMLSWSPYAIIALLAQFGPAE---WVTP
+YAAE--------LPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-CE
+DAN-DAE-E-EVVASER--GG-ESRDAAQMKEMMAMMQKMQAQQAAYQP---PPPPQGYP
+PQGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA
+>    28== X70498   1 Todarodes pacificus rhodopsin <retina>[FEBS317(1-2),5-11'93]
+----------MGRDLR-----------------DNETWWY--------------------
+------------------------------------------------------NPSI--
+----------------VVHPHWREFD----------QVPDAVYYSLGIFIGICGIIGCGG
+NGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCFL-KKWI--FGFAAC
+KVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFIMIIFVWLWSVLWAI
+G-PIFG------WGA-----YTLEGVLCNCSFDYISRD--STTRSNILCMFILGFFGPIL
+IIF--------------FCYFNIVMSVSNHEKEMAAMAK---------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---RLNAKELRK------------------------------------------------
+-------AQAGANAEMRLAKIS----IVIVSQFLLSWSPYAVVALLAQFGPLE---WVTP
+YAAQ--------LPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-TE
+DDK-DAE-T-EIPAGESSDAA-PSADAAQMKEMMAMMQKMQQQQAAYPPQGYAPPPQGYP
+PQGYPPQGY--PPQGYPPQGYPP---PPQGAPPQGAPP------AAPPQGVDNQAYQA
+>    29== L21195   1 human serotonin 5-HT7 receptor protein <placenta and fetal bra
+M---------MDVNS------------------SGRPDLYGHLRSFLLPEVGRGLPDLSP
+DG------------GADPVAGSW---------------APHLLS----------EVTAS-
+-----------------PAPTWDAPPDNASGCGEQINYGRVEKVVIGSILTLITLLTIAG
+NCLVVISVCFVKKLRQPSNYLIVSLALADLSVAVA-VMPFVSVTDLIGGKWI--FGHFFC
+NVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAKMILSVWLLSASITL
+P-PLFG------WAQ-----NVNDDKVCLIS----------QDFGYTIYSTAVAFYIPMS
+VML--------------FMYYQIYKAARKSAAKHKFPGF---------------------
+------------------------------------------------------------
+--------PR----------------------VEPDSVIALNG-----------------
+------------------------------------------------------------
+-----------------------------------IV-----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KLQKE-------------------VEECA-NL-----------------SRLL----
+--KHERKNISIFKREQKAATTL----GIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPL
+WVER--------TFLWLGYANSLINPFIYAFFNRDLRTTYRSLL-----QCQYRNINRKL
+SAA-GMH-E-ALKLAER-----PERPEFVL------------QNADYCR-----------
+-----KKGH--------------------------------------------DS---
+>    30== L15228   1 rat 5HT-7 serotonin receptor <>[JBC268,18200-18204'93]
+------------------------------------------------------------
+--------------------------------------MPHLLSGF-------LEVTAS-
+-----------------PAPTWDAPPDNVSGCGEQINYGRVEKVVIGSILTLITLLTIAG
+NCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVA-VMPFVSVTDLIGGKWI--FGHFFC
+NVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAKMILSVWLLSASITL
+P-PLFG------WAQ-----NVNDDKVCLIS----------QDFGYTIYSTAVAFYIPMS
+VML--------------FMYYQIYKAARKSAAKHKFPGF---------------------
+------------------------------------------------------------
+--------PR----------------------VQPESVISLNG-----------------
+------------------------------------------------------------
+-----------------------------------VV-----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KLQKE-------------------VEECA-NL-----------------SRLL----
+--KHERKNISIFKREQKAATTL----GIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPL
+WVER--------TCLWLGYANSLINPFIYAFFNRDLRPTSRSLL-----QCQYRNINRKL
+SAA-GMH-E-ALKLAER-----PERSEFVL------------QNSDHCG-----------
+-----KKGH--------------------------------------------DT---
+>    31=p A47425 serotonin receptor 5HT-7 - rat
+------------------------------------------------------------
+--------------------------------------MPHLLSGF-------LEVTAS-
+-----------------PAPTWDAPPDNVSGCGEQINYGRVEKVVIGSILTLITLLTIAG
+NCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVA-VMPFVSVTDLIGGKWI--FGHFFC
+NVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAKMILSVWLLSASITL
+P-PLFG------WAQ-----NVNDDKVCLIS----------QDFGYTIYSTAVAFYIPMS
+VML--------------FMYYQIYKAARKSAAKHKFPGF---------------------
+------------------------------------------------------------
+--------PR----------------------VQPESVISLNG-----------------
+------------------------------------------------------------
+-----------------------------------VV-----------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---KLQKE-------------------VEECA-NL-----------------SRLL----
+--KHERKNISIFKREQKAATTL----GIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPL
+WVER--------TCLWLGYANSLINPFIYAFFNRDLRTTYRSLL-----QCQYRNINRKL
+SAA-GMH-E-ALKLAER-----PERSEFVL------------QNSDHCG-----------
+-----KKGH--------------------------------------------DT---
+>    32== M83181   1 human serotonin receptor <>[JBC267(11),7553-7562'92]
+----------MDVLS---------------------------------------------
+-----------------------------PGQGNNTTSPPAPFETG-------GNTTGIS
+------------------------------------DVTVSYQVITSLLLGTLIFCAVLG
+NACVVAAIALERSLQNVANYLIGSLAVTDLMVSVL-VLPMAALYQVL-NKWT--LGQVTC
+DLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAALISLTWLIGFLISI
+P-PMLG------WRTPE---DRSDPDACTIS----------KDHGYTIYSTFGAFYIPLL
+LML--------------VLYGRIFRAARFRIRKTVKKVE---------------------
+----------------------------------KTGADTRHGASPAPQPKK--------
+---------------------------------------SVNG-ESGSRNWRLGVESK--
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---AGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAGPTPCA--PASFERKN
+ERNAEAKRKMALARERKTVKTL----GIIMGTFILCWLPFFIVALVLPFCESS--CHMPT
+LLGA--------IINWLGYSNSLLNPVIYAYFNKDFQNAFKKII-----KCKFCRQ----
+------------------------------------------------------------
+----------------------------------------------------------
+>    33=p A35181 serotonin receptor class 1A - rat
+----------MDVFS---------------------------------------------
+-----------------------------FGQGNNTTASQEPFGTG-------GNVTSIS
+------------------------------------DVTFSYQVITSLLLGTLIFCAVLG
+NACVVAAIALERSLQNVANYLIGSLAVTDLMVSVL-VLPMAALYQVL-NKWT--LGQVTC
+DLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAALISLTWLIGFLISI
+P-PMLG------WRTPE---DRSDPDACTIS----------KDHGYTIYSTFGAFYIPLL
+LML--------------VLYGRIFRAARFRIRKTVRKVE---------------------
+----------------------------------KKGAGTSLGTSSAPPPKK--------
+---------------------------------------SLNG-QPGSGDWRRCAENR--
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---AVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESGSNSYA--PACLERKN
+ERNAEAKRKMALARERKTVKTL----GIIMGTFILCWLPFFIVALVLPFCESS--CHMPA
+LLGA--------IINWLGYSNSLLNPVIYAYFNKDFQNAFKKII-----KCKFCRR----
+------------------------------------------------------------
+----------------------------------------------------------
+>    34== L06803   1 Lymnaea stagnalis serotonin receptor <>[PNAS90,11-15'93]
+MANFTFGDLALDVARM-----------------GGLASTPSGLRS-----TGLTTPGLSP
+TGLVTSDFNDSYGLTGQFINGSHSSRSRDNASANDT------------------SATNM-
+-----------------TDDRYWSLT----------VYSHEHLVLTSVILGLFVLCCIIG
+NCFVIAAVMLERSLHNVANYLILSLAVADLMVAVL-VMPLSVVSEIS-KVWF--LHSEVC
+DMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILLMIMVVWIVALFISI
+P-PLFG------WRDPN--NDPDKTGTCIIS----------QDKGYTIFSTVGAFYLPML
+VMM--------------IIYIRIWLVARSRIRKDKFQMT-------KARLKTEETTLVAS
+P---------KTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKK--------
+--------NRAKKL------------------PENANGVNSNS-----------------
+--SS--------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------SERLK-------
+---QIQIETAEAFANGCAEEASIAML-ERQCNNGKKISSNDTPY----------------
+---SRTREKLELKRERKAARTL----AIITGAFLICWLPFFIIALIGPFVDPE---GIPP
+FARS--------FVLWLGYFNSLLNPIIYTIFSPEFRSAFQKIL-----FGKYRRGHR--
+------------------------------------------------------------
+----------------------------------------------------------
+>    35=p A47174 serotonin receptor, 5HTlym receptor - great pond snail
+MANFTFGDLALDVARM-----------------GGLASTPSGLRS-----TGLTTPGLSP
+TGLVTSDFNDSYGLTGQFINGSHSSRSRDNASANDT------------------SATNM-
+-----------------TDDRYWSLT----------VYSHEHLVLTSVILGLFVLCCIIG
+NCFVIAAVMLERSLHNVANYLILSLAVADLMVAVL-VMPLSVVSEIS-KVWF--LHSEVC
+DMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILLMIMVVWIVALFISI
+P-PLFG------WRDPN--NDPDKTGTCIIS----------QDKGYTIFSTVGAFYLPML
+VMM--------------IIYIRIWLVARSRIRKDKFQMT-------KARLKTEETTLVAS
+P---------KTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKK--------
+--------NRAKKL------------------PENANGVNSNS-----------------
+--SS--------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------SERLK-------
+---QIQIETAEAFANGCAEEASIAML-ERQCNNGKKISSNDTPY----------------
+---SRTREKLELKRERKAARTL----AIITGAFLICWLPFFIIALIGPFVDPE---GIPP
+FARS--------FVLWLGYFNSLLNPIIYTIFSPEFRSAFQKIL-----FGKYRRGHR--
+------------------------------------------------------------
+----------------------------------------------------------
+>    36== X95604   1 Bombyx mori serotonin receptor <antennae>[InsectBiochem.Mol.Bi
+----------MEGAE-------------------GQEEL--DWEA-----LYLRLP----
+---------------------------LQNCSWNSTGWEPNW------------NVTVV-
+-----------------PNTTWWQAS-----APFDTPAALVRAAAKAVVLGLLILATVVG
+NVFVIAAILLERHLRSAANNLILSLAVADLLVACL-VMPLGAVYEVV-QRWT--LGPELC
+DMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGMMIACVWTVSFFVCI
+A-QLLG------WKDPDWNQRVSEDLRCVVS----------QDVGYQIFATASSFYVPVL
+IIL--------------ILYWRIYQTARKRIRRRRGATA---------------------
+----------------------------------------RGGVGPPPVPAG--------
+-----------------------------------GALVAGGG-----------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------SGGIAAAVVAVI-----GRPLP-------
+---TISETTTTGFTNVSSNNTSPE---KQSCANGLEADPPTTGYGAVAAAYYPSLV----
+--RRKPKEAADSKRERKAAKTL----AIITGAFVACWLPFFVLAILVPTCD----CEVSP
+VLTS--------LSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLL-----CGRRVRRRRA-
+----------------------PQ------------------------------------
+----------------------------------------------------------
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/seed.aln	Mon Jul 14 18:16:36 2025 +0000
@@ -0,0 +1,216 @@
+>PINI_ARATH/9-617
+HVMTAMVPLYVAMILA-YGSVKWWKIFTPDQCSGINRFVALFAVPLLSFHFIAANNPYAMNLRFLAADSLQK
+VIVLSLLFLWCKLSR---NGSLDWTITLFSLSTLPNTLVMGIPLLKGMYGN-------------------FS
+GDLMVQIVVLQCIIWYTLML------------------FLFEYRGAKLLISEQFP-DTAGSIVSIHVDSDIM
+SLDGRQ-PLETEAEIKEDGKLHVTVRRSNASRSDIYS-----RRSQGL-SATPRPSNLTNAEIYSLQSSRNP
+TPRGSSFNHTDFY---------------SMMASGGGRNSNFGPGEA---------------VFGSKGPTPRP
+SNYEEDGGPAKPTAAGTAAGAGRFHYQSGGSGGGGGAHYPAPNPGMFSPNTGGGGGTAAKGNAPVVGGKRQD
+GN------GRDLHMFVWSSSASPVSDVFGGGGGNHHADYSTATNDHQKDVKISVPQGNSNDNQYVEREEFSF
+GNKDDDSKVLATDGGNNISNKTTQAKVMPPTSVMTRLILIMVWRKLIRNPNSYSSLFGITWSLI-SFKWNIE
+MP------------ALIAKSISILSDAGLGMAMFSLGLFMALNPRIIACGNRRAAFA--------AAMRFVV
+GPAVMLVASYAVGLRGV-LLHVAIIQ------------AALPQGIVPFVFAKEYNVHPDILSTAVIFGMLIA
+LPITLLYY
+>Q9FVF6_POPPZ/9-609
+HVMTAMVPLYVAMILA-YGSVKWWKIFTPDQCSGINRFVALFAVPLLSFHFISTNDPYNMNLRFITADSLQK
+VIVLVVLALWTKLSK---RGCLEWTITLFSLSTLPNTLVMGIPLLKGMYGD-------------------YS
+GSLMVQVVVLQCIIWYTLML------------------FMFEYRGAKLLISEQFP-DTAGSIVSIHVDSDIM
+SLDGRQ-PLETEAAIKEDGKLHVTVRKSNASRSDIFS-----RRSQGLSSTTPRPSNLTNAEIYSLQSSRNP
+TPRGSSFNHTDFY---------------SMMA--AGRNSNFGASDVY-------------GLSASRGPTPRP
+SNFEEEHGGSNKPRFHHYHAPGGATHYPAPNPGMFSPTTAASKGVSANANNAAAAAAKKPNGQAQQKAED--
+-----------GRDLHMFVWSSSASPVSDVFGGHDYGAHDLKDVRVAVSPGKVEGQRENQEDYNLERDDFSF
+GNRGLDRERNSHEGEKGGFD--GKPKAMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWSLV-SFRWNVK
+MP------------LIIAKSISILSDAGLGMAMFSLGLFMALQPRIIACGNSIATFS--------MAVRFLT
+GPAIMAAASIAVGIRGT-LLHIAIVQ------------AALPQGIVPFVFAKEYNVHPEILSTGVIFGMLIA
+LPITLVYY
+>B8AIF2_ORYSI/9-590
+HVMTAMVPLYVAMILA-YGSVKWWRIFTPDQCSGINRFVALFAVPLLSFHFISTNNPYTMNLRFIAADTLQK
+LMVLAMLTAWSHLSR---RGSLEWTITLFSLSTLPNTLVMGIPLLKGMYGE-------------------FS
+GSLMVQIVVLQCIIWYTLML------------------FMFEYRGARMLITEQFP-DTAANIASIVVDPDVV
+SLDGRRDAIETETEVKEDGRIHVTVRRSNASRSDIYS-----RRSMGFSSTTPRPSNLTNAEIYSLQSSRNP
+TPRGSSFNHTDFY---------------SMV----GRSSNFGAADA---------------FGVRTGATPRP
+SNYEDDASKPKYPLPASNAAPMAGHYPAPNPAVSSAPKGAKKAATNGQAKGEDLHMFVWSS-----------
+--------------------SASPVSDVFGGGAPDYNDAAAVKSPRKMDGAKDREDYVERDDFSFGNRGVMD
+RDAEAGDEKAAAAAGADPSKAMAAPTAMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWSLV-CFRWNFE
+MP------------AIVLKSISILSDAGLGMAMFSLGLFMALQPHIIACGNKVATYA--------MAVRFLA
+GPAVMAAASFAVGLRGT-LLHVAIVQ------------AALPQGIVPFVFAKEYSVHPSILSTAVIFGMLIA
+LPITLVYY
+>PIN6_ARATH/9-565
+TVMCAMAPLYFAMFVA-YGSVKWCKIFTPAQCSGINRFVSVFAVPVLSFHFISQNNPYKMDTMFILADTLSK
+IFVFVLLSLWAVFFK---AGGLDWLITLFSIATLPNTLVMGIPLLQAMYGD-------------------YT
+QTLMVQLVVLQCIIWYTLLL------------------FLFELRAARLLIRAEFPGQAAGSIAKIQVDDDVI
+SLDGMD-PLRTETETDVNGRIRLRIRRSVSSVPDSVMSSSLC--------LTPRASNLSNAEIFSVN-----
+-----TPNNRFFHGGGGSGTLQFYNGSNEIMF-CNGDLGGFGFTRPGLGASPRRLSGYASSDAYSLQPTPRA
+SNFNELDVNGNGTPVWMKSPAAGRIYRQSSPKMMWESGQRHAAK----------------------------
+--------------------------------------DINGSVPEKEISFRDALKAAPQATAAGGGASMEE
+GAAGKDTTPVA-AIG-K-QE-------MPSAIVMMRLILTVVGRKLSRNPNTYSSLLGLVWSLI-SFKWNIP
+MP------------NIVDFSIKIISDAGLGMAMFSLGLFMALQPKMIPCGAKKATMG--------MLIRFIS
+GPLFMAGASLLVGLRGS-RLHAAIVQ------------AALPQGIVPFVFAREYNLHPDLLSTLVIFGMIVS
+LPVTILYY
+>YFDV_ECOLI/4-307
+FFIGDLLPIIVIMLLG-YFSGRR-ETFSEDQARAFNKLVLNYALPAALFVSITRANREMIFADTRLTLVSLV
+VIVGCFFFSWFGCYK-FFKRTHAEAAVCALIAGSPTIGFLGFAVLDPIYGD----------------SVSTG
+LVVAIISIIVNAITIPIGLY------------------LLNPSSGADGKK----------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------NSNLSALISAAKEPVVWAPVLATILVLV-GVKIP--
+--------------AAWDPTFNLIAKANSGVAVFAAGLTLAAHKFEFSAEIAYN-----------TFLKLIL
+MPLALLLVGMACHLNSE-HLQMMVLA------------GALPPAFSGIIIASRFNVYTRTGTASLAVSVLGF
+VVTAPLWI
+>YWKB_BACSU/5-315
+DILILLAPIFFVIVLG-WFAGHF-GSYDAKSAKGVSTLVTKYALPAHFIAGILTTSRSEFLSQVPLMISLII
+GIVGFYIIILLVCRF-IFKYDLTNSSVFSLNSAQPTFAFMGIPVLGSLFGA-------------------NE
+VAIPIAVTGIVVNAILDPLA------------------IIIATVGESSKKNEESGD----------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------SFWKMTGKSILHGLCEPLAAAPLISMILVLVFNFTLP--
+--------------ELGVKMLDQLGSTTSGVALFAVGVTVGIRKIKLSMPAIG-----------IALLKVAV
+QPALMFLIALAIGLPADQTTKAILL-------------VAFPGSAVAAMIATRFEKQEEETATAFVVSAILS
+LISLPIII
+>P71425_KLEPN/4-313
+VIIHALAPIFVIMLLG-FWAGKA-GMVDNKNVSLLNIFVMDFALPATLFSATVQTPWAGIVAQSPLVLVLTG
+AMWITYAAIYFLATS-VFKRTPQDGAVLTLTVALPNYAALGLPILGSVLGE------------------GAS
+TSLSVAVSIACGSVLMTPFC------------------LLILEREKARAAGENSG-----------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------STLAMLPVLMWRSVKKPIVWGPLLGVVLSAI-GIKMP--
+--------------DLLLASIKPLGLAATAAALFLTGVILSARKLQLNALIAAS-----------TIVKLLV
+QPFIAWGLVMLLGLHGSIAITAILM-------------IALAAGFFGVVFGNRFGVQSPDAEAVLLLSSVLC
+ILSLPLFI
+>Q98L58_RHILO/3-308
+PLTETVLFVFSLVALG-YLAGLT-GYLRPASGEGISDFAVSVAMPLLLFQTMVKADFHG--VAPWPLWGAYF
+TAVAITWAAGHLVTTRIFGRDARAGVVGGVSSAYSNVVLLGAPFILGIFGP-----------------SGFE
+VLSLLVSVHLPVMMMASIVL------------------FEMFGRGGGEHV----------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------HPLRVLRSFLRRLFINPLIIGILLGLAWRLS-GVPLP--
+--------------SLVMRLVDALANTAGPVALFAMGLSLRRFGVSGNVRPALA----------LSALKLFL
+MPALVLAFVLLLGLPPL-TAKVAVVV------------AALPSGINSYLIAVQFNTGQALASNQMTIATACA
+AVTTAFWL
+>O67397_AQUAE/2-289
+FIYEKVFFILLIIAFA-YTLKRG-GIFKEEHALPFINYVIYFALPFTIFKNLRF---LEIGKEVLGVVLIAW
+GAIFLSILFAFLFGK-FLKLEEKTLRAFLLVSSFGNTAFMGYPFLYALEGN-------------------EG
+LKYAILYDQLGSFLMVITLG----------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------LFLAIGKFDLKELILFPPFIALVLSFLLHGV-RFP----
+--------------QFFEHSVEIISGSLIPVILFSLGLRLNFTDMKSDYRTLFSA----------LFIKMFL
+VPLLILVFLKIFGLTSL-PYRVALIE------------SAMPPMVFAGVLALKYELDFRLAFSAITLGIVIS
+LFTVPVFR
+>Q97M34_CLOAB/2-296
+YVFEQIVILFLIMGIG-YYAAKS-KIIDDDTTSHLSNFIVSITLPLMILTSFNVEYSRKTVITIINLLVFSV
+AAFIISIVIGKII---SFKFAMDKRDILMFMSIFSNCGFIGFPVLKVVYGN-------------------KG
+VLYTSIFNLVYNVFIWTIGI------------------VIINDKREKIDY----------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+-------------------------------------------KKILFNHNIIAVIVGVFLMLL-SIKIP--
+--------------YVMSSAFNLIGSMTAPLSMIVIGSILA--------GVDFNDIFKDWSLYYIAILRLII
+IPLIIYFALKPFQINKI-VIGVIIIC------------EAMPGGTLCPILAKSCNRNFKYASKIVLITTILS
+MMTIPFMT
+>YB8B_YEAST/13-413
+LVFESVLQVVIIALAG-FWSASS-GLLPKQSQKIISLLNVDLFTPCLIFSKLAKSLSMAKIFEIAIIPIFFG
+LTTGISFISGKIMSR-ILDLDKDETNFVVANSVFGNSNSLPVSLTLSLAYTLPNLTWDQIPNDNRDNVASRG
+ILYLLIFQQIGQMLRWSWGY------------------NKLMKWSGENTQHMPPSQVQSLLERTPNIDNEEL
+VNEEQEEQELLEEENNRMNSSFLSSSSIGDKIWQKSCTVFER------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+-------------------------------------------IRANLNPPLYSMIFAVVVAAI-GPLQREL
+F------MEDGFINNTFAEAVTQLGSVSIPLILVVLGSNLYPSA-----EVFPKTVHHSKLLIGSIIGRMIL
+PSCFLLPIIAIAV-----KYINVSILDDPIFLVVGFLLTVSPPAIQLTQITQLNEFFEAEMADILFWGYAVL
+SLPVSIIV
+>YDQ4_SCHPO/18-440
+PIIESDLEVIVIALGG-YVLAKK-GFLPRDAQKVISSLNVYFFTPCLVFEKVGNGLNLKMLIDLSLLPVFYV
+IISAASILISFLLAK-LFRLTPRQRNFATACITFQNSNSLPLALVSSLATTVKDLLWDKIPDDTPDKVASRG
+IMYLLIFSQLGQALRWSYGY------------------RILLSPNQPEDPLPIGNRSWSHSDVNEEEIQNLL
+ASSANVDGVQNSVQANEGSTVQTDSSAISKNDNVQVETSNEEVGGFGAASSKISK-----------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------------FIVLLLDFFSPPLYSLFIALFIAVV-PPLQRFF
+F------EEGSFVEGSITSGIRMAGQVAVPMILVVLGASLATDISKTEPTQEVRKNNDTRVIIVCLLGRMVV
+VPLALLPAFSLLS-----YFSEISTVDDPVFVVVIFLLVGSPTAIQLTQICQLNGVFERECAKVLWWSYAVF
+TPPNSLLL
+>PILS4_ARATH/9-407
+ASSKPVVETLLITSVGFYLALDTVNLLGHDARKHLNNIVFYVFSPSLIGSRLADSVTYESLVKMWFMPVNVL
+LTFMIGSLLGWIVIV-ITKPPSQLRGLIISCCASGNLGTMPLIIIPAICKE------KGGPFGDSESCEKYG
+MGYVTLSMT--AFFISVYKHDTNWYVSGGNGLLMDLYINLMR------VLSNSPVETHTHSIESNYDDSCKV
+QLISSK------------------------------------------EEEKEEDNHQVGRWEEVKQ-----
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------RVVSLSKKVNLGSIFAPATIAAIIALVIGLI-TPLRNLI
+IGTVAPF-------RVIQDSLTLLGDGAIPAMTLILGGNLLKGMRRSEVRSSEMKNSCIIGV---LVARYIL
+LPVSGVLLVRGAY------KLDLVTS-EPLYQFVLLLQYAVPPAMNLGTKTQLFGAGESECSVIMLWTYSLA
+AVSLTVWP
+>PILS5_ARATH/9-388
+VASMPVIQVLFMSLVGAFMASDRCKLFPVEARNSMNKVVFVLFAPALMFANLAQTVTLEDIISWWFMPVNMG
+LTFLIGGLLGWLVVK-ILKPPPYLEGLIVATCSAGNMGNLPIILVPAICDE------DKSPFGNRSVCRTVG
+LSYASFSMALGGFYIWTYTF------------------RLIKGSAMKVQAIEESEKIAIKSSNSDLEADHKT
+HLLGAP-----------------------------------------EDKENKVVKEKTGFWRKGVD-----
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------FLHEI-----LEELLAPPTLGAIIGFIFGAV-RWLRNLI
+IGDDAPL-------RIVQSTAKLLGDGTIPCMTIILGGNLIQG-----LRSSAVKPMVVLGI---VCVRYIA
+MPIIGIGIVLTAA------NLGFLPA-DPLFQYVLMLQFTLPPAMNIGTMTQLYNVAQDECSVLMLWTYLVA
+ILALTVWS
+>PILS2_ARATH/18-441
+SGVVPLLKLICLTVIGLLLAHPKTQLVPRATFRLLSKLVFALFLPCLIFTELGESITLDNIVQWWFIPVNVL
+LSAVVGSLIGYLVVL-ICRPPPEFNRFTIVMTAFGNTGNLLLAIVSSVCHT--------KTNPFGPNCNSRG
+VSYVSFAQWVAVILVYTVVY------------------HMMEPPLEYYEVVEEEG-VEIEEINVENHDASRP
+LLVEAEWPGIEDKETEHCKTPFIARVFNSISSFSQTSFPEVDLGGEYGGESSSPRSIQCLAEPRVMR-----
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------RIRVVAEQTPVKHILQPPTIASLLAIIIGSV-PQLKSVV
+FGYDAPL-------SFITDSLNIMGSAMVPSVMLVLGGMLSEGPNESTLGLRTTIGI--------SVARLLV
+LPLVGIGIVMSAD------KLGLISSADPMFKFVLLLQYSTPSAILLGAIASLRGYAVREASALLFWQHIFA
+LLSLTFYI
+>PILS6_ARATH/30-423
+IAVMPIAKVFTMCFLGLLMASKYVNILPPSGRKLLNGLVFSLLLPCLIFSQLGQAVTLQKMLQWWFIPVNVV
+LGTISGSIIGFIVAS-IVRPPYPYFKFTIIQIGVGNIGNVPLVLLAALCRD------TSNPFGDSEKCSIDG
+TAYISFGQWVGAIILYTYVY------------------QMFAPPPEGFDAEEENLALKTLPVDAAPEQVPLL
+TQNFPKDFSPTQDL--------------------------------LPVQSTEPRGRGVSRKGKIAQ-----
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------IFVFLYEKLKLKQIVQPAIVASILAMILGAI-PFTKKLI
+FTNGAPL-------FFFTDSCMILGDAMIPCILLALGGNLINGPGSSKLGFKTTAAI--------IIGRLVL
+VPPVGLGIVTVAD------KLGFLPADDKMFRFVLLLQHTMPTSVLSGAVANLRGCG-RESAAVLFWVHIFA
+IFSMAGWM
+>PIN4_ARATH/9-611
+TVLTAVVPLYVAMILA-YGSVQWWKIFSPDQCSGINRFVAIFAVPLLSFHFISTNDPYAMNFRFVAADTLQK
+IIMLVLLALWANLTK---NGSLEWMITIFSLSTLPNTLVMGIPLLIAMYGT-------------------YA
+GSLMVQVVVLQCIIWYTLLL------------------FLFEYRGAKLLIMEQFP-ETGASIVSFKVESDVV
+SLDGHD-FLETDAEIGNDGKLHVTVRKSNASRRSLMM--------------TPRPSNLTGAEIYSLS----S
+TPRGSNFNHSDFY---------------SVMGFPGGRLSNFGPADLY-------------SVQSSRGPTPRP
+SNFEENNAVKYGFYNNTNSSVPAAGSYPAPNPEFSTGTGVSTKPNKIPKENQQQLQEKDSKASHDAKELHMF
+VWSSSASPVSDVFGGGAGDNVATEQSEQGAKEIRMVVSDQPRKSNARGGGDDIGGLDSGEGEREIEKATAGL
+NKMGSNSTAELEAAG-G-DGGGNNGTHMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWALV-AYRWHVA
+MP------------KILQQSISILSDAGLGMAMFSLGLFMALQPKIIACGNSVATFA--------MAVRFIT
+GPAIMAVAGIAIGLHGD-LLRIAIVQ------------AALPQGIVPFVFAKEYNVHPTILSTGVIFGMLIA
+LPITLVYY
+>PIN7_ARATH/9-614
+TVLTAVIPLYVAMILA-YGSVRWWKIFSPDQCSGINRFVAIFAVPLLSFHFISSNNPYAMNLRFIAADTLQK
+LIMLTLLIIWANFTR---SGSLEWSITIFSLSTLPNTLVMGIPLLIAMYGE-------------------YS
+GSLMVQIVVLQCIIWYTLLL------------------FLFEYRGAKILIMEQFP-ETGASIVSFKVESDVV
+SLDGHD-FLETDAQIGDDGKLHVTVRKSNASRRSFYG--------GGGTNMTPRPSNLTGAEIYSL----NT
+TPRGSNFNHSDFY---------------SMMGFPGGRLSNFGPADMY-------------SVQSSRGPTPRP
+SNFEESCAMASSPRFGYYPGGAPGSYPAPNPEFSTGNKTGSKAPKENHHHVGKSNSNDAKELHMFVWGSNGS
+PV-----SDRAGLQVDNGANEQVGKSDQGGAKEIRMLISDHTQNGENKAGPMNGDYGGEEESERVKEVPNGL
+HKLRCNSTAELNPKEAIETGETVPVKHMPPASVMTRLILIMVWRKLIRNPNTYSSLIGLIWALV-AFRWDVA
+MP------------KIIQQSISILSDAGLGMAMFSLGLFMALQPKLIACGNSTATFA--------MAVRFFT
+GPAVMAVAAMAIGLRGD-LLRVAIVQ------------AALPQGIVPFVFAKEYNVHPAILSTGVIFGMLIA
+LPITLVYY
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/seed2.aln	Mon Jul 14 18:16:36 2025 +0000
@@ -0,0 +1,216 @@
+>PINI_ARATH/9-617
+HVMTAMVPLYVAMILA-YGSVKWWKIFTPDQCSGINRFVALFAVPLLSFHFIAANNPYAMNLRFLAADSLQK
+VIVLSLLFLWCKLSR---NGSLDWTITLFSLSTLPNTLVMGIPLLKGMYGN-------------------FS
+GDLMVQIVVLQCIIWYTLML------------------FLFEYRGAKLLISEQFP-DTAGSIVSIHVDSDIM
+SLDGRQ-PLETEAEIKEDGKLHVTVRRSNASRSDIYS-----RRSQGL-SATPRPSNLTNAEIYSLQSSRNP
+TPRGSSFNHTDFY---------------SMMASGGGRNSNFGPGEA---------------VFGSKGPTPRP
+SNYEEDGGPAKPTAAGTAAGAGRFHYQSGGSGGGGGAHYPAPNPGMFSPNTGGGGGTAAKGNAPVVGGKRQD
+GN------GRDLHMFVWSSSASPVSDVFGGGGGNHHADYSTATNDHQKDVKISVPQGNSNDNQYVEREEFSF
+GNKDDDSKVLATDGGNNISNKTTQAKVMPPTSVMTRLILIMVWRKLIRNPNSYSSLFGITWSLI-SFKWNIE
+MP------------ALIAKSISILSDAGLGMAMFSLGLFMALNPRIIACGNRRAAFA--------AAMRFVV
+GPAVMLVASYAVGLRGV-LLHVAIIQ------------AALPQGIVPFVFAKEYNVHPDILSTAVIFGMLIA
+LPITLLYY
+>Q9FVF6_POPPZ/9-609
+HVMTAMVPLYVAMILA-YGSVKWWKIFTPDQCSGINRFVALFAVPLLSFHFISTNDPYNMNLRFITADSLQK
+VIVLVVLALWTKLSK---RGCLEWTITLFSLSTLPNTLVMGIPLLKGMYGD-------------------YS
+GSLMVQVVVLQCIIWYTLML------------------FMFEYRGAKLLISEQFP-DTAGSIVSIHVDSDIM
+SLDGRQ-PLETEAAIKEDGKLHVTVRKSNASRSDIFS-----RRSQGLSSTTPRPSNLTNAEIYSLQSSRNP
+TPRGSSFNHTDFY---------------SMMA--AGRNSNFGASDVY-------------GLSASRGPTPRP
+SNFEEEHGGSNKPRFHHYHAPGGATHYPAPNPGMFSPTTAASKGVSANANNAAAAAAKKPNGQAQQKAED--
+-----------GRDLHMFVWSSSASPVSDVFGGHDYGAHDLKDVRVAVSPGKVEGQRENQEDYNLERDDFSF
+GNRGLDRERNSHEGEKGGFD--GKPKAMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWSLV-SFRWNVK
+MP------------LIIAKSISILSDAGLGMAMFSLGLFMALQPRIIACGNSIATFS--------MAVRFLT
+GPAIMAAASIAVGIRGT-LLHIAIVQ------------AALPQGIVPFVFAKEYNVHPEILSTGVIFGMLIA
+LPITLVYY
+>B8AIF2_ORYSI/9-590
+HVMTAMVPLYVAMILA-YGSVKWWRIFTPDQCSGINRFVALFAVPLLSFHFISTNNPYTMNLRFIAADTLQK
+LMVLAMLTAWSHLSR---RGSLEWTITLFSLSTLPNTLVMGIPLLKGMYGE-------------------FS
+GSLMVQIVVLQCIIWYTLML------------------FMFEYRGARMLITEQFP-DTAANIASIVVDPDVV
+SLDGRRDAIETETEVKEDGRIHVTVRRSNASRSDIYS-----RRSMGFSSTTPRPSNLTNAEIYSLQSSRNP
+TPRGSSFNHTDFY---------------SMV----GRSSNFGAADA---------------FGVRTGATPRP
+SNYEDDASKPKYPLPASNAAPMAGHYPAPNPAVSSAPKGAKKAATNGQAKGEDLHMFVWSS-----------
+--------------------SASPVSDVFGGGAPDYNDAAAVKSPRKMDGAKDREDYVERDDFSFGNRGVMD
+RDAEAGDEKAAAAAGADPSKAMAAPTAMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWSLV-CFRWNFE
+MP------------AIVLKSISILSDAGLGMAMFSLGLFMALQPHIIACGNKVATYA--------MAVRFLA
+GPAVMAAASFAVGLRGT-LLHVAIVQ------------AALPQGIVPFVFAKEYSVHPSILSTAVIFGMLIA
+LPITLVYY
+>PIN6_ARATH/9-565
+TVMCAMAPLYFAMFVA-YGSVKWCKIFTPAQCSGINRFVSVFAVPVLSFHFISQNNPYKMDTMFILADTLSK
+IFVFVLLSLWAVFFK---AGGLDWLITLFSIATLPNTLVMGIPLLQAMYGD-------------------YT
+QTLMVQLVVLQCIIWYTLLL------------------FLFELRAARLLIRAEFPGQAAGSIAKIQVDDDVI
+SLDGMD-PLRTETETDVNGRIRLRIRRSVSSVPDSVMSSSLC--------LTPRASNLSNAEIFSVN-----
+-----TPNNRFFHGGGGSGTLQFYNGSNEIMF-CNGDLGGFGFTRPGLGASPRRLSGYASSDAYSLQPTPRA
+SNFNELDVNGNGTPVWMKSPAAGRIYRQSSPKMMWESGQRHAAK----------------------------
+--------------------------------------DINGSVPEKEISFRDALKAAPQATAAGGGASMEE
+GAAGKDTTPVA-AIG-K-QE-------MPSAIVMMRLILTVVGRKLSRNPNTYSSLLGLVWSLI-SFKWNIP
+MP------------NIVDFSIKIISDAGLGMAMFSLGLFMALQPKMIPCGAKKATMG--------MLIRFIS
+GPLFMAGASLLVGLRGS-RLHAAIVQ------------AALPQGIVPFVFAREYNLHPDLLSTLVIFGMIVS
+LPVTILYY
+>YFDV_ECOLI/4-307
+FFIGDLLPIIVIMLLG-YFSGRR-ETFSEDQARAFNKLVLNYALPAALFVSITRANREMIFADTRLTLVSLV
+VIVGCFFFSWFGCYK-FFKRTHAEAAVCALIAGSPTIGFLGFAVLDPIYGD----------------SVSTG
+LVVAIISIIVNAITIPIGLY------------------LLNPSSGADGKK----------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------NSNLSALISAAKEPVVWAPVLATILVLV-GVKIP--
+--------------AAWDPTFNLIAKANSGVAVFAAGLTLAAHKFEFSAEIAYN-----------TFLKLIL
+MPLALLLVGMACHLNSE-HLQMMVLA------------GALPPAFSGIIIASRFNVYTRTGTASLAVSVLGF
+VVTAPLWI
+>YWKB_BACSU/5-315
+DILILLAPIFFVIVLG-WFAGHF-GSYDAKSAKGVSTLVTKYALPAHFIAGILTTSRSEFLSQVPLMISLII
+GIVGFYIIILLVCRF-IFKYDLTNSSVFSLNSAQPTFAFMGIPVLGSLFGA-------------------NE
+VAIPIAVTGIVVNAILDPLA------------------IIIATVGESSKKNEESGD----------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------SFWKMTGKSILHGLCEPLAAAPLISMILVLVFNFTLP--
+--------------ELGVKMLDQLGSTTSGVALFAVGVTVGIRKIKLSMPAIG-----------IALLKVAV
+QPALMFLIALAIGLPADQTTKAILL-------------VAFPGSAVAAMIATRFEKQEEETATAFVVSAILS
+LISLPIII
+>P71425_KLEPN/4-313
+VIIHALAPIFVIMLLG-FWAGKA-GMVDNKNVSLLNIFVMDFALPATLFSATVQTPWAGIVAQSPLVLVLTG
+AMWITYAAIYFLATS-VFKRTPQDGAVLTLTVALPNYAALGLPILGSVLGE------------------GAS
+TSLSVAVSIACGSVLMTPFC------------------LLILEREKARAAGENSG-----------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------STLAMLPVLMWRSVKKPIVWGPLLGVVLSAI-GIKMP--
+--------------DLLLASIKPLGLAATAAALFLTGVILSARKLQLNALIAAS-----------TIVKLLV
+QPFIAWGLVMLLGLHGSIAITAILM-------------IALAAGFFGVVFGNRFGVQSPDAEAVLLLSSVLC
+ILSLPLFI
+>Q98L58_RHILO/3-308
+PLTETVLFVFSLVALG-YLAGLT-GYLRPASGEGISDFAVSVAMPLLLFQTMVKADFHG--VAPWPLWGAYF
+TAVAITWAAGHLVTTRIFGRDARAGVVGGVSSAYSNVVLLGAPFILGIFGP-----------------SGFE
+VLSLLVSVHLPVMMMASIVL------------------FEMFGRGGGEHV----------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------HPLRVLRSFLRRLFINPLIIGILLGLAWRLS-GVPLP--
+--------------SLVMRLVDALANTAGPVALFAMGLSLRRFGVSGNVRPALA----------LSALKLFL
+MPALVLAFVLLLGLPPL-TAKVAVVV------------AALPSGINSYLIAVQFNTGQALASNQMTIATACA
+AVTTAFWL
+>O67397_AQUAE/2-289
+FIYEKVFFILLIIAFA-YTLKRG-GIFKEEHALPFINYVIYFALPFTIFKNLRF---LEIGKEVLGVVLIAW
+GAIFLSILFAFLFGK-FLKLEEKTLRAFLLVSSFGNTAFMGYPFLYALEGN-------------------EG
+LKYAILYDQLGSFLMVITLG----------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------LFLAIGKFDLKELILFPPFIALVLSFLLHGV-RFP----
+--------------QFFEHSVEIISGSLIPVILFSLGLRLNFTDMKSDYRTLFSA----------LFIKMFL
+VPLLILVFLKIFGLTSL-PYRVALIE------------SAMPPMVFAGVLALKYELDFRLAFSAITLGIVIS
+LFTVPVFR
+>Q97M34_CLOAB/2-296
+YVFEQIVILFLIMGIG-YYAAKS-KIIDDDTTSHLSNFIVSITLPLMILTSFNVEYSRKTVITIINLLVFSV
+AAFIISIVIGKII---SFKFAMDKRDILMFMSIFSNCGFIGFPVLKVVYGN-------------------KG
+VLYTSIFNLVYNVFIWTIGI------------------VIINDKREKIDY----------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+-------------------------------------------KKILFNHNIIAVIVGVFLMLL-SIKIP--
+--------------YVMSSAFNLIGSMTAPLSMIVIGSILA--------GVDFNDIFKDWSLYYIAILRLII
+IPLIIYFALKPFQINKI-VIGVIIIC------------EAMPGGTLCPILAKSCNRNFKYASKIVLITTILS
+MMTIPFMT
+>YB8B_YEAST/13-413
+LVFESVLQVVIIALAG-FWSASS-GLLPKQSQKIISLLNVDLFTPCLIFSKLAKSLSMAKIFEIAIIPIFFG
+LTTGISFISGKIMSR-ILDLDKDETNFVVANSVFGNSNSLPVSLTLSLAYTLPNLTWDQIPNDNRDNVASRG
+ILYLLIFQQIGQMLRWSWGY------------------NKLMKWSGENTQHMPPSQVQSLLERTPNIDNEEL
+VNEEQEEQELLEEENNRMNSSFLSSSSIGDKIWQKSCTVFER------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+-------------------------------------------IRANLNPPLYSMIFAVVVAAI-GPLQREL
+F------MEDGFINNTFAEAVTQLGSVSIPLILVVLGSNLYPSA-----EVFPKTVHHSKLLIGSIIGRMIL
+PSCFLLPIIAIAV-----KYINVSILDDPIFLVVGFLLTVSPPAIQLTQITQLNEFFEAEMADILFWGYAVL
+SLPVSIIV
+>YDQ4_SCHPO/18-440
+PIIESDLEVIVIALGG-YVLAKK-GFLPRDAQKVISSLNVYFFTPCLVFEKVGNGLNLKMLIDLSLLPVFYV
+IISAASILISFLLAK-LFRLTPRQRNFATACITFQNSNSLPLALVSSLATTVKDLLWDKIPDDTPDKVASRG
+IMYLLIFSQLGQALRWSYGY------------------RILLSPNQPEDPLPIGNRSWSHSDVNEEEIQNLL
+ASSANVDGVQNSVQANEGSTVQTDSSAISKNDNVQVETSNEEVGGFGAASSKISK-----------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------------FIVLLLDFFSPPLYSLFIALFIAVV-PPLQRFF
+F------EEGSFVEGSITSGIRMAGQVAVPMILVVLGASLATDISKTEPTQEVRKNNDTRVIIVCLLGRMVV
+VPLALLPAFSLLS-----YFSEISTVDDPVFVVVIFLLVGSPTAIQLTQICQLNGVFERECAKVLWWSYAVF
+TPPNSLLL
+>PILS4_ARATH/9-407
+ASSKPVVETLLITSVGFYLALDTVNLLGHDARKHLNNIVFYVFSPSLIGSRLADSVTYESLVKMWFMPVNVL
+LTFMIGSLLGWIVIV-ITKPPSQLRGLIISCCASGNLGTMPLIIIPAICKE------KGGPFGDSESCEKYG
+MGYVTLSMT--AFFISVYKHDTNWYVSGGNGLLMDLYINLMR------VLSNSPVETHTHSIESNYDDSCKV
+QLISSK------------------------------------------EEEKEEDNHQVGRWEEVKQ-----
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------RVVSLSKKVNLGSIFAPATIAAIIALVIGLI-TPLRNLI
+IGTVAPF-------RVIQDSLTLLGDGAIPAMTLILGGNLLKGMRRSEVRSSEMKNSCIIGV---LVARYIL
+LPVSGVLLVRGAY------KLDLVTS-EPLYQFVLLLQYAVPPAMNLGTKTQLFGAGESECSVIMLWTYSLA
+AVSLTVWP
+>PILS5_ARATH/9-388
+VASMPVIQVLFMSLVGAFMASDRCKLFPVEARNSMNKVVFVLFAPALMFANLAQTVTLEDIISWWFMPVNMG
+LTFLIGGLLGWLVVK-ILKPPPYLEGLIVATCSAGNMGNLPIILVPAICDE------DKSPFGNRSVCRTVG
+LSYASFSMALGGFYIWTYTF------------------RLIKGSAMKVQAIEESEKIAIKSSNSDLEADHKT
+HLLGAP-----------------------------------------EDKENKVVKEKTGFWRKGVD-----
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------FLHEI-----LEELLAPPTLGAIIGFIFGAV-RWLRNLI
+IGDDAPL-------RIVQSTAKLLGDGTIPCMTIILGGNLIQG-----LRSSAVKPMVVLGI---VCVRYIA
+MPIIGIGIVLTAA------NLGFLPA-DPLFQYVLMLQFTLPPAMNIGTMTQLYNVAQDECSVLMLWTYLVA
+ILALTVWS
+>PILS2_ARATH/18-441
+SGVVPLLKLICLTVIGLLLAHPKTQLVPRATFRLLSKLVFALFLPCLIFTELGESITLDNIVQWWFIPVNVL
+LSAVVGSLIGYLVVL-ICRPPPEFNRFTIVMTAFGNTGNLLLAIVSSVCHT--------KTNPFGPNCNSRG
+VSYVSFAQWVAVILVYTVVY------------------HMMEPPLEYYEVVEEEG-VEIEEINVENHDASRP
+LLVEAEWPGIEDKETEHCKTPFIARVFNSISSFSQTSFPEVDLGGEYGGESSSPRSIQCLAEPRVMR-----
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------RIRVVAEQTPVKHILQPPTIASLLAIIIGSV-PQLKSVV
+FGYDAPL-------SFITDSLNIMGSAMVPSVMLVLGGMLSEGPNESTLGLRTTIGI--------SVARLLV
+LPLVGIGIVMSAD------KLGLISSADPMFKFVLLLQYSTPSAILLGAIASLRGYAVREASALLFWQHIFA
+LLSLTFYI
+>PILS6_ARATH/30-423
+IAVMPIAKVFTMCFLGLLMASKYVNILPPSGRKLLNGLVFSLLLPCLIFSQLGQAVTLQKMLQWWFIPVNVV
+LGTISGSIIGFIVAS-IVRPPYPYFKFTIIQIGVGNIGNVPLVLLAALCRD------TSNPFGDSEKCSIDG
+TAYISFGQWVGAIILYTYVY------------------QMFAPPPEGFDAEEENLALKTLPVDAAPEQVPLL
+TQNFPKDFSPTQDL--------------------------------LPVQSTEPRGRGVSRKGKIAQ-----
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+------------------------------------------------------------------------
+---------------------------------IFVFLYEKLKLKQIVQPAIVASILAMILGAI-PFTKKLI
+FTNGAPL-------FFFTDSCMILGDAMIPCILLALGGNLINGPGSSKLGFKTTAAI--------IIGRLVL
+VPPVGLGIVTVAD------KLGFLPADDKMFRFVLLLQHTMPTSVLSGAVANLRGCG-RESAAVLFWVHIFA
+IFSMAGWM
+>PIN4_ARATH/9-611
+TVLTAVVPLYVAMILA-YGSVQWWKIFSPDQCSGINRFVAIFAVPLLSFHFISTNDPYAMNFRFVAADTLQK
+IIMLVLLALWANLTK---NGSLEWMITIFSLSTLPNTLVMGIPLLIAMYGT-------------------YA
+GSLMVQVVVLQCIIWYTLLL------------------FLFEYRGAKLLIMEQFP-ETGASIVSFKVESDVV
+SLDGHD-FLETDAEIGNDGKLHVTVRKSNASRRSLMM--------------TPRPSNLTGAEIYSLS----S
+TPRGSNFNHSDFY---------------SVMGFPGGRLSNFGPADLY-------------SVQSSRGPTPRP
+SNFEENNAVKYGFYNNTNSSVPAAGSYPAPNPEFSTGTGVSTKPNKIPKENQQQLQEKDSKASHDAKELHMF
+VWSSSASPVSDVFGGGAGDNVATEQSEQGAKEIRMVVSDQPRKSNARGGGDDIGGLDSGEGEREIEKATAGL
+NKMGSNSTAELEAAG-G-DGGGNNGTHMPPTSVMTRLILIMVWRKLIRNPNTYSSLIGLIWALV-AYRWHVA
+MP------------KILQQSISILSDAGLGMAMFSLGLFMALQPKIIACGNSVATFA--------MAVRFIT
+GPAIMAVAGIAIGLHGD-LLRIAIVQ------------AALPQGIVPFVFAKEYNVHPTILSTGVIFGMLIA
+LPITLVYY
+>PIN7_ARATH/9-614
+TVLTAVIPLYVAMILA-YGSVRWWKIFSPDQCSGINRFVAIFAVPLLSFHFISSNNPYAMNLRFIAADTLQK
+LIMLTLLIIWANFTR---SGSLEWSITIFSLSTLPNTLVMGIPLLIAMYGE-------------------YS
+GSLMVQIVVLQCIIWYTLLL------------------FLFEYRGAKILIMEQFP-ETGASIVSFKVESDVV
+SLDGHD-FLETDAQIGDDGKLHVTVRKSNASRRSFYG--------GGGTNMTPRPSNLTGAEIYSL----NT
+TPRGSNFNHSDFY---------------SMMGFPGGRLSNFGPADMY-------------SVQSSRGPTPRP
+SNFEESCAMASSPRFGYYPGGAPGSYPAPNPEFSTGNKTGSKAPKENHHHVGKSNSNDAKELHMFVWGSNGS
+PV-----SDRAGLQVDNGANEQVGKSDQGGAKEIRMLISDHTQNGENKAGPMNGDYGGEEESERVKEVPNGL
+HKLRCNSTAELNPKEAIETGETVPVKHMPPASVMTRLILIMVWRKLIRNPNTYSSLIGLIWALV-AFRWDVA
+MP------------KIIQQSISILSDAGLGMAMFSLGLFMALQPKLIACGNSTATFA--------MAVRFFT
+GPAVMAVAAMAIGLRGD-LLRVAIVQ------------AALPQGIVPFVFAKEYNVHPAILSTGVIFGMLIA
+LPITLVYY